{"id":16087,"date":"2024-01-20T16:33:29","date_gmt":"2024-01-20T13:03:29","guid":{"rendered":"https:\/\/rasanegar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%da%a9%d8%a7%d8%b1-%d8%a8%d8%a7-%da%a9%d8%aa%d8%a7%d8%a8%d8%ae%d8%a7%d9%86%d9%87-fasttext-%d9%81%db%8c%d8%b3-%d8%a8%d9%88%da%a9\/"},"modified":"2024-01-20T16:33:29","modified_gmt":"2024-01-20T13:03:29","slug":"%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%da%a9%d8%a7%d8%b1-%d8%a8%d8%a7-%da%a9%d8%aa%d8%a7%d8%a8%d8%ae%d8%a7%d9%86%d9%87-fasttext-%d9%81%db%8c%d8%b3-%d8%a8%d9%88%da%a9","status":"publish","type":"post","link":"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%da%a9%d8%a7%d8%b1-%d8%a8%d8%a7-%da%a9%d8%aa%d8%a7%d8%a8%d8%ae%d8%a7%d9%86%d9%87-fasttext-%d9%81%db%8c%d8%b3-%d8%a8%d9%88%da%a9\/","title":{"rendered":"\u067e\u0627\u06cc\u062a\u0648\u0646 \u0628\u0631\u0627\u06cc NLP: \u06a9\u0627\u0631 \u0628\u0627 \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 FastText \u0641\u06cc\u0633 \u0628\u0648\u06a9"},"content":{"rendered":"<div id=\"ez-toc-container\" class=\"ez-toc-v2_0_85 counter-hierarchy ez-toc-counter ez-toc-custom ez-toc-container-direction\">\n<div class=\"ez-toc-title-container\"><p class=\"ez-toc-title\" style=\"cursor:inherit\">\u0633\u0631\u0641\u0635\u0644\u0647\u0627\u06cc \u0645\u0637\u0644\u0628<\/p>\n<\/div><nav><ul class='ez-toc-list ez-toc-list-level-1 ' ><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class=\"ez-toc-link ez-toc-heading-1\" href=\"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%da%a9%d8%a7%d8%b1-%d8%a8%d8%a7-%da%a9%d8%aa%d8%a7%d8%a8%d8%ae%d8%a7%d9%86%d9%87-fasttext-%d9%81%db%8c%d8%b3-%d8%a8%d9%88%da%a9\/#fasttext_%d8%a8%d8%b1%d8%a7%db%8c_%d8%aa%d8%b4%d8%a7%d8%a8%d9%87_%d9%85%d8%b9%d9%86%d8%a7%db%8c%db%8c\" >FastText \u0628\u0631\u0627\u06cc \u062a\u0634\u0627\u0628\u0647 \u0645\u0639\u0646\u0627\u06cc\u06cc<\/a><ul class='ez-toc-list-level-3' ><li class='ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-2\" href=\"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%da%a9%d8%a7%d8%b1-%d8%a8%d8%a7-%da%a9%d8%aa%d8%a7%d8%a8%d8%ae%d8%a7%d9%86%d9%87-fasttext-%d9%81%db%8c%d8%b3-%d8%a8%d9%88%da%a9\/#%d9%88%d8%a7%d8%b1%d8%af%d8%a7%d8%aa_%da%a9%d8%aa%d8%a7%d8%a8%d8%ae%d8%a7%d9%86%d9%87_%d9%87%d8%a7\" >\u0648\u0627\u0631\u062f\u0627\u062a \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 \u0647\u0627<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-3\" href=\"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%da%a9%d8%a7%d8%b1-%d8%a8%d8%a7-%da%a9%d8%aa%d8%a7%d8%a8%d8%ae%d8%a7%d9%86%d9%87-fasttext-%d9%81%db%8c%d8%b3-%d8%a8%d9%88%da%a9\/#%d8%ae%d8%b1%d8%a7%d8%b4_%d8%af%d8%a7%d8%af%d9%86_%d9%85%d9%82%d8%a7%d9%84%d8%a7%d8%aa_%d9%88%db%8c%da%a9%db%8c_%d9%be%d8%af%db%8c%d8%a7\" >\u062e\u0631\u0627\u0634 \u062f\u0627\u062f\u0646 \u0645\u0642\u0627\u0644\u0627\u062a \u0648\u06cc\u06a9\u06cc \u067e\u062f\u06cc\u0627<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-4\" href=\"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%da%a9%d8%a7%d8%b1-%d8%a8%d8%a7-%da%a9%d8%aa%d8%a7%d8%a8%d8%ae%d8%a7%d9%86%d9%87-fasttext-%d9%81%db%8c%d8%b3-%d8%a8%d9%88%da%a9\/#%d9%be%db%8c%d8%b4_%d9%be%d8%b1%d8%af%d8%a7%d8%b2%d8%b4_%d8%af%d8%a7%d8%af%d9%87_%d9%87%d8%a7\" >\u067e\u06cc\u0634 \u067e\u0631\u062f\u0627\u0632\u0634 \u062f\u0627\u062f\u0647 \u0647\u0627<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-5\" href=\"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%da%a9%d8%a7%d8%b1-%d8%a8%d8%a7-%da%a9%d8%aa%d8%a7%d8%a8%d8%ae%d8%a7%d9%86%d9%87-fasttext-%d9%81%db%8c%d8%b3-%d8%a8%d9%88%da%a9\/#%d8%a7%db%8c%d8%ac%d8%a7%d8%af_%d8%a8%d8%a7%d8%b2%d9%86%d9%85%d8%a7%db%8c%db%8c_%da%a9%d9%84%d9%85%d8%a7%d8%aa\" >\u0627\u06cc\u062c\u0627\u062f \u0628\u0627\u0632\u0646\u0645\u0627\u06cc\u06cc \u06a9\u0644\u0645\u0627\u062a<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-6\" href=\"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%da%a9%d8%a7%d8%b1-%d8%a8%d8%a7-%da%a9%d8%aa%d8%a7%d8%a8%d8%ae%d8%a7%d9%86%d9%87-fasttext-%d9%81%db%8c%d8%b3-%d8%a8%d9%88%da%a9\/#%d8%aa%d8%ac%d8%b3%d9%85_%d8%b4%d8%a8%d8%a7%d9%87%d8%aa_%d9%87%d8%a7%db%8c_%da%a9%d9%84%d9%85%d9%87\" >\u062a\u062c\u0633\u0645 \u0634\u0628\u0627\u0647\u062a \u0647\u0627\u06cc \u06a9\u0644\u0645\u0647<\/a><\/li><\/ul><\/li><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class=\"ez-toc-link ez-toc-heading-7\" href=\"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%da%a9%d8%a7%d8%b1-%d8%a8%d8%a7-%da%a9%d8%aa%d8%a7%d8%a8%d8%ae%d8%a7%d9%86%d9%87-fasttext-%d9%81%db%8c%d8%b3-%d8%a8%d9%88%da%a9\/#fasttext_%d8%a8%d8%b1%d8%a7%db%8c_%d8%b7%d8%a8%d9%82%d9%87_%d8%a8%d9%86%d8%af%db%8c_%d9%85%d8%aa%d9%86\" >FastText \u0628\u0631\u0627\u06cc \u0637\u0628\u0642\u0647 \u0628\u0646\u062f\u06cc \u0645\u062a\u0646<\/a><ul class='ez-toc-list-level-3' ><li class='ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-8\" href=\"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%da%a9%d8%a7%d8%b1-%d8%a8%d8%a7-%da%a9%d8%aa%d8%a7%d8%a8%d8%ae%d8%a7%d9%86%d9%87-fasttext-%d9%81%db%8c%d8%b3-%d8%a8%d9%88%da%a9\/#%d9%85%d8%ac%d9%85%d9%88%d8%b9%d9%87_%d8%af%d8%a7%d8%af%d9%87\" >\u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-9\" href=\"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%da%a9%d8%a7%d8%b1-%d8%a8%d8%a7-%da%a9%d8%aa%d8%a7%d8%a8%d8%ae%d8%a7%d9%86%d9%87-fasttext-%d9%81%db%8c%d8%b3-%d8%a8%d9%88%da%a9\/#%d9%86%d8%b5%d8%a8_fasttext\" >\u0646\u0635\u0628 FastText<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-10\" href=\"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%da%a9%d8%a7%d8%b1-%d8%a8%d8%a7-%da%a9%d8%aa%d8%a7%d8%a8%d8%ae%d8%a7%d9%86%d9%87-fasttext-%d9%81%db%8c%d8%b3-%d8%a8%d9%88%da%a9\/#%d8%b7%d8%a8%d9%82%d9%87_%d8%a8%d9%86%d8%af%db%8c_%d9%85%d8%aa%d9%86\" >\u0637\u0628\u0642\u0647 \u0628\u0646\u062f\u06cc \u0645\u062a\u0646<\/a><\/li><\/ul><\/li><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class=\"ez-toc-link ez-toc-heading-11\" href=\"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%da%a9%d8%a7%d8%b1-%d8%a8%d8%a7-%da%a9%d8%aa%d8%a7%d8%a8%d8%ae%d8%a7%d9%86%d9%87-fasttext-%d9%81%db%8c%d8%b3-%d8%a8%d9%88%da%a9\/#%d9%86%d8%aa%db%8c%d8%ac%d9%87\" >\u0646\u062a\u06cc\u062c\u0647<\/a><\/li><\/ul><\/nav><\/div>\n<span class=\"span-reading-time rt-reading-time\" style=\"display: block;\"><span class=\"rt-label rt-prefix\">\u0632\u0645\u0627\u0646 \u0644\u0627\u0632\u0645 \u0628\u0631\u0627\u06cc \u0645\u0637\u0627\u0644\u0639\u0647: <\/span> <span class=\"rt-time\"> 12<\/span> <span class=\"rt-label rt-postfix\">\u062f\u0642\u06cc\u0642\u0647<\/span><\/span><p> <br \/>\n<\/p>\n<div><noscript><\/noscript><\/p>\n<p>\u0627\u06cc\u0646 \u0628\u06cc\u0633\u062a\u0645\u06cc\u0646 \u0645\u0642\u0627\u0644\u0647 \u0627\u0632 \u0633\u0631\u06cc \u0645\u0642\u0627\u0644\u0627\u062a \u0645\u0646 \u0627\u0633\u062a \u0631\u0648\u06cc \u067e\u0627\u06cc\u062a\u0648\u0646 \u0628\u0631\u0627\u06cc NLP.  \u062f\u0631 \u0686\u0646\u062f \u0645\u0642\u0627\u0644\u0647 \u0627\u062e\u06cc\u0631\u060c \u062a\u06a9\u0646\u06cc\u06a9 \u0647\u0627\u06cc \u06cc\u0627\u062f\u06af\u06cc\u0631\u06cc \u0639\u0645\u06cc\u0642 \u0631\u0627 \u0628\u0631\u0627\u06cc \u0627\u0646\u062c\u0627\u0645 \u0627\u0646\u0648\u0627\u0639 \u0648\u0638\u0627\u06cc\u0641 \u06cc\u0627\u062f\u06af\u06cc\u0631\u06cc \u0645\u0627\u0634\u06cc\u0646 \u0628\u0631\u0631\u0633\u06cc \u06a9\u0631\u062f\u0647 \u0627\u06cc\u0645 \u0648 \u0647\u0645\u0686\u0646\u06cc\u0646 \u0628\u0627\u06cc\u062f \u0628\u0627 \u0645\u0641\u0647\u0648\u0645 \u062c\u0627\u0633\u0627\u0632\u06cc \u06a9\u0644\u0645\u0627\u062a \u0622\u0634\u0646\u0627 \u0628\u0627\u0634\u06cc\u062f.  \u062c\u0627\u0633\u0627\u0632\u06cc \u06a9\u0644\u0645\u0647 \u0631\u0627\u0647\u06cc \u0628\u0631\u0627\u06cc \u062a\u0628\u062f\u06cc\u0644 \u0627\u0637\u0644\u0627\u0639\u0627\u062a \u0645\u062a\u0646\u06cc \u0628\u0647 \u0634\u06a9\u0644 \u0639\u062f\u062f\u06cc \u0627\u0633\u062a \u06a9\u0647 \u0628\u0647 \u0646\u0648\u0628\u0647 \u062e\u0648\u062f \u0645\u06cc \u062a\u0648\u0627\u0646\u062f \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u0648\u0631\u0648\u062f\u06cc \u0628\u0647 \u0627\u0644\u06af\u0648\u0631\u06cc\u062a\u0645 \u0647\u0627\u06cc \u0622\u0645\u0627\u0631\u06cc \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0634\u0648\u062f.  \u062f\u0631 \u0645\u0642\u0627\u0644\u0647 \u0645\u0646 \u0631\u0648\u06cc \u062c\u0627\u0633\u0627\u0632\u06cc \u06a9\u0644\u0645\u0647\u060c \u0645\u0646 \u062a\u0648\u0636\u06cc\u062d \u062f\u0627\u062f\u0645 \u06a9\u0647 \u0686\u06af\u0648\u0646\u0647 \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u0645 \u062c\u0627\u0633\u0627\u0632\u06cc \u0647\u0627\u06cc \u06a9\u0644\u0645\u0647 \u062e\u0648\u062f \u0631\u0627 \u0627\u06cc\u062c\u0627\u062f \u06a9\u0646\u06cc\u0645 \u0648 \u0686\u06af\u0648\u0646\u0647 \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u0645 \u0627\u0632 \u062c\u0627\u0633\u0627\u0632\u06cc \u0647\u0627\u06cc \u06a9\u0644\u0645\u0647 \u062f\u0627\u062e\u0644\u06cc \u0645\u0627\u0646\u0646\u062f <a rel=\"nofollow noopener\" target=\"_blank\" href=\"https:\/\/nlp.stanford.edu\/projects\/glove\/\">\u062f\u0633\u062a\u06a9\u0634<\/a>.<\/p>\n<p>\u062f\u0631 \u0627\u06cc\u0646 \u0645\u0642\u0627\u0644\u0647 \u0642\u0635\u062f \u062f\u0627\u0631\u06cc\u0645 \u0628\u0647 \u0645\u0637\u0627\u0644\u0639\u0647 \u0628\u067e\u0631\u062f\u0627\u0632\u06cc\u0645 <a rel=\"nofollow noopener\" target=\"_blank\" href=\"https:\/\/fasttext.cc\/\" class=\"broken_link\">FastText<\/a> \u06a9\u0647 \u06cc\u06a9\u06cc \u062f\u06cc\u06af\u0631 \u0627\u0632 \u0645\u0627\u0698\u0648\u0644 \u0647\u0627\u06cc \u0628\u0633\u06cc\u0627\u0631 \u0645\u0641\u06cc\u062f \u0628\u0631\u0627\u06cc \u062c\u0627\u0633\u0627\u0632\u06cc \u06a9\u0644\u0645\u0627\u062a \u0648 \u0637\u0628\u0642\u0647 \u0628\u0646\u062f\u06cc \u0645\u062a\u0646 \u0627\u0633\u062a.  FastText \u062a\u0648\u0633\u0637 \u0641\u06cc\u0633 \u0628\u0648\u06a9 \u062a\u0648\u0633\u0639\u0647 \u062f\u0627\u062f\u0647 \u0634\u062f\u0647 \u0627\u0633\u062a \u0648 \u0646\u062a\u0627\u06cc\u062c \u0628\u0633\u06cc\u0627\u0631 \u062e\u0648\u0628\u06cc \u0627\u0632 \u062e\u0648\u062f \u0646\u0634\u0627\u0646 \u062f\u0627\u062f\u0647 \u0627\u0633\u062a \u0631\u0648\u06cc \u0628\u0633\u06cc\u0627\u0631\u06cc \u0627\u0632 \u0645\u0634\u06a9\u0644\u0627\u062a NLP\u060c \u0645\u0627\u0646\u0646\u062f \u062a\u0634\u062e\u06cc\u0635 \u0634\u0628\u0627\u0647\u062a \u0645\u0639\u0646\u0627\u06cc\u06cc \u0648 \u0637\u0628\u0642\u0647 \u0628\u0646\u062f\u06cc \u0645\u062a\u0646.<\/p>\n<p>\u062f\u0631 \u0627\u06cc\u0646 \u0645\u0642\u0627\u0644\u0647 \u0628\u0647 \u0637\u0648\u0631 \u062e\u0644\u0627\u0635\u0647 \u0628\u0647 \u0628\u0631\u0631\u0633\u06cc \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 FastText \u0645\u06cc \u067e\u0631\u062f\u0627\u0632\u06cc\u0645.  \u0627\u06cc\u0646 \u0645\u0642\u0627\u0644\u0647 \u0628\u0647 \u062f\u0648 \u0628\u062e\u0634 \u062a\u0642\u0633\u06cc\u0645 \u0634\u062f\u0647 \u0627\u0633\u062a.  \u062f\u0631 \u0628\u062e\u0634 \u0627\u0648\u0644\u060c \u062e\u0648\u0627\u0647\u06cc\u0645 \u062f\u06cc\u062f \u06a9\u0647 \u0686\u06af\u0648\u0646\u0647 \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 FastText \u0646\u0645\u0627\u06cc\u0634 \u0647\u0627\u06cc \u0628\u0631\u062f\u0627\u0631\u06cc \u0627\u06cc\u062c\u0627\u062f \u0645\u06cc \u06a9\u0646\u062f \u06a9\u0647 \u0645\u06cc \u062a\u0648\u0627\u0646\u062f \u0628\u0631\u0627\u06cc \u06cc\u0627\u0641\u062a\u0646 \u0634\u0628\u0627\u0647\u062a \u0647\u0627\u06cc \u0645\u0639\u0646\u0627\u06cc\u06cc \u0628\u06cc\u0646 \u06a9\u0644\u0645\u0627\u062a \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0634\u0648\u062f.  \u062f\u0631 \u0628\u062e\u0634 \u062f\u0648\u0645 \u06a9\u0627\u0631\u0628\u0631\u062f \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 FastText \u0628\u0631\u0627\u06cc \u0637\u0628\u0642\u0647 \u0628\u0646\u062f\u06cc \u0645\u062a\u0648\u0646 \u0631\u0627 \u0645\u0634\u0627\u0647\u062f\u0647 \u062e\u0648\u0627\u0647\u06cc\u0645 \u06a9\u0631\u062f.<\/p>\n<h2 id=\"fasttextforsemanticsimilarity\"><span class=\"ez-toc-section\" id=\"fasttext_%d8%a8%d8%b1%d8%a7%db%8c_%d8%aa%d8%b4%d8%a7%d8%a8%d9%87_%d9%85%d8%b9%d9%86%d8%a7%db%8c%db%8c\"><\/span>FastText \u0628\u0631\u0627\u06cc \u062a\u0634\u0627\u0628\u0647 \u0645\u0639\u0646\u0627\u06cc\u06cc<span class=\"ez-toc-section-end\"><\/span><\/h2>\n<p>FastText \u0627\u0632 \u0647\u0631 \u062f\u0648 \u067e\u0634\u062a\u06cc\u0628\u0627\u0646\u06cc \u0645\u06cc \u06a9\u0646\u062f <a rel=\"nofollow noopener\" target=\"_blank\" href=\"https:\/\/en.wikipedia.org\/wiki\/Word2vec#CBOW_and_skip_grams\">\u06a9\u06cc\u0633\u0647 \u06a9\u0644\u0645\u0627\u062a \u067e\u06cc\u0648\u0633\u062a\u0647 \u0648 \u0645\u062f\u0644 \u0647\u0627\u06cc Skip-Gram<\/a>.  \u062f\u0631 \u0627\u06cc\u0646 \u0645\u0642\u0627\u0644\u0647 \u0645\u062f\u0644 skip-gram \u0631\u0627 \u0628\u0631\u0627\u06cc \u06cc\u0627\u062f\u06af\u06cc\u0631\u06cc \u0646\u0645\u0627\u06cc\u0634 \u0628\u0631\u062f\u0627\u0631\u06cc \u06a9\u0644\u0645\u0627\u062a \u0627\u0632 \u0645\u0642\u0627\u0644\u0627\u062a \u0648\u06cc\u06a9\u06cc \u067e\u062f\u06cc\u0627 \u067e\u06cc\u0627\u062f\u0647 \u0633\u0627\u0632\u06cc \u0645\u06cc \u06a9\u0646\u06cc\u0645. \u0631\u0648\u06cc <a rel=\"nofollow noopener\" target=\"_blank\" href=\"https:\/\/en.wikipedia.org\/wiki\/Artificial_intelligence\">\u0647\u0648\u0634 \u0645\u0635\u0646\u0648\u0639\u06cc<\/a>\u060c <a rel=\"nofollow noopener\" target=\"_blank\" href=\"https:\/\/en.wikipedia.org\/wiki\/Machine_learning\">\u0641\u0631\u0627\u06af\u06cc\u0631\u06cc \u0645\u0627\u0634\u06cc\u0646<\/a>\u060c <a rel=\"nofollow noopener\" target=\"_blank\" href=\"https:\/\/en.wikipedia.org\/wiki\/Deep_learning\">\u06cc\u0627\u062f\u06af\u06cc\u0631\u06cc \u0639\u0645\u06cc\u0642<\/a>\u060c \u0648 <a rel=\"nofollow noopener\" target=\"_blank\" href=\"https:\/\/en.wikipedia.org\/wiki\/Artificial_neural_network\">\u0634\u0628\u06a9\u0647 \u0647\u0627\u06cc \u0639\u0635\u0628\u06cc<\/a>.  \u0627\u0632 \u0622\u0646\u062c\u0627\u06cc\u06cc \u06a9\u0647 \u0627\u06cc\u0646 \u0645\u0648\u0636\u0648\u0639\u0627\u062a \u06a9\u0627\u0645\u0644\u0627 \u0645\u0634\u0627\u0628\u0647 \u0647\u0633\u062a\u0646\u062f\u060c \u0645\u0627 \u0627\u06cc\u0646 \u0645\u0648\u0636\u0648\u0639\u0627\u062a \u0631\u0627 \u0628\u0631\u0627\u06cc \u062f\u0627\u0634\u062a\u0646 \u062d\u062c\u0645 \u0642\u0627\u0628\u0644 \u062a\u0648\u062c\u0647\u06cc \u0627\u0632 \u062f\u0627\u062f\u0647 \u0647\u0627 \u0628\u0631\u0627\u06cc \u0627\u06cc\u062c\u0627\u062f \u06cc\u06a9 \u0645\u062c\u0645\u0648\u0639\u0647 \u0627\u0646\u062a\u062e\u0627\u0628 \u06a9\u0631\u062f\u06cc\u0645.  \u062f\u0631 \u0635\u0648\u0631\u062a \u062a\u0645\u0627\u06cc\u0644 \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u062f \u0645\u0648\u0636\u0648\u0639\u0627\u062a \u0628\u06cc\u0634\u062a\u0631\u06cc \u0628\u0627 \u0645\u0627\u0647\u06cc\u062a \u0645\u0634\u0627\u0628\u0647 \u0627\u0636\u0627\u0641\u0647 \u06a9\u0646\u06cc\u062f.<\/p>\n<p>\u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u0627\u0648\u0644\u06cc\u0646 \u0642\u062f\u0645\u060c \u0645\u0627 \u0646\u06cc\u0627\u0632 \u062f\u0627\u0631\u06cc\u0645 import \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 \u0647\u0627\u06cc \u0645\u0648\u0631\u062f \u0646\u06cc\u0627\u0632  \u0645\u0627 \u0627\u0632 \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 \u0648\u06cc\u06a9\u06cc\u200c\u067e\u062f\u06cc\u0627 \u0628\u0631\u0627\u06cc \u067e\u0627\u06cc\u062a\u0648\u0646 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u062e\u0648\u0627\u0647\u06cc\u0645 \u06a9\u0631\u062f \u06a9\u0647 \u0627\u0632 \u0637\u0631\u06cc\u0642 \u062f\u0633\u062a\u0648\u0631 \u0632\u06cc\u0631 \u0642\u0627\u0628\u0644 \u062f\u0627\u0646\u0644\u0648\u062f \u0627\u0633\u062a:<\/p>\n<pre><code class=\"hljs\"><span class=\"hljs-meta\">$<\/span><span class=\"bash\"> pip install wikipedia<\/span>\n<\/code><\/pre>\n<h3 id=\"importinglibraries\"><span class=\"ez-toc-section\" id=\"%d9%88%d8%a7%d8%b1%d8%af%d8%a7%d8%aa_%da%a9%d8%aa%d8%a7%d8%a8%d8%ae%d8%a7%d9%86%d9%87_%d9%87%d8%a7\"><\/span>\u0648\u0627\u0631\u062f\u0627\u062a \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 \u0647\u0627<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p>\u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0632\u06cc\u0631 \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 \u0647\u0627\u06cc \u0645\u0648\u0631\u062f \u0646\u06cc\u0627\u0632 \u0631\u0627 \u0628\u0647 \u0628\u0631\u0646\u0627\u0645\u0647 \u0645\u0627 \u0648\u0627\u0631\u062f \u0645\u06cc \u06a9\u0646\u062f:<\/p>\n<pre><code class=\"hljs\"><span class=\"hljs-keyword\">from<\/span> keras.preprocessing.text <span class=\"hljs-keyword\">import<\/span> Tokenizer\n<span class=\"hljs-keyword\">from<\/span> gensim.models.fasttext <span class=\"hljs-keyword\">import<\/span> FastText\n<span class=\"hljs-keyword\">import<\/span> numpy <span class=\"hljs-keyword\">as<\/span> np\n<span class=\"hljs-keyword\">import<\/span> matplotlib.pyplot <span class=\"hljs-keyword\">as<\/span> plt\n<span class=\"hljs-keyword\">import<\/span> nltk\n<span class=\"hljs-keyword\">from<\/span> string <span class=\"hljs-keyword\">import<\/span> punctuation\n<span class=\"hljs-keyword\">from<\/span> nltk.corpus <span class=\"hljs-keyword\">import<\/span> stopwords\n<span class=\"hljs-keyword\">from<\/span> nltk.tokenize <span class=\"hljs-keyword\">import<\/span> word_tokenize\n<span class=\"hljs-keyword\">from<\/span> nltk.stem <span class=\"hljs-keyword\">import<\/span> WordNetLemmatizer\n<span class=\"hljs-keyword\">from<\/span> nltk.tokenize <span class=\"hljs-keyword\">import<\/span> sent_tokenize\n<span class=\"hljs-keyword\">from<\/span> nltk <span class=\"hljs-keyword\">import<\/span> WordPunctTokenizer\n\n<span class=\"hljs-keyword\">import<\/span> wikipedia\n<span class=\"hljs-keyword\">import<\/span> nltk\nnltk.download(<span class=\"hljs-string\">'punkt'<\/span>)\nnltk.download(<span class=\"hljs-string\">'wordnet'<\/span>)\nnltk.download(<span class=\"hljs-string\">'stopwords'<\/span>)\nen_stop = <span class=\"hljs-built_in\">set<\/span>(nltk.corpus.stopwords.words(<span class=\"hljs-string\">'english'<\/span>))\n\n%matplotlib inline\n<\/code><\/pre>\n<p>\u0645\u06cc \u0628\u06cc\u0646\u06cc\u062f \u06a9\u0647 \u0645\u0627 \u0627\u0632 \u0622\u0646 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0645\u06cc \u06a9\u0646\u06cc\u0645 <code>FastText<\/code> \u0645\u0627\u0698\u0648\u0644 \u0627\u0632 <code>gensim.models.fasttext<\/code> \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647  \u0628\u0631\u0627\u06cc \u0628\u0627\u0632\u0646\u0645\u0627\u06cc\u06cc \u06a9\u0644\u0645\u0647 \u0648 \u0634\u0628\u0627\u0647\u062a \u0645\u0639\u0646\u0627\u06cc\u06cc\u060c \u0645\u06cc\u200c\u062a\u0648\u0627\u0646 \u0627\u0632 \u0645\u062f\u0644 Gensim \u0628\u0631\u0627\u06cc FastText \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0631\u062f.  \u0627\u06cc\u0646 \u0645\u062f\u0644 \u0645\u06cc \u062a\u0648\u0627\u0646\u062f \u0627\u062c\u0631\u0627 \u0634\u0648\u062f \u0631\u0648\u06cc \u0648\u06cc\u0646\u062f\u0648\u0632\u060c \u0628\u0627 \u0627\u06cc\u0646 \u062d\u0627\u0644\u060c \u0628\u0631\u0627\u06cc \u0637\u0628\u0642\u0647 \u0628\u0646\u062f\u06cc \u0645\u062a\u0646\u060c \u0645\u0627 \u0628\u0627\u06cc\u062f \u0627\u0632 \u067e\u0644\u062a \u0641\u0631\u0645 \u0644\u06cc\u0646\u0648\u06a9\u0633 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0646\u06cc\u0645.  \u0622\u0646 \u0631\u0627 \u062f\u0631 \u0628\u062e\u0634 \u0628\u0639\u062f\u06cc \u062e\u0648\u0627\u0647\u06cc\u0645 \u062f\u06cc\u062f.<\/p>\n<h3 id=\"scrapingwikipediaarticles\"><span class=\"ez-toc-section\" id=\"%d8%ae%d8%b1%d8%a7%d8%b4_%d8%af%d8%a7%d8%af%d9%86_%d9%85%d9%82%d8%a7%d9%84%d8%a7%d8%aa_%d9%88%db%8c%da%a9%db%8c_%d9%be%d8%af%db%8c%d8%a7\"><\/span>\u062e\u0631\u0627\u0634 \u062f\u0627\u062f\u0646 \u0645\u0642\u0627\u0644\u0627\u062a \u0648\u06cc\u06a9\u06cc \u067e\u062f\u06cc\u0627<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p>\u062f\u0631 \u0627\u06cc\u0646 \u0645\u0631\u062d\u0644\u0647\u060c \u0645\u0642\u0627\u0644\u0627\u062a \u0645\u0648\u0631\u062f \u0646\u06cc\u0627\u0632 \u0648\u06cc\u06a9\u06cc\u200c\u067e\u062f\u06cc\u0627 \u0631\u0627 \u067e\u0627\u06a9 \u0645\u06cc\u200c\u06a9\u0646\u06cc\u0645.  \u0628\u0647 \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0632\u06cc\u0631 \u0646\u06af\u0627\u0647 \u06a9\u0646\u06cc\u062f:<\/p>\n<pre><code class=\"hljs\">artificial_intelligence = wikipedia.page(<span class=\"hljs-string\">\"Artificial Intelligence\"<\/span>).content\nmachine_learning = wikipedia.page(<span class=\"hljs-string\">\"Machine Learning\"<\/span>).content\ndeep_learning = wikipedia.page(<span class=\"hljs-string\">\"Deep Learning\"<\/span>).content\nneural_network = wikipedia.page(<span class=\"hljs-string\">\"Neural Network\"<\/span>).content\n\nartificial_intelligence = sent_tokenize(artificial_intelligence)\nmachine_learning = sent_tokenize(machine_learning)\ndeep_learning = sent_tokenize(deep_learning)\nneural_network = sent_tokenize(neural_network)\n\nartificial_intelligence.extend(machine_learning)\nartificial_intelligence.extend(deep_learning)\nartificial_intelligence.extend(neural_network)\n<\/code><\/pre>\n<p>\u0628\u0631\u0627\u06cc \u062e\u0631\u0627\u0634\u06cc\u062f\u0646 \u0648\u06cc\u06a9\u06cc \u067e\u062f\u06cc\u0627 page\u060c \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u0645 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0646\u06cc\u0645 <code>page<\/code> \u0631\u0648\u0634 \u0627\u0632 <code>wikipedia<\/code> \u0645\u062f\u0648\u0644.  \u0646\u0627\u0645 page \u06a9\u0647 \u0645\u06cc \u062e\u0648\u0627\u0647\u06cc\u062f \u0636\u0627\u06cc\u0639 \u06a9\u0646\u06cc\u062f \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u067e\u0627\u0631\u0627\u0645\u062a\u0631 \u0628\u0647 \u0622\u0646 \u0627\u0631\u0633\u0627\u0644 \u0645\u06cc \u0634\u0648\u062f <code>page<\/code> \u0631\u0648\u0634.  \u0631\u0648\u0634 \u0628\u0631\u0645\u06cc \u06af\u0631\u062f\u062f <code>WikipediaPage<\/code> \u0634\u06cc\u060c \u06a9\u0647 \u0633\u067e\u0633 \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u062f \u0627\u0632 \u0622\u0646 \u0628\u0631\u0627\u06cc \u0628\u0627\u0632\u06cc\u0627\u0628\u06cc \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0646\u06cc\u062f page \u0645\u0637\u0627\u0644\u0628 \u0627\u0632 \u0637\u0631\u06cc\u0642 <code>content<\/code> \u0648\u06cc\u0698\u06af\u06cc\u060c \u0647\u0645\u0627\u0646\u0637\u0648\u0631 \u06a9\u0647 \u062f\u0631 \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0628\u0627\u0644\u0627 \u0646\u0634\u0627\u0646 \u062f\u0627\u062f\u0647 \u0634\u062f\u0647 \u0627\u0633\u062a.<\/p>\n<p>\u0633\u067e\u0633 \u0645\u062d\u062a\u0648\u0627\u06cc \u062e\u0631\u0627\u0634\u06cc\u062f\u0647 \u0634\u062f\u0647 \u0627\u0632 \u0686\u0647\u0627\u0631 \u0635\u0641\u062d\u0647 \u0648\u06cc\u06a9\u06cc\u200c\u067e\u062f\u06cc\u0627 \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 \u0622\u0646 \u0628\u0647 \u062c\u0645\u0644\u0627\u062a \u062a\u0628\u062f\u06cc\u0644 \u0645\u06cc\u200c\u0634\u0648\u062f <code>sent_tokenize<\/code> \u0631\u0648\u0634.  \u0631\u0627 <code>sent_tokenize<\/code> \u0645\u062a\u062f \u0644\u06cc\u0633\u062a \u062c\u0645\u0644\u0627\u062a \u0631\u0627 \u0628\u0631\u0645\u06cc \u06af\u0631\u062f\u0627\u0646\u062f.  \u062c\u0645\u0644\u0627\u062a \u0686\u0647\u0627\u0631 \u0635\u0641\u062d\u0647 \u0628\u0647 \u0637\u0648\u0631 \u062c\u062f\u0627\u06af\u0627\u0646\u0647 \u0646\u0634\u0627\u0646\u0647 \u06af\u0630\u0627\u0631\u06cc \u0645\u06cc \u0634\u0648\u0646\u062f.  \u062f\u0631 \u0646\u0647\u0627\u06cc\u062a\u060c \u062c\u0645\u0644\u0627\u062a \u0627\u0632 \u0686\u0647\u0627\u0631 \u0645\u0642\u0627\u0644\u0647 \u0627\u0632 \u0637\u0631\u06cc\u0642 <code>extend<\/code> \u0631\u0648\u0634.<\/p>\n<h3 id=\"datapreprocessing\"><span class=\"ez-toc-section\" id=\"%d9%be%db%8c%d8%b4_%d9%be%d8%b1%d8%af%d8%a7%d8%b2%d8%b4_%d8%af%d8%a7%d8%af%d9%87_%d9%87%d8%a7\"><\/span>\u067e\u06cc\u0634 \u067e\u0631\u062f\u0627\u0632\u0634 \u062f\u0627\u062f\u0647 \u0647\u0627<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p>\u06af\u0627\u0645 \u0628\u0639\u062f\u06cc \u0627\u06cc\u0646 \u0627\u0633\u062a \u06a9\u0647 \u062f\u0627\u062f\u0647 \u0647\u0627\u06cc \u0645\u062a\u0646\u06cc \u062e\u0648\u062f \u0631\u0627 \u0628\u0627 \u062d\u0630\u0641 \u0639\u0644\u0627\u0626\u0645 \u0646\u06af\u0627\u0631\u0634\u06cc \u0648 \u0627\u0639\u062f\u0627\u062f \u067e\u0627\u06a9 \u06a9\u0646\u06cc\u0645.  \u0647\u0645\u0686\u0646\u06cc\u0646 \u062f\u0627\u062f\u0647 \u0647\u0627 \u0631\u0627 \u0628\u0647 \u062d\u0631\u0648\u0641 \u06a9\u0648\u0686\u06a9 \u062a\u0628\u062f\u06cc\u0644 \u0645\u06cc \u06a9\u0646\u06cc\u0645.  \u06a9\u0644\u0645\u0627\u062a \u0645\u0648\u062c\u0648\u062f \u062f\u0631 \u062f\u0627\u062f\u0647\u200c\u0647\u0627\u06cc \u0645\u0627 \u0628\u0647 \u0622\u0646\u0647\u0627 \u062a\u0628\u062f\u06cc\u0644 \u062e\u0648\u0627\u0647\u0646\u062f \u0634\u062f root \u0641\u0631\u0645.  \u0647\u0645\u0686\u0646\u06cc\u0646 \u06a9\u0644\u0645\u0627\u062a \u062a\u0648\u0642\u0641 \u0648 \u06a9\u0644\u0645\u0627\u062a \u0628\u0627 \u0637\u0648\u0644 \u06a9\u0645\u062a\u0631 \u0627\u0632 4 \u0627\u0632 \u0645\u062c\u0645\u0648\u0639\u0647 \u062d\u0630\u0641 \u0645\u06cc \u0634\u0648\u0646\u062f.<\/p>\n<p>\u0631\u0627 <code>preprocess_text<\/code> \u062a\u0627\u0628\u0639\u060c \u0647\u0645\u0627\u0646\u0637\u0648\u0631 \u06a9\u0647 \u062f\u0631 \u0632\u06cc\u0631 \u062a\u0639\u0631\u06cc\u0641 \u0634\u062f\u0647 \u0627\u0633\u062a\u060c \u0648\u0638\u0627\u06cc\u0641 \u067e\u06cc\u0634 \u067e\u0631\u062f\u0627\u0632\u0634 \u0631\u0627 \u0627\u0646\u062c\u0627\u0645 \u0645\u06cc \u062f\u0647\u062f.<\/p>\n<pre><code class=\"hljs\"><span class=\"hljs-keyword\">import<\/span> re\n<span class=\"hljs-keyword\">from<\/span> nltk.stem <span class=\"hljs-keyword\">import<\/span> WordNetLemmatizer\n\nstemmer = WordNetLemmatizer()\n\n<span class=\"hljs-function\"><span class=\"hljs-keyword\">def<\/span> <span class=\"hljs-title\">preprocess_text<\/span>(<span class=\"hljs-params\">document<\/span>):<\/span>\n        \n        document = re.sub(<span class=\"hljs-string\">r'\\W'<\/span>, <span class=\"hljs-string\">' '<\/span>, <span class=\"hljs-built_in\">str<\/span>(document))\n\n        \n        document = re.sub(<span class=\"hljs-string\">r'\\s+(a-zA-Z)\\s+'<\/span>, <span class=\"hljs-string\">' '<\/span>, document)\n\n        \n        document = re.sub(<span class=\"hljs-string\">r'\\^(a-zA-Z)\\s+'<\/span>, <span class=\"hljs-string\">' '<\/span>, document)\n\n        \n        document = re.sub(<span class=\"hljs-string\">r'\\s+'<\/span>, <span class=\"hljs-string\">' '<\/span>, document, flags=re.I)\n\n        \n        document = re.sub(<span class=\"hljs-string\">r'^b\\s+'<\/span>, <span class=\"hljs-string\">''<\/span>, document)\n\n        \n        document = document.lower()\n\n        \n        tokens = document.split()\n        tokens = (stemmer.lemmatize(word) <span class=\"hljs-keyword\">for<\/span> word <span class=\"hljs-keyword\">in<\/span> tokens)\n        tokens = (word <span class=\"hljs-keyword\">for<\/span> word <span class=\"hljs-keyword\">in<\/span> tokens <span class=\"hljs-keyword\">if<\/span> word <span class=\"hljs-keyword\">not<\/span> <span class=\"hljs-keyword\">in<\/span> en_stop)\n        tokens = (word <span class=\"hljs-keyword\">for<\/span> word <span class=\"hljs-keyword\">in<\/span> tokens <span class=\"hljs-keyword\">if<\/span> <span class=\"hljs-built_in\">len<\/span>(word) &gt; <span class=\"hljs-number\">3<\/span>)\n\n        preprocessed_text = <span class=\"hljs-string\">' '<\/span>.join(tokens)\n\n        <span class=\"hljs-keyword\">return<\/span> preprocessed_text\n<\/code><\/pre>\n<p>\u0628\u06cc\u0627\u06cc\u06cc\u062f \u0628\u0628\u06cc\u0646\u06cc\u0645 \u06a9\u0647 \u0622\u06cc\u0627 \u062a\u0627\u0628\u0639 \u0645\u0627 \u0628\u0627 \u067e\u06cc\u0634 \u067e\u0631\u062f\u0627\u0632\u0634 \u06cc\u06a9 \u062c\u0645\u0644\u0647 \u0633\u0627\u062e\u062a\u06af\u06cc \u0648\u0638\u06cc\u0641\u0647 \u0645\u0648\u0631\u062f \u0646\u0638\u0631 \u0631\u0627 \u0627\u0646\u062c\u0627\u0645 \u0645\u06cc \u062f\u0647\u062f:<\/p>\n<pre><code class=\"hljs\">\nsent = preprocess_text(<span class=\"hljs-string\">\"Artificial intelligence, is the most advanced technology of the present era\"<\/span>)\n<span class=\"hljs-built_in\">print<\/span>(sent)\n\n\nfinal_corpus = (preprocess_text(sentence) <span class=\"hljs-keyword\">for<\/span> sentence <span class=\"hljs-keyword\">in<\/span> artificial_intelligence <span class=\"hljs-keyword\">if<\/span> sentence.strip() !=<span class=\"hljs-string\">''<\/span>)\n\nword_punctuation_tokenizer = nltk.WordPunctTokenizer()\nword_tokenized_corpus = (word_punctuation_tokenizer.tokenize(sent) <span class=\"hljs-keyword\">for<\/span> sent <span class=\"hljs-keyword\">in<\/span> final_corpus)\n\n<\/code><\/pre>\n<p>\u062c\u0645\u0644\u0647 \u0627\u0632 \u067e\u06cc\u0634 \u067e\u0631\u062f\u0627\u0632\u0634 \u0634\u062f\u0647 \u0628\u0647 \u0627\u06cc\u0646 \u0635\u0648\u0631\u062a \u0627\u0633\u062a:<\/p>\n<pre><code class=\"hljs\">artificial intelligence advanced technology present\n<\/code><\/pre>\n<p>\u0645\u06cc\u200c\u062a\u0648\u0627\u0646\u06cc\u062f \u0628\u0628\u06cc\u0646\u06cc\u062f \u06a9\u0647 \u0639\u0644\u0627\u0626\u0645 \u0646\u06af\u0627\u0631\u0634\u06cc \u0648 \u062a\u0648\u0642\u0641 \u06a9\u0644\u0645\u0627\u062a \u062d\u0630\u0641 \u0634\u062f\u0647\u200c\u0627\u0646\u062f \u0648 \u062c\u0645\u0644\u0627\u062a \u0628\u0647 \u0635\u0648\u0631\u062a \u06a9\u0644\u0645\u0647\u200c\u0646\u0648\u06cc\u0633\u06cc \u0634\u062f\u0647\u200c\u0627\u0646\u062f.  \u0647\u0645\u0686\u0646\u06cc\u0646 \u06a9\u0644\u0645\u0627\u062a \u0628\u0627 \u0637\u0648\u0644 \u06a9\u0645\u062a\u0631 \u0627\u0632 4 \u0645\u0627\u0646\u0646\u062f &#8220;\u0639\u0635\u0631&#8221; \u0646\u06cc\u0632 \u062d\u0630\u0641 \u0634\u062f\u0647 \u0627\u0633\u062a.  \u0627\u06cc\u0646 \u0627\u0646\u062a\u062e\u0627\u0628\u200c\u0647\u0627 \u0628\u0647\u200c\u0637\u0648\u0631 \u062a\u0635\u0627\u062f\u0641\u06cc \u0628\u0631\u0627\u06cc \u0627\u06cc\u0646 \u0622\u0632\u0645\u0648\u0646 \u0627\u0646\u062a\u062e\u0627\u0628 \u0634\u062f\u0647\u200c\u0627\u0646\u062f\u060c \u0628\u0646\u0627\u0628\u0631\u0627\u06cc\u0646 \u0645\u06cc\u200c\u062a\u0648\u0627\u0646\u06cc\u062f \u06a9\u0644\u0645\u0627\u062a\u06cc \u0628\u0627 \u0637\u0648\u0644\u200c\u0647\u0627\u06cc \u06a9\u0648\u0686\u06a9\u200c\u062a\u0631 \u06cc\u0627 \u0628\u0632\u0631\u06af\u200c\u062a\u0631 \u0631\u0627 \u062f\u0631 \u0645\u062c\u0645\u0648\u0639\u0647 \u0645\u062c\u0627\u0632 \u06a9\u0646\u06cc\u062f.<\/p>\n<h3 id=\"creatingwordsrepresentation\"><span class=\"ez-toc-section\" id=\"%d8%a7%db%8c%d8%ac%d8%a7%d8%af_%d8%a8%d8%a7%d8%b2%d9%86%d9%85%d8%a7%db%8c%db%8c_%da%a9%d9%84%d9%85%d8%a7%d8%aa\"><\/span>\u0627\u06cc\u062c\u0627\u062f \u0628\u0627\u0632\u0646\u0645\u0627\u06cc\u06cc \u06a9\u0644\u0645\u0627\u062a<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p>\u0645\u0627 \u0645\u062c\u0645\u0648\u0639\u0647 \u062e\u0648\u062f \u0631\u0627 \u0627\u0632 \u0642\u0628\u0644 \u067e\u0631\u062f\u0627\u0632\u0634 \u06a9\u0631\u062f\u0647 \u0627\u06cc\u0645.  \u0627\u06a9\u0646\u0648\u0646 \u0632\u0645\u0627\u0646 \u0627\u06cc\u062c\u0627\u062f \u0646\u0645\u0627\u06cc\u0634 \u06a9\u0644\u0645\u0627\u062a \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 FastText \u0627\u0633\u062a.  \u0628\u06cc\u0627\u06cc\u06cc\u062f \u0627\u0628\u062a\u062f\u0627 \u067e\u0627\u0631\u0627\u0645\u062a\u0631\u0647\u0627\u06cc \u0641\u0648\u0642 \u0631\u0627 \u0628\u0631\u0627\u06cc \u0645\u062f\u0644 FastText \u062e\u0648\u062f \u062a\u0639\u0631\u06cc\u0641 \u06a9\u0646\u06cc\u0645:<\/p>\n<pre><code class=\"hljs\">embedding_size = <span class=\"hljs-number\">60<\/span>\nwindow_size = <span class=\"hljs-number\">40<\/span>\nmin_word = <span class=\"hljs-number\">5<\/span>\ndown_sampling = <span class=\"hljs-number\">1e-2<\/span>\n<\/code><\/pre>\n<p>\u0627\u06cc\u0646\u062c\u0627 <code>embedding_size<\/code> \u0627\u0646\u062f\u0627\u0632\u0647 \u0628\u0631\u062f\u0627\u0631 \u062c\u0627\u0633\u0627\u0632\u06cc \u0627\u0633\u062a.  \u0628\u0647 \u0639\u0628\u0627\u0631\u062a \u062f\u06cc\u06af\u0631\u060c \u0647\u0631 \u06a9\u0644\u0645\u0647 \u062f\u0631 \u067e\u06cc\u06a9\u0631\u0647 \u0645\u0627 \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u06cc\u06a9 \u0628\u0631\u062f\u0627\u0631 60 \u0628\u0639\u062f\u06cc \u0646\u0634\u0627\u0646 \u062f\u0627\u062f\u0647 \u0645\u06cc \u0634\u0648\u062f.  \u0631\u0627 <code>window_size<\/code> \u0627\u0646\u062f\u0627\u0632\u0647 \u062a\u0639\u062f\u0627\u062f \u06a9\u0644\u0645\u0627\u062a\u06cc \u0627\u0633\u062a \u06a9\u0647 \u0642\u0628\u0644 \u0648 \u0628\u0639\u062f \u0627\u0632 \u06a9\u0644\u0645\u0647 \u0628\u0631 \u0627\u0633\u0627\u0633 \u0648\u062c\u0648\u062f \u062f\u0627\u0631\u062f \u0631\u0648\u06cc \u06a9\u0647 \u0628\u0627\u0632\u0646\u0645\u0648\u062f\u0647\u0627\u06cc \u06a9\u0644\u0645\u0647 \u0628\u0631\u0627\u06cc \u06a9\u0644\u0645\u0647 \u06cc\u0627\u062f \u062e\u0648\u0627\u0647\u062f \u06af\u0631\u0641\u062a.  \u0627\u06cc\u0646 \u0645\u0645\u06a9\u0646 \u0627\u0633\u062a \u0645\u0634\u06a9\u0644 \u0628\u0647 \u0646\u0638\u0631 \u0628\u0631\u0633\u062f\u060c \u0628\u0627 \u0627\u06cc\u0646 \u062d\u0627\u0644 \u062f\u0631 \u0645\u062f\u0644 skip-gram \u06cc\u06a9 \u06a9\u0644\u0645\u0647 \u0631\u0627 \u0628\u0647 \u0627\u0644\u06af\u0648\u0631\u06cc\u062a\u0645 \u0648\u0627\u0631\u062f \u0645\u06cc\u200c\u06a9\u0646\u06cc\u0645 \u0648 \u062e\u0631\u0648\u062c\u06cc \u06a9\u0644\u0645\u0627\u062a \u0645\u062a\u0646 \u0627\u0633\u062a.  \u0627\u06af\u0631 \u0627\u0646\u062f\u0627\u0632\u0647 \u067e\u0646\u062c\u0631\u0647 40 \u0628\u0627\u0634\u062f\u060c \u0628\u0631\u0627\u06cc \u0647\u0631 \u0648\u0631\u0648\u062f\u06cc 80 \u062e\u0631\u0648\u062c\u06cc \u0648\u062c\u0648\u062f \u062f\u0627\u0631\u062f: 40 \u06a9\u0644\u0645\u0647 \u0642\u0628\u0644 \u0627\u0632 \u06a9\u0644\u0645\u0647 \u0648\u0631\u0648\u062f\u06cc \u0648 40 \u06a9\u0644\u0645\u0647 \u0628\u0639\u062f \u0627\u0632 \u06a9\u0644\u0645\u0647 \u0648\u0631\u0648\u062f\u06cc.  \u0648\u0627\u0698\u0647 embeddings \u0628\u0631\u0627\u06cc \u06a9\u0644\u0645\u0647 \u0648\u0631\u0648\u062f\u06cc \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 \u0627\u06cc\u0646 80 \u06a9\u0644\u0645\u0647 \u062e\u0631\u0648\u062c\u06cc \u0622\u0645\u0648\u062e\u062a\u0647 \u0645\u06cc \u0634\u0648\u062f.<\/p>\n<p>\u0647\u0627\u06cc\u067e\u0631\u067e\u0627\u0631\u0627\u0645\u062a\u0631 \u0628\u0639\u062f\u06cc \u0639\u0628\u0627\u0631\u062a \u0627\u0633\u062a \u0627\u0632 <code>min_word<\/code>\u060c \u06a9\u0647 \u062d\u062f\u0627\u0642\u0644 \u0641\u0631\u06a9\u0627\u0646\u0633 \u06cc\u06a9 \u06a9\u0644\u0645\u0647 \u0631\u0627 \u062f\u0631 \u0645\u062c\u0645\u0648\u0639\u0647 \u0627\u06cc \u06a9\u0647 \u0646\u0645\u0627\u06cc\u0634 \u0647\u0627\u06cc \u06a9\u0644\u0645\u0647 \u0628\u0631\u0627\u06cc \u0622\u0646 \u062a\u0648\u0644\u06cc\u062f \u0645\u06cc \u0634\u0648\u062f \u0631\u0627 \u0645\u0634\u062e\u0635 \u0645\u06cc \u06a9\u0646\u062f.  \u062f\u0631 \u0646\u0647\u0627\u06cc\u062a\u060c \u06a9\u0644\u0645\u0647 \u0627\u06cc \u06a9\u0647 \u0628\u06cc\u0634\u062a\u0631\u06cc\u0646 \u062a\u06a9\u0631\u0627\u0631 \u0631\u0627 \u062f\u0627\u0631\u062f \u0628\u0627 \u0639\u062f\u062f\u06cc \u06a9\u0647 \u062a\u0648\u0633\u0637 \u06a9\u0644\u0645\u0647 \u0645\u0634\u062e\u0635 \u0634\u062f\u0647 \u0627\u0633\u062a\u060c \u0646\u0645\u0648\u0646\u0647 \u0628\u0631\u062f\u0627\u0631\u06cc \u0645\u06cc \u0634\u0648\u062f <code>down_sampling<\/code> \u0635\u0641\u062a.<\/p>\n<p>\u0628\u06cc\u0627\u06cc\u06cc\u062f \u0627\u06a9\u0646\u0648\u0646 \u062e\u0648\u062f \u0631\u0627 \u0627\u06cc\u062c\u0627\u062f \u06a9\u0646\u06cc\u0645 <code>FastText<\/code> \u0645\u062f\u0644\u06cc \u0628\u0631\u0627\u06cc \u0628\u0627\u0632\u0646\u0645\u0627\u06cc\u06cc \u06a9\u0644\u0645\u0627\u062a<\/p>\n<pre><code class=\"hljs\">%%time\nft_model = FastText(word_tokenized_corpus,\n                      size=embedding_size,\n                      window=window_size,\n                      min_count=min_word,\n                      sample=down_sampling,\n                      sg=<span class=\"hljs-number\">1<\/span>,\n                      <span class=\"hljs-built_in\">iter<\/span>=<span class=\"hljs-number\">100<\/span>)\n<\/code><\/pre>\n<p>\u062a\u0645\u0627\u0645 \u067e\u0627\u0631\u0627\u0645\u062a\u0631\u0647\u0627\u06cc \u0645\u0648\u062c\u0648\u062f \u062f\u0631 \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0628\u0627\u0644\u0627 \u0628\u0647 \u062c\u0632 <code>sg<\/code>.  \u0631\u0627 <code>sg<\/code> \u067e\u0627\u0631\u0627\u0645\u062a\u0631 \u0646\u0648\u0639 \u0645\u062f\u0644\u06cc \u0631\u0627 \u06a9\u0647 \u0645\u06cc \u062e\u0648\u0627\u0647\u06cc\u0645 \u0627\u06cc\u062c\u0627\u062f \u06a9\u0646\u06cc\u0645 \u0631\u0627 \u0645\u0634\u062e\u0635 \u0645\u06cc \u06a9\u0646\u062f.  \u0645\u0642\u062f\u0627\u0631 1 \u0645\u0634\u062e\u0635 \u0645\u06cc \u06a9\u0646\u062f \u06a9\u0647 \u0645\u06cc \u062e\u0648\u0627\u0647\u06cc\u0645 \u0645\u062f\u0644 skip-gram \u0627\u06cc\u062c\u0627\u062f \u06a9\u0646\u06cc\u0645.  \u062f\u0631 \u062d\u0627\u0644\u06cc \u06a9\u0647 \u0635\u0641\u0631 \u0645\u062f\u0644 \u06a9\u06cc\u0633\u0647 \u06a9\u0644\u0645\u0627\u062a \u0631\u0627 \u0645\u0634\u062e\u0635 \u0645\u06cc \u06a9\u0646\u062f \u06a9\u0647 \u0645\u0642\u062f\u0627\u0631 \u067e\u06cc\u0634 \u0641\u0631\u0636 \u0646\u06cc\u0632 \u0645\u06cc \u0628\u0627\u0634\u062f.<\/p>\n<p>\u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0628\u0627\u0644\u0627 \u0631\u0627 \u0627\u062c\u0631\u0627 \u06a9\u0646\u06cc\u062f  \u0645\u0645\u06a9\u0646 \u0627\u0633\u062a \u0645\u062f\u062a\u06cc \u0637\u0648\u0644 \u0628\u06a9\u0634\u062f \u062a\u0627 \u0627\u062c\u0631\u0627 \u0634\u0648\u062f.  \u062f\u0631 \u062f\u0633\u062a\u06af\u0627\u0647 \u0645\u0646 \u0622\u0645\u0627\u0631 \u0632\u0645\u0627\u0646 \u0627\u062c\u0631\u0627\u06cc \u06a9\u062f \u0628\u0627\u0644\u0627 \u0628\u0647 \u0634\u0631\u062d \u0632\u06cc\u0631 \u0627\u0633\u062a:<\/p>\n<pre><code class=\"hljs\">CPU times: user 1min 45s, sys: 434 ms, total: 1min 45s\nWall time: 57.2 s\n<\/code><\/pre>\n<p>\u0628\u06cc\u0627\u06cc\u06cc\u062f \u0627\u06a9\u0646\u0648\u0646 \u06a9\u0644\u0645\u0647 \u0646\u0645\u0627\u06cc\u0646\u062f\u06af\u06cc \u0628\u0631\u0627\u06cc \u06a9\u0644\u0645\u0647 &#8220;\u0645\u0635\u0646\u0648\u0639\u06cc&#8221; \u0631\u0627 \u0628\u0628\u06cc\u0646\u06cc\u0645.  \u0628\u0631\u0627\u06cc \u0627\u06cc\u0646 \u06a9\u0627\u0631 \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u062f \u0627\u0632 <code>wv<\/code> \u0631\u0648\u0634 \u0627\u0632 <code>FastText<\/code> \u0634\u06cc\u0621 \u06a9\u0646\u06cc\u062f \u0648 \u0646\u0627\u0645 \u06a9\u0644\u0645\u0647 \u0631\u0627 \u062f\u0631 \u06cc\u06a9 \u0644\u06cc\u0633\u062a \u0627\u0631\u0633\u0627\u0644 \u06a9\u0646\u06cc\u062f.<\/p>\n<pre><code class=\"hljs\"><span class=\"hljs-built_in\">print<\/span>(ft_model.wv(<span class=\"hljs-string\">'artificial'<\/span>))\n<\/code><\/pre>\n<p>\u062f\u0631 \u0627\u06cc\u0646\u062c\u0627 \u062e\u0631\u0648\u062c\u06cc \u0627\u0633\u062a:<\/p>\n<pre><code class=\"hljs\">(-3.7653010e-02 -4.5558015e-01  3.2035065e-01 -1.5289043e-01\n  4.0645871e-02 -1.8946664e-01  7.0426887e-01  2.8806925e-01\n -1.8166199e-01  1.7566417e-01  1.1522485e-01 -3.6525184e-01\n -6.4378887e-01 -1.6650060e-01  7.4625671e-01 -4.8166099e-01\n  2.0884991e-01  1.8067230e-01 -6.2647951e-01  2.7614883e-01\n -3.6478557e-02  1.4782918e-02 -3.3124462e-01  1.9372456e-01\n  4.3028224e-02 -8.2326338e-02  1.0356739e-01  4.0792203e-01\n -2.0596240e-02 -3.5974573e-02  9.9928051e-02  1.7191900e-01\n -2.1196717e-01  6.4424530e-02 -4.4705093e-02  9.7391091e-02\n -2.8846195e-01  8.8607501e-03  1.6514034e-01 -3.6626378e-01\n -6.2017748e-04 -1.5083785e-01 -1.7499258e-01  7.1994811e-02\n -1.9868813e-01 -3.1733567e-01  1.9832127e-01  1.2799081e-01\n -7.6522082e-01  5.2335665e-02 -4.5766738e-01 -2.7947658e-01\n  3.7890410e-03 -3.8761377e-01 -9.3001537e-02 -1.7128626e-01\n -1.2923178e-01  3.9627206e-01 -3.6673656e-01  2.2755004e-01)\n<\/code><\/pre>\n<p>\u062f\u0631 \u062e\u0631\u0648\u062c\u06cc \u0628\u0627\u0644\u0627 \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u062f \u06cc\u06a9 \u0648\u06a9\u062a\u0648\u0631 60 \u0628\u0639\u062f\u06cc \u0628\u0631\u0627\u06cc \u06a9\u0644\u0645\u0647 &#8220;\u0645\u0635\u0646\u0648\u0639\u06cc&#8221; \u0645\u0634\u0627\u0647\u062f\u0647 \u06a9\u0646\u06cc\u062f.<\/p>\n<p>\u0628\u06cc\u0627\u06cc\u06cc\u062f \u0627\u06a9\u0646\u0648\u0646 5 \u06a9\u0644\u0645\u0647 \u0645\u0634\u0627\u0628\u0647 \u0631\u0627 \u0628\u0631\u0627\u06cc \u06a9\u0644\u0645\u0627\u062a &#8220;\u0645\u0635\u0646\u0648\u0639\u06cc&#8221;\u060c &#8220;\u0647\u0648\u0634&#8221;\u060c &#8220;\u0645\u0627\u0634\u06cc\u0646&#8221;\u060c &#8220;\u0634\u0628\u06a9\u0647&#8221;\u060c &#8220;\u062a\u06a9\u0631\u0627\u0631 \u06a9\u0646\u0646\u062f\u0647&#8221;\u060c &#8220;\u0639\u0645\u06cc\u0642&#8221; \u067e\u06cc\u062f\u0627 \u06a9\u0646\u06cc\u0645.  \u0634\u0645\u0627 \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u062f \u0647\u0631 \u062a\u0639\u062f\u0627\u062f \u06a9\u0644\u0645\u0647 \u0631\u0627 \u0627\u0646\u062a\u062e\u0627\u0628 \u06a9\u0646\u06cc\u062f.  \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0632\u06cc\u0631 \u06a9\u0644\u0645\u0627\u062a \u0645\u0634\u062e\u0635 \u0634\u062f\u0647 \u0631\u0627 \u0628\u0647 \u0647\u0645\u0631\u0627\u0647 5 \u06a9\u0644\u0645\u0647 \u0645\u0634\u0627\u0628\u0647 \u0686\u0627\u067e \u0645\u06cc \u06a9\u0646\u062f.<\/p>\n<pre><code class=\"hljs\">semantically_similar_words = {words: (item(<span class=\"hljs-number\">0<\/span>) <span class=\"hljs-keyword\">for<\/span> item <span class=\"hljs-keyword\">in<\/span> ft_model.wv.most_similar((words), topn=<span class=\"hljs-number\">5<\/span>))\n                  <span class=\"hljs-keyword\">for<\/span> words <span class=\"hljs-keyword\">in<\/span> (<span class=\"hljs-string\">'artificial'<\/span>, <span class=\"hljs-string\">'intelligence'<\/span>, <span class=\"hljs-string\">'machine'<\/span>, <span class=\"hljs-string\">'network'<\/span>, <span class=\"hljs-string\">'recurrent'<\/span>, <span class=\"hljs-string\">'deep'<\/span>)}\n\n<span class=\"hljs-keyword\">for<\/span> k,v <span class=\"hljs-keyword\">in<\/span> semantically_similar_words.items():\n    <span class=\"hljs-built_in\">print<\/span>(k+<span class=\"hljs-string\">\":\"<\/span>+<span class=\"hljs-built_in\">str<\/span>(v))\n<\/code><\/pre>\n<p>\u062e\u0631\u0648\u062c\u06cc \u0628\u0647 \u0635\u0648\u0631\u062a \u0632\u06cc\u0631 \u0627\u0633\u062a:<\/p>\n<pre><code class=\"hljs\">artificial:('intelligence', 'inspired', 'book', 'academic', 'biological')\nintelligence:('artificial', 'human', 'people', 'intelligent', 'general')\nmachine:('ethic', 'learning', 'concerned', 'argument', 'intelligence')\nnetwork:('neural', 'forward', 'deep', 'backpropagation', 'hidden')\nrecurrent:('rnns', 'short', 'schmidhuber', 'shown', 'feedforward')\ndeep:('convolutional', 'speech', 'network', 'generative', 'neural')\n<\/code><\/pre>\n<p>\u0645\u0627 \u0647\u0645\u0686\u0646\u06cc\u0646 \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u0645 \u0634\u0628\u0627\u0647\u062a \u06a9\u0633\u06cc\u0646\u0648\u0633 \u0628\u06cc\u0646 \u0628\u0631\u062f\u0627\u0631\u0647\u0627 \u0631\u0627 \u0628\u0631\u0627\u06cc \u0647\u0631 \u062f\u0648 \u06a9\u0644\u0645\u0647 \u067e\u06cc\u062f\u0627 \u06a9\u0646\u06cc\u0645\u060c \u0647\u0645\u0627\u0646\u0637\u0648\u0631 \u06a9\u0647 \u062f\u0631 \u0632\u06cc\u0631 \u0646\u0634\u0627\u0646 \u062f\u0627\u062f\u0647 \u0634\u062f\u0647 \u0627\u0633\u062a:<\/p>\n<pre><code class=\"hljs\"><span class=\"hljs-built_in\">print<\/span>(ft_model.wv.similarity(w1=<span class=\"hljs-string\">'artificial'<\/span>, w2=<span class=\"hljs-string\">'intelligence'<\/span>))\n<\/code><\/pre>\n<p>\u062e\u0631\u0648\u062c\u06cc \u0645\u0642\u062f\u0627\u0631 &#8220;0.7481&#8221; \u0631\u0627 \u0646\u0634\u0627\u0646 \u0645\u06cc \u062f\u0647\u062f.  \u0645\u0642\u062f\u0627\u0631 \u0645\u06cc \u062a\u0648\u0627\u0646\u062f \u0628\u06cc\u0646 0 \u0648 1 \u0628\u0627\u0634\u062f. \u0645\u0642\u062f\u0627\u0631 \u0628\u0627\u0644\u0627\u062a\u0631 \u0628\u0647 \u0645\u0639\u0646\u0627\u06cc \u0634\u0628\u0627\u0647\u062a \u0628\u06cc\u0634\u062a\u0631 \u0627\u0633\u062a.<\/p>\n<h3 id=\"visualizingwordsimilarities\"><span class=\"ez-toc-section\" id=\"%d8%aa%d8%ac%d8%b3%d9%85_%d8%b4%d8%a8%d8%a7%d9%87%d8%aa_%d9%87%d8%a7%db%8c_%da%a9%d9%84%d9%85%d9%87\"><\/span>\u062a\u062c\u0633\u0645 \u0634\u0628\u0627\u0647\u062a \u0647\u0627\u06cc \u06a9\u0644\u0645\u0647<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p>\u0627\u06af\u0631\u0686\u0647 \u0647\u0631 \u06a9\u0644\u0645\u0647 \u062f\u0631 \u0645\u062f\u0644 \u0645\u0627 \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u0628\u0631\u062f\u0627\u0631 60 \u0628\u0639\u062f\u06cc \u0646\u0634\u0627\u0646 \u062f\u0627\u062f\u0647 \u0645\u06cc \u0634\u0648\u062f\u060c \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u0645 \u0627\u0632 \u062a\u06a9\u0646\u06cc\u06a9 \u062a\u062d\u0644\u06cc\u0644 \u0645\u0648\u0644\u0641\u0647 \u0627\u0635\u0644\u06cc \u0628\u0631\u0627\u06cc \u06cc\u0627\u0641\u062a\u0646 \u062f\u0648 \u062c\u0632\u0621 \u0627\u0635\u0644\u06cc \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0646\u06cc\u0645.  \u0633\u067e\u0633 \u0645\u06cc \u062a\u0648\u0627\u0646 \u0627\u0632 \u062f\u0648 \u062c\u0632\u0621 \u0627\u0635\u0644\u06cc \u0628\u0631\u0627\u06cc \u062a\u0631\u0633\u06cc\u0645 \u06a9\u0644\u0645\u0627\u062a \u062f\u0631 \u06cc\u06a9 \u0641\u0636\u0627\u06cc \u062f\u0648 \u0628\u0639\u062f\u06cc \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0631\u062f.  \u0628\u0627 \u0627\u06cc\u0646 \u062d\u0627\u0644\u060c \u0627\u0628\u062a\u062f\u0627 \u0628\u0627\u06cc\u062f \u0644\u06cc\u0633\u062a\u06cc \u0627\u0632 \u062a\u0645\u0627\u0645 \u06a9\u0644\u0645\u0627\u062a \u0645\u0648\u062c\u0648\u062f \u062f\u0631 \u0622\u0646 \u0627\u06cc\u062c\u0627\u062f \u06a9\u0646\u06cc\u0645 <code>semantically_similar_words<\/code> \u0641\u0631\u0647\u0646\u06af \u0644\u063a\u062a.  \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0632\u06cc\u0631 \u0627\u06cc\u0646 \u06a9\u0627\u0631 \u0631\u0627 \u0627\u0646\u062c\u0627\u0645 \u0645\u06cc \u062f\u0647\u062f:<\/p>\n<pre><code class=\"hljs\"><span class=\"hljs-keyword\">from<\/span> sklearn.decomposition <span class=\"hljs-keyword\">import<\/span> PCA\n\nall_similar_words = <span class=\"hljs-built_in\">sum<\/span>(((k) + v <span class=\"hljs-keyword\">for<\/span> k, v <span class=\"hljs-keyword\">in<\/span> semantically_similar_words.items()), ())\n\n<span class=\"hljs-built_in\">print<\/span>(all_similar_words)\n<span class=\"hljs-built_in\">print<\/span>(<span class=\"hljs-built_in\">type<\/span>(all_similar_words))\n<span class=\"hljs-built_in\">print<\/span>(<span class=\"hljs-built_in\">len<\/span>(all_similar_words))\n<\/code><\/pre>\n<p>\u062f\u0631 \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0628\u0627\u0644\u0627\u060c \u062a\u0645\u0627\u0645 \u062c\u0641\u062a\u200c\u0647\u0627\u06cc \u06a9\u0644\u06cc\u062f-\u0645\u0642\u062f\u0627\u0631 \u062f\u0631 \u0631\u0627 \u062a\u06a9\u0631\u0627\u0631 \u0645\u06cc\u200c\u06a9\u0646\u06cc\u0645 <code>semantically_similar_words<\/code> \u0641\u0631\u0647\u0646\u06af \u0644\u063a\u062a.  \u0647\u0631 \u06a9\u0644\u06cc\u062f \u062f\u0631 \u0641\u0631\u0647\u0646\u06af \u0644\u063a\u062a \u06cc\u06a9 \u06a9\u0644\u0645\u0647 \u0627\u0633\u062a.  \u0645\u0642\u062f\u0627\u0631 \u0645\u0631\u0628\u0648\u0637\u0647 \u0641\u0647\u0631\u0633\u062a\u06cc \u0627\u0632 \u062a\u0645\u0627\u0645 \u06a9\u0644\u0645\u0627\u062a \u0645\u0634\u0627\u0628\u0647 \u0645\u0639\u0646\u0627\u06cc\u06cc \u0627\u0633\u062a.  \u0627\u0632 \u0622\u0646\u062c\u0627\u06cc\u06cc \u06a9\u0647 \u0645\u0627 5 \u06a9\u0644\u0645\u0647 \u0645\u0634\u0627\u0628\u0647 \u0631\u0627 \u0628\u0631\u0627\u06cc \u0644\u06cc\u0633\u062a\u06cc \u0627\u0632 6 \u06a9\u0644\u0645\u0647 \u067e\u06cc\u062f\u0627 \u06a9\u0631\u062f\u06cc\u0645\u060c \u06cc\u0639\u0646\u06cc \u00ab\u0645\u0635\u0646\u0648\u0639\u06cc\u00bb\u060c \u00ab\u0647\u0648\u0634\u00bb\u060c \u00ab\u0645\u0627\u0634\u06cc\u0646\u00bb\u060c \u00ab\u0634\u0628\u06a9\u0647\u00bb\u060c \u00ab\u062a\u06a9\u0631\u0627\u0631\u06a9\u0646\u0646\u062f\u0647\u00bb\u060c \u00ab\u0639\u0645\u06cc\u0642\u00bb\u060c \u062e\u0648\u0627\u0647\u06cc\u062f \u062f\u06cc\u062f \u06a9\u0647 30 \u0645\u0648\u0631\u062f \u062f\u0631 \u0627\u06cc\u0646 \u0641\u0647\u0631\u0633\u062a \u0648\u062c\u0648\u062f \u062e\u0648\u0627\u0647\u062f \u062f\u0627\u0634\u062a. \u0631\u0627 <code>all_similar_words<\/code> \u0641\u0647\u0631\u0633\u062a<\/p>\n<p>\u062f\u0631 \u0645\u0631\u062d\u0644\u0647 \u0628\u0639\u062f\u060c \u0645\u0627 \u0628\u0627\u06cc\u062f \u06a9\u0644\u0645\u0647 \u0628\u0631\u062f\u0627\u0631 \u0631\u0627 \u0628\u0631\u0627\u06cc \u062a\u0645\u0627\u0645 \u0627\u06cc\u0646 30 \u06a9\u0644\u0645\u0647 \u067e\u06cc\u062f\u0627 \u06a9\u0646\u06cc\u0645 \u0648 \u0633\u067e\u0633 \u0627\u0632 PCA \u0628\u0631\u0627\u06cc \u06a9\u0627\u0647\u0634 \u0627\u0628\u0639\u0627\u062f \u0628\u0631\u062f\u0627\u0631\u0647\u0627\u06cc \u06a9\u0644\u0645\u0647 \u0627\u0632 60 \u0628\u0647 2 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0646\u06cc\u0645. \u0633\u067e\u0633 \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u0645 \u0627\u0632 <code>plt<\/code> \u0645\u062a\u062f\u060c \u06a9\u0647 \u0646\u0627\u0645 \u0645\u0633\u062a\u0639\u0627\u0631 the <code>matplotlib.pyplot<\/code> \u0631\u0648\u0634 \u0631\u0633\u0645 \u06a9\u0644\u0645\u0627\u062a \u0631\u0648\u06cc \u06cc\u06a9 \u0641\u0636\u0627\u06cc \u0628\u0631\u062f\u0627\u0631\u06cc \u062f\u0648 \u0628\u0639\u062f\u06cc<\/p>\n<p>\u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0632\u06cc\u0631 \u0631\u0627 \u0628\u0631\u0627\u06cc \u062a\u062c\u0633\u0645 \u06a9\u0644\u0645\u0627\u062a \u0627\u062c\u0631\u0627 \u06a9\u0646\u06cc\u062f:<\/p>\n<pre><code class=\"hljs\">word_vectors = ft_model.wv(all_similar_words)\n\npca = PCA(n_components=<span class=\"hljs-number\">2<\/span>)\n\np_comps = pca.fit_transform(word_vectors)\nword_names = all_similar_words\n\nplt.figure(figsize=(<span class=\"hljs-number\">18<\/span>, <span class=\"hljs-number\">10<\/span>))\nplt.scatter(p_comps(:, <span class=\"hljs-number\">0<\/span>), p_comps(:, <span class=\"hljs-number\">1<\/span>), c=<span class=\"hljs-string\">'red'<\/span>)\n\n<span class=\"hljs-keyword\">for<\/span> word_names, x, y <span class=\"hljs-keyword\">in<\/span> <span class=\"hljs-built_in\">zip<\/span>(word_names, p_comps(:, <span class=\"hljs-number\">0<\/span>), p_comps(:, <span class=\"hljs-number\">1<\/span>)):\n    plt.annotate(word_names, xy=(x+<span class=\"hljs-number\">0.06<\/span>, y+<span class=\"hljs-number\">0.03<\/span>), xytext=(<span class=\"hljs-number\">0<\/span>, <span class=\"hljs-number\">0<\/span>), textcoords=<span class=\"hljs-string\">'offset points'<\/span>)\n<\/code><\/pre>\n<p>\u062e\u0631\u0648\u062c\u06cc \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0628\u0627\u0644\u0627 \u0628\u0647 \u0634\u06a9\u0644 \u0632\u06cc\u0631 \u0627\u0633\u062a:<\/p>\n<p><img decoding=\"async\" src=\"https:\/\/rasanegar.com\/blog\/wp-content\/uploads\/2024\/01\/Python-for-NLP-Working-with-Facebook-FastText-Library-1.PNG\" alt=\"\" title=\"\"><\/p>\n<p>\u062f\u0631 \u0635\u0641\u062d\u0647 \u062f\u0648\u0628\u0639\u062f\u06cc \u0646\u06cc\u0632 \u0645\u06cc\u200c\u062a\u0648\u0627\u0646\u06cc\u062f \u06a9\u0644\u0645\u0627\u062a\u06cc \u0631\u0627 \u06a9\u0647 \u0627\u063a\u0644\u0628 \u0628\u0627 \u0647\u0645 \u062f\u0631 \u0645\u062a\u0646 \u0627\u062a\u0641\u0627\u0642 \u0645\u06cc\u200c\u0627\u0641\u062a\u0646\u062f\u060c \u0646\u0632\u062f\u06cc\u06a9 \u0628\u0647 \u0647\u0645 \u0628\u0628\u06cc\u0646\u06cc\u062f.  \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u0645\u062b\u0627\u0644\u060c \u06a9\u0644\u0645\u0627\u062a &#8220;\u0639\u0645\u06cc\u0642&#8221; \u0648 &#8220;\u0634\u0628\u06a9\u0647&#8221; \u062a\u0642\u0631\u06cc\u0628\u0627\u064b \u0647\u0645\u067e\u0648\u0634\u0627\u0646\u06cc \u062f\u0627\u0631\u0646\u062f.  \u0628\u0647 \u0647\u0645\u06cc\u0646 \u062a\u0631\u062a\u06cc\u0628\u060c \u06a9\u0644\u0645\u0627\u062a &#8220;\u0641\u06cc\u062f \u0641\u0648\u0631\u0648\u0627\u0631\u062f&#8221; \u0648 &#8220;\u067e\u0633 \u0627\u0646\u062a\u0634\u0627\u0631&#8221; \u0646\u06cc\u0632 \u0628\u0633\u06cc\u0627\u0631 \u0646\u0632\u062f\u06cc\u06a9 \u0647\u0633\u062a\u0646\u062f.<\/p>\n<p>\u0627\u06a9\u0646\u0648\u0646 \u0645\u06cc \u062f\u0627\u0646\u06cc\u0645 \u06a9\u0647 \u0686\u06af\u0648\u0646\u0647 \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 FastText \u062c\u0627\u0633\u0627\u0632\u06cc \u0647\u0627\u06cc \u06a9\u0644\u0645\u0647 \u0627\u06cc\u062c\u0627\u062f \u06a9\u0646\u06cc\u0645.  \u062f\u0631 \u0628\u062e\u0634 \u0628\u0639\u062f\u06cc \u062e\u0648\u0627\u0647\u06cc\u0645 \u062f\u06cc\u062f \u06a9\u0647 \u0686\u06af\u0648\u0646\u0647 \u0645\u06cc \u062a\u0648\u0627\u0646 \u0627\u0632 FastText \u0628\u0631\u0627\u06cc \u06a9\u0627\u0631\u0647\u0627\u06cc \u0637\u0628\u0642\u0647 \u0628\u0646\u062f\u06cc \u0645\u062a\u0646 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0631\u062f.<\/p>\n<h2 id=\"fasttextfortextclassification\"><span class=\"ez-toc-section\" id=\"fasttext_%d8%a8%d8%b1%d8%a7%db%8c_%d8%b7%d8%a8%d9%82%d9%87_%d8%a8%d9%86%d8%af%db%8c_%d9%85%d8%aa%d9%86\"><\/span>FastText \u0628\u0631\u0627\u06cc \u0637\u0628\u0642\u0647 \u0628\u0646\u062f\u06cc \u0645\u062a\u0646<span class=\"ez-toc-section-end\"><\/span><\/h2>\n<p>\u0637\u0628\u0642\u0647 \u0628\u0646\u062f\u06cc \u0645\u062a\u0646 \u0628\u0647 \u0637\u0628\u0642\u0647 \u0628\u0646\u062f\u06cc \u062f\u0627\u062f\u0647 \u0647\u0627\u06cc \u0645\u062a\u0646\u06cc \u0628\u0647 \u062f\u0633\u062a\u0647 \u0647\u0627\u06cc \u0627\u0632 \u067e\u06cc\u0634 \u062a\u0639\u0631\u06cc\u0641 \u0634\u062f\u0647 \u0628\u0631 \u0627\u0633\u0627\u0633 \u0627\u0634\u0627\u0631\u0647 \u062f\u0627\u0631\u062f \u0631\u0648\u06cc \u0645\u062d\u062a\u0648\u06cc\u0627\u062a \u0645\u062a\u0646  \u062a\u062c\u0632\u06cc\u0647 \u0648 \u062a\u062d\u0644\u06cc\u0644 \u0627\u062d\u0633\u0627\u0633\u0627\u062a\u060c \u062a\u0634\u062e\u06cc\u0635 \u0647\u0631\u0632\u0646\u0627\u0645\u0647\u060c \u0648 \u062a\u0634\u062e\u06cc\u0635 \u0628\u0631\u0686\u0633\u0628 \u0628\u0631\u062e\u06cc \u0627\u0632 \u0631\u0627\u06cc\u062c \u062a\u0631\u06cc\u0646 \u0646\u0645\u0648\u0646\u0647 \u0647\u0627\u06cc \u0645\u0648\u0627\u0631\u062f \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0628\u0631\u0627\u06cc \u0637\u0628\u0642\u0647 \u0628\u0646\u062f\u06cc \u0645\u062a\u0646 \u0647\u0633\u062a\u0646\u062f.<\/p>\n<p>\u0645\u0627\u0698\u0648\u0644 \u0637\u0628\u0642\u0647 \u0628\u0646\u062f\u06cc \u0645\u062a\u0646 FastText \u0641\u0642\u0637 \u0627\u0632 \u0637\u0631\u06cc\u0642 \u0644\u06cc\u0646\u0648\u06a9\u0633 \u06cc\u0627 OSX \u0642\u0627\u0628\u0644 \u0627\u062c\u0631\u0627 \u0627\u0633\u062a.  \u0627\u06af\u0631 \u06a9\u0627\u0631\u0628\u0631 \u0648\u06cc\u0646\u062f\u0648\u0632 \u0647\u0633\u062a\u06cc\u062f\u060c \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u062f \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0646\u06cc\u062f <a rel=\"nofollow noopener\" target=\"_blank\" href=\"https:\/\/colab.research.google.com\" class=\"broken_link\">Google Collaboratory<\/a> \u0628\u0631\u0627\u06cc \u0627\u062c\u0631\u0627\u06cc \u0645\u0627\u0698\u0648\u0644 \u0637\u0628\u0642\u0647 \u0628\u0646\u062f\u06cc \u0645\u062a\u0646 FastText.  \u062a\u0645\u0627\u0645 \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0647\u0627\u06cc \u0627\u06cc\u0646 \u0628\u062e\u0634 \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 Google Colaboratory \u0627\u062c\u0631\u0627 \u0634\u062f\u0647 \u0627\u0646\u062f.<\/p>\n<h3 id=\"thedataset\"><span class=\"ez-toc-section\" id=\"%d9%85%d8%ac%d9%85%d9%88%d8%b9%d9%87_%d8%af%d8%a7%d8%af%d9%87\"><\/span>\u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p>\u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647 \u0647\u0627\u06cc \u0627\u06cc\u0646 \u0645\u0642\u0627\u0644\u0647 \u0631\u0627 \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u062f \u0627\u0632 \u0627\u06cc\u0646\u062c\u0627 \u062f\u0627\u0646\u0644\u0648\u062f \u06a9\u0646\u06cc\u062f <a rel=\"nofollow noopener\" target=\"_blank\" href=\"https:\/\/www.kaggle.com\/yelp-dataset\/yelp-dataset\/version\/4#yelp_review.csv\" class=\"broken_link\">\u0644\u06cc\u0646\u06a9 \u06a9\u0627\u06af\u0644<\/a>.  \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647 \u0634\u0627\u0645\u0644 \u0686\u0646\u062f\u06cc\u0646 \u0641\u0627\u06cc\u0644 \u0627\u0633\u062a\u060c \u0627\u0645\u0627 \u0645\u0627 \u0641\u0642\u0637 \u0628\u0647 \u0622\u0646 \u0639\u0644\u0627\u0642\u0647 \u062f\u0627\u0631\u06cc\u0645 <code>yelp_review.csv<\/code> \u0641\u0627\u06cc\u0644.  \u0627\u06cc\u0646 \u0641\u0627\u06cc\u0644 \u062d\u0627\u0648\u06cc \u0628\u06cc\u0634 \u0627\u0632 5.2 \u0645\u06cc\u0644\u06cc\u0648\u0646 \u0628\u0631\u0631\u0633\u06cc \u062f\u0631 \u0645\u0648\u0631\u062f \u0645\u0634\u0627\u063a\u0644 \u0645\u062e\u062a\u0644\u0641 \u0627\u0632 \u062c\u0645\u0644\u0647 \u0631\u0633\u062a\u0648\u0631\u0627\u0646 \u0647\u0627\u060c \u06a9\u0627\u0641\u0647 \u0647\u0627\u060c \u062f\u0646\u062f\u0627\u0646\u067e\u0632\u0634\u06a9\u0627\u0646\u060c \u067e\u0632\u0634\u06a9\u0627\u0646\u060c \u0633\u0627\u0644\u0646 \u0647\u0627\u06cc \u0632\u06cc\u0628\u0627\u06cc\u06cc \u0648 \u063a\u06cc\u0631\u0647 \u0627\u0633\u062a. \u0628\u0627 \u0627\u06cc\u0646 \u062d\u0627\u0644\u060c \u0628\u0647 \u062f\u0644\u06cc\u0644 \u0645\u062d\u062f\u0648\u062f\u06cc\u062a \u0647\u0627\u06cc \u062d\u0627\u0641\u0638\u0647\u060c \u0645\u0627 \u0641\u0642\u0637 \u0627\u0632 50000 \u0631\u06a9\u0648\u0631\u062f \u0627\u0648\u0644 \u0628\u0631\u0627\u06cc \u0622\u0645\u0648\u0632\u0634 \u0645\u062f\u0644 \u062e\u0648\u062f \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u062e\u0648\u0627\u0647\u06cc\u0645 \u06a9\u0631\u062f.  \u062f\u0631 \u0635\u0648\u0631\u062a \u062a\u0645\u0627\u06cc\u0644 \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u062f \u0628\u0627 \u0631\u06a9\u0648\u0631\u062f\u0647\u0627\u06cc \u0628\u06cc\u0634\u062a\u0631\u06cc \u0627\u0645\u062a\u062d\u0627\u0646 \u06a9\u0646\u06cc\u062f.<\/p>\n<p>\u0627\u062c\u0627\u0632\u0647 \u062f\u0647\u06cc\u062f import \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 \u0647\u0627\u06cc \u0645\u0648\u0631\u062f \u0646\u06cc\u0627\u0632 \u0648 \u0628\u0627\u0631\u06af\u0630\u0627\u0631\u06cc \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647:<\/p>\n<pre><code class=\"hljs\"><span class=\"hljs-keyword\">import<\/span> pandas <span class=\"hljs-keyword\">as<\/span> pd\n<span class=\"hljs-keyword\">import<\/span> numpy <span class=\"hljs-keyword\">as<\/span> np\n\nyelp_reviews = pd.read_csv(<span class=\"hljs-string\">\"\/content\/drive\/My Drive\/Colab Datasets\/yelp_review_short.csv\"<\/span>)\n\nbins = (<span class=\"hljs-number\">0<\/span>,<span class=\"hljs-number\">2<\/span>,<span class=\"hljs-number\">5<\/span>)\nreview_names = (<span class=\"hljs-string\">'negative'<\/span>, <span class=\"hljs-string\">'positive'<\/span>)\n\nyelp_reviews(<span class=\"hljs-string\">'reviews_score'<\/span>) = pd.cut(yelp_reviews(<span class=\"hljs-string\">'stars'<\/span>), bins, labels=review_names)\n\nyelp_reviews.head()\n<\/code><\/pre>\n<p>\u062f\u0631 \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0628\u0627\u0644\u0627 \u0645\u0627 \u0628\u0627\u0631\u06af\u0630\u0627\u0631\u06cc \u0645\u06cc \u06a9\u0646\u06cc\u0645 <code>yelp_review_short.csv<\/code> \u0641\u0627\u06cc\u0644\u06cc \u06a9\u0647 \u0634\u0627\u0645\u0644 50000 \u0628\u0631\u0631\u0633\u06cc \u0628\u0627 <code>pd.read_csv<\/code> \u062a\u0627\u0628\u0639.<\/p>\n<p>\u0645\u0627 \u0645\u0634\u06a9\u0644 \u062e\u0648\u062f \u0631\u0627 \u0628\u0627 \u062a\u0628\u062f\u06cc\u0644 \u0645\u0642\u0627\u062f\u06cc\u0631 \u0639\u062f\u062f\u06cc \u0628\u0631\u0631\u0633\u06cc \u0647\u0627 \u0628\u0647 \u0645\u0642\u0648\u0644\u0647 \u0627\u06cc \u0633\u0627\u062f\u0647 \u0645\u06cc \u06a9\u0646\u06cc\u0645.  \u0627\u06cc\u0646 \u06a9\u0627\u0631 \u0628\u0627 \u0627\u0636\u0627\u0641\u0647 \u06a9\u0631\u062f\u0646 \u06cc\u06a9 \u0633\u062a\u0648\u0646 \u062c\u062f\u06cc\u062f \u0627\u0646\u062c\u0627\u0645 \u0645\u06cc \u0634\u0648\u062f\u060c<code>reviews_score<\/code>\u060c \u0628\u0647 \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647 \u0645\u0627.  \u0627\u06af\u0631 \u0646\u0638\u0631 \u06a9\u0627\u0631\u0628\u0631 \u062f\u0627\u0631\u0627\u06cc \u0645\u0642\u062f\u0627\u0631\u06cc \u0628\u06cc\u0646 1-2 \u0628\u0627\u0634\u062f <code>Stars<\/code> \u0633\u062a\u0648\u0646 (\u06a9\u0647 \u06a9\u0633\u0628 \u0648 \u06a9\u0627\u0631 \u0631\u0627 \u0631\u062a\u0628\u0647 \u0628\u0646\u062f\u06cc \u0645\u06cc \u06a9\u0646\u062f \u0631\u0648\u06cc \u0645\u0642\u06cc\u0627\u0633 1-5)\u060c <code>reviews_score<\/code> \u0633\u062a\u0648\u0646 \u06cc\u06a9 \u0645\u0642\u062f\u0627\u0631 \u0631\u0634\u062a\u0647 \u0627\u06cc \u062e\u0648\u0627\u0647\u062f \u062f\u0627\u0634\u062a <code>negative<\/code>.  \u0627\u06af\u0631 \u0627\u0645\u062a\u06cc\u0627\u0632 \u0628\u06cc\u0646 3-5 \u062f\u0631 <code>Stars<\/code> \u0633\u062a\u0648\u0646\u060c <code>reviews_score<\/code> \u0633\u062a\u0648\u0646 \u062d\u0627\u0648\u06cc \u06cc\u06a9 \u0645\u0642\u062f\u0627\u0631 \u062e\u0648\u0627\u0647\u062f \u0628\u0648\u062f <code>positive<\/code>.  \u0627\u06cc\u0646 \u0628\u0627\u0639\u062b \u0645\u06cc \u0634\u0648\u062f \u0645\u0634\u06a9\u0644 \u0645\u0627 \u06cc\u06a9 \u0645\u0634\u06a9\u0644 \u0637\u0628\u0642\u0647 \u0628\u0646\u062f\u06cc \u0628\u0627\u06cc\u0646\u0631\u06cc \u0628\u0627\u0634\u062f.<\/p>\n<p>\u062f\u0631 \u0646\u0647\u0627\u06cc\u062a \u0647\u062f\u0631 \u062f\u06cc\u062a\u0627\u0641\u0631\u06cc\u0645 \u0645\u0637\u0627\u0628\u0642 \u0634\u06a9\u0644 \u0632\u06cc\u0631 \u0686\u0627\u067e \u0645\u06cc \u0634\u0648\u062f:<\/p>\n<p><img decoding=\"async\" src=\"https:\/\/rasanegar.com\/blog\/wp-content\/uploads\/2024\/01\/Python-for-NLP-Working-with-Facebook-FastText-Library-2.PNG\" alt=\"\" title=\"\"><\/p>\n<h3 id=\"installingfasttext\"><span class=\"ez-toc-section\" id=\"%d9%86%d8%b5%d8%a8_fasttext\"><\/span>\u0646\u0635\u0628 FastText<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p>\u0645\u0631\u062d\u0644\u0647 \u0628\u0639\u062f\u06cc \u0627\u06cc\u0646 \u0627\u0633\u062a \u06a9\u0647 import \u0645\u062f\u0644 \u0647\u0627\u06cc FastText\u060c \u06a9\u0647 \u0645\u06cc \u062a\u0648\u0627\u0646\u0646\u062f \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 <code>wget<\/code> \u062f\u0633\u062a\u0648\u0631 \u0627\u0632 \u0645\u062e\u0632\u0646 GitHub\u060c \u0647\u0645\u0627\u0646\u0637\u0648\u0631 \u06a9\u0647 \u062f\u0631 \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0632\u06cc\u0631 \u0646\u0634\u0627\u0646 \u062f\u0627\u062f\u0647 \u0634\u062f\u0647 \u0627\u0633\u062a:<\/p>\n<pre><code class=\"hljs\">!wget https:\/\/github.com\/facebookresearch\/fastText\/archive\/v0.1.0.zip\n<\/code><\/pre>\n<p><strong>\u062a\u0648\u062c\u0647 \u062f\u0627\u0634\u062a\u0647 \u0628\u0627\u0634\u06cc\u062f<\/strong>: \u0627\u06af\u0631 \u062f\u0633\u062a\u0648\u0631 \u0628\u0627\u0644\u0627 \u0631\u0627 \u0627\u0632 \u0644\u06cc\u0646\u0648\u06a9\u0633 \u0627\u062c\u0631\u0627 \u0645\u06cc \u06a9\u0646\u06cc\u062f terminal\u060c \u0644\u0627\u0632\u0645 \u0646\u06cc\u0633\u062a \u067e\u06cc\u0634\u0648\u0646\u062f \u0628\u0632\u0646\u06cc\u062f <code>!<\/code> \u0642\u0628\u0644 \u0627\u0632 \u062f\u0633\u062a\u0648\u0631 \u0628\u0627\u0644\u0627  \u062f\u0631 Google Colaboratory notebook\u060c \u0647\u0631 \u062f\u0633\u062a\u0648\u0631\u06cc \u0628\u0639\u062f \u0627\u0632 <code>!<\/code> \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u06cc\u06a9 \u0641\u0631\u0645\u0627\u0646 \u067e\u0648\u0633\u062a\u0647 \u0648 \u0646\u0647 \u062f\u0631 \u0645\u0641\u0633\u0631 \u067e\u0627\u06cc\u062a\u0648\u0646 \u0627\u062c\u0631\u0627 \u0645\u06cc \u0634\u0648\u062f.  \u0628\u0646\u0627\u0628\u0631\u0627\u06cc\u0646 \u062a\u0645\u0627\u0645 \u062f\u0633\u062a\u0648\u0631\u0627\u062a \u063a\u06cc\u0631 \u067e\u0627\u06cc\u062a\u0648\u0646 \u062f\u0631 \u0627\u06cc\u0646\u062c\u0627 \u0628\u0627 \u067e\u06cc\u0634\u0648\u0646\u062f \u0647\u0633\u062a\u0646\u062f <code>!<\/code>.<\/p>\n<p>\u0627\u06af\u0631 \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0628\u0627\u0644\u0627 \u0631\u0627 \u0627\u062c\u0631\u0627 \u06a9\u0646\u06cc\u062f \u0648 \u0646\u062a\u0627\u06cc\u062c \u0632\u06cc\u0631 \u0631\u0627 \u0645\u0634\u0627\u0647\u062f\u0647 \u06a9\u0646\u06cc\u062f\u060c \u0628\u0647 \u0627\u06cc\u0646 \u0645\u0639\u0646\u06cc \u0627\u0633\u062a \u06a9\u0647 FastText \u0628\u0627 \u0645\u0648\u0641\u0642\u06cc\u062a \u062f\u0627\u0646\u0644\u0648\u062f \u0634\u062f\u0647 \u0627\u0633\u062a:<\/p>\n<pre><code class=\"hljs\">--2019-08-16 15:05:05--  https:\/\/github.com\/facebookresearch\/fastText\/archive\/v0.1.0.zip\nResolving github.com (github.com)... 140.82.113.4\nConnecting to github.com (github.com)|140.82.113.4|:443... connected.\nHTTP request sent, awaiting response... 302 Found\nLocation: https:\/\/codeload.github.com\/facebookresearch\/fastText\/zip\/v0.1.0 (following)\n--2019-08-16 15:05:05--  https:\/\/codeload.github.com\/facebookresearch\/fastText\/zip\/v0.1.0\nResolving codeload.github.com (codeload.github.com)... 192.30.255.121\nConnecting to codeload.github.com (codeload.github.com)|192.30.255.121|:443... connected.\nHTTP request sent, awaiting response... 200 OK\nLength: unspecified (application\/zip)\nSaving to: \u2018v0.1.0.zip\u2019\n\nv0.1.0.zip              ( &lt;=&gt;                )  92.06K  --.-KB\/s    in 0.03s\n\n2019-08-16 15:05:05 (3.26 MB\/s) - \u2018v0.1.0.zip\u2019 saved (94267)\n<\/code><\/pre>\n<p>\u0645\u0631\u062d\u0644\u0647 \u0628\u0639\u062f\u06cc \u0627\u06cc\u0646 \u0627\u0633\u062a \u06a9\u0647 \u0645\u0627\u0698\u0648\u0644 \u0647\u0627\u06cc FastText \u0631\u0627 \u0627\u0632 \u062d\u0627\u0644\u062a \u0641\u0634\u0631\u062f\u0647 \u062e\u0627\u0631\u062c \u06a9\u0646\u06cc\u062f.  \u0628\u0647 \u0633\u0627\u062f\u06af\u06cc \u062f\u0633\u062a\u0648\u0631 \u0632\u06cc\u0631 \u0631\u0627 \u062a\u0627\u06cc\u067e \u06a9\u0646\u06cc\u062f:<\/p>\n<pre><code class=\"hljs\">!unzip v0.1.0.zip\n<\/code><\/pre>\n<p>\u062f\u0631 \u0645\u0631\u062d\u0644\u0647 \u0628\u0639\u062f\u060c \u0628\u0627\u06cc\u062f \u0628\u0647 \u062f\u0627\u06cc\u0631\u06a9\u062a\u0648\u0631\u06cc \u06a9\u0647 \u062f\u0631 \u0622\u0646 FastText \u0631\u0627 \u062f\u0627\u0646\u0644\u0648\u062f \u06a9\u0631\u062f\u0647 \u0627\u06cc\u062f \u0628\u0631\u0648\u06cc\u062f \u0648 \u0633\u067e\u0633 \u0622\u0646 \u0631\u0627 \u0627\u062c\u0631\u0627 \u06a9\u0646\u06cc\u062f <code>!make<\/code> \u062f\u0633\u062a\u0648\u0631 \u0627\u062c\u0631\u0627\u06cc \u0628\u0627\u06cc\u0646\u0631\u06cc \u0647\u0627\u06cc ++C.  \u0645\u0631\u0627\u062d\u0644 \u0632\u06cc\u0631 \u0631\u0627 \u0627\u062c\u0631\u0627 \u06a9\u0646\u06cc\u062f:<\/p>\n<pre><code class=\"hljs\">cd fastText-0.1.0\n!make\n<\/code><\/pre>\n<p>\u0627\u06af\u0631 \u062e\u0631\u0648\u062c\u06cc \u0632\u06cc\u0631 \u0631\u0627 \u0645\u0634\u0627\u0647\u062f\u0647 \u06a9\u0631\u062f\u06cc\u062f\u060c \u0628\u0647 \u0627\u06cc\u0646 \u0645\u0639\u0646\u06cc \u0627\u0633\u062a \u06a9\u0647 FastText \u0628\u0627 \u0645\u0648\u0641\u0642\u06cc\u062a \u0646\u0635\u0628 \u0634\u062f\u0647 \u0627\u0633\u062a \u0631\u0648\u06cc \u0645\u0627\u0634\u06cc\u0646 \u0634\u0645\u0627<\/p>\n<pre><code class=\"hljs\">c++ -pthread -std=c++0x -O3 -funroll-loops -c src\/args.cc\nc++ -pthread -std=c++0x -O3 -funroll-loops -c src\/dictionary.cc\nc++ -pthread -std=c++0x -O3 -funroll-loops -c src\/productquantizer.cc\nc++ -pthread -std=c++0x -O3 -funroll-loops -c src\/matrix.cc\nc++ -pthread -std=c++0x -O3 -funroll-loops -c src\/qmatrix.cc\nc++ -pthread -std=c++0x -O3 -funroll-loops -c src\/vector.cc\nc++ -pthread -std=c++0x -O3 -funroll-loops -c src\/model.cc\nc++ -pthread -std=c++0x -O3 -funroll-loops -c src\/utils.cc\nc++ -pthread -std=c++0x -O3 -funroll-loops -c src\/fasttext.cc\nc++ -pthread -std=c++0x -O3 -funroll-loops args.o dictionary.o productquantizer.o matrix.o qmatrix.o vector.o model.o utils.o fasttext.o src\/main.cc -o fasttext\n<\/code><\/pre>\n<p>\u0628\u0631\u0627\u06cc \u062a\u0627\u06cc\u06cc\u062f \u0646\u0635\u0628\u060c \u062f\u0633\u062a\u0648\u0631 \u0632\u06cc\u0631 \u0631\u0627 \u0627\u062c\u0631\u0627 \u06a9\u0646\u06cc\u062f:<\/p>\n<pre><code class=\"hljs\">!.\/fasttext\n<\/code><\/pre>\n<p>\u0628\u0627\u06cc\u062f \u0628\u0628\u06cc\u0646\u06cc\u062f \u06a9\u0647 \u0627\u06cc\u0646 \u062f\u0633\u062a\u0648\u0631\u0627\u062a \u062a\u0648\u0633\u0637 FastText \u067e\u0634\u062a\u06cc\u0628\u0627\u0646\u06cc \u0645\u06cc \u0634\u0648\u0646\u062f:<\/p>\n<pre><code class=\"hljs\">usage: fasttext &lt;command&gt; &lt;args&gt;\n\nThe commands supported by FastText are:\n\n  supervised              train a supervised classifier\n  quantize                quantize a model to reduce the memory usage\n  test                    evaluate a supervised classifier\n  predict                 predict most likely labels\n  predict-prob            predict most likely labels with probabilities\n  skipgram                train a skipgram model\n  cbow                    train a cbow model\n  print-word-vectors      print word vectors given a trained model\n  print-sentence-vectors  print sentence vectors given a trained model\n  nn                      query for nearest neighbors\n  analogies               query for analogies\n<\/code><\/pre>\n<h3 id=\"textclassification\"><span class=\"ez-toc-section\" id=\"%d8%b7%d8%a8%d9%82%d9%87_%d8%a8%d9%86%d8%af%db%8c_%d9%85%d8%aa%d9%86\"><\/span>\u0637\u0628\u0642\u0647 \u0628\u0646\u062f\u06cc \u0645\u062a\u0646<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p>\u0642\u0628\u0644 \u0627\u0632 \u0622\u0645\u0648\u0632\u0634 \u0645\u062f\u0644 \u0647\u0627\u06cc FastText \u0628\u0631\u0627\u06cc \u0627\u0646\u062c\u0627\u0645 \u0637\u0628\u0642\u0647 \u0628\u0646\u062f\u06cc \u0645\u062a\u0646\u060c \u0644\u0627\u0632\u0645 \u0628\u0647 \u0630\u06a9\u0631 \u0627\u0633\u062a \u06a9\u0647 FastText \u062f\u0627\u062f\u0647 \u0647\u0627 \u0631\u0627 \u062f\u0631 \u0642\u0627\u0644\u0628 \u062e\u0627\u0635\u06cc \u0645\u06cc \u067e\u0630\u06cc\u0631\u062f \u06a9\u0647 \u0628\u0647 \u0634\u0631\u062d \u0632\u06cc\u0631 \u0627\u0633\u062a:<\/p>\n<pre><code class=\"hljs\">_label_tag This is sentence 1\n_label_tag2 This is sentence 2.\n<\/code><\/pre>\n<p>\u0627\u06af\u0631 \u0628\u0647 \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647 \u062e\u0648\u062f \u0646\u06af\u0627\u0647 \u06a9\u0646\u06cc\u0645\u060c \u062f\u0631 \u0642\u0627\u0644\u0628 \u0645\u0648\u0631\u062f \u0646\u0638\u0631 \u0646\u06cc\u0633\u062a.  \u0645\u062a\u0646 \u0628\u0627 \u0627\u062d\u0633\u0627\u0633\u0627\u062a \u0645\u062b\u0628\u062a \u0628\u0627\u06cc\u062f \u0628\u0647 \u0627\u06cc\u0646 \u0635\u0648\u0631\u062a \u0628\u0627\u0634\u062f:<\/p>\n<pre><code class=\"hljs\">__label__positive burgers are very big portions here.\n<\/code><\/pre>\n<p>\u0628\u0647 \u0637\u0648\u0631 \u0645\u0634\u0627\u0628\u0647\u060c \u0646\u0638\u0631\u0627\u062a \u0645\u0646\u0641\u06cc \u0628\u0627\u06cc\u062f \u0628\u0647 \u0627\u06cc\u0646 \u0635\u0648\u0631\u062a \u0628\u0627\u0634\u062f:<\/p>\n<pre><code class=\"hljs\">__label__negative They do not use organic ingredients, but I thi...\n<\/code><\/pre>\n<p>\u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0632\u06cc\u0631 \u0631\u0627 \u0641\u06cc\u0644\u062a\u0631 \u0645\u06cc \u06a9\u0646\u062f <code>reviews_score<\/code> \u0648 <code>text<\/code> \u0633\u062a\u0648\u0646 \u0647\u0627\u06cc\u06cc \u0627\u0632 \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647 \u0648 \u0633\u067e\u0633 \u067e\u06cc\u0634\u0648\u0646\u062f\u0647\u0627 <code>__label__<\/code> \u0642\u0628\u0644 \u0627\u0632 \u062a\u0645\u0627\u0645 \u0645\u0642\u0627\u062f\u06cc\u0631 \u0645\u0648\u062c\u0648\u062f \u062f\u0631 <code>reviews_score<\/code> \u0633\u062a\u0648\u0646  \u0628\u0647 \u0637\u0648\u0631 \u0645\u0634\u0627\u0628\u0647\u060c <code>\\n<\/code> \u0648 <code>\\t<\/code> \u0628\u0627 \u06cc\u06a9 \u0641\u0627\u0635\u0644\u0647 \u062f\u0631 \u062c\u0627\u06cc\u06af\u0632\u06cc\u0646 \u0645\u06cc \u0634\u0648\u0646\u062f <code>text<\/code> \u0633\u062a\u0648\u0646  \u062f\u0631 \u0646\u0647\u0627\u06cc\u062a \u062f\u06cc\u062a\u0627\u0641\u0631\u06cc\u0645 \u0628\u0647 \u0631\u0648\u0632 \u0634\u062f\u0647 \u0628\u0647 \u0634\u06a9\u0644 \u0631\u0648\u06cc \u062f\u06cc\u0633\u06a9 \u0646\u0648\u0634\u062a\u0647 \u0645\u06cc \u0634\u0648\u062f <code>yelp_reviews_updated.txt<\/code>.<\/p>\n<pre><code class=\"hljs\"><span class=\"hljs-keyword\">import<\/span> pandas <span class=\"hljs-keyword\">as<\/span> pd\n<span class=\"hljs-keyword\">from<\/span> io <span class=\"hljs-keyword\">import<\/span> StringIO\n<span class=\"hljs-keyword\">import<\/span> csv\n\ncol = (<span class=\"hljs-string\">'reviews_score'<\/span>, <span class=\"hljs-string\">'text'<\/span>)\n\nyelp_reviews = yelp_reviews(col)\nyelp_reviews(<span class=\"hljs-string\">'reviews_score'<\/span>)=(<span class=\"hljs-string\">'__label__'<\/span>+ s <span class=\"hljs-keyword\">for<\/span> s <span class=\"hljs-keyword\">in<\/span> yelp_reviews(<span class=\"hljs-string\">'reviews_score'<\/span>))\nyelp_reviews(<span class=\"hljs-string\">'text'<\/span>)= yelp_reviews(<span class=\"hljs-string\">'text'<\/span>).replace(<span class=\"hljs-string\">'\\n'<\/span>,<span class=\"hljs-string\">' '<\/span>, regex=<span class=\"hljs-literal\">True<\/span>).replace(<span class=\"hljs-string\">'\\t'<\/span>,<span class=\"hljs-string\">' '<\/span>, regex=<span class=\"hljs-literal\">True<\/span>)\nyelp_reviews.to_csv(<span class=\"hljs-string\">r'\/content\/drive\/My Drive\/Colab Datasets\/yelp_reviews_updated.txt'<\/span>, index=<span class=\"hljs-literal\">False<\/span>, sep=<span class=\"hljs-string\">' '<\/span>, header=<span class=\"hljs-literal\">False<\/span>, quoting=csv.QUOTE_NONE, quotechar=<span class=\"hljs-string\">\"\"<\/span>, escapechar=<span class=\"hljs-string\">\" \"<\/span>)\n<\/code><\/pre>\n<p>\u062d\u0627\u0644\u0627 \u0628\u06cc\u0627\u06cc\u06cc\u062f print \u0631\u0626\u06cc\u0633 \u0628\u0647 \u0631\u0648\u0632 \u0634\u062f\u0647 <code>yelp_reviews<\/code> \u0686\u0627\u0631\u0686\u0648\u0628 \u062f\u0627\u062f\u0647<\/p>\n<pre><code class=\"hljs\">yelp_reviews.head()\n<\/code><\/pre>\n<p>\u0634\u0645\u0627 \u0628\u0627\u06cc\u062f \u0646\u062a\u0627\u06cc\u062c \u0632\u06cc\u0631 \u0631\u0627 \u0628\u0628\u06cc\u0646\u06cc\u062f:<\/p>\n<pre><code class=\"hljs\">reviews_score   text\n0   __label__positive   Super simple place but amazing nonetheless. It...\n1   __label__positive   Small unassuming place that changes their menu...\n2   __label__positive   Lester's is located in a beautiful neighborhoo...\n3   __label__positive   Love coming here. Yes the place always needs t...\n4   __label__positive   Had their chocolate almond croissant and it wa...\n<\/code><\/pre>\n<p>\u0628\u0647 \u0637\u0648\u0631 \u0645\u0634\u0627\u0628\u0647\u060c \u062f\u0645 \u062f\u06cc\u062a\u0627\u0641\u0631\u06cc\u0645 \u0628\u0647 \u0634\u06a9\u0644 \u0632\u06cc\u0631 \u0627\u0633\u062a:<\/p>\n<pre><code class=\"hljs\">    reviews_score   text\n49995   __label__positive   This is an awesome consignment store! They hav...\n49996   __label__positive   Awesome laid back atmosphere with made-to-orde...\n49997   __label__positive   Today was my first appointment and I can hones...\n49998   __label__positive   I love this chic salon. They use the best prod...\n49999   __label__positive   This place is delicious. All their meats and s...\n<\/code><\/pre>\n<p>\u0645\u0627 \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647 \u062e\u0648\u062f \u0631\u0627 \u0628\u0647 \u0634\u06a9\u0644 \u0645\u0648\u0631\u062f \u0646\u06cc\u0627\u0632 \u062a\u0628\u062f\u06cc\u0644 \u06a9\u0631\u062f\u0647 \u0627\u06cc\u0645.  \u0645\u0631\u062d\u0644\u0647 \u0628\u0639\u062f\u06cc \u0627\u06cc\u0646 \u0627\u0633\u062a \u06a9\u0647 \u062f\u0627\u062f\u0647 \u0647\u0627\u06cc \u062e\u0648\u062f \u0631\u0627 \u0628\u0647 \u0645\u062c\u0645\u0648\u0639\u0647 \u0647\u0627\u06cc \u0642\u0637\u0627\u0631 \u0648 \u0622\u0632\u0645\u0627\u06cc\u0634 \u062a\u0642\u0633\u06cc\u0645 \u06a9\u0646\u06cc\u0645.  80% \u062f\u0627\u062f\u0647 \u06cc\u0639\u0646\u06cc 40000 \u0631\u06a9\u0648\u0631\u062f \u0627\u0648\u0644 \u0627\u0632 50000 \u0631\u06a9\u0648\u0631\u062f \u0628\u0631\u0627\u06cc \u0622\u0645\u0648\u0632\u0634 \u062f\u0627\u062f\u0647 \u0647\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u062e\u0648\u0627\u0647\u062f \u0634\u062f\u060c \u062f\u0631 \u062d\u0627\u0644\u06cc \u06a9\u0647 20% \u062f\u0627\u062f\u0647 (10000 \u0631\u06a9\u0648\u0631\u062f \u0622\u062e\u0631) \u0628\u0631\u0627\u06cc \u0627\u0631\u0632\u06cc\u0627\u0628\u06cc \u0639\u0645\u0644\u06a9\u0631\u062f \u0627\u0644\u06af\u0648\u0631\u06cc\u062a\u0645 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u062e\u0648\u0627\u0647\u062f \u0634\u062f.<\/p>\n<p>\u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0632\u06cc\u0631 \u062f\u0627\u062f\u0647 \u0647\u0627 \u0631\u0627 \u0628\u0647 \u0645\u062c\u0645\u0648\u0639\u0647 \u0647\u0627\u06cc \u0622\u0645\u0648\u0632\u0634\u06cc \u0648 \u0622\u0632\u0645\u0627\u06cc\u0634\u06cc \u062a\u0642\u0633\u06cc\u0645 \u0645\u06cc \u06a9\u0646\u062f:<\/p>\n<pre><code class=\"hljs\">!head -n 40000 \"\/content\/drive\/My Drive\/Colab Datasets\/yelp_reviews_updated.txt\" &gt; \"\/content\/drive\/My Drive\/Colab Datasets\/yelp_reviews_train.txt\"\n!tail -n 10000 \"\/content\/drive\/My Drive\/Colab Datasets\/yelp_reviews_updated.txt\" &gt; \"\/content\/drive\/My Drive\/Colab Datasets\/yelp_reviews_test.txt\"\n<\/code><\/pre>\n<p>\u067e\u0633 \u0627\u0632 \u0627\u062c\u0631\u0627\u06cc \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0628\u0627\u0644\u0627\u060c <code>yelp_reviews_train.txt<\/code> \u0641\u0627\u06cc\u0644\u06cc \u062a\u0648\u0644\u06cc\u062f \u062e\u0648\u0627\u0647\u062f \u0634\u062f \u06a9\u0647 \u062d\u0627\u0648\u06cc \u062f\u0627\u062f\u0647 \u0647\u0627\u06cc \u0622\u0645\u0648\u0632\u0634\u06cc \u0627\u0633\u062a.  \u0628\u0647 \u0637\u0648\u0631 \u0645\u0634\u0627\u0628\u0647\u060c \u0628\u0647 \u062a\u0627\u0632\u06af\u06cc \u062a\u0648\u0644\u06cc\u062f \u0634\u062f\u0647 \u0627\u0633\u062a <code>yelp_reviews_test.txt<\/code> \u0641\u0627\u06cc\u0644 \u062d\u0627\u0648\u06cc \u062f\u0627\u062f\u0647 \u0647\u0627\u06cc \u0622\u0632\u0645\u0627\u06cc\u0634\u06cc \u062e\u0648\u0627\u0647\u062f \u0628\u0648\u062f.<\/p>\n<p>\u0627\u06a9\u0646\u0648\u0646 \u0632\u0645\u0627\u0646 \u0622\u0645\u0648\u0632\u0634 \u0627\u0644\u06af\u0648\u0631\u06cc\u062a\u0645 \u0637\u0628\u0642\u0647 \u0628\u0646\u062f\u06cc \u0645\u062a\u0646 FastText \u0627\u0633\u062a.<\/p>\n<pre><code class=\"hljs\">%%time\n!.\/fasttext supervised -<span class=\"hljs-built_in\">input<\/span> <span class=\"hljs-string\">\"\/content\/drive\/My Drive\/Colab Datasets\/yelp_reviews_train.txt\"<\/span> -output model_yelp_reviews\n<\/code><\/pre>\n<p>\u0628\u0631\u0627\u06cc \u0622\u0645\u0648\u0632\u0634 \u0627\u0644\u06af\u0648\u0631\u06cc\u062a\u0645 \u0628\u0627\u06cc\u062f \u0627\u0632 \u0622\u0646 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0646\u06cc\u0645 <code>supervised<\/code> \u062f\u0633\u062a\u0648\u0631 \u062f\u0627\u062f\u0647 \u0648 \u0641\u0627\u06cc\u0644 \u0648\u0631\u0648\u062f\u06cc \u0631\u0627 \u0627\u0631\u0633\u0627\u0644 \u06a9\u0646\u06cc\u062f.  \u0646\u0627\u0645 \u0645\u062f\u0644 \u0628\u0639\u062f \u0627\u0632 \u0622\u0646 \u0645\u0634\u062e\u0635 \u0645\u06cc \u0634\u0648\u062f <code>-output<\/code> \u06a9\u0644\u0645\u0647 \u06a9\u0644\u06cc\u062f\u06cc.  \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0628\u0627\u0644\u0627 \u0645\u0646\u062c\u0631 \u0628\u0647 \u06cc\u06a9 \u0645\u062f\u0644 \u0637\u0628\u0642\u0647 \u0628\u0646\u062f\u06cc \u0645\u062a\u0646 \u0622\u0645\u0648\u0632\u0634 \u062f\u06cc\u062f\u0647 \u0628\u0647 \u0646\u0627\u0645 \u0645\u06cc \u0634\u0648\u062f <code>model_yelp_reviews.bin<\/code>.  \u062f\u0631 \u0627\u06cc\u0646\u062c\u0627 \u062e\u0631\u0648\u062c\u06cc \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0628\u0627\u0644\u0627 \u0622\u0645\u062f\u0647 \u0627\u0633\u062a:<\/p>\n<pre><code class=\"hljs\">Read 4M words\nNumber of words:  177864\nNumber of labels: 2\nProgress: 100.0%  words\/sec\/thread: 2548017  lr: 0.000000  loss: 0.246120  eta: 0h0m\nCPU times: user 212 ms, sys: 48.6 ms, total: 261 ms\nWall time: 15.6 s\n<\/code><\/pre>\n<p>\u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u062f \u0627\u0632 \u0637\u0631\u06cc\u0642 \u0627\u06cc\u0646 \u0645\u062f\u0644 \u0646\u06af\u0627\u0647\u06cc \u0628\u06cc\u0646\u062f\u0627\u0632\u06cc\u062f <code>!ls<\/code> \u062f\u0633\u062a\u0648\u0631 \u0645\u0637\u0627\u0628\u0642 \u0634\u06a9\u0644 \u0632\u06cc\u0631:<\/p>\n<pre><code class=\"hljs\">!ls\n<\/code><\/pre>\n<p>\u062f\u0631 \u0627\u06cc\u0646\u062c\u0627 \u062e\u0631\u0648\u062c\u06cc \u0627\u0633\u062a:<\/p>\n<pre><code class=\"hljs\">args.o             Makefile         quantization-results.sh\nclassification-example.sh  matrix.o         README.md\nclassification-results.sh  model.o          src\nCONTRIBUTING.md        model_yelp_reviews.bin   tutorials\ndictionary.o           model_yelp_reviews.vec   utils.o\neval.py            PATENTS          vector.o\nfasttext           pretrained-vectors.md    wikifil.pl\nfasttext.o         productquantizer.o       word-vector-example.sh\nget-wikimedia.sh       qmatrix.o            yelp_reviews_train.txt\nLICENSE            quantization-example.sh\n<\/code><\/pre>\n<p>\u0645\u06cc \u062a\u0648\u0627\u0646\u06cc \u0628\u0628\u06cc\u0646\u06cc <code>model_yelp_reviews.bin<\/code> \u062f\u0631 \u0644\u06cc\u0633\u062a \u0627\u0633\u0646\u0627\u062f \u0628\u0627\u0644\u0627<\/p>\n<p>\u062f\u0631 \u0646\u0647\u0627\u06cc\u062a \u0628\u0631\u0627\u06cc \u062a\u0633\u062a \u0645\u062f\u0644 \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u062f \u0627\u0632 <code>test<\/code> \u0641\u0631\u0645\u0627\u0646  \u0634\u0645\u0627 \u0628\u0627\u06cc\u062f \u0646\u0627\u0645 \u0645\u062f\u0644 \u0648 \u0641\u0627\u06cc\u0644 \u062a\u0633\u062a \u0631\u0627 \u0628\u0639\u062f \u0627\u0632 \u0622\u0646 \u0645\u0634\u062e\u0635 \u06a9\u0646\u06cc\u062f <code>test<\/code> \u062f\u0633\u062a\u0648\u0631\u060c \u0645\u0637\u0627\u0628\u0642 \u0634\u06a9\u0644 \u0632\u06cc\u0631:<\/p>\n<pre><code class=\"hljs\">!.\/fasttext test model_yelp_reviews.bin \"\/content\/drive\/My Drive\/Colab Datasets\/yelp_reviews_test.txt\"\n<\/code><\/pre>\n<p>\u062e\u0631\u0648\u062c\u06cc \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0628\u0627\u0644\u0627 \u0628\u0647 \u0634\u06a9\u0644 \u0632\u06cc\u0631 \u0627\u0633\u062a:<\/p>\n<pre><code class=\"hljs\">N   10000\nP@1 0.909\nR@1 0.909\nNumber of examples: 10000\n<\/code><\/pre>\n<p>\u0627\u06cc\u0646\u062c\u0627 <code>P@1<\/code> \u0627\u0634\u0627\u0631\u0647 \u0628\u0647 \u062f\u0642\u062a \u0648 <code>R@1<\/code>\u0628\u0647 \u06cc\u0627\u062f\u0622\u0648\u0631\u06cc \u0627\u0634\u0627\u0631\u0647 \u062f\u0627\u0631\u062f.  \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u062f \u0628\u0628\u06cc\u0646\u06cc\u062f \u06a9\u0647 \u0645\u062f\u0644 \u0645\u0627 \u0628\u0647 \u062f\u0642\u062a \u0648 \u0641\u0631\u0627\u062e\u0648\u0627\u0646\u06cc 0.909 \u0645\u06cc \u0631\u0633\u062f \u06a9\u0647 \u0628\u0633\u06cc\u0627\u0631 \u062e\u0648\u0628 \u0627\u0633\u062a.<\/p>\n<p>\u0627\u06a9\u0646\u0648\u0646 \u0628\u06cc\u0627\u06cc\u06cc\u062f \u0633\u0639\u06cc \u06a9\u0646\u06cc\u0645 \u0645\u062a\u0646 \u062e\u0648\u062f \u0631\u0627 \u0627\u0632 \u0639\u0644\u0627\u0626\u0645 \u0646\u06af\u0627\u0631\u0634\u06cc\u060c \u06a9\u0627\u0631\u0627\u06a9\u062a\u0631\u0647\u0627\u06cc \u062e\u0627\u0635 \u067e\u0627\u06a9 \u06a9\u0646\u06cc\u0645 \u0648 \u0622\u0646 \u0631\u0627 \u0628\u0647 \u062d\u0631\u0648\u0641 \u06a9\u0648\u0686\u06a9 \u062a\u0628\u062f\u06cc\u0644 \u06a9\u0646\u06cc\u0645 \u062a\u0627 \u06cc\u06a9\u0646\u0648\u0627\u062e\u062a\u06cc \u0645\u062a\u0646 \u0628\u0647\u0628\u0648\u062f \u06cc\u0627\u0628\u062f.  \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0632\u06cc\u0631 \u0645\u062c\u0645\u0648\u0639\u0647 \u0642\u0637\u0627\u0631 \u0631\u0627 \u062a\u0645\u06cc\u0632 \u0645\u06cc \u06a9\u0646\u062f:<\/p>\n<pre><code class=\"hljs\">!cat \"\/content\/drive\/My Drive\/Colab Datasets\/yelp_reviews_train.txt\" | sed -e \"s\/\\((.\\!?,\u2019\/())\\)\/ \\1 \/g\" | tr \"(:upper:)\" \"(:lower:)\" &gt; \"\/content\/drive\/My Drive\/Colab Datasets\/yelp_reviews_train_clean.txt\"\n<\/code><\/pre>\n<p>\u0648 \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0632\u06cc\u0631 \u0645\u062c\u0645\u0648\u0639\u0647 \u062a\u0633\u062a \u0631\u0627 \u067e\u0627\u06a9 \u0645\u06cc \u06a9\u0646\u062f:<\/p>\n<pre><code class=\"hljs\">\"\/content\/drive\/My Drive\/Colab Datasets\/yelp_reviews_test.txt\" | sed -e \"s\/\\((.\\!?,\u2019\/())\\)\/ \\1 \/g\" | tr \"(:upper:)\" \"(:lower:)\" &gt; \"\/content\/drive\/My Drive\/Colab Datasets\/yelp_reviews_test_clean.txt\"\n<\/code><\/pre>\n<p>\u0627\u06a9\u0646\u0648\u0646 \u0628\u0647 \u0622\u0645\u0648\u0632\u0634 \u0645\u062f\u0644 \u0645\u06cc \u067e\u0631\u062f\u0627\u0632\u06cc\u0645 \u0631\u0648\u06cc \u0645\u062c\u0645\u0648\u0639\u0647 \u0622\u0645\u0648\u0632\u0634\u06cc \u062a\u0645\u06cc\u0632 \u0634\u062f\u0647:<\/p>\n<pre><code class=\"hljs\">%%time\n!.\/fasttext supervised -input \"\/content\/drive\/My Drive\/Colab Datasets\/yelp_reviews_train_clean.txt\" -output model_yelp_reviews\n<\/code><\/pre>\n<p>\u0648 \u062f\u0631 \u0646\u0647\u0627\u06cc\u062a \u0627\u0632 \u0645\u062f\u0644 \u0622\u0645\u0648\u0632\u0634 \u062f\u06cc\u062f\u0647 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u062e\u0648\u0627\u0647\u06cc\u0645 \u06a9\u0631\u062f \u0631\u0648\u06cc \u0645\u062c\u0645\u0648\u0639\u0647 \u0622\u0645\u0648\u0632\u0634\u06cc \u062a\u0645\u06cc\u0632 \u0634\u062f\u0647 \u0628\u0631\u0627\u06cc \u067e\u06cc\u0634 \u0628\u06cc\u0646\u06cc \u0631\u0648\u06cc \u0645\u062c\u0645\u0648\u0639\u0647 \u062a\u0633\u062a \u062a\u0645\u06cc\u0632 \u0634\u062f\u0647:<\/p>\n<pre><code class=\"hljs\">!.\/fasttext test model_yelp_reviews.bin \"\/content\/drive\/My Drive\/Colab Datasets\/yelp_reviews_test_clean.txt\"\n<\/code><\/pre>\n<p>\u062e\u0631\u0648\u062c\u06cc \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0641\u0648\u0642 \u0628\u0647 \u0635\u0648\u0631\u062a \u0632\u06cc\u0631 \u0627\u0633\u062a:<\/p>\n<pre><code class=\"hljs\">N   10000\nP@1 0.915\nR@1 0.915\nNumber of examples: 10000\n<\/code><\/pre>\n<p>\u0634\u0645\u0627 \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u062f \u0627\u0641\u0632\u0627\u06cc\u0634 \u062c\u0632\u0626\u06cc \u062f\u0631 \u062f\u0642\u062a \u0648 \u06cc\u0627\u062f\u0622\u0648\u0631\u06cc \u0645\u0634\u0627\u0647\u062f\u0647 \u06a9\u0646\u06cc\u062f.  \u0628\u0631\u0627\u06cc \u0628\u0647\u0628\u0648\u062f \u0628\u06cc\u0634\u062a\u0631 \u0645\u062f\u0644\u060c \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u062f \u062f\u0648\u0631\u0647 \u0647\u0627 \u0648 \u0645\u06cc\u0632\u0627\u0646 \u06cc\u0627\u062f\u06af\u06cc\u0631\u06cc \u0645\u062f\u0644 \u0631\u0627 \u0627\u0641\u0632\u0627\u06cc\u0634 \u062f\u0647\u06cc\u062f.  \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0632\u06cc\u0631 \u062a\u0639\u062f\u0627\u062f \u062f\u0648\u0631\u0647 \u0647\u0627 \u0631\u0627 30 \u0648 \u0646\u0631\u062e \u06cc\u0627\u062f\u06af\u06cc\u0631\u06cc \u0631\u0627 0.5 \u062a\u0646\u0638\u06cc\u0645 \u0645\u06cc \u06a9\u0646\u062f.<\/p>\n<pre><code class=\"hljs\">%%time\n!.\/fasttext supervised -input \"\/content\/drive\/My Drive\/Colab Datasets\/yelp_reviews_train_clean.txt\" -output model_yelp_reviews -epoch 30 -lr 0.5\n<\/code><\/pre>\n<p>\u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u062f \u0627\u0639\u062f\u0627\u062f \u0645\u062e\u062a\u0644\u0641 \u0631\u0627 \u0627\u0645\u062a\u062d\u0627\u0646 \u06a9\u0646\u06cc\u062f \u0648 \u0628\u0628\u06cc\u0646\u06cc\u062f \u0622\u06cc\u0627 \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u062f \u0646\u062a\u0627\u06cc\u062c \u0628\u0647\u062a\u0631\u06cc \u0628\u06af\u06cc\u0631\u06cc\u062f.  \u0641\u0631\u0627\u0645\u0648\u0634 \u0646\u06a9\u0646\u06cc\u062f \u06a9\u0647 \u0646\u062a\u0627\u06cc\u062c \u062e\u0648\u062f \u0631\u0627 \u062f\u0631 \u0646\u0638\u0631\u0627\u062a \u0628\u0647 \u0627\u0634\u062a\u0631\u0627\u06a9 \u0628\u06af\u0630\u0627\u0631\u06cc\u062f!<\/p>\n<h2 id=\"conclusion\"><span class=\"ez-toc-section\" id=\"%d9%86%d8%aa%db%8c%d8%ac%d9%87\"><\/span>\u0646\u062a\u06cc\u062c\u0647<span class=\"ez-toc-section-end\"><\/span><\/h2>\n<p>\u0645\u062f\u0644 FastText \u0627\u062e\u06cc\u0631\u0627\u064b \u062f\u0631 \u0632\u0645\u06cc\u0646\u0647 \u062a\u0639\u0628\u06cc\u0647 \u06a9\u0644\u0645\u0627\u062a \u0648 \u0648\u0638\u0627\u06cc\u0641 \u0637\u0628\u0642\u0647\u200c\u0628\u0646\u062f\u06cc \u0645\u062a\u0646 \u0628\u0647 \u0628\u0647\u062a\u0631\u06cc\u0646 \u0634\u06a9\u0644 \u0628\u0647 \u0627\u062b\u0628\u0627\u062a \u0631\u0633\u06cc\u062f\u0647 \u0627\u0633\u062a \u0631\u0648\u06cc \u0628\u0633\u06cc\u0627\u0631\u06cc \u0627\u0632 \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647 \u0647\u0627  \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 \u0622\u0646 \u062f\u0631 \u0645\u0642\u0627\u06cc\u0633\u0647 \u0628\u0627 \u0633\u0627\u06cc\u0631 \u0645\u062f\u0644 \u0647\u0627\u06cc \u062c\u0627\u0633\u0627\u0632\u06cc \u06a9\u0644\u0645\u0647 \u0628\u0633\u06cc\u0627\u0631 \u0622\u0633\u0627\u0646 \u0648 \u0633\u0631\u06cc\u0639 \u0627\u0633\u062a.<\/p>\n<p>\u062f\u0631 \u0627\u06cc\u0646 \u0645\u0642\u0627\u0644\u0647 \u0628\u0647 \u0637\u0648\u0631 \u062e\u0644\u0627\u0635\u0647 \u0631\u0648\u0634 \u06cc\u0627\u0641\u062a\u0646 \u0634\u0628\u0627\u0647\u062a \u0647\u0627\u06cc \u0645\u0639\u0646\u0627\u06cc\u06cc \u0628\u06cc\u0646 \u06a9\u0644\u0645\u0627\u062a \u0645\u062e\u062a\u0644\u0641 \u0628\u0627 \u0627\u06cc\u062c\u0627\u062f \u062c\u0627\u0633\u0627\u0632\u06cc \u06a9\u0644\u0645\u0627\u062a \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 FastText \u0631\u0627 \u0628\u0631\u0631\u0633\u06cc \u06a9\u0631\u062f\u06cc\u0645.  \u0642\u0633\u0645\u062a \u062f\u0648\u0645 \u0645\u0642\u0627\u0644\u0647 \u0631\u0648\u0634 \u0627\u0646\u062c\u0627\u0645 \u0637\u0628\u0642\u0647 \u0628\u0646\u062f\u06cc \u0645\u062a\u0646 \u0627\u0632 \u0637\u0631\u06cc\u0642 \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 FastText \u0631\u0627 \u062a\u0648\u0636\u06cc\u062d \u0645\u06cc \u062f\u0647\u062f.<\/p>\n<\/div>\n<p><script>\n                        !function(f,b,e,v,n,t,s)\n                        {if(f.fbq)return;n=f.fbq=function(){n.callMethod?\n                        n.callMethod.apply(n,arguments):n.queue.push(arguments)};\n                        if(!f._fbq)f._fbq=n;n.push=n;n.loaded=!0;n.version='2.0';\n                        n.queue=();t=b.createElement(e);t.async=!0;\n                        t.src=v;s=b.getElementsByTagName(e)(0);\n                        s.parentNode.insertBefore(t,s)}(window, document,'script',\n                        'https:\/\/connect.facebook.net\/en_US\/fbevents.js');\n                        fbq('init', '525232124909042');\n                        fbq('track', 'PageView');\n                    <\/script>    (\u0628\u0631\u0686\u0633\u0628\u200c\u0647\u0627 \u0628\u0647 \u062a\u0631\u062c\u0645\u0647)# python<br \/>\n<br \/><br \/>\n<br \/>\u0645\u0646\u062a\u0634\u0631 \u0634\u062f\u0647 \u062f\u0631 1403-01-20 16:33:09<br \/>\n<\/p>\n\n\n<div class=\"kk-star-ratings kksr-auto kksr-align-center kksr-valign-bottom\"\n    data-payload='{&quot;align&quot;:&quot;center&quot;,&quot;id&quot;:&quot;16087&quot;,&quot;slug&quot;:&quot;default&quot;,&quot;valign&quot;:&quot;bottom&quot;,&quot;ignore&quot;:&quot;&quot;,&quot;reference&quot;:&quot;auto&quot;,&quot;class&quot;:&quot;&quot;,&quot;count&quot;:&quot;0&quot;,&quot;legendonly&quot;:&quot;&quot;,&quot;readonly&quot;:&quot;&quot;,&quot;score&quot;:&quot;0&quot;,&quot;starsonly&quot;:&quot;&quot;,&quot;best&quot;:&quot;5&quot;,&quot;gap&quot;:&quot;5&quot;,&quot;greet&quot;:&quot;\u0627\u0645\u062a\u06cc\u0627\u0632 \u0634\u0645\u0627 \u0628\u0647 \u0627\u06cc\u0646 \u0645\u0637\u0644\u0628&quot;,&quot;legend&quot;:&quot;0\\\/5 (0 \u0631\u0627\u06cc)&quot;,&quot;size&quot;:&quot;30&quot;,&quot;title&quot;:&quot;\u067e\u0627\u06cc\u062a\u0648\u0646 \u0628\u0631\u0627\u06cc NLP: \u06a9\u0627\u0631 \u0628\u0627 \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 FastText \u0641\u06cc\u0633 \u0628\u0648\u06a9&quot;,&quot;width&quot;:&quot;0&quot;,&quot;_legend&quot;:&quot;{score}\\\/{best} ({count} \u0631\u0627\u06cc)&quot;,&quot;font_factor&quot;:&quot;1.25&quot;}'>\n            \n<div class=\"kksr-stars\">\n    \n<div class=\"kksr-stars-inactive\">\n            <div class=\"kksr-star\" data-star=\"1\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" data-star=\"2\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" data-star=\"3\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" data-star=\"4\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" data-star=\"5\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n    <\/div>\n    \n<div class=\"kksr-stars-active\" style=\"width: 0px;\">\n            <div class=\"kksr-star\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n    <\/div>\n<\/div>\n                \n\n<div class=\"kksr-legend\" style=\"font-size: 24px;\">\n            <span class=\"kksr-muted\">\u0627\u0645\u062a\u06cc\u0627\u0632 \u0634\u0645\u0627 \u0628\u0647 \u0627\u06cc\u0646 \u0645\u0637\u0644\u0628<\/span>\n    <\/div>\n    <\/div>\n","protected":false},"excerpt":{"rendered":"<p><span class=\"span-reading-time rt-reading-time\" style=\"display: block;\"><span class=\"rt-label rt-prefix\">\u0632\u0645\u0627\u0646 \u0644\u0627\u0632\u0645 \u0628\u0631\u0627\u06cc \u0645\u0637\u0627\u0644\u0639\u0647: <\/span> <span class=\"rt-time\"> 12<\/span> <span class=\"rt-label rt-postfix\">\u062f\u0642\u06cc\u0642\u0647<\/span><\/span>\u0627\u06cc\u0646 \u0628\u06cc\u0633\u062a\u0645\u06cc\u0646 \u0645\u0642\u0627\u0644\u0647 \u0627\u0632 \u0633\u0631\u06cc \u0645\u0642\u0627\u0644\u0627\u062a \u0645\u0646 \u0627\u0633\u062a \u0631\u0648\u06cc \u067e\u0627\u06cc\u062a\u0648\u0646 \u0628\u0631\u0627\u06cc NLP. \u062f\u0631 \u0686\u0646\u062f \u0645\u0642\u0627\u0644\u0647 \u0627\u062e\u06cc\u0631\u060c \u062a\u06a9\u0646\u06cc\u06a9 \u0647\u0627\u06cc \u06cc\u0627\u062f\u06af\u06cc\u0631\u06cc \u0639\u0645\u06cc\u0642 \u0631\u0627 \u0628\u0631\u0627\u06cc \u0627\u0646\u062c\u0627\u0645 \u0627\u0646\u0648\u0627\u0639 \u0648\u0638\u0627\u06cc\u0641 \u06cc\u0627\u062f\u06af\u06cc\u0631\u06cc \u0645\u0627\u0634\u06cc\u0646 \u0628\u0631\u0631\u0633\u06cc \u06a9\u0631\u062f\u0647 \u0627\u06cc\u0645 \u0648 \u0647\u0645\u0686\u0646\u06cc\u0646 \u0628\u0627\u06cc\u062f \u0628\u0627 \u0645\u0641\u0647\u0648\u0645 \u062c\u0627\u0633\u0627\u0632\u06cc \u06a9\u0644\u0645\u0627\u062a \u0622\u0634\u0646\u0627 \u0628\u0627\u0634\u06cc\u062f. \u062c\u0627\u0633\u0627\u0632\u06cc \u06a9\u0644\u0645\u0647 \u0631\u0627\u0647\u06cc \u0628\u0631\u0627\u06cc \u062a\u0628\u062f\u06cc\u0644 \u0627\u0637\u0644\u0627\u0639\u0627\u062a \u0645\u062a\u0646\u06cc \u0628\u0647 \u0634\u06a9\u0644 \u0639\u062f\u062f\u06cc \u0627\u0633\u062a \u06a9\u0647 \u0628\u0647 \u0646\u0648\u0628\u0647 \u062e\u0648\u062f \u0645\u06cc [&hellip;]<\/p>\n","protected":false},"author":3,"featured_media":16088,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"footnotes":""},"categories":[1743,620,1686],"tags":[],"class_list":["post-16087","post","type-post","status-publish","format-standard","has-post-thumbnail","hentry","category-python","category-programming","category-ai"],"acf":[],"_links":{"self":[{"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/posts\/16087","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/users\/3"}],"replies":[{"embeddable":true,"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/comments?post=16087"}],"version-history":[{"count":0,"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/posts\/16087\/revisions"}],"wp:featuredmedia":[{"embeddable":true,"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/media\/16088"}],"wp:attachment":[{"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/media?parent=16087"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/categories?post=16087"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/tags?post=16087"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}