{"id":12575,"date":"2023-12-31T08:41:14","date_gmt":"2023-12-31T05:11:14","guid":{"rendered":"https:\/\/rasanegar.com\/blog\/nlp-%d8%b3%d8%a7%d8%af%d9%87-%d8%af%d8%b1-%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%a7-textblob-lemmatization\/"},"modified":"2023-12-31T08:41:14","modified_gmt":"2023-12-31T05:11:14","slug":"nlp-%d8%b3%d8%a7%d8%af%d9%87-%d8%af%d8%b1-%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%a7-textblob-lemmatization","status":"publish","type":"post","link":"https:\/\/rasanegaar.com\/blog\/nlp-%d8%b3%d8%a7%d8%af%d9%87-%d8%af%d8%b1-%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%a7-textblob-lemmatization\/","title":{"rendered":"NLP \u0633\u0627\u062f\u0647 \u062f\u0631 \u067e\u0627\u06cc\u062a\u0648\u0646 \u0628\u0627 TextBlob: Lemmatization"},"content":{"rendered":"<div id=\"ez-toc-container\" class=\"ez-toc-v2_0_85 counter-hierarchy ez-toc-counter ez-toc-custom ez-toc-container-direction\">\n<div class=\"ez-toc-title-container\"><p class=\"ez-toc-title\" style=\"cursor:inherit\">\u0633\u0631\u0641\u0635\u0644\u0647\u0627\u06cc \u0645\u0637\u0644\u0628<\/p>\n<\/div><nav><ul class='ez-toc-list ez-toc-list-level-1 ' ><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class=\"ez-toc-link ez-toc-heading-1\" href=\"https:\/\/rasanegaar.com\/blog\/nlp-%d8%b3%d8%a7%d8%af%d9%87-%d8%af%d8%b1-%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%a7-textblob-lemmatization\/#%d9%85%d8%b9%d8%b1%d9%81%db%8c\" >\u0645\u0639\u0631\u0641\u06cc<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class=\"ez-toc-link ez-toc-heading-2\" href=\"https:\/\/rasanegaar.com\/blog\/nlp-%d8%b3%d8%a7%d8%af%d9%87-%d8%af%d8%b1-%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%a7-textblob-lemmatization\/#%d9%86%d8%b5%d8%a8_textblob\" >\u0646\u0635\u0628 TextBlob<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class=\"ez-toc-link ez-toc-heading-3\" href=\"https:\/\/rasanegaar.com\/blog\/nlp-%d8%b3%d8%a7%d8%af%d9%87-%d8%af%d8%b1-%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%a7-textblob-lemmatization\/#lemmatization_%da%86%db%8c%d8%b3%d8%aa%d8%9f\" >Lemmatization \u0686\u06cc\u0633\u062a\u061f<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class=\"ez-toc-link ez-toc-heading-4\" href=\"https:\/\/rasanegaar.com\/blog\/nlp-%d8%b3%d8%a7%d8%af%d9%87-%d8%af%d8%b1-%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%a7-textblob-lemmatization\/#%d9%be%db%8c%d8%a7%d8%af%d9%87_%d8%b3%d8%a7%d8%b2%db%8c_lemmatization_%d8%af%d8%b1_%da%a9%d8%af\" >\u067e\u06cc\u0627\u062f\u0647 \u0633\u0627\u0632\u06cc Lemmatization \u062f\u0631 \u06a9\u062f<\/a><ul class='ez-toc-list-level-3' ><li class='ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-5\" href=\"https:\/\/rasanegaar.com\/blog\/nlp-%d8%b3%d8%a7%d8%af%d9%87-%d8%af%d8%b1-%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%a7-textblob-lemmatization\/#%d8%a7%d9%86%d8%aa%d8%ae%d8%a7%d8%a8_%db%8c%da%a9_%d8%a8%d8%b1%d8%b1%d8%b3%db%8c_%d8%a7%d8%b2_nltk_corpus\" >\u0627\u0646\u062a\u062e\u0627\u0628 \u06cc\u06a9 \u0628\u0631\u0631\u0633\u06cc \u0627\u0632 NLTK Corpus<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-6\" href=\"https:\/\/rasanegaar.com\/blog\/nlp-%d8%b3%d8%a7%d8%af%d9%87-%d8%af%d8%b1-%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%a7-textblob-lemmatization\/#%d8%a7%db%8c%d8%ac%d8%a7%d8%af_%db%8c%da%a9_%d8%b4%db%8c%d8%a1_textblob\" >\u0627\u06cc\u062c\u0627\u062f \u06cc\u06a9 \u0634\u06cc\u0621 TextBlob<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-7\" href=\"https:\/\/rasanegaar.com\/blog\/nlp-%d8%b3%d8%a7%d8%af%d9%87-%d8%af%d8%b1-%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%a7-textblob-lemmatization\/#%d8%ae%d9%84%d8%a7%d8%b5%d9%87_%d8%b3%d8%a7%d8%b2%db%8c_%db%8c%da%a9_%d8%ac%d9%85%d9%84%d9%87\" >\u062e\u0644\u0627\u0635\u0647 \u0633\u0627\u0632\u06cc \u06cc\u06a9 \u062c\u0645\u0644\u0647<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-8\" href=\"https:\/\/rasanegaar.com\/blog\/nlp-%d8%b3%d8%a7%d8%af%d9%87-%d8%af%d8%b1-%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%a7-textblob-lemmatization\/#%d8%aa%d9%81%d8%a7%d9%88%d8%aa_%d8%a8%db%8c%d9%86_lemmatization_%d9%88_stemming\" >\u062a\u0641\u0627\u0648\u062a \u0628\u06cc\u0646 Lemmatization \u0648 Stemming<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-9\" href=\"https:\/\/rasanegaar.com\/blog\/nlp-%d8%b3%d8%a7%d8%af%d9%87-%d8%af%d8%b1-%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%a7-textblob-lemmatization\/#%d8%ae%d9%84%d8%a7%d8%b5%d9%87_%d8%b3%d8%a7%d8%b2%db%8c_%db%8c%da%a9_%d8%a8%d8%b1%d8%b1%d8%b3%db%8c\" >\u062e\u0644\u0627\u0635\u0647 \u0633\u0627\u0632\u06cc \u06cc\u06a9 \u0628\u0631\u0631\u0633\u06cc<\/a><\/li><\/ul><\/li><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class=\"ez-toc-link ez-toc-heading-10\" href=\"https:\/\/rasanegaar.com\/blog\/nlp-%d8%b3%d8%a7%d8%af%d9%87-%d8%af%d8%b1-%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%a7-textblob-lemmatization\/#%d9%86%d8%aa%db%8c%d8%ac%d9%87\" >\u0646\u062a\u06cc\u062c\u0647<\/a><\/li><\/ul><\/nav><\/div>\n<span class=\"span-reading-time rt-reading-time\" style=\"display: block;\"><span class=\"rt-label rt-prefix\">\u0632\u0645\u0627\u0646 \u0644\u0627\u0632\u0645 \u0628\u0631\u0627\u06cc \u0645\u0637\u0627\u0644\u0639\u0647: <\/span> <span class=\"rt-time\"> 9<\/span> <span class=\"rt-label rt-postfix\">\u062f\u0642\u06cc\u0642\u0647<\/span><\/span><p> <br \/>\n<\/p>\n<div><noscript><\/noscript><\/p>\n<h2 id=\"introduction\"><span class=\"ez-toc-section\" id=\"%d9%85%d8%b9%d8%b1%d9%81%db%8c\"><\/span>\u0645\u0639\u0631\u0641\u06cc<span class=\"ez-toc-section-end\"><\/span><\/h2>\n<p>TextBlob \u06cc\u06a9 \u0628\u0633\u062a\u0647 \u0633\u0627\u062e\u062a\u0647 \u0634\u062f\u0647 \u0627\u0633\u062a \u0631\u0648\u06cc \u062f\u0631 \u0628\u0627\u0644\u0627\u06cc \u062f\u0648 \u0628\u0633\u062a\u0647 \u062f\u06cc\u06af\u0631\u060c \u06cc\u06a9\u06cc \u0627\u0632 \u0622\u0646\u0647\u0627 Natural Language Toolkit \u0646\u0627\u0645 \u062f\u0627\u0631\u062f \u06a9\u0647 \u0639\u0645\u062f\u062a\u0627\u064b \u0628\u0647 \u0635\u0648\u0631\u062a \u0645\u062e\u0641\u0641 \u0622\u0646 \u0634\u0646\u0627\u062e\u062a\u0647 \u0645\u06cc \u0634\u0648\u062f. <a rel=\"nofollow noopener\" target=\"_blank\" href=\"https:\/\/www.nltk.org\/\">NLTK<\/a>\u060c \u0648 \u062f\u06cc\u06af\u0631\u06cc \u0627\u0633\u062a <a rel=\"nofollow noopener\" target=\"_blank\" href=\"https:\/\/github.com\/clips\/pattern\/\">\u0627\u0644\u06af\u0648<\/a>.  NLTK \u06cc\u06a9 \u0628\u0633\u062a\u0647 \u0633\u0646\u062a\u06cc \u0627\u0633\u062a \u06a9\u0647 \u0628\u0631\u0627\u06cc \u067e\u0631\u062f\u0627\u0632\u0634 \u0645\u062a\u0646 \u06cc\u0627 <em>\u067e\u0631\u062f\u0627\u0632\u0634 \u0632\u0628\u0627\u0646 \u0637\u0628\u06cc\u0639\u06cc (NLP)<\/em>\u0648 Pattern \u0639\u0645\u062f\u062a\u0627\u064b \u0628\u0631\u0627\u06cc \u0648\u0628 \u06a9\u0627\u0648\u06cc \u0633\u0627\u062e\u062a\u0647 \u0634\u062f\u0647 \u0627\u0633\u062a.<\/p>\n<p>TextBlob \u0628\u0647 \u06af\u0648\u0646\u0647\u200c\u0627\u06cc \u0637\u0631\u0627\u062d\u06cc \u0634\u062f\u0647 \u0627\u0633\u062a \u06a9\u0647 \u06cc\u0627\u062f\u06af\u06cc\u0631\u06cc \u0648 \u062f\u0633\u062a\u06a9\u0627\u0631\u06cc \u0622\u0646 \u0622\u0633\u0627\u0646\u200c\u062a\u0631 \u0627\u0632 NLTK \u0628\u0627\u0634\u062f\u060c \u062f\u0631 \u062d\u0627\u0644\u06cc \u06a9\u0647 \u0647\u0645\u0627\u0646 \u0648\u0638\u0627\u06cc\u0641 \u0645\u0647\u0645 NLP \u0645\u0627\u0646\u0646\u062f \u0648\u0627\u0698\u0647\u200c\u0633\u0627\u0632\u06cc\u060c \u062a\u062d\u0644\u06cc\u0644 \u0627\u062d\u0633\u0627\u0633\u0627\u062a\u060c \u0631\u06cc\u0634\u0647\u200c\u06af\u0630\u0627\u0631\u06cc\u060c \u0628\u0631\u0686\u0633\u0628\u200c\u06af\u0630\u0627\u0631\u06cc POS\u060c \u0627\u0633\u062a\u062e\u0631\u0627\u062c \u0639\u0628\u0627\u0631\u062a \u0627\u0633\u0645\u06cc\u060c \u0637\u0628\u0642\u0647\u200c\u0628\u0646\u062f\u06cc\u060c \u062a\u0631\u062c\u0645\u0647 \u0648 \u0645\u0648\u0627\u0631\u062f \u062f\u06cc\u06af\u0631 \u0631\u0627 \u062d\u0641\u0638 \u0645\u06cc\u200c\u06a9\u0646\u062f.  \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u062f \u0644\u06cc\u0633\u062a \u06a9\u0627\u0645\u0644\u06cc \u0627\u0632 \u0648\u0638\u0627\u06cc\u0641 \u0631\u0627 \u0645\u0634\u0627\u0647\u062f\u0647 \u06a9\u0646\u06cc\u062f \u0631\u0648\u06cc \u0631\u0627 <a rel=\"nofollow noopener\" target=\"_blank\" href=\"https:\/\/pypi.org\/project\/textblob\/\">TextBlob PyPI page<\/a>.<\/p>\n<p>\u0627\u06af\u0631 \u0628\u0647 \u062f\u0646\u0628\u0627\u0644 \u06cc\u06a9 \u0646\u0645\u0627\u06cc \u06a9\u0644\u06cc \u0627\u0632 \u0628\u0633\u06cc\u0627\u0631\u06cc \u0627\u0632 \u0648\u0638\u0627\u06cc\u0641 NLP \u0647\u0633\u062a\u06cc\u062f \u06a9\u0647 \u0645\u06cc\u200c\u062a\u0648\u0627\u0646\u0646\u062f \u0628\u0627 TextBlob \u0627\u062c\u0631\u0627 \u0634\u0648\u0646\u062f\u060c \u0628\u0647 \u0631\u0627\u0647\u0646\u0645\u0627\u06cc \u00abPython for NLP: \u0645\u0642\u062f\u0645\u0647\u200c\u0627\u06cc \u0628\u0631 \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 TextBlob\u00bb \u0646\u06af\u0627\u0647\u06cc \u0628\u06cc\u0646\u062f\u0627\u0632\u06cc\u062f.<\/p>\n<p>\u0647\u06cc\u0686 \u067e\u06cc\u0634 \u0646\u06cc\u0627\u0632 \u0641\u0646\u06cc \u062e\u0627\u0635\u06cc \u0628\u0631\u0627\u06cc \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 TextBlob \u0645\u0648\u0631\u062f \u0646\u06cc\u0627\u0632 \u0646\u06cc\u0633\u062a.  \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u0645\u062b\u0627\u0644\u060c \u0628\u0633\u062a\u0647 \u0628\u0631\u0627\u06cc \u0647\u0631 \u062f\u0648 \u067e\u0627\u06cc\u062a\u0648\u0646 2 \u0648 3 \u0642\u0627\u0628\u0644 \u0627\u062c\u0631\u0627 \u0627\u0633\u062a (Python >= 2.7 \u06cc\u0627 >= 3.5).<\/p>\n<p>\u0647\u0645\u0686\u0646\u06cc\u0646\u060c \u062f\u0631 \u0635\u0648\u0631\u062a\u06cc \u06a9\u0647 \u0647\u06cc\u0686 \u06af\u0648\u0646\u0647 \u0627\u0637\u0644\u0627\u0639\u0627\u062a \u0645\u062a\u0646\u06cc \u062f\u0631 \u062f\u0633\u062a\u0631\u0633 \u0646\u062f\u0627\u0631\u06cc\u062f\u060c TextBlob \u0645\u062c\u0645\u0648\u0639\u0647 \u0647\u0627\u06cc \u0644\u0627\u0632\u0645 \u0627\u0632 \u062f\u0627\u062f\u0647 \u0647\u0627\u06cc \u0632\u0628\u0627\u0646 (\u0645\u0639\u0645\u0648\u0644\u0627\u064b \u0645\u062a\u0648\u0646) \u0631\u0627 \u0627\u0631\u0627\u0626\u0647 \u0645\u06cc \u062f\u0647\u062f \u06a9\u0647 \u0628\u0647 \u0646\u0627\u0645 <em>\u0628\u062f\u0646\u0647 \u0647\u0627<\/em>\u060c \u0627\u0632 \u067e\u0627\u06cc\u06af\u0627\u0647 \u062f\u0627\u062f\u0647 NLTK.<\/p>\n<h2 id=\"installingtextblob\"><span class=\"ez-toc-section\" id=\"%d9%86%d8%b5%d8%a8_textblob\"><\/span>\u0646\u0635\u0628 TextBlob<span class=\"ez-toc-section-end\"><\/span><\/h2>\n<p>\u0628\u06cc\u0627\u06cc\u06cc\u062f \u0628\u0627 \u0646\u0635\u0628 TextBlob \u0634\u0631\u0648\u0639 \u06a9\u0646\u06cc\u0645.  \u0627\u06af\u0631 \u0627\u0632 a \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0645\u06cc \u06a9\u0646\u06cc\u062f terminal\u060c command-line\u060c \u06cc\u0627 \u062e\u0637 \u0641\u0631\u0645\u0627\u0646\u060c \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u062f \u0648\u0627\u0631\u062f \u06a9\u0646\u06cc\u062f:<\/p>\n<pre><code class=\"hljs\"><span class=\"hljs-meta\">$<\/span><span class=\"bash\"> pip install textblob<\/span>\n<\/code><\/pre>\n<p>\u062f\u0631 \u063a\u06cc\u0631 \u0627\u06cc\u0646 \u0635\u0648\u0631\u062a\u060c \u0627\u06af\u0631 \u0627\u0632 a Jupyter Notebook\u060c \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u062f \u062f\u0633\u062a\u0648\u0631 \u0631\u0627 \u0645\u0633\u062a\u0642\u06cc\u0645\u0627\u064b \u0627\u0632 notebook \u0628\u0627 \u0627\u0636\u0627\u0641\u0647 \u06a9\u0631\u062f\u0646 \u0639\u0644\u0627\u0645\u062a \u062a\u0639\u062c\u0628 <code>!<\/code> \u062f\u0631 \u0627\u0628\u062a\u062f\u0627\u06cc \u0622\u0645\u0648\u0632\u0634:<\/p>\n<pre><code class=\"hljs\">!pip install textblob\n<\/code><\/pre>\n<div class=\"alert alert-note\">\n<div class=\"flex\">\n<div class=\"flex-shrink-0 mr-3\"><\/div>\n<div class=\"w-full\">\n<p>\u062a\u0648\u062c\u0647: \u0627\u06cc\u0646 process \u0628\u0647 \u062f\u0644\u06cc\u0644 \u062a\u0639\u062f\u0627\u062f \u0632\u06cc\u0627\u062f \u0627\u0644\u06af\u0648\u0631\u06cc\u062a\u0645\u200c\u0647\u0627 \u0648 \u0645\u062c\u0645\u0648\u0639\u0647\u200c\u0647\u0627\u06cc\u06cc \u06a9\u0647 \u0627\u06cc\u0646 \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 \u062f\u0627\u0631\u062f\u060c \u0645\u0645\u06a9\u0646 \u0627\u0633\u062a \u06a9\u0645\u06cc \u0637\u0648\u0644 \u0628\u06a9\u0634\u062f.<\/p>\n<\/p><\/div><\/div><\/div>\n<p>\u067e\u0633 \u0627\u0632 \u0646\u0635\u0628 TextBlob\u060c \u0628\u0631\u0627\u06cc \u062f\u0627\u0634\u062a\u0646 \u0646\u0645\u0648\u0646\u0647 \u0645\u062a\u0646\u06cc\u060c \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u062f \u0628\u0627 \u0627\u062c\u0631\u0627\u06cc \u062f\u0633\u062a\u0648\u0631\u0627\u062a \u0645\u062a\u0646\u06cc \u0631\u0627 \u062f\u0627\u0646\u0644\u0648\u062f \u06a9\u0646\u06cc\u062f. <code>python -m textblob.download_corpora<\/code> \u0641\u0631\u0645\u0627\u0646  \u06cc\u06a9 \u0628\u0627\u0631 \u062f\u06cc\u06af\u0631\u060c \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u062f \u0622\u0646 \u0631\u0627 \u0645\u0633\u062a\u0642\u06cc\u0645\u0627\u064b \u062f\u0631 \u062e\u0637 \u0641\u0631\u0645\u0627\u0646 \u06cc\u0627 \u062f\u0631 a \u0627\u062c\u0631\u0627 \u06a9\u0646\u06cc\u062f notebook \u0642\u0628\u0644 \u0627\u0632 \u0622\u0646 \u0628\u0627 \u0639\u0644\u0627\u0645\u062a \u062a\u0639\u062c\u0628.<\/p>\n<p>\u0647\u0646\u06af\u0627\u0645 \u0627\u062c\u0631\u0627\u06cc \u062f\u0633\u062a\u0648\u0631\u060c \u0628\u0627\u06cc\u062f \u062e\u0631\u0648\u062c\u06cc \u0632\u06cc\u0631 \u0631\u0627 \u0628\u0628\u06cc\u0646\u06cc\u062f:<\/p>\n<pre><code class=\"hljs\"><span class=\"hljs-meta\">$<\/span><span class=\"bash\"> python -m textblob.download_corpora<\/span>\n(nltk_data) Downloading package brown to \/Users\/csamp\/nltk_data...\n(nltk_data)   Package brown is already up-to-date!\n(nltk_data) Downloading package punkt to \/Users\/csamp\/nltk_data...\n(nltk_data)   Package punkt is already up-to-date!\n(nltk_data) Downloading package wordnet to \/Users\/csamp\/nltk_data...\n(nltk_data)   Package wordnet is already up-to-date!\n(nltk_data) Downloading package averaged_perceptron_tagger to\n(nltk_data)     \/Users\/csamp\/nltk_data...\n(nltk_data)   Package averaged_perceptron_tagger is already up-to-\n(nltk_data)       date!\n(nltk_data) Downloading package conll2000 to \/Users\/csamp\/nltk_data...\n(nltk_data)   Unzipping corpora\/conll2000.zip.\n(nltk_data) Downloading package movie_reviews to\n(nltk_data)     \/Users\/csamp\/nltk_data...\n(nltk_data)   Unzipping corpora\/movie_reviews.zip.\nFinished.\n<\/code><\/pre>\n<p>\u0645\u0627 \u0642\u0628\u0644\u0627 \u0628\u0633\u062a\u0647 TextBlob \u0648 \u0645\u062c\u0645\u0648\u0639\u0647 \u0647\u0627\u06cc \u0622\u0646 \u0631\u0627 \u0646\u0635\u0628 \u06a9\u0631\u062f\u0647 \u0627\u06cc\u0645.  \u062d\u0627\u0644\u060c \u0628\u06cc\u0627\u06cc\u06cc\u062f \u0628\u06cc\u0634\u062a\u0631 \u062f\u0631 \u0645\u0648\u0631\u062f \u0644\u0645\u062a \u0633\u0627\u0632\u06cc \u0628\u062f\u0627\u0646\u06cc\u0645.<\/p>\n<blockquote>\n<p>\u0628\u0631\u0627\u06cc \u0645\u062d\u062a\u0648\u0627\u06cc \u0628\u06cc\u0634\u062a\u0631 TextBlob\u060c NLP \u0633\u0627\u062f\u0647 \u062f\u0631 \u067e\u0627\u06cc\u062a\u0648\u0646 \u0628\u0627 TextBlob: Tokenization\u060c NLP \u0633\u0627\u062f\u0647 \u062f\u0631 \u067e\u0627\u06cc\u062a\u0648\u0646 \u0628\u0627 TextBlob: \u062a\u0634\u062e\u06cc\u0635 N-Grams \u0648 \u062a\u062c\u0632\u06cc\u0647 \u0648 \u062a\u062d\u0644\u06cc\u0644 \u0627\u062d\u0633\u0627\u0633\u0627\u062a \u062f\u0631 \u067e\u0627\u06cc\u062a\u0648\u0646 \u0628\u0627 \u0631\u0627\u0647\u0646\u0645\u0627\u06cc TextBlob \u0631\u0627 \u0628\u0631\u0631\u0633\u06cc \u06a9\u0646\u06cc\u062f.<\/p>\n<\/blockquote>\n<h2 id=\"whatislemmatization\"><span class=\"ez-toc-section\" id=\"lemmatization_%da%86%db%8c%d8%b3%d8%aa%d8%9f\"><\/span>Lemmatization \u0686\u06cc\u0633\u062a\u061f<span class=\"ez-toc-section-end\"><\/span><\/h2>\n<p>\u0642\u0628\u0644 \u0627\u0632 \u0627\u06cc\u0646\u06a9\u0647 \u0639\u0645\u06cc\u0642 \u062a\u0631 \u0628\u0647 \u062d\u0648\u0632\u0647 NLP \u0628\u0631\u0648\u06cc\u062f\u060c \u0628\u0627\u06cc\u062f \u0628\u062a\u0648\u0627\u0646\u06cc\u062f \u0628\u0631\u062e\u06cc \u0627\u0632 \u0627\u0635\u0637\u0644\u0627\u062d\u0627\u062a \u06a9\u0644\u06cc\u062f\u06cc \u0631\u0627 \u0628\u0634\u0646\u0627\u0633\u06cc\u062f:<\/p>\n<p><strong>\u0645\u062c\u0645\u0648\u0639\u0647 \u0646\u0648\u0634\u062a\u0647 \u0647\u0627<\/strong> (\u06cc\u0627 \u067e\u06cc\u06a9\u0631\u0647\u0627 \u0628\u0647 \u0635\u0648\u0631\u062a \u062c\u0645\u0639) &#8211; \u0645\u062c\u0645\u0648\u0639\u0647 \u062e\u0627\u0635\u06cc \u0627\u0632 \u062f\u0627\u062f\u0647 \u0647\u0627\u06cc \u0632\u0628\u0627\u0646 (\u0645\u062b\u0644\u0627\u064b \u0645\u062a\u0648\u0646) \u0627\u0633\u062a.  \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u0645\u062b\u0627\u0644\u060c Corpora \u0645\u0639\u0645\u0648\u0644\u0627\u064b \u0628\u0631\u0627\u06cc \u0622\u0645\u0648\u0632\u0634 \u0645\u062f\u0644\u200c\u0647\u0627\u06cc \u0645\u062e\u062a\u0644\u0641 \u0637\u0628\u0642\u0647\u200c\u0628\u0646\u062f\u06cc \u0645\u062a\u0646 \u06cc\u0627 \u062a\u062d\u0644\u06cc\u0644 \u0627\u062d\u0633\u0627\u0633\u0627\u062a \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0645\u06cc\u200c\u0634\u0648\u062f.<\/p>\n<p><strong>\u0644\u0645\u0627<\/strong> &#8211; \u06a9\u0644\u0645\u0647 \u0627\u06cc \u0627\u0633\u062a \u06a9\u0647 \u062f\u0631 \u0641\u0631\u0647\u0646\u06af \u0644\u063a\u062a \u0628\u0647 \u062f\u0646\u0628\u0627\u0644 \u0622\u0646 \u0645\u06cc \u06af\u0631\u062f\u06cc\u062f.  \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u0645\u062b\u0627\u0644\u060c \u0627\u06af\u0631 \u0645\u06cc \u062e\u0648\u0627\u0647\u06cc\u062f \u0628\u0647 \u062a\u0639\u0631\u06cc\u0641 \u0641\u0639\u0644 &#8220;runs&#8221; \u0646\u06af\u0627\u0647 \u06a9\u0646\u06cc\u062f\u060c \u0628\u0627\u06cc\u062f &#8220;run&#8221; \u0631\u0627 \u062c\u0633\u062a\u062c\u0648 \u06a9\u0646\u06cc\u062f.<\/p>\n<p><strong>\u0633\u0627\u0642\u0647<\/strong> &#8211; \u0628\u062e\u0634\u06cc \u0627\u0632 \u06cc\u06a9 \u06a9\u0644\u0645\u0647 \u0627\u0633\u062a \u06a9\u0647 \u0647\u0631\u06af\u0632 \u062a\u063a\u06cc\u06cc\u0631 \u0646\u0645\u06cc \u06a9\u0646\u062f.<\/p>\n<p>\u062e\u0648\u062f \u0644\u0645\u0627\u062a\u06cc\u0632\u0627\u0633\u06cc\u0648\u0646 \u0686\u06cc\u0633\u062a\u061f<\/p>\n<blockquote>\n<p>Lemmatization \u0627\u0633\u062a process \u0628\u0647 \u062f\u0633\u062a \u0622\u0648\u0631\u062f\u0646 \u0644\u0645 \u06a9\u0644\u0645\u0627\u062a \u0627\u0632 \u06cc\u06a9 \u067e\u06cc\u06a9\u0631\u0647.<\/p>\n<\/blockquote>\n<p>\u0646\u0645\u0648\u0646\u0647 \u0627\u06cc \u0627\u0632 \u0627\u06cc\u0646 \u0645\u0648\u0636\u0648\u0639 \u0645\u06cc \u062a\u0648\u0627\u0646\u062f \u062c\u0645\u0644\u0647 \u0632\u06cc\u0631 \u0628\u0627\u0634\u062f:<\/p>\n<ul>\n<li>\u0648\u0631\u0648\u062f\u06cc (\u062c\u0633\u0645): \u0622\u0644\u06cc\u0633 \u0641\u06a9\u0631 \u0645\u06cc \u06a9\u0646\u062f \u06af\u0645 \u0634\u062f\u0647 \u0627\u0633\u062a\u060c \u0627\u0645\u0627 \u0628\u0639\u062f \u0634\u0631\u0648\u0639 \u0628\u0647 \u06cc\u0627\u0641\u062a\u0646 \u062e\u0648\u062f \u0645\u06cc \u06a9\u0646\u062f<\/li>\n<li>\u062e\u0631\u0648\u062c\u06cc (\u0644\u0645): |  \u0622\u0644\u06cc\u0633 |  \u0641\u06a9\u0631 \u06a9\u0646 |  \u0627\u0648 |  \u0627\u0633\u062a |  \u06af\u0645 \u0634\u062f\u0647 |  \u0627\u0645\u0627 |  \u0633\u067e\u0633 |  \u0634\u0631\u0648\u0639 |  \u0628\u0647 |  \u067e\u06cc\u062f\u0627 \u06a9\u0631\u062f\u0646 |  \u062e\u0648\u062f\u0634 |<\/li>\n<\/ul>\n<p>\u062a\u0648\u062c\u0647 \u062f\u0627\u0634\u062a\u0647 \u0628\u0627\u0634\u06cc\u062f \u06a9\u0647 \u0647\u0631 \u06a9\u0644\u0645\u0647 \u062f\u0631 \u062c\u0645\u0644\u0647 \u0648\u0631\u0648\u062f\u06cc \u0628\u0627 \u062a\u0648\u062c\u0647 \u0628\u0647 \u0628\u0627\u0641\u062a \u0622\u0646 \u062f\u0631 \u062c\u0645\u0644\u0647 \u0627\u0635\u0644\u06cc \u0628\u0647 \u0635\u0648\u0631\u062a \u0644\u0645\u0627\u062a\u06cc\u0632\u0647 \u0645\u06cc \u0634\u0648\u062f.  \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u0645\u062b\u0627\u0644\u060c &#8220;\u0622\u0644\u06cc\u0633&#8221; \u06cc\u06a9 \u0627\u0633\u0645 \u062e\u0627\u0635 \u0627\u0633\u062a\u060c \u0628\u0646\u0627\u0628\u0631\u0627\u06cc\u0646 \u062b\u0627\u0628\u062a \u0645\u06cc \u0645\u0627\u0646\u062f \u0648 \u0627\u0641\u0639\u0627\u0644 &#8220;\u0641\u06a9\u0631 \u0645\u06cc \u06a9\u0646\u062f&#8221; \u0648 &#8220;\u0634\u0631\u0648\u0639 \u0645\u06cc \u06a9\u0646\u062f&#8221; \u062f\u0631 \u0634\u06a9\u0644 \u0647\u0627\u06cc \u067e\u0627\u06cc\u0647 \u062e\u0648\u062f &#8220;\u0627\u0646\u062f\u06cc\u0634\u06cc\u062f\u0646&#8221; \u0648 &#8220;\u0634\u0631\u0648\u0639&#8221; \u0627\u0631\u062c\u0627\u0639 \u0645\u06cc \u0634\u0648\u0646\u062f.<\/p>\n<p>Lemmatization \u06cc\u06a9\u06cc \u0627\u0632 \u0645\u0631\u0627\u062d\u0644 \u0627\u0633\u0627\u0633\u06cc \u067e\u0631\u062f\u0627\u0632\u0634 \u0632\u0628\u0627\u0646 \u0627\u0633\u062a.  \u06a9\u0644\u0645\u0627\u062a \u0631\u0627 \u0628\u0631\u0627\u06cc \u0622\u0646\u0647\u0627 \u0628\u0647 \u0627\u0631\u0645\u063a\u0627\u0646 \u0645\u06cc \u0622\u0648\u0631\u062f root \u0641\u0631\u0645 \u0647\u0627 \u06cc\u0627 <em>\u0644\u0645 \u0647\u0627<\/em>\u060c \u06a9\u0647 \u0627\u06af\u0631 \u062f\u0631 \u0641\u0631\u0647\u0646\u06af \u0644\u063a\u062a \u0628\u0647 \u062f\u0646\u0628\u0627\u0644 \u0622\u0646\u0647\u0627 \u0628\u0627\u0634\u06cc\u0645\u060c \u0622\u0646\u0647\u0627 \u0631\u0627 \u067e\u06cc\u062f\u0627 \u0645\u06cc \u06a9\u0646\u06cc\u0645.<\/p>\n<p>\u062f\u0631 \u0645\u0648\u0631\u062f TextBlob\u060c \u0648\u0627\u0698\u0647\u200c\u0633\u0627\u0632\u06cc \u0645\u0628\u062a\u0646\u06cc \u0627\u0633\u062a \u0631\u0648\u06cc \u067e\u0627\u06cc\u06af\u0627\u0647 \u062f\u0627\u062f\u0647 \u0627\u06cc \u0628\u0647 \u0646\u0627\u0645 <a rel=\"nofollow noopener\" target=\"_blank\" href=\"https:\/\/wordnet.princeton.edu\/\">\u0648\u0631\u062f \u0646\u062a<\/a>\u06a9\u0647 \u062a\u0648\u0633\u0637 \u062f\u0627\u0646\u0634\u06af\u0627\u0647 \u067e\u0631\u06cc\u0646\u0633\u062a\u0648\u0646 \u062a\u0648\u0633\u0639\u0647 \u0648 \u0646\u06af\u0647\u062f\u0627\u0631\u06cc \u0645\u06cc \u0634\u0648\u062f.  \u062f\u0631 \u067e\u0634\u062a \u0635\u062d\u0646\u0647\u060c TextBlob \u0627\u0632 WordNet \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0645\u06cc \u06a9\u0646\u062f <a target=\"_blank\" rel=\"nofollow noopener\" href=\"https:\/\/wordnet.princeton.edu\/documentation\/morphy7wn\">\u0645\u0648\u0631\u0641\u06cc<\/a> \u067e\u0631\u062f\u0627\u0632\u0646\u062f\u0647 \u0628\u0631\u0627\u06cc \u0628\u0647 \u062f\u0633\u062a \u0622\u0648\u0631\u062f\u0646 \u0644\u0645 \u0628\u0631\u0627\u06cc \u06cc\u06a9 \u06a9\u0644\u0645\u0647.<\/p>\n<div class=\"alert alert-note\">\n<div class=\"flex\">\n<div class=\"flex-shrink-0 mr-3\"><\/div>\n<div class=\"w-full\">\n<p><strong>\u062a\u0648\u062c\u0647 \u062f\u0627\u0634\u062a\u0647 \u0628\u0627\u0634\u06cc\u062f<\/strong>: \u062c\u0647\u062a \u0645\u0631\u0627\u062c\u0639\u0647 \u0628\u06cc\u0634\u062a\u0631 \u0631\u0648\u06cc \u0631\u0648\u0634 \u0639\u0645\u0644\u06a9\u0631\u062f \u0648\u0627\u0698\u0647\u200c\u0633\u0627\u0632\u06cc \u062f\u0631 TextBlob\u060c \u0645\u06cc\u200c\u062a\u0648\u0627\u0646\u06cc\u062f \u0646\u06af\u0627\u0647\u06cc \u0628\u0647 \u0622\u0646 \u0628\u06cc\u0646\u062f\u0627\u0632\u06cc\u062f <a target=\"_blank\" rel=\"nofollow noopener\" href=\"https:\/\/textblob.readthedocs.io\/en\/dev\/_modules\/textblob\/blob.html#Word.lemmatize\">\u0645\u0633\u062a\u0646\u062f\u0627\u062a<\/a>.<\/p>\n<\/p><\/div><\/div><\/div>\n<p>\u0627\u062d\u062a\u0645\u0627\u0644\u0627\u064b \u062a\u063a\u06cc\u06cc\u0631\u0627\u062a \u0642\u0627\u0628\u0644 \u062a\u0648\u062c\u0647\u06cc \u0631\u0627 \u0628\u0627 \u06a9\u0644\u0645\u0647 \u0646\u0648\u06cc\u0633\u06cc \u0645\u062a\u0648\u062c\u0647 \u0646\u062e\u0648\u0627\u0647\u06cc\u062f \u0634\u062f \u0645\u06af\u0631 \u0627\u06cc\u0646\u06a9\u0647 \u0628\u0627 \u062d\u062c\u0645 \u0632\u06cc\u0627\u062f\u06cc \u0627\u0632 \u0645\u062a\u0646 \u06a9\u0627\u0631 \u06a9\u0646\u06cc\u062f.  \u062f\u0631 \u0622\u0646 \u0635\u0648\u0631\u062a\u060c \u0648\u0627\u0698\u0647\u200c\u0633\u0627\u0632\u06cc \u0628\u0647 \u06a9\u0627\u0647\u0634 \u0627\u0646\u062f\u0627\u0632\u0647 \u06a9\u0644\u0645\u0627\u062a\u06cc \u06a9\u0647 \u0645\u0645\u06a9\u0646 \u0627\u0633\u062a \u062f\u0631 \u062c\u0633\u062a\u062c\u0648\u06cc \u0622\u0646\u0647\u0627 \u0628\u0627\u0634\u06cc\u0645 \u06a9\u0645\u06a9 \u0645\u06cc\u200c\u06a9\u0646\u062f \u0648 \u062f\u0631 \u0639\u06cc\u0646 \u062d\u0627\u0644 \u0633\u0639\u06cc \u0645\u06cc\u200c\u06a9\u0646\u06cc\u0645 \u0645\u062a\u0646 \u0622\u0646\u0647\u0627 \u0631\u0627 \u062f\u0631 \u062c\u0645\u0644\u0647 \u062d\u0641\u0638 \u06a9\u0646\u06cc\u0645.  \u0645\u06cc\u200c\u062a\u0648\u0627\u0646 \u0622\u0646 \u0631\u0627 \u0628\u06cc\u0634\u062a\u0631 \u062f\u0631 \u062a\u0648\u0633\u0639\u0647 \u0645\u062f\u0644\u200c\u0647\u0627\u06cc \u062a\u0631\u062c\u0645\u0647 \u0645\u0627\u0634\u06cc\u0646\u06cc\u060c \u0628\u0647\u06cc\u0646\u0647\u200c\u0633\u0627\u0632\u06cc \u0645\u0648\u062a\u0648\u0631\u0647\u0627\u06cc \u062c\u0633\u062a\u062c\u0648 \u06cc\u0627 \u0633\u0624\u0627\u0644\u0627\u062a \u0645\u062e\u062a\u0644\u0641 \u062a\u062c\u0627\u0631\u06cc \u0628\u0647 \u06a9\u0627\u0631 \u0628\u0631\u062f.<\/p>\n<h2 id=\"implementinglemmatizationincode\"><span class=\"ez-toc-section\" id=\"%d9%be%db%8c%d8%a7%d8%af%d9%87_%d8%b3%d8%a7%d8%b2%db%8c_lemmatization_%d8%af%d8%b1_%da%a9%d8%af\"><\/span>\u067e\u06cc\u0627\u062f\u0647 \u0633\u0627\u0632\u06cc Lemmatization \u062f\u0631 \u06a9\u062f<span class=\"ez-toc-section-end\"><\/span><\/h2>\n<p>\u0627\u0648\u0644 \u0627\u0632 \u0647\u0645\u0647\u060c \u0644\u0627\u0632\u0645 \u0627\u0633\u062a \u06cc\u06a9 \u0634\u06cc TextBlob \u0627\u06cc\u062c\u0627\u062f \u06a9\u0646\u06cc\u062f \u0648 \u06cc\u06a9 \u067e\u06cc\u06a9\u0631\u0647 \u0646\u0645\u0648\u0646\u0647 \u062a\u0639\u0631\u06cc\u0641 \u06a9\u0646\u06cc\u062f \u06a9\u0647 \u0628\u0639\u062f\u0627\u064b \u0628\u0647 \u0635\u0648\u0631\u062a \u0644\u0645\u0627\u062a\u06cc\u0632\u0647 \u062e\u0648\u0627\u0647\u062f \u0634\u062f.  \u062f\u0631 \u0627\u06cc\u0646 \u0645\u0631\u062d\u0644\u0647 \u0627\u0648\u0644\u06cc\u0647\u060c \u0645\u06cc\u200c\u062a\u0648\u0627\u0646\u06cc\u062f \u06cc\u06a9 \u0631\u0634\u062a\u0647 \u0645\u062a\u0646 \u0628\u0631\u0627\u06cc \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0628\u0646\u0648\u06cc\u0633\u06cc\u062f \u06cc\u0627 \u062a\u0639\u0631\u06cc\u0641 \u06a9\u0646\u06cc\u062f (\u0645\u0627\u0646\u0646\u062f \u0627\u06cc\u0646 \u0631\u0627\u0647\u0646\u0645\u0627)\u060c \u06cc\u0627 \u0645\u06cc\u200c\u062a\u0648\u0627\u0646\u06cc\u0645 \u0627\u0632 \u0646\u0645\u0648\u0646\u0647\u200c\u0627\u06cc \u0627\u0632 \u0645\u062c\u0645\u0648\u0639\u0647 NLTK \u06a9\u0647 \u062f\u0627\u0646\u0644\u0648\u062f \u06a9\u0631\u062f\u0647\u200c\u0627\u06cc\u0645 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0646\u06cc\u0645.  \u0628\u06cc\u0627\u06cc\u06cc\u062f \u0628\u0627 \u062f\u0648\u0645\u06cc \u0628\u0631\u0648\u06cc\u0645.<\/p>\n<h3 id=\"choosingareviewfromthenltkcorpus\"><span class=\"ez-toc-section\" id=\"%d8%a7%d9%86%d8%aa%d8%ae%d8%a7%d8%a8_%db%8c%da%a9_%d8%a8%d8%b1%d8%b1%d8%b3%db%8c_%d8%a7%d8%b2_nltk_corpus\"><\/span>\u0627\u0646\u062a\u062e\u0627\u0628 \u06cc\u06a9 \u0628\u0631\u0631\u0633\u06cc \u0627\u0632 NLTK Corpus<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p>\u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u0645\u062b\u0627\u0644\u060c \u0628\u06cc\u0627\u06cc\u06cc\u062f \u0633\u0639\u06cc \u06a9\u0646\u06cc\u0645 \u0644\u0645 \u0647\u0627\u06cc \u06cc\u06a9 \u0646\u0642\u062f \u0641\u06cc\u0644\u0645 \u0631\u0627 \u06a9\u0647 \u062f\u0631 \u0645\u062c\u0645\u0648\u0639\u0647 \u0627\u0633\u062a \u0628\u0647 \u062f\u0633\u062a \u0622\u0648\u0631\u06cc\u0645.  \u0628\u0631\u0627\u06cc \u0627\u0646\u062c\u0627\u0645 \u0627\u06cc\u0646 \u06a9\u0627\u0631\u060c \u0645\u0627 import \u0647\u0645 \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 TextBlob \u0648 \u0647\u0645 <code>movie_reviews<\/code> \u0627\u0632 <code>nltk.corpus<\/code> \u0628\u0633\u062a\u0647:<\/p>\n<pre><code class=\"hljs\">\n<span class=\"hljs-keyword\">from<\/span> textblob <span class=\"hljs-keyword\">import<\/span> TextBlob\n<span class=\"hljs-keyword\">from<\/span> nltk.corpus <span class=\"hljs-keyword\">import<\/span> movie_reviews\n<\/code><\/pre>\n<p>\u067e\u0633 \u0627\u0632 \u0648\u0627\u0631\u062f \u06a9\u0631\u062f\u0646\u060c \u0645\u06cc\u200c\u062a\u0648\u0627\u0646\u06cc\u0645 \u0646\u06af\u0627\u0647\u06cc \u0628\u0647 \u0641\u0627\u06cc\u0644\u200c\u0647\u0627\u06cc \u0646\u0642\u062f \u0641\u06cc\u0644\u0645 \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 \u0622\u0646 \u0628\u06cc\u0627\u0646\u062f\u0627\u0632\u06cc\u0645 <code>fileids()<\/code> \u0631\u0648\u0634.  \u0627\u0632 \u0622\u0646\u062c\u0627\u06cc\u06cc \u06a9\u0647 \u0627\u06cc\u0646 \u06a9\u062f \u062f\u0631 a \u0627\u062c\u0631\u0627 \u0645\u06cc \u0634\u0648\u062f Jupyter \u0646\u0648\u062a \u0628\u0648\u06a9\u060c \u0645\u0627 \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u0645 \u0645\u0633\u062a\u0642\u06cc\u0645\u0627 \u0627\u062c\u0631\u0627 \u06a9\u0646\u06cc\u0645:<\/p>\n<pre><code class=\"hljs\">movie_reviews.fileids()\n<\/code><\/pre>\n<p>\u0628\u0627 \u0627\u06cc\u0646 \u06a9\u0627\u0631 \u0644\u06cc\u0633\u062a\u06cc \u0627\u0632 2000 \u0646\u0627\u0645 \u0641\u0627\u06cc\u0644 \u0645\u062a\u0646\u06cc \u062d\u0627\u0648\u06cc \u0646\u0638\u0631\u0627\u062a \u0645\u0646\u0641\u06cc \u0648 \u0645\u062b\u0628\u062a \u0628\u0627\u0632 \u0645\u06cc \u06af\u0631\u062f\u062f:<\/p>\n<pre><code class=\"hljs\">('neg\/cv000_29416.txt',\n 'neg\/cv001_19502.txt',\n 'neg\/cv002_17424.txt',\n 'neg\/cv003_12683.txt',\n 'neg\/cv004_12641.txt',\n 'neg\/cv005_29357.txt',\n 'neg\/cv006_17022.txt',\n 'neg\/cv007_4992.txt',\n 'neg\/cv008_29326.txt',\n 'neg\/cv009_29417.txt',\n ...)\n<\/code><\/pre>\n<div class=\"alert alert-note\">\n<div class=\"flex\">\n<div class=\"flex-shrink-0 mr-3\"><\/div>\n<div class=\"w-full\">\n<p><strong>\u062a\u0648\u062c\u0647 \u062f\u0627\u0634\u062a\u0647 \u0628\u0627\u0634\u06cc\u062f<\/strong>: \u0627\u06af\u0631 \u06a9\u062f \u0631\u0627 \u0628\u0647 \u0631\u0648\u0634 \u062f\u06cc\u06af\u0631\u06cc \u0627\u062c\u0631\u0627 \u0645\u06cc \u06a9\u0646\u06cc\u062f\u060c \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u0645\u062b\u0627\u0644\u060c \u062f\u0631 a terminal \u06cc\u0627 IDE\u060c \u0634\u0645\u0627 \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u062f print \u067e\u0627\u0633\u062e \u0628\u0627 \u0627\u062c\u0631\u0627 <code>print(movie_reviews.fileids())<\/code>.<\/p>\n<\/p><\/div><\/div><\/div>\n<p>\u0628\u0627 \u0646\u06af\u0627\u0647 \u06a9\u0631\u062f\u0646 \u0628\u0647 <strong>\u0646\u0641\u06cc<\/strong> \u062f\u0631 \u0646\u0627\u0645 \u0641\u0627\u06cc\u0644\u060c \u0645\u06cc \u062a\u0648\u0627\u0646 \u0641\u0631\u0636 \u06a9\u0631\u062f \u06a9\u0647 \u0644\u06cc\u0633\u062a \u0628\u0627 \u0628\u0631\u0631\u0633\u06cc \u0647\u0627\u06cc \u0645\u0646\u0641\u06cc \u0634\u0631\u0648\u0639 \u0645\u06cc \u0634\u0648\u062f \u0648 \u0628\u0627 \u0628\u0631\u0631\u0633\u06cc \u0647\u0627\u06cc \u0645\u062b\u0628\u062a \u0628\u0647 \u067e\u0627\u06cc\u0627\u0646 \u0645\u06cc \u0631\u0633\u062f.  \u0628\u0627 \u0646\u0645\u0627\u06cc\u0647 \u0633\u0627\u0632\u06cc \u0627\u0632 \u0627\u0646\u062a\u0647\u0627\u06cc \u0644\u06cc\u0633\u062a \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u0645 \u0628\u0647 \u0628\u0631\u0631\u0633\u06cc \u0645\u062b\u0628\u062a \u0646\u06af\u0627\u0647 \u06a9\u0646\u06cc\u0645.  \u062f\u0631 \u0627\u06cc\u0646\u062c\u0627\u060c \u0645\u0627 1989\u0645\u06cc\u0646 \u0628\u0631\u0631\u0633\u06cc \u0631\u0627 \u0627\u0646\u062a\u062e\u0627\u0628 \u0645\u06cc \u06a9\u0646\u06cc\u0645:<\/p>\n<pre><code class=\"hljs\">movie_reviews.fileids()(-<span class=\"hljs-number\">10<\/span>)\n<\/code><\/pre>\n<p>\u0627\u06cc\u0646 \u0645\u0646\u062c\u0631 \u0628\u0647:<\/p>\n<pre><code class=\"hljs\">'pos\/cv990_11591.txt'\n<\/code><\/pre>\n<p>\u0628\u0631\u0627\u06cc \u0628\u0631\u0631\u0633\u06cc \u062c\u0645\u0644\u0627\u062a \u0645\u0631\u0648\u0631\u06cc\u060c \u0645\u06cc\u200c\u062a\u0648\u0627\u0646\u06cc\u0645 \u0646\u0627\u0645 \u0646\u0642\u062f \u0631\u0627 \u0628\u0647 \u0622\u0646 \u0645\u0646\u062a\u0642\u0644 \u06a9\u0646\u06cc\u0645 <code>.sents()<\/code> \u0645\u062a\u062f\u060c \u06a9\u0647 \u0644\u06cc\u0633\u062a\u06cc \u0627\u0632 \u062a\u0645\u0627\u0645 \u062c\u0645\u0644\u0627\u062a \u0628\u0627\u0632\u0628\u06cc\u0646\u06cc \u0631\u0627 \u062e\u0631\u0648\u062c\u06cc \u0645\u06cc \u062f\u0647\u062f:<\/p>\n<pre><code class=\"hljs\">movie_reviews.sents(<span class=\"hljs-string\">'pos\/cv990_11591.txt'<\/span>)\n<\/code><\/pre>\n<pre><code class=\"hljs\">(('the', 'relaxed', 'dude', 'rides', 'a', 'roller', 'coaster',\n'the', 'big', 'lebowski', 'a', 'film', 'review', 'by', 'michael',\n'redman', 'copyright', '1998', 'by', 'michael', 'redman', 'the',\n'most', 'surreal', 'situations', 'are', 'ordinary', 'everyday',\n'life', 'as', 'viewed', 'by', 'an', 'outsider', '.'), ('when',\n'those', 'observers', 'are', 'joel', 'and', 'ethan', 'coen', ',',\n'the', 'surreal', 'becomes', 'bizarre', '.'), ...)\n<\/code><\/pre>\n<p>\u0628\u06cc\u0627\u06cc\u06cc\u062f \u0627\u06cc\u0646 \u0644\u06cc\u0633\u062a \u0631\u0627 \u062f\u0631 \u0645\u062a\u063a\u06cc\u0631\u06cc \u0628\u0647 \u0646\u0627\u0645 \u0630\u062e\u06cc\u0631\u0647 \u06a9\u0646\u06cc\u0645 <code>pos_review<\/code>:<\/p>\n<pre><code class=\"hljs\">pos_review = movie_reviews.sents(<span class=\"hljs-string\">\"pos\/cv990_11591.txt\"<\/span>)\n<span class=\"hljs-built_in\">len<\/span>(pos_review) \n<\/code><\/pre>\n<p>\u062f\u0631 \u0627\u06cc\u0646\u062c\u0627 \u0645\u06cc \u0628\u06cc\u0646\u06cc\u0645 \u06a9\u0647 63 \u062c\u0645\u0644\u0647 \u0648\u062c\u0648\u062f \u062f\u0627\u0631\u062f.  \u0627\u06a9\u0646\u0648\u0646 \u0645\u06cc\u200c\u062a\u0648\u0627\u0646\u06cc\u0645 \u06cc\u06a9 \u062c\u0645\u0644\u0647 \u0631\u0627 \u0628\u0631\u0627\u06cc \u06a9\u0644\u0645\u0647\u200c\u0633\u0627\u0632\u06cc \u0627\u0646\u062a\u062e\u0627\u0628 \u06a9\u0646\u06cc\u0645\u060c \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u0645\u062b\u0627\u0644\u060c \u062c\u0645\u0644\u0647 \u067e\u0627\u0646\u0632\u062f\u0647\u0645:<\/p>\n<pre><code class=\"hljs\">sentence = pos_review(<span class=\"hljs-number\">16<\/span>)\n<span class=\"hljs-built_in\">type<\/span>(sentence) \n<\/code><\/pre>\n<h3 id=\"creatingatextblobobject\"><span class=\"ez-toc-section\" id=\"%d8%a7%db%8c%d8%ac%d8%a7%d8%af_%db%8c%da%a9_%d8%b4%db%8c%d8%a1_textblob\"><\/span>\u0627\u06cc\u062c\u0627\u062f \u06cc\u06a9 \u0634\u06cc\u0621 TextBlob<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p>\u067e\u0633 \u0627\u0632 \u0627\u0646\u062a\u062e\u0627\u0628 \u062c\u0645\u0644\u0647\u060c \u0628\u0627\u06cc\u062f \u06cc\u06a9 \u0634\u06cc TextBlob \u0627\u06cc\u062c\u0627\u062f \u06a9\u0646\u06cc\u0645 \u062a\u0627 \u0628\u062a\u0648\u0627\u0646\u06cc\u0645 \u0628\u0647 \u0622\u0646 \u062f\u0633\u062a\u0631\u0633\u06cc \u062f\u0627\u0634\u062a\u0647 \u0628\u0627\u0634\u06cc\u0645 <code>.lemmatize()<\/code> \u0631\u0648\u0634.  \u0627\u0634\u06cc\u0627\u0621 TextBlob \u0628\u0627\u06cc\u062f \u0627\u0632 \u0631\u0634\u062a\u0647 \u0647\u0627 \u0627\u06cc\u062c\u0627\u062f \u0634\u0648\u0646\u062f.  \u0627\u0632 \u0622\u0646\u062c\u0627\u06cc\u06cc \u06a9\u0647 \u0645\u0627 \u06cc\u06a9 \u0644\u06cc\u0633\u062a \u062f\u0627\u0631\u06cc\u0645\u060c \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u0645 \u0622\u0646 \u0631\u0627 \u0628\u0647 \u06cc\u06a9 \u0631\u0634\u062a\u0647 \u062a\u0628\u062f\u06cc\u0644 \u06a9\u0646\u06cc\u0645 <code>string.join()<\/code> \u0631\u0648\u0634\u060c \u067e\u06cc\u0648\u0633\u062a\u0646 \u0628\u0631 \u0627\u0633\u0627\u0633 \u0631\u0648\u06cc \u0641\u0636\u0627\u0647\u0627\u06cc \u062e\u0627\u0644\u06cc:<\/p>\n<pre><code class=\"hljs\">sentence_string = <span class=\"hljs-string\">' '<\/span>.join(sentence)\n<\/code><\/pre>\n<p>\u0627\u06a9\u0646\u0648\u0646 \u06a9\u0647 \u0631\u0634\u062a\u0647 \u062c\u0645\u0644\u0647 \u062e\u0648\u062f \u0631\u0627 \u062f\u0627\u0631\u06cc\u0645\u060c \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u0645 \u0622\u0646 \u0631\u0627 \u0628\u0647 \u0633\u0627\u0632\u0646\u062f\u0647 TextBlob \u0627\u0631\u0633\u0627\u0644 \u06a9\u0646\u06cc\u0645:<\/p>\n<pre><code class=\"hljs\">blob_object = TextBlob(sentence_string)\n<\/code><\/pre>\n<p>\u0647\u0646\u06af\u0627\u0645\u06cc \u06a9\u0647 \u0634\u06cc TextBlob \u0631\u0627 \u062f\u0627\u0634\u062a\u0647 \u0628\u0627\u0634\u06cc\u0645\u060c \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u0645 \u0639\u0645\u0644\u06cc\u0627\u062a \u0645\u062e\u062a\u0644\u0641\u06cc \u0645\u0627\u0646\u0646\u062f lemmatization \u0631\u0627 \u0627\u0646\u062c\u0627\u0645 \u062f\u0647\u06cc\u0645.<\/p>\n<h3 id=\"lemmatizationofasentence\"><span class=\"ez-toc-section\" id=\"%d8%ae%d9%84%d8%a7%d8%b5%d9%87_%d8%b3%d8%a7%d8%b2%db%8c_%db%8c%da%a9_%d8%ac%d9%85%d9%84%d9%87\"><\/span>\u062e\u0644\u0627\u0635\u0647 \u0633\u0627\u0632\u06cc \u06cc\u06a9 \u062c\u0645\u0644\u0647<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p>\u062f\u0631 \u0646\u0647\u0627\u06cc\u062a\u060c \u0628\u0631\u0627\u06cc \u0628\u0647 \u062f\u0633\u062a \u0622\u0648\u0631\u062f\u0646 \u0648\u0627\u0698\u0647\u200c\u0647\u0627\u06cc \u0648\u0627\u0698\u0647\u200c\u0628\u0646\u062f\u06cc\u060c \u0628\u0647 \u0633\u0627\u062f\u06af\u06cc \u0639\u0628\u0627\u0631\u062a \u0631\u0627 \u0628\u0627\u0632\u06cc\u0627\u0628\u06cc \u0645\u06cc\u200c\u06a9\u0646\u06cc\u0645 <code>words<\/code> \u0648\u06cc\u0698\u06af\u06cc \u0627\u06cc\u062c\u0627\u062f \u0634\u062f\u0647 <code>blob_object<\/code>.  \u0627\u06cc\u0646 \u0644\u06cc\u0633\u062a\u06cc \u062d\u0627\u0648\u06cc \u0627\u0634\u06cc\u0627\u0621 Word \u0628\u0647 \u0645\u0627 \u0645\u06cc \u062f\u0647\u062f \u06a9\u0647 \u0628\u0633\u06cc\u0627\u0631 \u0634\u0628\u06cc\u0647 \u0628\u0647 \u0627\u0634\u06cc\u0627\u0621 \u0631\u0634\u062a\u0647 \u0627\u06cc \u0639\u0645\u0644 \u0645\u06cc \u06a9\u0646\u0646\u062f:<\/p>\n<pre><code class=\"hljs\">\ncorpus_words = blob_object.words\n\n<span class=\"hljs-built_in\">print<\/span>(<span class=\"hljs-string\">'sentence:'<\/span>, corpus_words)\n\nnumber_of_tokens = <span class=\"hljs-built_in\">len<\/span>(corpus_words)\n<span class=\"hljs-built_in\">print<\/span>(<span class=\"hljs-string\">'\\nnumber of tokens:'<\/span>, number_of_tokens)\n<\/code><\/pre>\n<p>\u062f\u0633\u062a\u0648\u0631\u0627\u062a \u062e\u0631\u0648\u062c\u06cc \u0628\u0627\u06cc\u062f \u0645\u0648\u0627\u0631\u062f \u0632\u06cc\u0631 \u0631\u0627 \u0628\u0647 \u0634\u0645\u0627 \u0628\u062f\u0647\u062f:<\/p>\n<pre><code class=\"hljs\">sentence: (<span class=\"hljs-string\">'the'<\/span>, <span class=\"hljs-string\">'carpet'<\/span>, <span class=\"hljs-string\">'is'<\/span>, <span class=\"hljs-string\">'important'<\/span>, <span class=\"hljs-string\">'to'<\/span>, <span class=\"hljs-string\">'him'<\/span>, <span class=\"hljs-string\">'because'<\/span>, <span class=\"hljs-string\">'it'<\/span>, <span class=\"hljs-string\">'pulls'<\/span>, <span class=\"hljs-string\">'the'<\/span>, <span class=\"hljs-string\">'room'<\/span>, <span class=\"hljs-string\">'together'<\/span>, <span class=\"hljs-string\">'not'<\/span>, <span class=\"hljs-string\">'surprisingly'<\/span>, <span class=\"hljs-string\">'since'<\/span>, <span class=\"hljs-string\">'it'<\/span>, <span class=\"hljs-string\">'s'<\/span>, <span class=\"hljs-string\">'virtually'<\/span>, <span class=\"hljs-string\">'the'<\/span>, <span class=\"hljs-string\">'only'<\/span>, <span class=\"hljs-string\">'object'<\/span>, <span class=\"hljs-string\">'there'<\/span>)\n\nnumber of tokens: <span class=\"hljs-number\">22<\/span>\n<\/code><\/pre>\n<p>\u0628\u0631\u0627\u06cc \u0645\u0641\u0647\u0648\u0645 \u0633\u0627\u0632\u06cc \u06a9\u0644\u0645\u0627\u062a\u060c \u0641\u0642\u0637 \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u0645 \u0627\u0632 \u0622\u0646 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0646\u06cc\u0645 <code>.lemmatize()<\/code> \u0631\u0648\u0634:<\/p>\n<pre><code class=\"hljs\">corpus_words.lemmatize()\n<\/code><\/pre>\n<p>\u0627\u06cc\u0646 \u0628\u0647 \u0645\u0627 \u06cc\u06a9 \u0634\u06cc WordList \u0627\u0635\u0637\u0644\u0627\u062d\u06cc \u0645\u06cc \u062f\u0647\u062f:<\/p>\n<pre><code class=\"hljs\">WordList(('the', 'carpet', 'is', 'important', 'to', 'him', 'because', 'it', 'pull', 'the',\n'room', 'together', 'not', 'surprisingly', 'since', 'it', 's', 'virtually', 'the', 'only',\n'object', 'there'))\n<\/code><\/pre>\n<p>\u0627\u0632 \u0622\u0646\u062c\u0627\u06cc\u06cc \u06a9\u0647 \u062e\u0648\u0627\u0646\u062f\u0646 \u0627\u06cc\u0646 \u0645\u0645\u06a9\u0646 \u0627\u0633\u062a \u06a9\u0645\u06cc \u062f\u0634\u0648\u0627\u0631 \u0628\u0627\u0634\u062f\u060c \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u0645 \u06cc\u06a9 \u062d\u0644\u0642\u0647 \u0648 \u0627\u0646\u062c\u0627\u0645 \u062f\u0647\u06cc\u0645 print \u0647\u0631 \u06a9\u0644\u0645\u0647 \u0642\u0628\u0644 \u0648 \u0628\u0639\u062f \u0627\u0632 \u06a9\u0644\u0645\u0647 \u0646\u0648\u06cc\u0633\u06cc:<\/p>\n<pre><code class=\"hljs\"><span class=\"hljs-keyword\">for<\/span> word <span class=\"hljs-keyword\">in<\/span> corpus_words:\n    <span class=\"hljs-built_in\">print<\/span>(<span class=\"hljs-string\">f'<span class=\"hljs-subst\">{word}<\/span> | <span class=\"hljs-subst\">{word.lemmatize()}<\/span>'<\/span>)\n<\/code><\/pre>\n<p>\u0627\u06cc\u0646 \u0645\u0646\u062c\u0631 \u0628\u0647:<\/p>\n<pre><code class=\"hljs\">the | the\ncarpet | carpet\nis | is\nimportant | important\nto | to\nhim | him\nbecause | because\nit | it\npulls | pull\nthe | the\nroom | room\ntogether | together\nnot | not\nsurprisingly | surprisingly\nsince | since\nit | it\ns | s\nvirtually | virtually\nthe | the\nonly | only\nobject | object\nthere | there\n<\/code><\/pre>\n<p>\u062a\u0648\u062c\u0647 \u06a9\u0646\u06cc\u062f \u06a9\u0647 \u0686\u06af\u0648\u0646\u0647 &#8220;\u06a9\u0634\u0634&#8221; \u0628\u0647 &#8220;\u06a9\u0634\u0634&#8221; \u062a\u063a\u06cc\u06cc\u0631 \u06a9\u0631\u062f.  \u06a9\u0644\u0645\u0627\u062a \u062f\u06cc\u06af\u0631\u060c \u0639\u0644\u0627\u0648\u0647 \u0628\u0631 &#8220;\u0622\u0646 \u0627\u0633\u062a&#8221;\u060c \u0646\u06cc\u0632 \u0647\u0645\u0627\u0646\u0637\u0648\u0631 \u06a9\u0647 \u0627\u0646\u062a\u0638\u0627\u0631 \u0645\u06cc \u0631\u0641\u062a\u060c \u0628\u0647 \u0635\u0648\u0631\u062a \u0644\u0645\u0627\u062a\u06cc\u06a9 \u0634\u062f\u0646\u062f.  \u0647\u0645\u0686\u0646\u06cc\u0646 \u0645\u06cc\u200c\u062a\u0648\u0627\u0646\u06cc\u0645 \u0628\u0628\u06cc\u0646\u06cc\u0645 \u06a9\u0647 \u00ab\u0622\u0646\u00bb \u0628\u0647 \u062f\u0644\u06cc\u0644 \u0622\u067e\u0633\u062a\u0631\u0648\u0641 \u0627\u0632 \u0647\u0645 \u062c\u062f\u0627 \u0634\u062f\u0647 \u0627\u0633\u062a.  \u0627\u06cc\u0646 \u0646\u0634\u0627\u0646 \u0645\u06cc \u062f\u0647\u062f \u06a9\u0647 \u0645\u0627 \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u0645 \u0628\u06cc\u0634\u062a\u0631 \u067e\u06cc\u0634 \u0627\u0632process \u062c\u0645\u0644\u0647 \u0628\u0647 \u0637\u0648\u0631\u06cc \u06a9\u0647 \u00ab\u0622\u0646\u00bb \u0628\u0647 \u062c\u0627\u06cc \u00ab\u0622\u0646\u00bb \u0648 \u00ab\u0633\u00bb \u06cc\u06a9 \u06a9\u0644\u0645\u0647 \u062f\u0631 \u0646\u0638\u0631 \u06af\u0631\u0641\u062a\u0647 \u0634\u0648\u062f.<\/p>\n<h3 id=\"differencebetweenlemmatizationandstemming\"><span class=\"ez-toc-section\" id=\"%d8%aa%d9%81%d8%a7%d9%88%d8%aa_%d8%a8%db%8c%d9%86_lemmatization_%d9%88_stemming\"><\/span>\u062a\u0641\u0627\u0648\u062a \u0628\u06cc\u0646 Lemmatization \u0648 Stemming<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p>Lemmatization \u0627\u063a\u0644\u0628 \u0628\u0627 \u062a\u06a9\u0646\u06cc\u06a9 \u062f\u06cc\u06af\u0631\u06cc \u0628\u0647 \u0646\u0627\u0645 stemming \u0627\u0634\u062a\u0628\u0627\u0647 \u06af\u0631\u0641\u062a\u0647 \u0645\u06cc \u0634\u0648\u062f.  \u0627\u06cc\u0646 \u0633\u0631\u062f\u0631\u06af\u0645\u06cc \u0628\u0647 \u0627\u06cc\u0646 \u062f\u0644\u06cc\u0644 \u0631\u062e \u0645\u06cc \u062f\u0647\u062f \u06a9\u0647 \u0647\u0631 \u062f\u0648 \u062a\u06a9\u0646\u06cc\u06a9 \u0645\u0639\u0645\u0648\u0644\u0627\u064b \u0628\u0631\u0627\u06cc \u06a9\u0627\u0647\u0634 \u06a9\u0644\u0645\u0627\u062a \u0628\u0647 \u06a9\u0627\u0631 \u0645\u06cc \u0631\u0648\u0646\u062f.  \u062f\u0631 \u062d\u0627\u0644\u06cc \u06a9\u0647 \u0648\u0627\u0698\u0647 \u0633\u0627\u0632\u06cc \u0627\u0632 \u0641\u0631\u0647\u0646\u06af \u0644\u063a\u062a \u0648 \u062a\u0645\u0631\u06a9\u0632 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0645\u06cc \u06a9\u0646\u062f \u0631\u0648\u06cc \u0628\u0627\u0641\u062a \u06a9\u0644\u0645\u0627\u062a \u062f\u0631 \u06cc\u06a9 \u062c\u0645\u0644\u0647\u060c \u062a\u0644\u0627\u0634 \u0628\u0631\u0627\u06cc \u062d\u0641\u0638 \u0622\u0646\u060c \u0631\u06cc\u0634\u0647 \u06cc\u0627\u0628\u06cc \u0627\u0632 \u0642\u0648\u0627\u0646\u06cc\u0646 \u0628\u0631\u0627\u06cc \u062d\u0630\u0641 \u067e\u0633\u0648\u0646\u062f\u0647\u0627\u06cc \u06a9\u0644\u0645\u0647 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0645\u06cc \u06a9\u0646\u062f\u060c \u062a\u0645\u0631\u06a9\u0632 \u0631\u0648\u06cc \u0628\u0647 \u062f\u0633\u062a \u0622\u0648\u0631\u062f\u0646 \u0631\u06cc\u0634\u0647 \u06cc\u06a9 \u06a9\u0644\u0645\u0647<\/p>\n<p>\u0628\u06cc\u0627\u06cc\u06cc\u062f \u0628\u0647 \u0633\u0631\u0639\u062a \u062d\u0644\u0642\u0647 for \u062e\u0648\u062f \u0631\u0627 \u062a\u063a\u06cc\u06cc\u0631 \u062f\u0647\u06cc\u0645 \u062a\u0627 \u0628\u0647 \u0627\u06cc\u0646 \u062a\u0641\u0627\u0648\u062a \u0647\u0627 \u0646\u06af\u0627\u0647 \u06a9\u0646\u06cc\u0645:<\/p>\n<pre><code class=\"hljs\"><span class=\"hljs-built_in\">print<\/span>(<span class=\"hljs-string\">'word | lemma | stem\\n'<\/span>)\n<span class=\"hljs-keyword\">for<\/span> word <span class=\"hljs-keyword\">in<\/span> corpus_words:\n    <span class=\"hljs-built_in\">print<\/span>(<span class=\"hljs-string\">f'<span class=\"hljs-subst\">{word}<\/span> | <span class=\"hljs-subst\">{word.lemmatize()}<\/span> | <span class=\"hljs-subst\">{word.stem()}<\/span>'<\/span>)\n<\/code><\/pre>\n<p>\u0627\u06cc\u0646 \u062e\u0631\u0648\u062c\u06cc:<\/p>\n<pre><code class=\"hljs\">the | the | the\ncarpet | carpet | carpet\nis | is | is\nimportant | important | import\nto | to | to\nhim | him | him\nbecause | because | becaus\nit | it | it\npulls | pull | pull\nthe | the | the\nroom | room | room\ntogether | together | togeth\nnot | not | not\nsurprisingly | surprisingly | surprisingli\nsince | since | sinc\nit | it | it\ns | s | s\nvirtually | virtually | virtual\nthe | the | the\nonly | only | onli\nobject | object | object\nthere | there | there\n<\/code><\/pre>\n<p>\u0648\u0642\u062a\u06cc \u0628\u0647 \u062e\u0631\u0648\u062c\u06cc \u0628\u0627\u0644\u0627 \u0646\u06af\u0627\u0647 \u0645\u06cc \u06a9\u0646\u06cc\u0645\u060c \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u0645 \u0628\u0628\u06cc\u0646\u06cc\u0645 \u06a9\u0647 \u0686\u06af\u0648\u0646\u0647 stemming \u0645\u06cc \u062a\u0648\u0627\u0646\u062f \u0645\u0634\u06a9\u0644 \u0633\u0627\u0632 \u0628\u0627\u0634\u062f.  \u00ab\u0645\u0647\u0645\u00bb \u0631\u0627 \u0628\u0647 \u00abimport&#8221;\u060c \u0627\u0632 \u062f\u0633\u062a \u062f\u0627\u062f\u0646 \u062a\u0645\u0627\u0645 \u0645\u0639\u0646\u06cc \u06a9\u0644\u0645\u0647\u060c \u06a9\u0647 \u062d\u062a\u06cc \u0645\u06cc \u062a\u0648\u0627\u0646 \u0622\u0646 \u0631\u0627 \u0627\u06a9\u0646\u0648\u0646 \u06cc\u06a9 \u0641\u0639\u0644 \u062f\u0631 \u0646\u0638\u0631 \u06af\u0631\u0641\u062a\u061b &#8220;\u0632\u06cc\u0631\u0627&#8221; \u0628\u0647 &#8220;\u0686\u0648\u0646&#8221;\u060c \u06a9\u0647 \u06a9\u0644\u0645\u0647 \u0627\u06cc \u0627\u0633\u062a \u06a9\u0647 \u0648\u062c\u0648\u062f \u0646\u062f\u0627\u0631\u062f\u060c \u0647\u0645\u0627\u0646 &#8220;\u0628\u0627 \u0647\u0645&#8221;\u060c &#8220;\u0633\u0648\u0631\u067e\u0631\u0627\u06cc\u0632\u06cc\u0646\u06af\u0644\u06cc&#8221;\u060c &#8220;\u0633\u06cc\u0646\u06a9&#8221; \u060c &#8220;onli&#8221;.<\/p>\n<p>\u062a\u0641\u0627\u0648\u062a \u0647\u0627\u06cc \u0648\u0627\u0636\u062d\u06cc \u0628\u06cc\u0646 \u0631\u06cc\u0634\u0647 \u06cc\u0627\u0628\u06cc \u0648 \u0631\u06cc\u0634\u0647 \u06cc\u0627\u0628\u06cc \u0648\u062c\u0648\u062f \u062f\u0627\u0631\u062f.  \u062f\u0631\u06a9 \u0632\u0645\u0627\u0646 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 \u0647\u0631 \u062a\u06a9\u0646\u06cc\u06a9 \u06a9\u0644\u06cc\u062f \u0627\u0635\u0644\u06cc \u0627\u0633\u062a.  \u0641\u0631\u0636 \u06a9\u0646\u06cc\u062f \u062f\u0631 \u062d\u0627\u0644 \u0628\u0647\u06cc\u0646\u0647 \u0633\u0627\u0632\u06cc \u062c\u0633\u062a\u062c\u0648\u06cc \u06a9\u0644\u0645\u0647 \u0647\u0633\u062a\u06cc\u062f \u0648 \u062a\u0645\u0631\u06a9\u0632 \u0631\u0648\u06cc \u0622\u0646 \u0627\u0633\u062a \u0631\u0648\u06cc \u0627\u06af\u0631 \u0628\u062a\u0648\u0627\u0646\u06cc\u062f \u062d\u062f\u0627\u06a9\u062b\u0631 \u062a\u0639\u062f\u0627\u062f \u06a9\u0644\u0645\u0627\u062a \u0645\u0634\u0627\u0628\u0647 \u0631\u0627 \u067e\u06cc\u0634\u0646\u0647\u0627\u062f \u062f\u0647\u06cc\u062f\u060c \u0627\u0632 \u06a9\u062f\u0627\u0645 \u062a\u06a9\u0646\u06cc\u06a9 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0645\u06cc \u06a9\u0646\u06cc\u062f\u061f  \u0648\u0642\u062a\u06cc \u0628\u0627\u0641\u062a \u06a9\u0644\u0645\u0647 \u0645\u0647\u0645 \u0646\u06cc\u0633\u062a\u060c \u0648 \u0645\u06cc\u200c\u062a\u0648\u0627\u0646\u06cc\u0645 \u00ab\u0645\u0647\u0645\u00bb \u0631\u0627 \u0628\u0627 \u00ab\u0628\u0627\u0632\u06cc\u0627\u0628\u06cc \u06a9\u0646\u06cc\u0645.import&#8221;\u060c \u0627\u0646\u062a\u062e\u0627\u0628 \u0648\u0627\u0636\u062d \u0627\u0633\u062a. \u0627\u0632 \u0637\u0631\u0641 \u062f\u06cc\u06af\u0631\u060c \u0627\u06af\u0631 \u0634\u0645\u0627 \u06a9\u0627\u0631 \u0645\u06cc \u06a9\u0646\u06cc\u062f \u0631\u0648\u06cc \u0645\u0642\u0627\u06cc\u0633\u0647 \u0645\u062a\u0646 \u0633\u0646\u062f\u060c \u06a9\u0647 \u062f\u0631 \u0622\u0646 \u0645\u0648\u0642\u0639\u06cc\u062a \u06a9\u0644\u0645\u0627\u062a \u062f\u0631 \u06cc\u06a9 \u062c\u0645\u0644\u0647 \u0645\u0647\u0645 \u0627\u0633\u062a\u060c \u0648 \u0633\u06cc\u0627\u0642 &#8220;\u0627\u0647\u0645\u06cc\u062a&#8221; \u0628\u0627\u06cc\u062f \u062d\u0641\u0638 \u0634\u0648\u062f \u0648 \u0628\u0627 \u0641\u0639\u0644 \u0627\u0634\u062a\u0628\u0627\u0647 \u06af\u0631\u0641\u062a\u0647 \u0646\u0634\u0648\u062f.import&#8221;\u060c \u0628\u0647\u062a\u0631\u06cc\u0646 \u0627\u0646\u062a\u062e\u0627\u0628 \u0644\u0645\u0627\u062a \u0633\u0627\u0632\u06cc \u0627\u0633\u062a.<\/p>\n<p>\u062f\u0631 \u0622\u062e\u0631\u06cc\u0646 \u0633\u0646\u0627\u0631\u06cc\u0648\u060c \u0641\u0631\u0636 \u06a9\u0646\u06cc\u062f \u062f\u0631 \u062d\u0627\u0644 \u06a9\u0627\u0631 \u0647\u0633\u062a\u06cc\u062f \u0631\u0648\u06cc \u06cc\u06a9 \u062c\u0633\u062a\u062c\u0648\u06cc \u06a9\u0644\u0645\u0647 \u0648 \u0633\u067e\u0633 \u0645\u0642\u0627\u06cc\u0633\u0647 \u0645\u062a\u0646 \u0633\u0646\u062f \u0628\u0627\u0632\u06cc\u0627\u0628\u06cc \u0634\u062f\u0647\u060c \u0627\u0632 \u0686\u0647 \u0686\u06cc\u0632\u06cc \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u062e\u0648\u0627\u0647\u06cc\u062f \u06a9\u0631\u062f\u061f  \u0647\u0645 \u0631\u06cc\u0634\u0647 \u0648 \u0647\u0645 \u0631\u06cc\u0634\u0647 \u06cc\u0627\u0628\u06cc.<\/p>\n<p>\u0645\u0627 \u062a\u0641\u0627\u0648\u062a \u0647\u0627\u06cc \u0628\u06cc\u0646 \u0631\u06cc\u0634\u0647 \u06cc\u0627\u0628\u06cc \u0648 \u0627\u0635\u0637\u0644\u0627\u062d \u0633\u0627\u0632\u06cc \u0631\u0627 \u062f\u0631\u06a9 \u06a9\u0631\u062f\u0647 \u0627\u06cc\u0645.  \u062d\u0627\u0644\u0627 \u0628\u06cc\u0627\u06cc\u06cc\u062f \u0628\u0628\u06cc\u0646\u06cc\u0645 \u0686\u06af\u0648\u0646\u0647 \u0645\u06cc\u200c\u062a\u0648\u0627\u0646\u06cc\u0645 \u0628\u0647 \u062c\u0627\u06cc \u06cc\u06a9 \u062c\u0645\u0644\u0647\u060c \u06a9\u0644 \u0628\u0631\u0631\u0633\u06cc \u0631\u0627 \u0628\u0647 \u0635\u0648\u0631\u062a \u0645\u0641\u0647\u0648\u0645\u06cc \u0628\u06cc\u0627\u0646 \u06a9\u0646\u06cc\u0645.<\/p>\n<h3 id=\"lemmatizationofareview\"><span class=\"ez-toc-section\" id=\"%d8%ae%d9%84%d8%a7%d8%b5%d9%87_%d8%b3%d8%a7%d8%b2%db%8c_%db%8c%da%a9_%d8%a8%d8%b1%d8%b1%d8%b3%db%8c\"><\/span>\u062e\u0644\u0627\u0635\u0647 \u0633\u0627\u0632\u06cc \u06cc\u06a9 \u0628\u0631\u0631\u0633\u06cc<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p>\u0628\u0631\u0627\u06cc \u0628\u06cc\u0627\u0646 \u0645\u0641\u0647\u0648\u0645\u06cc \u06a9\u0644 \u0628\u0631\u0631\u0633\u06cc\u060c \u0641\u0642\u0637 \u0628\u0627\u06cc\u062f \u0622\u0646 \u0631\u0627 \u0627\u0635\u0644\u0627\u062d \u06a9\u0646\u06cc\u0645 <code>.join()<\/code>.  \u0628\u0647 \u062c\u0627\u06cc \u067e\u06cc\u0648\u0633\u062a\u0646 \u06a9\u0644\u0645\u0627\u062a \u062f\u0631 \u06cc\u06a9 \u062c\u0645\u0644\u0647\u060c \u062c\u0645\u0644\u0627\u062a \u0631\u0627 \u062f\u0631 \u06cc\u06a9 \u0645\u0631\u0648\u0631 \u0645\u06cc\u200c\u067e\u06cc\u0648\u0646\u062f\u06cc\u0645:<\/p>\n<pre><code class=\"hljs\">\ncorpus_words = <span class=\"hljs-string\">'\\n'<\/span>.join(<span class=\"hljs-string\">' '<\/span>.join(sentence) <span class=\"hljs-keyword\">for<\/span> sentence <span class=\"hljs-keyword\">in<\/span> pos_review)\n<\/code><\/pre>\n<p>\u067e\u0633 \u0627\u0632 \u062a\u0628\u062f\u06cc\u0644 \u067e\u06cc\u06a9\u0631\u0647 \u0628\u0647 \u06cc\u06a9 \u0631\u0634\u062a\u0647\u060c \u0645\u06cc\u200c\u062a\u0648\u0627\u0646\u06cc\u0645 \u0628\u0647 \u0647\u0645\u0627\u0646 \u0631\u0648\u0634\u06cc \u06a9\u0647 \u0628\u0631\u0627\u06cc \u062c\u0645\u0644\u0647\u200c\u0627\u06cc \u0628\u0648\u062f\u060c \u0622\u0646 \u0631\u0627 \u0628\u0647 \u0635\u0648\u0631\u062a \u06a9\u0644\u0645\u0647\u200c\u0628\u0646\u062f\u06cc \u06a9\u0646\u06cc\u0645:<\/p>\n<pre><code class=\"hljs\">blob_object = TextBlob(pos_rev)\ncorpus_words = blob_object.words\ncorpus_words.lemmatize()\n<\/code><\/pre>\n<p>\u0627\u06cc\u0646 \u06cc\u06a9 \u0634\u06cc WordList \u0628\u0627 \u0645\u062a\u0646 \u0628\u0631\u0631\u0633\u06cc \u06a9\u0627\u0645\u0644 \u0627\u06cc\u062c\u0627\u062f \u0645\u06cc \u06a9\u0646\u062f.  \u062f\u0631 \u0627\u06cc\u0646\u062c\u0627\u060c \u0645\u0627 \u0628\u0631\u062e\u06cc \u0627\u0632 \u0642\u0633\u0645\u062a \u0647\u0627 \u0631\u0627 \u0628\u0627 \u0628\u06cc\u0636\u06cc \u062d\u0630\u0641 \u0645\u06cc \u06a9\u0646\u06cc\u0645 <code>(...)<\/code> \u0627\u0632 \u0622\u0646\u062c\u0627\u06cc\u06cc \u06a9\u0647 \u0628\u0631\u0631\u0633\u06cc \u0628\u0632\u0631\u06af \u0627\u0633\u062a\u060c \u0627\u0645\u0627 \u0634\u0645\u0627 \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u062f \u0622\u0646 \u0631\u0627 \u0628\u0647 \u0634\u06a9\u0644 \u06cc\u06a9\u067e\u0627\u0631\u0686\u0647 \u0622\u0646 \u0628\u0628\u06cc\u0646\u06cc\u062f.  \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u0645 \u062c\u0645\u0644\u0647 \u062e\u0648\u062f \u0631\u0627 \u062f\u0631 \u0648\u0633\u0637 \u0622\u0646 \u0628\u0628\u06cc\u0646\u06cc\u0645:<\/p>\n<pre><code class=\"hljs\">WordList(('the', 'relaxed', 'dude', 'rides', 'a', 'roller', 'coaster', 'the', 'big',\n'lebowski', 'a', 'film', 'review', 'by', 'michael', 'redman', 'copyright', '1998', 'by',\n'michael', 'redman', 'the', 'most', 'surreal', 'situations', 'are', 'ordinary', 'everyday',\n'life', 'as', 'viewed', 'by', 'an', 'outsider', 'when', 'those', 'observers', 'are', 'joel',\n(...) \n\n'the', 'carpet', 'is', 'important', 'to', 'him', 'because', 'it', 'pulls', 'the', 'room',\n'together', 'not', 'surprisingly', 'since', 'it', 's', 'virtually', 'the', 'only', 'object',\n'there'\n\n(...)\n'com', 'is', 'the', 'eaddress', 'for', 'estuff'))\n<\/code><\/pre>\n<h2 id=\"conclusion\"><span class=\"ez-toc-section\" id=\"%d9%86%d8%aa%db%8c%d8%ac%d9%87\"><\/span>\u0646\u062a\u06cc\u062c\u0647<span class=\"ez-toc-section-end\"><\/span><\/h2>\n<p>\u067e\u0633 \u0627\u0632 \u0648\u0627\u0698\u0647 \u0633\u0627\u0632\u06cc \u062c\u0645\u0644\u0647 \u0648 \u0628\u0631\u0631\u0633\u06cc\u060c \u0645\u06cc \u0628\u06cc\u0646\u06cc\u0645 \u06a9\u0647 \u0647\u0631 \u062f\u0648 \u0627\u0628\u062a\u062f\u0627 \u06a9\u0644\u0645\u0627\u062a \u067e\u06cc\u06a9\u0631\u0647 \u0631\u0627 \u0627\u0633\u062a\u062e\u0631\u0627\u062c \u0645\u06cc \u06a9\u0646\u0646\u062f.  \u0627\u06cc\u0646 \u0628\u062f\u0627\u0646 \u0645\u0639\u0646\u0627\u0633\u062a \u06a9\u0647 \u0648\u0627\u0698\u0647\u200c\u0633\u0627\u0632\u06cc \u062f\u0631 \u0633\u0637\u062d \u06a9\u0644\u0645\u0647 \u0627\u062a\u0641\u0627\u0642 \u0645\u06cc\u200c\u0627\u0641\u062a\u062f\u060c \u06a9\u0647 \u0647\u0645\u0686\u0646\u06cc\u0646 \u0628\u0647 \u0627\u06cc\u0646 \u0645\u0639\u0646\u06cc \u0627\u0633\u062a \u06a9\u0647 \u0645\u06cc\u200c\u062a\u0648\u0627\u0646 \u0622\u0646 \u0631\u0627 \u0628\u0647 \u06cc\u06a9 \u06a9\u0644\u0645\u0647\u060c \u06cc\u06a9 \u062c\u0645\u0644\u0647 \u06cc\u0627 \u06cc\u06a9 \u0645\u062a\u0646 \u06a9\u0627\u0645\u0644 \u0627\u0639\u0645\u0627\u0644 \u06a9\u0631\u062f.  \u0628\u0631\u0627\u06cc \u06cc\u06a9 \u06a9\u0644\u0645\u0647 \u06cc\u0627 \u0647\u0631 \u0645\u062c\u0645\u0648\u0639\u0647 \u0627\u06cc \u0627\u0632 \u06a9\u0644\u0645\u0627\u062a \u06a9\u0627\u0631 \u0645\u06cc \u06a9\u0646\u062f.<\/p>\n<p>\u0627\u06cc\u0646 \u0647\u0645\u0686\u0646\u06cc\u0646 \u0646\u0634\u0627\u0646 \u0645\u06cc \u062f\u0647\u062f \u06a9\u0647 \u0645\u0645\u06a9\u0646 \u0627\u0633\u062a \u06a9\u0646\u062f\u062a\u0631 \u0628\u0627\u0634\u062f \u0632\u06cc\u0631\u0627 \u0644\u0627\u0632\u0645 \u0627\u0633\u062a \u0627\u0628\u062a\u062f\u0627 \u0645\u062a\u0646 \u0631\u0627 \u0628\u0647 \u0646\u0634\u0627\u0646\u0647 \u0647\u0627 \u062a\u0642\u0633\u06cc\u0645 \u06a9\u0646\u06cc\u062f \u062a\u0627 \u0628\u0639\u062f\u0627\u064b \u0622\u0646 \u0631\u0627 \u0627\u0639\u0645\u0627\u0644 \u06a9\u0646\u06cc\u062f.  \u0648 \u0627\u0632 \u0622\u0646\u062c\u0627\u06cc\u06cc \u06a9\u0647 \u0648\u0627\u0698\u0647\u200c\u0633\u0627\u0632\u06cc \u0645\u062e\u062a\u0635 \u0628\u0647 \u0632\u0645\u06cc\u0646\u0647 \u0627\u0633\u062a\u060c \u0647\u0645\u0627\u0646\u0637\u0648\u0631 \u06a9\u0647 \u062f\u06cc\u062f\u06cc\u0645\u060c \u067e\u06cc\u0634\u200c\u067e\u0631\u062f\u0627\u0632\u0634 \u062e\u0648\u0628 \u0645\u062a\u0646 \u0642\u0628\u0644 \u0627\u0632 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 \u0622\u0646\u060c \u062d\u0635\u0648\u0644 \u0627\u0637\u0645\u06cc\u0646\u0627\u0646 \u0627\u0632 \u062a\u0641\u06a9\u06cc\u06a9 \u0635\u062d\u06cc\u062d \u0628\u0647 \u0646\u0634\u0627\u0646\u0647\u200c\u0647\u0627 \u0648 \u0628\u062e\u0634 \u0645\u0646\u0627\u0633\u0628 \u0628\u0631\u0686\u0633\u0628\u200c\u06af\u0630\u0627\u0631\u06cc \u06af\u0641\u062a\u0627\u0631 \u0646\u06cc\u0632 \u0628\u0633\u06cc\u0627\u0631 \u0645\u0647\u0645 \u0627\u0633\u062a.  \u0647\u0631 \u062f\u0648 \u0646\u062a\u0627\u06cc\u062c \u0631\u0627 \u0627\u0641\u0632\u0627\u06cc\u0634 \u0645\u06cc \u062f\u0647\u0646\u062f.<\/p>\n<blockquote>\n<p>\u0627\u06af\u0631 \u0628\u0627 \u0628\u0631\u0686\u0633\u0628 \u06af\u0630\u0627\u0631\u06cc \u0628\u062e\u0634\u06cc \u0627\u0632 \u06af\u0641\u062a\u0627\u0631 (\u0628\u0631\u0686\u0633\u0628 \u06af\u0630\u0627\u0631\u06cc POS) \u0622\u0634\u0646\u0627 \u0646\u06cc\u0633\u062a\u06cc\u062f\u060c \u0631\u0627\u0647\u0646\u0645\u0627\u06cc \u067e\u0627\u06cc\u062a\u0648\u0646 \u0645\u0627 \u0631\u0627 \u0628\u0631\u0627\u06cc NLP: \u0642\u0633\u0645\u062a \u0647\u0627\u06cc\u06cc \u0627\u0632 \u0628\u0631\u0686\u0633\u0628 \u0632\u062f\u0646 \u06af\u0641\u062a\u0627\u0631 \u0648 \u0631\u0627\u0647\u0646\u0645\u0627\u06cc \u062a\u0634\u062e\u06cc\u0635 \u0646\u0647\u0627\u062f \u0646\u0627\u0645\u06af\u0630\u0627\u0631\u06cc \u0634\u062f\u0647 \u0628\u0631\u0631\u0633\u06cc \u06a9\u0646\u06cc\u062f.<\/p>\n<\/blockquote>\n<p>\u0645\u0627 \u0647\u0645\u0686\u0646\u06cc\u0646 \u062f\u06cc\u062f\u0647\u200c\u0627\u06cc\u0645 \u06a9\u0647 \u0686\u06af\u0648\u0646\u0647 \u0648\u0627\u0698\u0647\u200c\u0633\u0627\u0632\u06cc \u0628\u0627 \u0631\u06cc\u0634\u0647 \u06a9\u0631\u062f\u0646\u060c \u062a\u06a9\u0646\u06cc\u06a9 \u062f\u06cc\u06af\u0631\u06cc \u0628\u0631\u0627\u06cc \u06a9\u0627\u0647\u0634 \u06a9\u0644\u0645\u0627\u062a \u06a9\u0647 \u0628\u0627\u0641\u062a \u0622\u0646\u0647\u0627 \u0631\u0627 \u062d\u0641\u0638 \u0646\u0645\u06cc\u200c\u06a9\u0646\u062f\u060c \u0645\u062a\u0641\u0627\u0648\u062a \u0627\u0633\u062a.  \u0628\u0647 \u0647\u0645\u06cc\u0646 \u062f\u0644\u06cc\u0644 \u0645\u0639\u0645\u0648\u0644\u0627\u064b \u0633\u0631\u06cc\u0639\u062a\u0631 \u0627\u0633\u062a.<\/p>\n<p>\u0631\u0627\u0647 \u0647\u0627\u06cc \u0632\u06cc\u0627\u062f\u06cc \u0628\u0631\u0627\u06cc \u0627\u0646\u062c\u0627\u0645 \u0648\u0627\u0698\u0647 \u0633\u0627\u0632\u06cc \u0648\u062c\u0648\u062f \u062f\u0627\u0631\u062f \u0648 TextBlob \u06cc\u06a9 \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 \u0639\u0627\u0644\u06cc \u0628\u0631\u0627\u06cc \u0634\u0631\u0648\u0639 \u06a9\u0627\u0631 \u0628\u0627 NLP \u0627\u0633\u062a.  \u0627\u06cc\u0646 \u06cc\u06a9 API \u0633\u0627\u062f\u0647 \u0627\u0631\u0627\u0626\u0647 \u0645\u06cc \u062f\u0647\u062f \u06a9\u0647 \u0628\u0647 \u06a9\u0627\u0631\u0628\u0631\u0627\u0646 \u0627\u062c\u0627\u0632\u0647 \u0645\u06cc \u062f\u0647\u062f \u062a\u0627 \u0628\u0647 \u0633\u0631\u0639\u062a \u0634\u0631\u0648\u0639 \u0628\u0647 \u06a9\u0627\u0631 \u06a9\u0646\u0646\u062f \u0631\u0648\u06cc \u0648\u0638\u0627\u06cc\u0641 NLP  \u0627\u06af\u0631 \u062f\u0631 \u067e\u0631\u0648\u0698\u0647\u200c\u0627\u06cc \u0627\u0632 \u0648\u0627\u0698\u0647\u200c\u0633\u0627\u0632\u06cc \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0631\u062f\u0647\u200c\u0627\u06cc\u062f \u06cc\u0627 \u0642\u0635\u062f \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 \u0622\u0646 \u0631\u0627 \u062f\u0627\u0631\u06cc\u062f\u060c \u0646\u0638\u0631 \u0628\u062f\u0647\u06cc\u062f.<\/p>\n<p>\u06a9\u062f \u0646\u0648\u06cc\u0633\u06cc \u0645\u0628\u0627\u0631\u06a9!<\/p>\n<\/div>\n<p><script>\n                        !function(f,b,e,v,n,t,s)\n                        {if(f.fbq)return;n=f.fbq=function(){n.callMethod?\n                        n.callMethod.apply(n,arguments):n.queue.push(arguments)};\n                        if(!f._fbq)f._fbq=n;n.push=n;n.loaded=!0;n.version='2.0';\n                        n.queue=();t=b.createElement(e);t.async=!0;\n                        t.src=v;s=b.getElementsByTagName(e)(0);\n                        s.parentNode.insertBefore(t,s)}(window, document,'script',\n                        'https:\/\/connect.facebook.net\/en_US\/fbevents.js');\n                        fbq('init', '525232124909042');\n                        fbq('track', 'PageView');\n                    <\/script>    (\u0628\u0631\u0686\u0633\u0628\u200c\u0647\u0627 \u0628\u0647 \u062a\u0631\u062c\u0645\u0647)# python<br \/>\n<br \/><br \/>\n<br \/>\u0645\u0646\u062a\u0634\u0631 \u0634\u062f\u0647 \u062f\u0631 1402-12-31 08:41:04<br \/>\n<\/p>\n\n\n<div class=\"kk-star-ratings kksr-auto kksr-align-center kksr-valign-bottom\"\n    data-payload='{&quot;align&quot;:&quot;center&quot;,&quot;id&quot;:&quot;12575&quot;,&quot;slug&quot;:&quot;default&quot;,&quot;valign&quot;:&quot;bottom&quot;,&quot;ignore&quot;:&quot;&quot;,&quot;reference&quot;:&quot;auto&quot;,&quot;class&quot;:&quot;&quot;,&quot;count&quot;:&quot;0&quot;,&quot;legendonly&quot;:&quot;&quot;,&quot;readonly&quot;:&quot;&quot;,&quot;score&quot;:&quot;0&quot;,&quot;starsonly&quot;:&quot;&quot;,&quot;best&quot;:&quot;5&quot;,&quot;gap&quot;:&quot;5&quot;,&quot;greet&quot;:&quot;\u0627\u0645\u062a\u06cc\u0627\u0632 \u0634\u0645\u0627 \u0628\u0647 \u0627\u06cc\u0646 \u0645\u0637\u0644\u0628&quot;,&quot;legend&quot;:&quot;0\\\/5 (0 \u0631\u0627\u06cc)&quot;,&quot;size&quot;:&quot;30&quot;,&quot;title&quot;:&quot;NLP \u0633\u0627\u062f\u0647 \u062f\u0631 \u067e\u0627\u06cc\u062a\u0648\u0646 \u0628\u0627 TextBlob: Lemmatization&quot;,&quot;width&quot;:&quot;0&quot;,&quot;_legend&quot;:&quot;{score}\\\/{best} ({count} \u0631\u0627\u06cc)&quot;,&quot;font_factor&quot;:&quot;1.25&quot;}'>\n            \n<div class=\"kksr-stars\">\n    \n<div class=\"kksr-stars-inactive\">\n            <div class=\"kksr-star\" data-star=\"1\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" data-star=\"2\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" data-star=\"3\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" data-star=\"4\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" data-star=\"5\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n    <\/div>\n    \n<div class=\"kksr-stars-active\" style=\"width: 0px;\">\n            <div class=\"kksr-star\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n    <\/div>\n<\/div>\n                \n\n<div class=\"kksr-legend\" style=\"font-size: 24px;\">\n            <span class=\"kksr-muted\">\u0627\u0645\u062a\u06cc\u0627\u0632 \u0634\u0645\u0627 \u0628\u0647 \u0627\u06cc\u0646 \u0645\u0637\u0644\u0628<\/span>\n    <\/div>\n    <\/div>\n","protected":false},"excerpt":{"rendered":"<p><span class=\"span-reading-time rt-reading-time\" style=\"display: block;\"><span class=\"rt-label rt-prefix\">\u0632\u0645\u0627\u0646 \u0644\u0627\u0632\u0645 \u0628\u0631\u0627\u06cc \u0645\u0637\u0627\u0644\u0639\u0647: <\/span> <span class=\"rt-time\"> 9<\/span> <span class=\"rt-label rt-postfix\">\u062f\u0642\u06cc\u0642\u0647<\/span><\/span>\u0645\u0639\u0631\u0641\u06cc TextBlob \u06cc\u06a9 \u0628\u0633\u062a\u0647 \u0633\u0627\u062e\u062a\u0647 \u0634\u062f\u0647 \u0627\u0633\u062a \u0631\u0648\u06cc \u062f\u0631 \u0628\u0627\u0644\u0627\u06cc \u062f\u0648 \u0628\u0633\u062a\u0647 \u062f\u06cc\u06af\u0631\u060c \u06cc\u06a9\u06cc \u0627\u0632 \u0622\u0646\u0647\u0627 Natural Language Toolkit \u0646\u0627\u0645 \u062f\u0627\u0631\u062f \u06a9\u0647 \u0639\u0645\u062f\u062a\u0627\u064b \u0628\u0647 \u0635\u0648\u0631\u062a \u0645\u062e\u0641\u0641 \u0622\u0646 \u0634\u0646\u0627\u062e\u062a\u0647 \u0645\u06cc \u0634\u0648\u062f. NLTK\u060c \u0648 \u062f\u06cc\u06af\u0631\u06cc \u0627\u0633\u062a \u0627\u0644\u06af\u0648. NLTK \u06cc\u06a9 \u0628\u0633\u062a\u0647 \u0633\u0646\u062a\u06cc \u0627\u0633\u062a \u06a9\u0647 \u0628\u0631\u0627\u06cc \u067e\u0631\u062f\u0627\u0632\u0634 \u0645\u062a\u0646 \u06cc\u0627 \u067e\u0631\u062f\u0627\u0632\u0634 \u0632\u0628\u0627\u0646 \u0637\u0628\u06cc\u0639\u06cc (NLP)\u0648 Pattern \u0639\u0645\u062f\u062a\u0627\u064b \u0628\u0631\u0627\u06cc \u0648\u0628 \u06a9\u0627\u0648\u06cc \u0633\u0627\u062e\u062a\u0647 [&hellip;]<\/p>\n","protected":false},"author":3,"featured_media":9162,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"footnotes":""},"categories":[1743,620],"tags":[],"class_list":["post-12575","post","type-post","status-publish","format-standard","has-post-thumbnail","hentry","category-python","category-programming"],"acf":[],"_links":{"self":[{"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/posts\/12575","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/users\/3"}],"replies":[{"embeddable":true,"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/comments?post=12575"}],"version-history":[{"count":0,"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/posts\/12575\/revisions"}],"wp:featuredmedia":[{"embeddable":true,"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/media\/9162"}],"wp:attachment":[{"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/media?parent=12575"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/categories?post=12575"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/tags?post=12575"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}