{"id":16341,"date":"2024-01-23T19:05:37","date_gmt":"2024-01-23T15:35:37","guid":{"rendered":"https:\/\/rasanegar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%d8%aa%d8%ac%d8%b2%db%8c%d9%87-%d9%88-%d8%aa%d8%ad%d9%84%db%8c%d9%84-%d8%a7%d8%ad%d8%b3%d8%a7%d8%b3%d8%a7%d8%aa-%d8%a8%d8%a7-scikit-l\/"},"modified":"2024-01-23T19:05:37","modified_gmt":"2024-01-23T15:35:37","slug":"%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%d8%aa%d8%ac%d8%b2%db%8c%d9%87-%d9%88-%d8%aa%d8%ad%d9%84%db%8c%d9%84-%d8%a7%d8%ad%d8%b3%d8%a7%d8%b3%d8%a7%d8%aa-%d8%a8%d8%a7-scikit-l","status":"publish","type":"post","link":"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%d8%aa%d8%ac%d8%b2%db%8c%d9%87-%d9%88-%d8%aa%d8%ad%d9%84%db%8c%d9%84-%d8%a7%d8%ad%d8%b3%d8%a7%d8%b3%d8%a7%d8%aa-%d8%a8%d8%a7-scikit-l\/","title":{"rendered":"\u067e\u0627\u06cc\u062a\u0648\u0646 \u0628\u0631\u0627\u06cc NLP: \u062a\u062c\u0632\u06cc\u0647 \u0648 \u062a\u062d\u0644\u06cc\u0644 \u0627\u062d\u0633\u0627\u0633\u0627\u062a \u0628\u0627 Scikit-Learn"},"content":{"rendered":"<div id=\"ez-toc-container\" class=\"ez-toc-v2_0_85 counter-hierarchy ez-toc-counter ez-toc-custom ez-toc-container-direction\">\n<div class=\"ez-toc-title-container\"><p class=\"ez-toc-title\" style=\"cursor:inherit\">\u0633\u0631\u0641\u0635\u0644\u0647\u0627\u06cc \u0645\u0637\u0644\u0628<\/p>\n<\/div><nav><ul class='ez-toc-list ez-toc-list-level-1 ' ><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class=\"ez-toc-link ez-toc-heading-1\" href=\"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%d8%aa%d8%ac%d8%b2%db%8c%d9%87-%d9%88-%d8%aa%d8%ad%d9%84%db%8c%d9%84-%d8%a7%d8%ad%d8%b3%d8%a7%d8%b3%d8%a7%d8%aa-%d8%a8%d8%a7-scikit-l\/#%d8%aa%d8%b9%d8%b1%db%8c%d9%81_%d9%85%d8%b4%da%a9%d9%84\" >\u062a\u0639\u0631\u06cc\u0641 \u0645\u0634\u06a9\u0644<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class=\"ez-toc-link ez-toc-heading-2\" href=\"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%d8%aa%d8%ac%d8%b2%db%8c%d9%87-%d9%88-%d8%aa%d8%ad%d9%84%db%8c%d9%84-%d8%a7%d8%ad%d8%b3%d8%a7%d8%b3%d8%a7%d8%aa-%d8%a8%d8%a7-scikit-l\/#%d8%b1%d8%a7%d9%87_%d8%ad%d9%84\" >\u0631\u0627\u0647 \u062d\u0644<\/a><ul class='ez-toc-list-level-3' ><li class='ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-3\" href=\"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%d8%aa%d8%ac%d8%b2%db%8c%d9%87-%d9%88-%d8%aa%d8%ad%d9%84%db%8c%d9%84-%d8%a7%d8%ad%d8%b3%d8%a7%d8%b3%d8%a7%d8%aa-%d8%a8%d8%a7-scikit-l\/#%d9%88%d8%a7%d8%b1%d8%af%d8%a7%d8%aa_%da%a9%d8%aa%d8%a7%d8%a8%d8%ae%d8%a7%d9%86%d9%87_%d9%87%d8%a7%db%8c_%d9%85%d9%88%d8%b1%d8%af_%d9%86%db%8c%d8%a7%d8%b2\" >\u0648\u0627\u0631\u062f\u0627\u062a \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 \u0647\u0627\u06cc \u0645\u0648\u0631\u062f \u0646\u06cc\u0627\u0632<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-4\" href=\"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%d8%aa%d8%ac%d8%b2%db%8c%d9%87-%d9%88-%d8%aa%d8%ad%d9%84%db%8c%d9%84-%d8%a7%d8%ad%d8%b3%d8%a7%d8%b3%d8%a7%d8%aa-%d8%a8%d8%a7-scikit-l\/#%d9%88%d8%a7%d8%b1%d8%af_%da%a9%d8%b1%d8%af%d9%86_%d9%85%d8%ac%d9%85%d9%88%d8%b9%d9%87_%d8%af%d8%a7%d8%af%d9%87\" >\u0648\u0627\u0631\u062f \u06a9\u0631\u062f\u0646 \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-5\" href=\"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%d8%aa%d8%ac%d8%b2%db%8c%d9%87-%d9%88-%d8%aa%d8%ad%d9%84%db%8c%d9%84-%d8%a7%d8%ad%d8%b3%d8%a7%d8%b3%d8%a7%d8%aa-%d8%a8%d8%a7-scikit-l\/#%d8%aa%d8%ad%d9%84%db%8c%d9%84_%d8%af%d8%a7%d8%af%d9%87_%d9%87%d8%a7\" >\u062a\u062d\u0644\u06cc\u0644 \u062f\u0627\u062f\u0647 \u0647\u0627<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-6\" href=\"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%d8%aa%d8%ac%d8%b2%db%8c%d9%87-%d9%88-%d8%aa%d8%ad%d9%84%db%8c%d9%84-%d8%a7%d8%ad%d8%b3%d8%a7%d8%b3%d8%a7%d8%aa-%d8%a8%d8%a7-scikit-l\/#%d9%be%d8%a7%da%a9%d8%b3%d8%a7%d8%b2%db%8c_%d8%af%d8%a7%d8%af%d9%87_%d9%87%d8%a7\" >\u067e\u0627\u06a9\u0633\u0627\u0632\u06cc \u062f\u0627\u062f\u0647 \u0647\u0627<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-7\" href=\"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%d8%aa%d8%ac%d8%b2%db%8c%d9%87-%d9%88-%d8%aa%d8%ad%d9%84%db%8c%d9%84-%d8%a7%d8%ad%d8%b3%d8%a7%d8%b3%d8%a7%d8%aa-%d8%a8%d8%a7-scikit-l\/#%d9%86%d9%85%d8%a7%db%8c%d8%b4_%d9%85%d8%aa%d9%86_%d8%a8%d9%87_%d8%b4%da%a9%d9%84_%d8%b9%d8%af%d8%af%db%8c\" >\u0646\u0645\u0627\u06cc\u0634 \u0645\u062a\u0646 \u0628\u0647 \u0634\u06a9\u0644 \u0639\u062f\u062f\u06cc<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-8\" href=\"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%d8%aa%d8%ac%d8%b2%db%8c%d9%87-%d9%88-%d8%aa%d8%ad%d9%84%db%8c%d9%84-%d8%a7%d8%ad%d8%b3%d8%a7%d8%b3%d8%a7%d8%aa-%d8%a8%d8%a7-scikit-l\/#%d8%aa%d9%82%d8%b3%db%8c%d9%85_%d8%af%d8%a7%d8%af%d9%87_%d9%87%d8%a7_%d8%a8%d9%87_%d9%85%d8%ac%d9%85%d9%88%d8%b9%d9%87_%d9%87%d8%a7%db%8c_%d8%a2%d9%85%d9%88%d8%b2%d8%b4%db%8c_%d9%88_%d8%a2%d8%b2%d9%85%d8%a7%db%8c%d8%b4%db%8c\" >\u062a\u0642\u0633\u06cc\u0645 \u062f\u0627\u062f\u0647 \u0647\u0627 \u0628\u0647 \u0645\u062c\u0645\u0648\u0639\u0647 \u0647\u0627\u06cc \u0622\u0645\u0648\u0632\u0634\u06cc \u0648 \u0622\u0632\u0645\u0627\u06cc\u0634\u06cc<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-9\" href=\"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%d8%aa%d8%ac%d8%b2%db%8c%d9%87-%d9%88-%d8%aa%d8%ad%d9%84%db%8c%d9%84-%d8%a7%d8%ad%d8%b3%d8%a7%d8%b3%d8%a7%d8%aa-%d8%a8%d8%a7-scikit-l\/#%d8%a2%d9%85%d9%88%d8%b2%d8%b4_%d9%85%d8%af%d9%84\" >\u0622\u0645\u0648\u0632\u0634 \u0645\u062f\u0644<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-10\" href=\"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%d8%aa%d8%ac%d8%b2%db%8c%d9%87-%d9%88-%d8%aa%d8%ad%d9%84%db%8c%d9%84-%d8%a7%d8%ad%d8%b3%d8%a7%d8%b3%d8%a7%d8%aa-%d8%a8%d8%a7-scikit-l\/#%d9%be%db%8c%d8%b4_%d8%a8%db%8c%d9%86%db%8c_%d9%88_%d8%a7%d8%b1%d8%b2%db%8c%d8%a7%d8%a8%db%8c_%d9%85%d8%af%d9%84\" >\u067e\u06cc\u0634 \u0628\u06cc\u0646\u06cc \u0648 \u0627\u0631\u0632\u06cc\u0627\u0628\u06cc \u0645\u062f\u0644<\/a><\/li><\/ul><\/li><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class=\"ez-toc-link ez-toc-heading-11\" href=\"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%d8%aa%d8%ac%d8%b2%db%8c%d9%87-%d9%88-%d8%aa%d8%ad%d9%84%db%8c%d9%84-%d8%a7%d8%ad%d8%b3%d8%a7%d8%b3%d8%a7%d8%aa-%d8%a8%d8%a7-scikit-l\/#%d9%86%d8%aa%db%8c%d8%ac%d9%87\" >\u0646\u062a\u06cc\u062c\u0647<\/a><\/li><\/ul><\/nav><\/div>\n<span class=\"span-reading-time rt-reading-time\" style=\"display: block;\"><span class=\"rt-label rt-prefix\">\u0632\u0645\u0627\u0646 \u0644\u0627\u0632\u0645 \u0628\u0631\u0627\u06cc \u0645\u0637\u0627\u0644\u0639\u0647: <\/span> <span class=\"rt-time\"> 8<\/span> <span class=\"rt-label rt-postfix\">\u062f\u0642\u06cc\u0642\u0647<\/span><\/span><p> <br \/>\n<\/p>\n<div><noscript><\/noscript><\/p>\n<p>\u0627\u06cc\u0646 \u067e\u0646\u062c\u0645\u06cc\u0646 \u0645\u0642\u0627\u0644\u0647 \u0627\u0632 \u0645\u062c\u0645\u0648\u0639\u0647 \u0645\u0642\u0627\u0644\u0627\u062a \u0627\u0633\u062a \u0631\u0648\u06cc NLP \u0628\u0631\u0627\u06cc \u067e\u0627\u06cc\u062a\u0648\u0646.  \u062f\u0631 \u0645\u0642\u0627\u0644\u0647 \u0642\u0628\u0644\u06cc \u062e\u0648\u062f \u062a\u0648\u0636\u06cc\u062d \u062f\u0627\u062f\u0645 \u06a9\u0647 \u0686\u06af\u0648\u0646\u0647 \u0645\u06cc\u200c\u062a\u0648\u0627\u0646 \u0627\u0632 \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 spaCy \u067e\u0627\u06cc\u062a\u0648\u0646 \u0628\u0631\u0627\u06cc \u0627\u0646\u062c\u0627\u0645 \u0628\u062e\u0634\u200c\u0647\u0627\u06cc\u06cc \u0627\u0632 \u0628\u0631\u0686\u0633\u0628\u200c\u06af\u0630\u0627\u0631\u06cc \u06af\u0641\u062a\u0627\u0631 \u0648 \u0634\u0646\u0627\u0633\u0627\u06cc\u06cc \u0645\u0648\u062c\u0648\u062f\u06cc\u062a \u0646\u0627\u0645\u200c\u06af\u0630\u0627\u0631\u06cc \u0634\u062f\u0647 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0631\u062f.  \u062f\u0631 \u0627\u06cc\u0646 \u0645\u0642\u0627\u0644\u0647\u060c \u0631\u0648\u0634 \u0627\u0646\u062c\u0627\u0645 \u062a\u062c\u0632\u06cc\u0647 \u0648 \u062a\u062d\u0644\u06cc\u0644 \u0627\u062d\u0633\u0627\u0633\u0627\u062a \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 \u062f\u0627\u062f\u0647 \u0647\u0627\u06cc \u062a\u0648\u06cc\u06cc\u062a\u0631 \u0631\u0627 \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 Scikit-Learn \u0646\u0634\u0627\u0646 \u062e\u0648\u0627\u0647\u0645 \u062f\u0627\u062f.<\/p>\n<p>\u062a\u062c\u0632\u06cc\u0647 \u0648 \u062a\u062d\u0644\u06cc\u0644 \u0627\u062d\u0633\u0627\u0633\u0627\u062a \u0628\u0647 \u062a\u062c\u0632\u06cc\u0647 \u0648 \u062a\u062d\u0644\u06cc\u0644 \u06cc\u06a9 \u0646\u0638\u0631 \u06cc\u0627 \u0627\u062d\u0633\u0627\u0633\u0627\u062a \u062f\u0631 \u0645\u0648\u0631\u062f \u0686\u06cc\u0632\u06cc \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 \u062f\u0627\u062f\u0647 \u0647\u0627\u06cc\u06cc \u0645\u0627\u0646\u0646\u062f \u0645\u062a\u0646 \u06cc\u0627 \u062a\u0635\u0627\u0648\u06cc\u0631\u060c \u062a\u0642\u0631\u06cc\u0628\u0627\u064b \u062f\u0631 \u0645\u0648\u0631\u062f \u0647\u0631 \u0686\u06cc\u0632\u06cc \u0627\u0634\u0627\u0631\u0647 \u062f\u0627\u0631\u062f.  \u062a\u062c\u0632\u06cc\u0647 \u0648 \u062a\u062d\u0644\u06cc\u0644 \u0627\u062d\u0633\u0627\u0633\u0627\u062a \u0628\u0647 \u0634\u0631\u06a9\u062a \u0647\u0627 \u062f\u0631 \u062a\u0635\u0645\u06cc\u0645 \u06af\u06cc\u0631\u06cc \u06a9\u0645\u06a9 \u0645\u06cc \u06a9\u0646\u062f process.  \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u0645\u062b\u0627\u0644\u060c \u0627\u06af\u0631 \u0627\u062d\u0633\u0627\u0633\u0627\u062a \u0639\u0645\u0648\u0645\u06cc \u0646\u0633\u0628\u062a \u0628\u0647 \u06cc\u06a9 \u0645\u062d\u0635\u0648\u0644 \u0686\u0646\u062f\u0627\u0646 \u062e\u0648\u0628 \u0646\u0628\u0627\u0634\u062f\u060c \u06cc\u06a9 \u0634\u0631\u06a9\u062a \u0645\u0645\u06a9\u0646 \u0627\u0633\u062a \u0633\u0639\u06cc \u06a9\u0646\u062f \u0645\u062d\u0635\u0648\u0644 \u0631\u0627 \u0627\u0635\u0644\u0627\u062d \u06a9\u0646\u062f \u06cc\u0627 \u062a\u0648\u0644\u06cc\u062f \u0631\u0627 \u0628\u0647 \u0637\u0648\u0631 \u06a9\u0627\u0645\u0644 \u0645\u062a\u0648\u0642\u0641 \u06a9\u0646\u062f \u062a\u0627 \u0627\u0632 \u0636\u0631\u0631 \u062c\u0644\u0648\u06af\u06cc\u0631\u06cc \u06a9\u0646\u062f.<\/p>\n<p>\u0645\u0646\u0627\u0628\u0639 \u0632\u06cc\u0627\u062f\u06cc \u0628\u0631\u0627\u06cc \u0627\u062d\u0633\u0627\u0633\u0627\u062a \u0639\u0645\u0648\u0645\u06cc \u0648\u062c\u0648\u062f \u062f\u0627\u0631\u062f\u060c \u0645\u0627\u0646\u0646\u062f \u0645\u0635\u0627\u062d\u0628\u0647 \u0647\u0627\u06cc \u0639\u0645\u0648\u0645\u06cc\u060c \u0646\u0638\u0631\u0633\u0646\u062c\u06cc \u0647\u0627\u060c \u0646\u0638\u0631\u0633\u0646\u062c\u06cc \u0647\u0627\u060c \u0648 \u063a\u06cc\u0631\u0647. \u0628\u0627 \u0627\u06cc\u0646 \u062d\u0627\u0644\u060c \u0628\u0627 \u067e\u06cc\u0648\u0633\u062a\u0646 \u0627\u0641\u0631\u0627\u062f \u0628\u06cc\u0634\u062a\u0631 \u0648 \u0628\u06cc\u0634\u062a\u0631 \u0628\u0647 \u067e\u0644\u062a \u0641\u0631\u0645 \u0647\u0627\u06cc \u0631\u0633\u0627\u0646\u0647 \u0647\u0627\u06cc \u0627\u062c\u062a\u0645\u0627\u0639\u06cc\u060c \u0648\u0628 \u0633\u0627\u06cc\u062a \u0647\u0627\u06cc\u06cc \u0645\u0627\u0646\u0646\u062f \u0641\u06cc\u0633 \u0628\u0648\u06a9 \u0648 \u062a\u0648\u06cc\u06cc\u062a\u0631 \u0645\u06cc \u062a\u0648\u0627\u0646\u0646\u062f \u0628\u0631\u0627\u06cc \u0627\u062d\u0633\u0627\u0633\u0627\u062a \u0639\u0645\u0648\u0645\u06cc \u062a\u062c\u0632\u06cc\u0647 \u0634\u0648\u0646\u062f.<\/p>\n<p>\u062f\u0631 \u0627\u06cc\u0646 \u0645\u0642\u0627\u0644\u0647 \u062e\u0648\u0627\u0647\u06cc\u0645 \u062f\u06cc\u062f \u06a9\u0647 \u0686\u06af\u0648\u0646\u0647 \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u0645 \u062a\u062d\u0644\u06cc\u0644 \u0627\u062d\u0633\u0627\u0633\u0627\u062a \u062f\u0627\u062f\u0647 \u0647\u0627\u06cc \u0645\u062a\u0646\u06cc \u0631\u0627 \u0627\u0646\u062c\u0627\u0645 \u062f\u0647\u06cc\u0645.<\/p>\n<h2 id=\"problemdefinition\"><span class=\"ez-toc-section\" id=\"%d8%aa%d8%b9%d8%b1%db%8c%d9%81_%d9%85%d8%b4%da%a9%d9%84\"><\/span>\u062a\u0639\u0631\u06cc\u0641 \u0645\u0634\u06a9\u0644<span class=\"ez-toc-section-end\"><\/span><\/h2>\n<p>\u0628\u0627 \u062a\u0648\u062c\u0647 \u0628\u0647 \u062a\u0648\u06cc\u06cc\u062a\u200c\u0647\u0627\u06cc\u06cc \u062f\u0631\u0628\u0627\u0631\u0647 \u0634\u0634 \u0634\u0631\u06a9\u062a \u0647\u0648\u0627\u067e\u06cc\u0645\u0627\u06cc\u06cc \u0627\u06cc\u0627\u0644\u0627\u062a \u0645\u062a\u062d\u062f\u0647\u060c \u0648\u0638\u06cc\u0641\u0647 \u067e\u06cc\u0634\u200c\u0628\u06cc\u0646\u06cc \u0627\u06cc\u0646 \u0627\u0633\u062a \u06a9\u0647 \u0622\u06cc\u0627 \u06cc\u06a9 \u062a\u0648\u06cc\u06cc\u062a \u062d\u0627\u0648\u06cc \u0627\u062d\u0633\u0627\u0633\u0627\u062a \u0645\u062b\u0628\u062a\u060c \u0645\u0646\u0641\u06cc \u06cc\u0627 \u062e\u0646\u062b\u06cc \u062f\u0631\u0628\u0627\u0631\u0647 \u0634\u0631\u06a9\u062a \u0647\u0648\u0627\u067e\u06cc\u0645\u0627\u06cc\u06cc \u0627\u0633\u062a.  \u0627\u06cc\u0646 \u06cc\u06a9 \u06a9\u0627\u0631 \u0622\u0645\u0648\u0632\u0634\u06cc \u0628\u0627 \u0646\u0638\u0627\u0631\u062a \u0645\u0639\u0645\u0648\u0644\u06cc \u0627\u0633\u062a \u06a9\u0647 \u062f\u0631 \u0622\u0646 \u0628\u0627 \u062a\u0648\u062c\u0647 \u0628\u0647 \u06cc\u06a9 \u0631\u0634\u062a\u0647 \u0645\u062a\u0646\u060c \u0628\u0627\u06cc\u062f \u0631\u0634\u062a\u0647 \u0645\u062a\u0646 \u0631\u0627 \u0628\u0647 \u062f\u0633\u062a\u0647 \u0647\u0627\u06cc \u0627\u0632 \u067e\u06cc\u0634 \u062a\u0639\u0631\u06cc\u0641 \u0634\u062f\u0647 \u062f\u0633\u062a\u0647 \u0628\u0646\u062f\u06cc \u06a9\u0646\u06cc\u0645.<\/p>\n<h2 id=\"solution\"><span class=\"ez-toc-section\" id=\"%d8%b1%d8%a7%d9%87_%d8%ad%d9%84\"><\/span>\u0631\u0627\u0647 \u062d\u0644<span class=\"ez-toc-section-end\"><\/span><\/h2>\n<p>\u0628\u0631\u0627\u06cc \u062d\u0644 \u0627\u06cc\u0646 \u0645\u0634\u06a9\u0644\u060c \u062e\u0637 \u0644\u0648\u0644\u0647 \u06cc\u0627\u062f\u06af\u06cc\u0631\u06cc \u0645\u0627\u0634\u06cc\u0646 \u0645\u0639\u0645\u0648\u0644\u06cc \u0631\u0627 \u062f\u0646\u0628\u0627\u0644 \u062e\u0648\u0627\u0647\u06cc\u0645 \u06a9\u0631\u062f.  \u0627\u0628\u062a\u062f\u0627 \u062e\u0648\u0627\u0647\u06cc\u0645 \u06a9\u0631\u062f import \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 \u0647\u0627\u06cc \u0645\u0648\u0631\u062f \u0646\u06cc\u0627\u0632 \u0648 \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647  \u0633\u067e\u0633 \u062a\u062c\u0632\u06cc\u0647 \u0648 \u062a\u062d\u0644\u06cc\u0644 \u062f\u0627\u062f\u0647\u200c\u0647\u0627\u06cc \u0627\u06a9\u062a\u0634\u0627\u0641\u06cc \u0631\u0627 \u0627\u0646\u062c\u0627\u0645 \u062e\u0648\u0627\u0647\u06cc\u0645 \u062f\u0627\u062f \u062a\u0627 \u0628\u0628\u06cc\u0646\u06cc\u0645 \u0622\u06cc\u0627 \u0645\u06cc\u200c\u062a\u0648\u0627\u0646\u06cc\u0645 \u06af\u0631\u0627\u06cc\u0634\u200c\u0647\u0627\u06cc\u06cc \u0631\u0627 \u062f\u0631 \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647 \u067e\u06cc\u062f\u0627 \u06a9\u0646\u06cc\u0645.  \u062f\u0631 \u0645\u0631\u062d\u0644\u0647 \u0628\u0639\u062f\u060c \u067e\u06cc\u0634 \u067e\u0631\u062f\u0627\u0632\u0634 \u0645\u062a\u0646 \u0631\u0627 \u0628\u0631\u0627\u06cc \u062a\u0628\u062f\u06cc\u0644 \u062f\u0627\u062f\u0647 \u0647\u0627\u06cc \u0645\u062a\u0646\u06cc \u0628\u0647 \u062f\u0627\u062f\u0647 \u0647\u0627\u06cc \u0639\u062f\u062f\u06cc \u06a9\u0647 \u0645\u06cc \u062a\u0648\u0627\u0646\u062f \u062a\u0648\u0633\u0637 \u06cc\u06a9 \u0627\u0644\u06af\u0648\u0631\u06cc\u062a\u0645 \u06cc\u0627\u062f\u06af\u06cc\u0631\u06cc \u0645\u0627\u0634\u06cc\u0646 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0634\u0648\u062f\u060c \u0627\u0646\u062c\u0627\u0645 \u062e\u0648\u0627\u0647\u06cc\u0645 \u062f\u0627\u062f.  \u062f\u0631 \u0646\u0647\u0627\u06cc\u062a\u060c \u0645\u0627 \u0627\u0632 \u0627\u0644\u06af\u0648\u0631\u06cc\u062a\u0645\u200c\u0647\u0627\u06cc \u06cc\u0627\u062f\u06af\u06cc\u0631\u06cc \u0645\u0627\u0634\u06cc\u0646 \u0628\u0631\u0627\u06cc \u0622\u0645\u0648\u0632\u0634 \u0648 \u0622\u0632\u0645\u0627\u06cc\u0634 \u0645\u062f\u0644\u200c\u0647\u0627\u06cc \u062a\u062d\u0644\u06cc\u0644 \u0627\u062d\u0633\u0627\u0633\u0627\u062a \u062e\u0648\u062f \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u062e\u0648\u0627\u0647\u06cc\u0645 \u06a9\u0631\u062f.<\/p>\n<h3 id=\"importingtherequiredlibraries\"><span class=\"ez-toc-section\" id=\"%d9%88%d8%a7%d8%b1%d8%af%d8%a7%d8%aa_%da%a9%d8%aa%d8%a7%d8%a8%d8%ae%d8%a7%d9%86%d9%87_%d9%87%d8%a7%db%8c_%d9%85%d9%88%d8%b1%d8%af_%d9%86%db%8c%d8%a7%d8%b2\"><\/span>\u0648\u0627\u0631\u062f\u0627\u062a \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 \u0647\u0627\u06cc \u0645\u0648\u0631\u062f \u0646\u06cc\u0627\u0632<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p>\u0627\u0648\u0644\u06cc\u0646 \u0642\u062f\u0645 \u0645\u062b\u0644 \u0647\u0645\u06cc\u0634\u0647 \u0627\u06cc\u0646 \u0627\u0633\u062a \u06a9\u0647 import \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 \u0647\u0627\u06cc \u0645\u0648\u0631\u062f \u0646\u06cc\u0627\u0632:<\/p>\n<pre><code class=\"hljs\"><span class=\"hljs-keyword\">import<\/span> numpy <span class=\"hljs-keyword\">as<\/span> np \n<span class=\"hljs-keyword\">import<\/span> pandas <span class=\"hljs-keyword\">as<\/span> pd \n<span class=\"hljs-keyword\">import<\/span> re\n<span class=\"hljs-keyword\">import<\/span> nltk \n<span class=\"hljs-keyword\">import<\/span> matplotlib.pyplot <span class=\"hljs-keyword\">as<\/span> plt\n%matplotlib inline\n<\/code><\/pre>\n<p><strong>\u062a\u0648\u062c\u0647 \u062f\u0627\u0634\u062a\u0647 \u0628\u0627\u0634\u06cc\u062f:<\/strong> \u062a\u0645\u0627\u0645 \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0647\u0627\u06cc \u0645\u0642\u0627\u0644\u0647 \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 Jupyter \u0646\u0648\u062a \u0628\u0648\u06a9.<\/p>\n<h3 id=\"importingthedataset\"><span class=\"ez-toc-section\" id=\"%d9%88%d8%a7%d8%b1%d8%af_%da%a9%d8%b1%d8%af%d9%86_%d9%85%d8%ac%d9%85%d9%88%d8%b9%d9%87_%d8%af%d8%a7%d8%af%d9%87\"><\/span>\u0648\u0627\u0631\u062f \u06a9\u0631\u062f\u0646 \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p>\u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647 \u0627\u06cc \u06a9\u0647 \u0645\u0627 \u0645\u06cc \u062e\u0648\u0627\u0647\u06cc\u0645 \u0628\u0631\u0627\u06cc \u0627\u06cc\u0646 \u0645\u0642\u0627\u0644\u0647 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0646\u06cc\u0645 \u0628\u0647 \u0635\u0648\u0631\u062a \u0631\u0627\u06cc\u06af\u0627\u0646 \u062f\u0631 \u0627\u06cc\u0646\u062c\u0627 \u0645\u0648\u062c\u0648\u062f \u0627\u0633\u062a <a rel=\"nofollow noopener\" target=\"_blank\" href=\"https:\/\/github.com\/satyajeetkrjha\/kaggle-Twitter-US-Airline-Sentiment-\/blob\/master\/Tweets.csv\">\u0644\u06cc\u0646\u06a9 GitHub<\/a>.<\/p>\n<p>\u0628\u0647 import \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647\u060c \u0627\u0632 \u067e\u0627\u0646\u062f\u0627\u0647\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u062e\u0648\u0627\u0647\u06cc\u0645 \u06a9\u0631\u062f <code>read_csv<\/code> \u0639\u0645\u0644\u06a9\u0631\u062f\u060c \u0647\u0645\u0627\u0646\u0637\u0648\u0631 \u06a9\u0647 \u062f\u0631 \u0632\u06cc\u0631 \u0646\u0634\u0627\u0646 \u062f\u0627\u062f\u0647 \u0634\u062f\u0647 \u0627\u0633\u062a:<\/p>\n<pre><code class=\"hljs\">data_source_url = <span class=\"hljs-string\">\"https:\/\/raw.githubusercontent.com\/kolaveridi\/kaggle-Twitter-US-Airline-Sentiment-\/master\/Tweets.csv\"<\/span>\nairline_tweets = pd.read_csv(data_source_url)\n<\/code><\/pre>\n<p>\u0628\u06cc\u0627\u06cc\u06cc\u062f \u0627\u0628\u062a\u062f\u0627 \u0628\u0628\u06cc\u0646\u06cc\u0645 \u06a9\u0647 \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647 \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 \u0686\u06af\u0648\u0646\u0647 \u0628\u0647 \u0646\u0638\u0631 \u0645\u06cc \u0631\u0633\u062f <code>head()<\/code> \u0631\u0648\u0634:<\/p>\n<pre><code class=\"hljs\">airline_tweets.head()\n<\/code><\/pre>\n<p>\u062e\u0631\u0648\u062c\u06cc \u0628\u0647 \u0634\u06a9\u0644 \u0632\u06cc\u0631 \u0627\u0633\u062a:<\/p>\n<p><img decoding=\"async\" class=\"img-responsive\" src=\"https:\/\/rasanegar.com\/blog\/wp-content\/uploads\/2024\/01\/python-nlp-sentiment-analysis-scikit-learn-1.png\" alt=\"\" title=\"\"><\/p>\n<h3 id=\"dataanalysis\"><span class=\"ez-toc-section\" id=\"%d8%aa%d8%ad%d9%84%db%8c%d9%84_%d8%af%d8%a7%d8%af%d9%87_%d9%87%d8%a7\"><\/span>\u062a\u062d\u0644\u06cc\u0644 \u062f\u0627\u062f\u0647 \u0647\u0627<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p>\u0628\u06cc\u0627\u06cc\u06cc\u062f \u06a9\u0645\u06cc \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647 \u0631\u0627 \u0628\u0631\u0631\u0633\u06cc \u06a9\u0646\u06cc\u0645 \u062a\u0627 \u0628\u0628\u06cc\u0646\u06cc\u0645 \u0622\u06cc\u0627 \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u0645 \u06af\u0631\u0627\u06cc\u0634 \u0647\u0627\u06cc\u06cc \u0631\u0627 \u067e\u06cc\u062f\u0627 \u06a9\u0646\u06cc\u0645.  \u0627\u0645\u0627 \u0642\u0628\u0644 \u0627\u0632 \u0622\u0646\u060c \u0627\u0646\u062f\u0627\u0632\u0647 \u0637\u0631\u062d \u067e\u06cc\u0634 \u0641\u0631\u0636 \u0631\u0627 \u062a\u063a\u06cc\u06cc\u0631 \u0645\u06cc \u062f\u0647\u06cc\u0645 \u062a\u0627 \u062f\u06cc\u062f \u0628\u0647\u062a\u0631\u06cc \u0646\u0633\u0628\u062a \u0628\u0647 \u0646\u0645\u0648\u062f\u0627\u0631\u0647\u0627 \u062f\u0627\u0634\u062a\u0647 \u0628\u0627\u0634\u06cc\u0645.  \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0632\u06cc\u0631 \u0631\u0627 \u0627\u062c\u0631\u0627 \u06a9\u0646\u06cc\u062f:<\/p>\n<pre><code class=\"hljs\">plot_size = plt.rcParams(<span class=\"hljs-string\">\"figure.figsize\"<\/span>) \n<span class=\"hljs-built_in\">print<\/span>(plot_size(<span class=\"hljs-number\">0<\/span>)) \n<span class=\"hljs-built_in\">print<\/span>(plot_size(<span class=\"hljs-number\">1<\/span>))\n\nplot_size(<span class=\"hljs-number\">0<\/span>) = <span class=\"hljs-number\">8<\/span>\nplot_size(<span class=\"hljs-number\">1<\/span>) = <span class=\"hljs-number\">6<\/span>\nplt.rcParams(<span class=\"hljs-string\">\"figure.figsize\"<\/span>) = plot_size \n<\/code><\/pre>\n<p>\u0628\u06cc\u0627\u06cc\u06cc\u062f \u0627\u0628\u062a\u062f\u0627 \u062a\u0639\u062f\u0627\u062f \u062a\u0648\u06cc\u06cc\u062a \u0647\u0627\u06cc \u0647\u0631 \u0627\u06cc\u0631\u0644\u0627\u06cc\u0646 \u0631\u0627 \u0628\u0628\u06cc\u0646\u06cc\u0645.  \u06cc\u06a9 \u0646\u0645\u0648\u062f\u0627\u0631 \u062f\u0627\u06cc\u0631\u0647 \u0627\u06cc \u0628\u0631\u0627\u06cc \u0622\u0646 \u062a\u0631\u0633\u06cc\u0645 \u0645\u06cc \u06a9\u0646\u06cc\u0645:<\/p>\n<pre><code class=\"hljs\">airline_tweets.airline.value_counts().plot(kind=<span class=\"hljs-string\">'pie'<\/span>, autopct=<span class=\"hljs-string\">'%1.0f%%'<\/span>)\n<\/code><\/pre>\n<p>\u062f\u0631 \u062e\u0631\u0648\u062c\u06cc \u0645\u06cc\u200c\u062a\u0648\u0627\u0646\u06cc\u062f \u062f\u0631\u0635\u062f \u062a\u0648\u06cc\u06cc\u062a\u200c\u0647\u0627\u06cc \u0639\u0645\u0648\u0645\u06cc \u0628\u0631\u0627\u06cc \u0647\u0631 \u0634\u0631\u06a9\u062a \u0647\u0648\u0627\u067e\u06cc\u0645\u0627\u06cc\u06cc \u0631\u0627 \u0628\u0628\u06cc\u0646\u06cc\u062f.  \u06cc\u0648\u0646\u0627\u06cc\u062a\u062f \u0627\u06cc\u0631\u0644\u0627\u06cc\u0646 \u0628\u06cc\u0634\u062a\u0631\u06cc\u0646 \u062a\u0639\u062f\u0627\u062f \u062a\u0648\u06cc\u06cc\u062a \u06cc\u0639\u0646\u06cc 26 \u062f\u0631\u0635\u062f \u0631\u0627 \u062f\u0627\u0631\u062f \u0648 \u067e\u0633 \u0627\u0632 \u0622\u0646 US Airways (20 \u062f\u0631\u0635\u062f) \u0642\u0631\u0627\u0631 \u062f\u0627\u0631\u062f.<\/p>\n<p><img decoding=\"async\" class=\"img-responsive\" src=\"https:\/\/rasanegar.com\/blog\/wp-content\/uploads\/2024\/01\/python-nlp-sentiment-analysis-scikit-learn-2.png\" alt=\"\" title=\"\"><\/p>\n<p>\u0628\u06cc\u0627\u06cc\u06cc\u062f \u0627\u06a9\u0646\u0648\u0646 \u062a\u0648\u0632\u06cc\u0639 \u0627\u062d\u0633\u0627\u0633\u0627\u062a \u062f\u0631 \u0647\u0645\u0647 \u062a\u0648\u06cc\u06cc\u062a \u0647\u0627 \u0631\u0627 \u0628\u0628\u06cc\u0646\u06cc\u0645.  \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0632\u06cc\u0631 \u0631\u0627 \u0627\u062c\u0631\u0627 \u06a9\u0646\u06cc\u062f:<\/p>\n<pre><code class=\"hljs\">airline_tweets.airline_sentiment.value_counts().plot(kind=<span class=\"hljs-string\">'pie'<\/span>, autopct=<span class=\"hljs-string\">'%1.0f%%'<\/span>, colors=(<span class=\"hljs-string\">\"red\"<\/span>, <span class=\"hljs-string\">\"yellow\"<\/span>, <span class=\"hljs-string\">\"green\"<\/span>))\n<\/code><\/pre>\n<p>\u062e\u0631\u0648\u062c\u06cc \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0628\u0627\u0644\u0627 \u0628\u0647 \u0634\u06a9\u0644 \u0632\u06cc\u0631 \u0627\u0633\u062a:<\/p>\n<p><img decoding=\"async\" class=\"img-responsive\" src=\"https:\/\/rasanegar.com\/blog\/wp-content\/uploads\/2024\/01\/python-nlp-sentiment-analysis-scikit-learn-3.png\" alt=\"\" title=\"\"><\/p>\n<p>\u0627\u0632 \u062e\u0631\u0648\u062c\u06cc \u0645\u0634\u0627\u0647\u062f\u0647 \u0645\u06cc\u200c\u06a9\u0646\u06cc\u062f \u06a9\u0647 \u0627\u06a9\u062b\u0631 \u062a\u0648\u06cc\u06cc\u062a\u200c\u0647\u0627 \u0645\u0646\u0641\u06cc \u0647\u0633\u062a\u0646\u062f (63%)\u060c \u067e\u0633 \u0627\u0632 \u0622\u0646 \u062a\u0648\u06cc\u06cc\u062a\u200c\u0647\u0627\u06cc \u062e\u0646\u062b\u06cc (21%) \u0648 \u0633\u067e\u0633 \u062a\u0648\u06cc\u06cc\u062a\u200c\u0647\u0627\u06cc \u0645\u062b\u0628\u062a (16%) \u0647\u0633\u062a\u0646\u062f.<\/p>\n<p>\u062f\u0631 \u0645\u0631\u062d\u0644\u0647 \u0628\u0639\u062f\u060c \u0628\u06cc\u0627\u06cc\u06cc\u062f \u062a\u0648\u0632\u06cc\u0639 \u0627\u062d\u0633\u0627\u0633\u0627\u062a \u0628\u0631\u0627\u06cc \u0647\u0631 \u0634\u0631\u06a9\u062a \u0647\u0648\u0627\u067e\u06cc\u0645\u0627\u06cc\u06cc \u0631\u0627 \u0628\u0628\u06cc\u0646\u06cc\u0645\u060c<\/p>\n<pre><code class=\"hljs\">airline_sentiment = airline_tweets.groupby((<span class=\"hljs-string\">'airline'<\/span>, <span class=\"hljs-string\">'airline_sentiment'<\/span>)).airline_sentiment.count().unstack()\nairline_sentiment.plot(kind=<span class=\"hljs-string\">'bar'<\/span>)\n<\/code><\/pre>\n<p>\u062e\u0631\u0648\u062c\u06cc \u0628\u0647 \u0634\u06a9\u0644 \u0632\u06cc\u0631 \u0627\u0633\u062a:<\/p>\n<p><img decoding=\"async\" class=\"img-responsive\" src=\"https:\/\/rasanegar.com\/blog\/wp-content\/uploads\/2024\/01\/python-nlp-sentiment-analysis-scikit-learn-4.png\" alt=\"\" title=\"\"><\/p>\n<p>\u0627\u0632 \u062e\u0631\u0648\u062c\u06cc \u0645\u0634\u062e\u0635 \u0627\u0633\u062a \u06a9\u0647 \u062a\u0642\u0631\u06cc\u0628\u0627\u064b \u0628\u0631\u0627\u06cc \u0647\u0645\u0647 \u062e\u0637\u0648\u0637 \u0647\u0648\u0627\u06cc\u06cc\u060c \u0627\u06a9\u062b\u0631 \u062a\u0648\u06cc\u06cc\u062a\u200c\u0647\u0627 \u0645\u0646\u0641\u06cc \u0647\u0633\u062a\u0646\u062f \u0648 \u0628\u0647 \u062f\u0646\u0628\u0627\u0644 \u0622\u0646 \u062a\u0648\u06cc\u06cc\u062a\u200c\u0647\u0627\u06cc \u062e\u0646\u062b\u06cc \u0648 \u0645\u062b\u0628\u062a \u0647\u0633\u062a\u0646\u062f.  \u0648\u06cc\u0631\u062c\u06cc\u0646 \u0622\u0645\u0631\u06cc\u06a9\u0627 \u0627\u062d\u062a\u0645\u0627\u0644\u0627 \u062a\u0646\u0647\u0627 \u0634\u0631\u06a9\u062a \u0647\u0648\u0627\u067e\u06cc\u0645\u0627\u06cc\u06cc \u0627\u0633\u062a \u06a9\u0647 \u0646\u0633\u0628\u062a \u0627\u06cc\u0646 \u0633\u0647 \u0627\u062d\u0633\u0627\u0633 \u062a\u0627 \u062d\u062f\u0648\u062f\u06cc \u0645\u0634\u0627\u0628\u0647 \u0627\u0633\u062a.<\/p>\n<p>\u062f\u0631 \u0646\u0647\u0627\u06cc\u062a\u060c \u0628\u06cc\u0627\u06cc\u06cc\u062f \u0627\u0632 \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 Seaborn \u0628\u0631\u0627\u06cc \u0645\u0634\u0627\u0647\u062f\u0647 \u0645\u06cc\u0627\u0646\u06af\u06cc\u0646 \u0633\u0637\u062d \u0627\u0637\u0645\u06cc\u0646\u0627\u0646 \u0628\u0631\u0627\u06cc \u062a\u0648\u06cc\u06cc\u062a\u200c\u0647\u0627\u06cc \u0645\u062a\u0639\u0644\u0642 \u0628\u0647 \u0633\u0647 \u062f\u0633\u062a\u0647 \u0627\u062d\u0633\u0627\u0633\u0627\u062a \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0646\u06cc\u0645.  \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0632\u06cc\u0631 \u0631\u0627 \u0627\u062c\u0631\u0627 \u06a9\u0646\u06cc\u062f:<\/p>\n<pre><code class=\"hljs\"><span class=\"hljs-keyword\">import<\/span> seaborn <span class=\"hljs-keyword\">as<\/span> sns\n\nsns.barplot(x=<span class=\"hljs-string\">'airline_sentiment'<\/span>, y=<span class=\"hljs-string\">'airline_sentiment_confidence'<\/span> , data=airline_tweets)\n<\/code><\/pre>\n<p>\u062e\u0631\u0648\u062c\u06cc \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0628\u0627\u0644\u0627 \u0628\u0647 \u0634\u06a9\u0644 \u0632\u06cc\u0631 \u0627\u0633\u062a:<\/p>\n<p><img decoding=\"async\" class=\"img-responsive\" src=\"https:\/\/rasanegar.com\/blog\/wp-content\/uploads\/2024\/01\/python-nlp-sentiment-analysis-scikit-learn-5.png\" alt=\"\" title=\"\"><\/p>\n<p>\u0627\u0632 \u062e\u0631\u0648\u062c\u06cc \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u062f \u0645\u062a\u0648\u062c\u0647 \u0634\u0648\u06cc\u062f \u06a9\u0647 \u0633\u0637\u062d \u0627\u0637\u0645\u06cc\u0646\u0627\u0646 \u0628\u0631\u0627\u06cc \u062a\u0648\u06cc\u06cc\u062a \u0647\u0627\u06cc \u0645\u0646\u0641\u06cc \u062f\u0631 \u0645\u0642\u0627\u06cc\u0633\u0647 \u0628\u0627 \u062a\u0648\u06cc\u06cc\u062a \u0647\u0627\u06cc \u0645\u062b\u0628\u062a \u0648 \u062e\u0646\u062b\u06cc \u0628\u0627\u0644\u0627\u062a\u0631 \u0627\u0633\u062a.<\/p>\n<p>\u0628\u0647 \u0627\u0646\u062f\u0627\u0632\u0647 \u06a9\u0627\u0641\u06cc \u062a\u062c\u0632\u06cc\u0647 \u0648 \u062a\u062d\u0644\u06cc\u0644 \u062f\u0627\u062f\u0647 \u0647\u0627\u06cc \u0627\u06a9\u062a\u0634\u0627\u0641\u06cc\u060c \u06af\u0627\u0645 \u0628\u0639\u062f\u06cc \u0645\u0627 \u0627\u0646\u062c\u0627\u0645 \u0628\u0631\u062e\u06cc \u067e\u06cc\u0634 \u067e\u0631\u062f\u0627\u0632\u0634 \u0627\u0633\u062a \u0631\u0648\u06cc \u062f\u0627\u062f\u0647 \u0648 \u0633\u067e\u0633 \u062f\u0627\u062f\u0647 \u0647\u0627\u06cc \u0639\u062f\u062f\u06cc \u0631\u0627 \u0645\u0637\u0627\u0628\u0642 \u0634\u06a9\u0644 \u0632\u06cc\u0631 \u0628\u0647 \u062f\u0627\u062f\u0647 \u0647\u0627\u06cc \u0645\u062a\u0646\u06cc \u062a\u0628\u062f\u06cc\u0644 \u06a9\u0646\u06cc\u062f.<\/p>\n<h3 id=\"datacleaning\"><span class=\"ez-toc-section\" id=\"%d9%be%d8%a7%da%a9%d8%b3%d8%a7%d8%b2%db%8c_%d8%af%d8%a7%d8%af%d9%87_%d9%87%d8%a7\"><\/span>\u067e\u0627\u06a9\u0633\u0627\u0632\u06cc \u062f\u0627\u062f\u0647 \u0647\u0627<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p>\u062a\u0648\u06cc\u06cc\u062a \u0647\u0627 \u062d\u0627\u0648\u06cc \u06a9\u0644\u0645\u0627\u062a \u0639\u0627\u0645\u06cc\u0627\u0646\u0647 \u0648 \u0639\u0644\u0627\u0626\u0645 \u0646\u06af\u0627\u0631\u0634\u06cc \u0632\u06cc\u0627\u062f\u06cc \u0647\u0633\u062a\u0646\u062f.  \u0645\u0627 \u0628\u0627\u06cc\u062f \u062a\u0648\u06cc\u06cc\u062a\u200c\u0647\u0627\u06cc\u0645\u0627\u0646 \u0631\u0627 \u0642\u0628\u0644 \u0627\u0632 \u0627\u06cc\u0646\u06a9\u0647 \u0628\u062a\u0648\u0627\u0646\u06cc\u0645 \u0628\u0631\u0627\u06cc \u0622\u0645\u0648\u0632\u0634 \u0645\u062f\u0644 \u06cc\u0627\u062f\u06af\u06cc\u0631\u06cc \u0645\u0627\u0634\u06cc\u0646 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0646\u06cc\u0645\u060c \u067e\u0627\u06a9 \u06a9\u0646\u06cc\u0645.  \u0628\u0627 \u0627\u06cc\u0646 \u062d\u0627\u0644\u060c \u0642\u0628\u0644 \u0627\u0632 \u067e\u0627\u06a9 \u06a9\u0631\u062f\u0646 \u062a\u0648\u06cc\u06cc\u062a\u200c\u0647\u0627\u060c \u0628\u06cc\u0627\u06cc\u06cc\u062f \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647\u200c\u0647\u0627\u06cc \u062e\u0648\u062f \u0631\u0627 \u0628\u0647 \u0645\u062c\u0645\u0648\u0639\u0647\u200c\u0647\u0627\u06cc \u0648\u06cc\u0698\u06af\u06cc \u0648 \u0628\u0631\u0686\u0633\u0628 \u062a\u0642\u0633\u06cc\u0645 \u06a9\u0646\u06cc\u0645.<\/p>\n<p>\u0645\u062c\u0645\u0648\u0639\u0647 \u0648\u06cc\u0698\u06af\u06cc \u0647\u0627\u06cc \u0645\u0627 \u0641\u0642\u0637 \u0627\u0632 \u062a\u0648\u06cc\u06cc\u062a \u0647\u0627 \u062a\u0634\u06a9\u06cc\u0644 \u0645\u06cc \u0634\u0648\u062f.  \u0627\u06af\u0631 \u0628\u0647 \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647 \u062e\u0648\u062f \u0646\u06af\u0627\u0647 \u06a9\u0646\u06cc\u0645\u060c \u0633\u062a\u0648\u0646 \u06cc\u0627\u0632\u062f\u0647\u0645 \u062d\u0627\u0648\u06cc \u0645\u062a\u0646 \u062a\u0648\u06cc\u06cc\u062a \u0627\u0633\u062a.  \u062a\u0648\u062c\u0647 \u062f\u0627\u0634\u062a\u0647 \u0628\u0627\u0634\u06cc\u062f \u06a9\u0647 \u0634\u0627\u062e\u0635 \u0633\u062a\u0648\u0646 10 \u062e\u0648\u0627\u0647\u062f \u0628\u0648\u062f \u0632\u06cc\u0631\u0627 \u0633\u062a\u0648\u0646 \u0647\u0627\u06cc \u067e\u0627\u0646\u062f\u0627\u0647\u0627 \u0627\u0632 \u0637\u0631\u062d \u0646\u0645\u0627\u06cc\u0647 \u0633\u0627\u0632\u06cc \u0645\u0628\u062a\u0646\u06cc \u0628\u0631 \u0635\u0641\u0631 \u067e\u06cc\u0631\u0648\u06cc \u0645\u06cc \u06a9\u0646\u0646\u062f \u06a9\u0647 \u062f\u0631 \u0622\u0646 \u0633\u062a\u0648\u0646 \u0627\u0648\u0644 \u0633\u062a\u0648\u0646 0 \u0646\u0627\u0645\u06cc\u062f\u0647 \u0645\u06cc \u0634\u0648\u062f.  \u0645\u062c\u0645\u0648\u0639\u0647 \u0628\u0631\u0686\u0633\u0628 \u0645\u0627 \u0634\u0627\u0645\u0644 \u0627\u062d\u0633\u0627\u0633 \u062a\u0648\u06cc\u06cc\u062a\u06cc \u0627\u0633\u062a \u06a9\u0647 \u0628\u0627\u06cc\u062f \u067e\u06cc\u0634 \u0628\u06cc\u0646\u06cc \u06a9\u0646\u06cc\u0645.  \u0627\u062d\u0633\u0627\u0633 \u062a\u0648\u06cc\u06cc\u062a \u062f\u0631 \u0633\u062a\u0648\u0646 \u062f\u0648\u0645 (\u0634\u0627\u062e\u0635 1) \u0642\u0631\u0627\u0631 \u062f\u0627\u0631\u062f.  \u0628\u0631\u0627\u06cc \u0627\u06cc\u062c\u0627\u062f \u06cc\u06a9 \u0648\u06cc\u0698\u06af\u06cc \u0648 \u06cc\u06a9 \u0645\u062c\u0645\u0648\u0639\u0647 \u0628\u0631\u0686\u0633\u0628\u060c \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u0645 \u0627\u0632 <code>iloc<\/code> \u0631\u0648\u0634 \u062e\u0627\u0631\u062c \u0627\u0632 \u0642\u0627\u0628 \u062f\u0627\u062f\u0647 \u067e\u0627\u0646\u062f\u0627\u0647\u0627.<\/p>\n<p>\u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0632\u06cc\u0631 \u0631\u0627 \u0627\u062c\u0631\u0627 \u06a9\u0646\u06cc\u062f:<\/p>\n<pre><code class=\"hljs\">features = airline_tweets.iloc(:, <span class=\"hljs-number\">10<\/span>).values\nlabels = airline_tweets.iloc(:, <span class=\"hljs-number\">1<\/span>).values\n<\/code><\/pre>\n<p>\u0647\u0646\u06af\u0627\u0645\u06cc \u06a9\u0647 \u062f\u0627\u062f\u0647\u200c\u0647\u0627 \u0631\u0627 \u0628\u0647 \u0648\u06cc\u0698\u06af\u06cc\u200c\u0647\u0627 \u0648 \u0645\u062c\u0645\u0648\u0639\u0647 \u0622\u0645\u0648\u0632\u0634\u06cc \u062a\u0642\u0633\u06cc\u0645 \u0645\u06cc\u200c\u06a9\u0646\u06cc\u0645\u060c \u0645\u06cc\u200c\u062a\u0648\u0627\u0646\u06cc\u0645 \u062f\u0627\u062f\u0647\u200c\u0647\u0627 \u0631\u0627 \u0628\u0631\u0627\u06cc \u067e\u0627\u06a9 \u06a9\u0631\u062f\u0646 \u0622\u0646\u200c\u0647\u0627 \u0627\u0632 \u0642\u0628\u0644 \u067e\u0631\u062f\u0627\u0632\u0634 \u06a9\u0646\u06cc\u0645.  \u0628\u0631\u0627\u06cc \u0627\u06cc\u0646 \u06a9\u0627\u0631 \u0627\u0632 \u0639\u0628\u0627\u0631\u0627\u062a \u0645\u0646\u0638\u0645 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0645\u06cc \u06a9\u0646\u06cc\u0645.  \u0628\u0631\u0627\u06cc \u0645\u0637\u0627\u0644\u0639\u0647 \u0628\u06cc\u0634\u062a\u0631 \u062f\u0631 \u0645\u0648\u0631\u062f \u0639\u0628\u0627\u0631\u0627\u062a \u0645\u0646\u0638\u0645\u060c \u0644\u0637\u0641\u0627\u064b \u0628\u0647 \u0627\u06cc\u0646 \u0645\u0642\u0627\u0644\u0647 \u0646\u06af\u0627\u0647\u06cc \u0628\u06cc\u0646\u062f\u0627\u0632\u06cc\u062f \u0631\u0648\u06cc \u0639\u0628\u0627\u0631\u0627\u062a \u0628\u0627 \u0642\u0627\u0639\u062f\u0647.<\/p>\n<pre><code class=\"hljs\">processed_features = ()\n\n<span class=\"hljs-keyword\">for<\/span> sentence <span class=\"hljs-keyword\">in<\/span> <span class=\"hljs-built_in\">range<\/span>(<span class=\"hljs-number\">0<\/span>, <span class=\"hljs-built_in\">len<\/span>(features)):\n    \n    processed_feature = re.sub(<span class=\"hljs-string\">r'\\W'<\/span>, <span class=\"hljs-string\">' '<\/span>, <span class=\"hljs-built_in\">str<\/span>(features(sentence)))\n\n    \n    processed_feature= re.sub(<span class=\"hljs-string\">r'\\s+(a-zA-Z)\\s+'<\/span>, <span class=\"hljs-string\">' '<\/span>, processed_feature)\n\n    \n    processed_feature = re.sub(<span class=\"hljs-string\">r'\\^(a-zA-Z)\\s+'<\/span>, <span class=\"hljs-string\">' '<\/span>, processed_feature) \n\n    \n    processed_feature = re.sub(<span class=\"hljs-string\">r'\\s+'<\/span>, <span class=\"hljs-string\">' '<\/span>, processed_feature, flags=re.I)\n\n    \n    processed_feature = re.sub(<span class=\"hljs-string\">r'^b\\s+'<\/span>, <span class=\"hljs-string\">''<\/span>, processed_feature)\n\n    \n    processed_feature = processed_feature.lower()\n\n    processed_features.append(processed_feature)\n<\/code><\/pre>\n<p>\u062f\u0631 \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0628\u0627\u0644\u0627\u060c \u0628\u0627 \u062d\u0630\u0641 \u062a\u0645\u0627\u0645 \u06a9\u0627\u0631\u0627\u06a9\u062a\u0631\u0647\u0627\u06cc \u062e\u0627\u0635 \u0627\u0632 \u062a\u0648\u06cc\u06cc\u062a \u0647\u0627 \u0634\u0631\u0648\u0639 \u0645\u06cc \u06a9\u0646\u06cc\u0645.  \u0628\u06cc\u0627\u0646 \u0645\u0646\u0638\u0645 <code>re.sub(r'\\W', ' ', str(features(sentence)))<\/code> \u0622\u0646 \u0631\u0627 \u0627\u0646\u062c\u0627\u0645 \u0645\u06cc \u062f\u0647\u062f.<\/p>\n<p>\u062f\u0631 \u0645\u0631\u062d\u0644\u0647 \u0628\u0639\u062f\u060c \u062a\u0645\u0627\u0645 \u06a9\u0627\u0631\u0627\u06a9\u062a\u0631\u0647\u0627\u06cc \u062a\u06a9 \u0628\u0627\u0642\u06cc \u0645\u0627\u0646\u062f\u0647 \u062f\u0631 \u0646\u062a\u06cc\u062c\u0647 \u062d\u0630\u0641 \u06a9\u0627\u0631\u0627\u06a9\u062a\u0631 \u0648\u06cc\u0698\u0647 \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 \u0631\u0627 \u062d\u0630\u0641 \u0645\u06cc \u06a9\u0646\u06cc\u0645 <code>re.sub(r'\\s+(a-zA-Z)\\s+', ' ', processed_feature)<\/code> \u0639\u0628\u0627\u0631\u062a \u0645\u0646\u0638\u0645.  \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u0645\u062b\u0627\u0644\u060c \u0627\u06af\u0631 \u06a9\u0627\u0631\u0627\u06a9\u062a\u0631 \u0648\u06cc\u0698\u0647 \u0631\u0627 \u062d\u0630\u0641 \u06a9\u0646\u06cc\u0645 <code>'<\/code> \u0627\u0632 \u062c\u0627\u0646\u0628 <code>Jack's<\/code> \u0648 \u062c\u0627\u06cc \u0622\u0646 \u0631\u0627 \u0628\u0627 \u0641\u0636\u0627 \u062c\u0627\u06cc\u06af\u0632\u06cc\u0646 \u06a9\u0646\u06cc\u062f\u060c \u0645\u0627 \u0645\u0627\u0646\u062f\u0647 \u0627\u06cc\u0645 <code>Jack s<\/code>.  \u0627\u06cc\u0646\u062c\u0627 <code>s<\/code> \u0645\u0639\u0646\u06cc \u0646\u062f\u0627\u0631\u062f\u060c \u0628\u0646\u0627\u0628\u0631\u0627\u06cc\u0646 \u0628\u0627 \u062c\u0627\u06cc\u06af\u0632\u06cc\u0646 \u06a9\u0631\u062f\u0646 \u062a\u0645\u0627\u0645 \u06a9\u0627\u0631\u0627\u06a9\u062a\u0631\u0647\u0627\u06cc \u0645\u0646\u0641\u0631\u062f \u0628\u0627 \u06cc\u06a9 \u0641\u0627\u0635\u0644\u0647\u060c \u0622\u0646 \u0631\u0627 \u062d\u0630\u0641 \u0645\u06cc \u06a9\u0646\u06cc\u0645.<\/p>\n<p>\u0628\u0627 \u0627\u06cc\u0646 \u062d\u0627\u0644\u060c \u0627\u06af\u0631 \u0647\u0645\u0647 \u06a9\u0627\u0631\u0627\u06a9\u062a\u0631\u0647\u0627\u06cc \u0645\u0646\u0641\u0631\u062f \u0631\u0627 \u0628\u0627 \u0641\u0627\u0635\u0644\u0647 \u062c\u0627\u06cc\u06af\u0632\u06cc\u0646 \u06a9\u0646\u06cc\u0645\u060c \u0686\u0646\u062f\u06cc\u0646 \u0641\u0627\u0635\u0644\u0647 \u0627\u06cc\u062c\u0627\u062f \u0645\u06cc \u0634\u0648\u062f.  \u0628\u0646\u0627\u0628\u0631\u0627\u06cc\u0646\u060c \u0647\u0645\u0647 \u0641\u0636\u0627\u0647\u0627\u06cc \u0686\u0646\u062f\u06af\u0627\u0646\u0647 \u0631\u0627 \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 \u0641\u0636\u0627\u0647\u0627\u06cc \u062a\u06a9 \u062c\u0627\u06cc\u06af\u0632\u06cc\u0646 \u0645\u06cc \u06a9\u0646\u06cc\u0645 <code>re.sub(r'\\s+', ' ', processed_feature, flags=re.I)<\/code> regex  \u0639\u0644\u0627\u0648\u0647 \u0628\u0631 \u0627\u06cc\u0646\u060c \u0627\u06af\u0631 \u0631\u0634\u062a\u0647 \u0645\u062a\u0646 \u0634\u0645\u0627 \u062f\u0631 \u0628\u0627\u06cc\u062a \u0628\u0627\u0634\u062f\u060c \u06cc\u06a9 \u06a9\u0627\u0631\u0627\u06a9\u062a\u0631 \u0631\u0627 \u0641\u0631\u0645\u062a \u06a9\u0646\u06cc\u062f <code>b<\/code> \u0628\u0647 \u0631\u0634\u062a\u0647 \u0627\u0636\u0627\u0641\u0647 \u0645\u06cc \u0634\u0648\u062f.  \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0628\u0627\u0644\u0627 \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 regex \u0622\u0646 \u0631\u0627 \u062d\u0630\u0641 \u0645\u06cc \u06a9\u0646\u062f <code>re.sub(r'^b\\s+', '', processed_feature)<\/code>.<\/p>\n<p>\u062f\u0631 \u0646\u0647\u0627\u06cc\u062a\u060c \u0645\u062a\u0646 \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 \u062d\u0631\u0648\u0641 \u06a9\u0648\u0686\u06a9 \u062a\u0628\u062f\u06cc\u0644 \u0645\u06cc \u0634\u0648\u062f <code>lower()<\/code> \u062a\u0627\u0628\u0639.<\/p>\n<h3 id=\"representingtextinnumericform\"><span class=\"ez-toc-section\" id=\"%d9%86%d9%85%d8%a7%db%8c%d8%b4_%d9%85%d8%aa%d9%86_%d8%a8%d9%87_%d8%b4%da%a9%d9%84_%d8%b9%d8%af%d8%af%db%8c\"><\/span>\u0646\u0645\u0627\u06cc\u0634 \u0645\u062a\u0646 \u0628\u0647 \u0634\u06a9\u0644 \u0639\u062f\u062f\u06cc<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p>\u0627\u0644\u06af\u0648\u0631\u06cc\u062a\u0645 \u0647\u0627\u06cc \u0622\u0645\u0627\u0631\u06cc \u0627\u0632 \u0631\u06cc\u0627\u0636\u06cc\u0627\u062a \u0628\u0631\u0627\u06cc \u0622\u0645\u0648\u0632\u0634 \u0645\u062f\u0644 \u0647\u0627\u06cc \u06cc\u0627\u062f\u06af\u06cc\u0631\u06cc \u0645\u0627\u0634\u06cc\u0646 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0645\u06cc \u06a9\u0646\u0646\u062f.  \u0628\u0627 \u0627\u06cc\u0646 \u062d\u0627\u0644\u060c \u0631\u06cc\u0627\u0636\u06cc\u0627\u062a \u0641\u0642\u0637 \u0628\u0627 \u0627\u0639\u062f\u0627\u062f \u06a9\u0627\u0631 \u0645\u06cc \u06a9\u0646\u062f.  \u0628\u0631\u0627\u06cc \u0627\u06cc\u0646\u06a9\u0647 \u0627\u0644\u06af\u0648\u0631\u06cc\u062a\u0645 \u0647\u0627\u06cc \u0622\u0645\u0627\u0631\u06cc \u0628\u0627 \u0645\u062a\u0646 \u06a9\u0627\u0631 \u06a9\u0646\u0646\u062f\u060c \u0627\u0628\u062a\u062f\u0627 \u0628\u0627\u06cc\u062f \u0645\u062a\u0646 \u0631\u0627 \u0628\u0647 \u0639\u062f\u062f \u062a\u0628\u062f\u06cc\u0644 \u06a9\u0646\u06cc\u0645.  \u0628\u0631\u0627\u06cc \u0627\u0646\u062c\u0627\u0645 \u0627\u06cc\u0646 \u06a9\u0627\u0631\u060c \u0633\u0647 \u0631\u0648\u06cc\u06a9\u0631\u062f \u0627\u0635\u0644\u06cc \u0648\u062c\u0648\u062f \u062f\u0627\u0631\u062f \u06a9\u0647 \u0639\u0628\u0627\u0631\u062a\u0646\u062f \u0627\u0632 Bag of Words\u060c TF-IDF \u0648 Word2Vec.  \u062f\u0631 \u0627\u06cc\u0646 \u0628\u062e\u0634 \u0628\u0647 \u06a9\u06cc\u0633\u0647 \u06a9\u0644\u0645\u0627\u062a \u0648 \u0637\u0631\u062d TF-IDF \u0645\u06cc \u067e\u0631\u062f\u0627\u0632\u06cc\u0645.<\/p>\n<h4 id=\"bagofwords\">\u06a9\u06cc\u0633\u0647 \u06a9\u0644\u0645\u0627\u062a<\/h4>\n<p>\u0637\u0631\u062d \u06a9\u06cc\u0633\u0647 \u06a9\u0644\u0645\u0627\u062a \u0633\u0627\u062f\u0647 \u062a\u0631\u06cc\u0646 \u0631\u0627\u0647 \u0628\u0631\u0627\u06cc \u062a\u0628\u062f\u06cc\u0644 \u0645\u062a\u0646 \u0628\u0647 \u0627\u0639\u062f\u0627\u062f \u0627\u0633\u062a.<\/p>\n<p>\u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u0645\u062b\u0627\u0644\u060c \u0634\u0645\u0627 \u0633\u0647 \u0633\u0646\u062f \u062f\u0627\u0631\u06cc\u062f:<\/p>\n<ul>\n<li>Doc1 = &#8220;\u0645\u0646 \u062f\u0648\u0633\u062a \u062f\u0627\u0631\u0645 \u0641\u0648\u062a\u0628\u0627\u0644 \u0628\u0627\u0632\u06cc \u06a9\u0646\u0645&#8221;<\/li>\n<li>Doc2 = &#8220;\u0628\u0627\u0632\u06cc \u062e\u0648\u0628\u06cc \u0627\u0633\u062a&#8221;<\/li>\n<li>Doc3 = &#8220;\u0645\u0646 \u0641\u0648\u062a\u0628\u0627\u0644 \u0631\u0627 \u0628\u0647 \u0631\u0627\u06af\u0628\u06cc \u062a\u0631\u062c\u06cc\u062d \u0645\u06cc \u062f\u0647\u0645&#8221;<\/li>\n<\/ul>\n<p>\u062f\u0631 \u0631\u0648\u06cc\u06a9\u0631\u062f \u06a9\u06cc\u0633\u0647 \u06a9\u0644\u0645\u0627\u062a\u060c \u0627\u0648\u0644\u06cc\u0646 \u0642\u062f\u0645 \u0627\u06cc\u062c\u0627\u062f \u0648\u0627\u0698\u06af\u0627\u0646\u06cc \u0627\u0632 \u062a\u0645\u0627\u0645 \u06a9\u0644\u0645\u0627\u062a \u0645\u0646\u062d\u0635\u0631 \u0628\u0647 \u0641\u0631\u062f \u0627\u0633\u062a.  \u0628\u0631\u0627\u06cc \u0633\u0647 \u0633\u0646\u062f \u0641\u0648\u0642\u060c \u0648\u0627\u0698\u06af\u0627\u0646 \u0645\u0627 \u0628\u0647 \u0635\u0648\u0631\u062a \u0632\u06cc\u0631 \u062e\u0648\u0627\u0647\u062f \u0628\u0648\u062f:<\/p>\n<pre><code class=\"hljs\">Vocab = (I, like, to, play, football, it, is, a, good, game, prefer, over, rugby)\n<\/code><\/pre>\n<p>\u0645\u0631\u062d\u0644\u0647 \u0628\u0639\u062f\u06cc \u062a\u0628\u062f\u06cc\u0644 \u0647\u0631 \u0633\u0646\u062f \u0628\u0647 \u06cc\u06a9 \u0628\u0631\u062f\u0627\u0631 \u0648\u06cc\u0698\u06af\u06cc \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 \u0648\u0627\u0698\u06af\u0627\u0646 \u0627\u0633\u062a.  \u0637\u0648\u0644 \u0647\u0631 \u0628\u0631\u062f\u0627\u0631 \u0648\u06cc\u0698\u06af\u06cc \u0628\u0631\u0627\u0628\u0631 \u0627\u0633\u062a \u0628\u0627 \u0637\u0648\u0644 \u0648\u0627\u0698\u06af\u0627\u0646.  \u0641\u0631\u0627\u0648\u0627\u0646\u06cc \u06a9\u0644\u0645\u0647 \u062f\u0631 \u0633\u0646\u062f \u062c\u0627\u06cc\u06af\u0632\u06cc\u0646 \u06a9\u0644\u0645\u0647 \u0648\u0627\u0642\u0639\u06cc \u062f\u0631 \u0648\u0627\u0698\u06af\u0627\u0646 \u0645\u06cc \u0634\u0648\u062f.  \u0627\u06af\u0631 \u06a9\u0644\u0645\u0647 \u0627\u06cc \u062f\u0631 \u0648\u0627\u0698\u06af\u0627\u0646 \u062f\u0631 \u0633\u0646\u062f \u0645\u0631\u0628\u0648\u0637\u0647 \u06cc\u0627\u0641\u062a \u0646\u0634\u062f\u060c \u0628\u0631\u062f\u0627\u0631 \u0648\u06cc\u0698\u06af\u06cc \u0633\u0646\u062f \u062f\u0631 \u0622\u0646 \u0645\u06a9\u0627\u0646 \u0635\u0641\u0631 \u062e\u0648\u0627\u0647\u062f \u0628\u0648\u062f.  \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u0645\u062b\u0627\u0644\u060c \u0628\u0631\u0627\u06cc Doc1\u060c \u0628\u0631\u062f\u0627\u0631 \u0648\u06cc\u0698\u06af\u06cc \u0628\u0647 \u0634\u06a9\u0644 \u0632\u06cc\u0631 \u062e\u0648\u0627\u0647\u062f \u0628\u0648\u062f:<\/p>\n<pre><code class=\"hljs\">(1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0)\n<\/code><\/pre>\n<h4 id=\"tfidf\">TF-IDF<\/h4>\n<p>\u062f\u0631 \u0631\u0648\u06cc\u06a9\u0631\u062f \u06a9\u06cc\u0633\u0647 \u06a9\u0644\u0645\u0627\u062a\u060c \u0647\u0631 \u06a9\u0644\u0645\u0647 \u0648\u0632\u0646 \u06cc\u06a9\u0633\u0627\u0646\u06cc \u062f\u0627\u0631\u062f.  \u0627\u06cc\u062f\u0647 \u067e\u0634\u062a \u0631\u0648\u06cc\u06a9\u0631\u062f TF-IDF \u0627\u06cc\u0646 \u0627\u0633\u062a \u06a9\u0647 \u06a9\u0644\u0645\u0627\u062a\u06cc \u06a9\u0647 \u06a9\u0645\u062a\u0631 \u062f\u0631 \u0647\u0645\u0647 \u0627\u0633\u0646\u0627\u062f \u0648 \u0628\u06cc\u0634\u062a\u0631 \u062f\u0631 \u0627\u0633\u0646\u0627\u062f \u062c\u062f\u0627\u06af\u0627\u0646\u0647 \u0648\u062c\u0648\u062f \u062f\u0627\u0631\u0646\u062f\u060c \u0628\u06cc\u0634\u062a\u0631 \u0628\u0647 \u0637\u0628\u0642\u0647 \u0628\u0646\u062f\u06cc \u06a9\u0645\u06a9 \u0645\u06cc \u06a9\u0646\u0646\u062f.<\/p>\n<p>TF-IDF \u062a\u0631\u06a9\u06cc\u0628\u06cc \u0627\u0632 \u062f\u0648 \u0639\u0628\u0627\u0631\u062a \u0627\u0633\u062a.  \u0641\u0631\u06a9\u0627\u0646\u0633 \u0645\u062f\u062a \u0648 \u0628\u0633\u0627\u0645\u062f \u0633\u0646\u062f \u0645\u0639\u06a9\u0648\u0633.  \u0622\u0646\u0647\u0627 \u0631\u0627 \u0645\u06cc \u062a\u0648\u0627\u0646 \u0628\u0647 \u0635\u0648\u0631\u062a \u0632\u06cc\u0631 \u0645\u062d\u0627\u0633\u0628\u0647 \u06a9\u0631\u062f:<\/p>\n<pre><code class=\"hljs\">TF  = (Frequency of a word in the document)\/(Total words in the document)\n\nIDF = Log((Total number of docs)\/(Number of docs containing the word))\n<\/code><\/pre>\n<h4 id=\"tfidfusingthescikitlearnlibrary\">TF-IDF \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 Scikit-Learn<\/h4>\n<p>\u062e\u0648\u0634\u0628\u062e\u062a\u0627\u0646\u0647 \u0628\u0631\u0627\u06cc \u0645\u0627\u060c \u067e\u0627\u06cc\u062a\u0648\u0646 <a rel=\"nofollow noopener\" target=\"_blank\" href=\"https:\/\/scikit-learn.org\/stable\/\">Scikit-Learn<\/a> \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 \u0634\u0627\u0645\u0644 <code>TfidfVectorizer<\/code> \u06a9\u0644\u0627\u0633\u06cc \u06a9\u0647 \u0645\u06cc \u062a\u0648\u0627\u0646\u062f \u0628\u0631\u0627\u06cc \u062a\u0628\u062f\u06cc\u0644 \u0648\u06cc\u0698\u06af\u06cc \u0647\u0627\u06cc \u0645\u062a\u0646 \u0628\u0647 \u0628\u0631\u062f\u0627\u0631\u0647\u0627\u06cc \u0648\u06cc\u0698\u06af\u06cc TF-IDF \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0634\u0648\u062f.  \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0632\u06cc\u0631 \u0627\u06cc\u0646 \u06a9\u0627\u0631 \u0631\u0627 \u0627\u0646\u062c\u0627\u0645 \u0645\u06cc \u062f\u0647\u062f:<\/p>\n<pre><code class=\"hljs\"><span class=\"hljs-keyword\">from<\/span> nltk.corpus <span class=\"hljs-keyword\">import<\/span> stopwords\n<span class=\"hljs-keyword\">from<\/span> sklearn.feature_extraction.text <span class=\"hljs-keyword\">import<\/span> TfidfVectorizer\n\nvectorizer = TfidfVectorizer (max_features=<span class=\"hljs-number\">2500<\/span>, min_df=<span class=\"hljs-number\">7<\/span>, max_df=<span class=\"hljs-number\">0.8<\/span>, stop_words=stopwords.words(<span class=\"hljs-string\">'english'<\/span>))\nprocessed_features = vectorizer.fit_transform(processed_features).toarray()\n<\/code><\/pre>\n<p>\u062f\u0631 \u06a9\u062f \u0628\u0627\u0644\u0627 \u062a\u0639\u0631\u06cc\u0641 \u0645\u06cc \u06a9\u0646\u06cc\u0645 \u06a9\u0647 <code>max_features<\/code> \u0628\u0627\u06cc\u062f 2500 \u0628\u0627\u0634\u062f\u060c \u0628\u0647 \u0627\u06cc\u0646 \u0645\u0639\u0646\u06cc \u06a9\u0647 \u0641\u0642\u0637 \u0627\u0632 2500 \u06a9\u0644\u0645\u0647 \u0645\u062a\u062f\u0627\u0648\u0644 \u0628\u0631\u0627\u06cc \u0627\u06cc\u062c\u0627\u062f \u0628\u0631\u062f\u0627\u0631 \u0648\u06cc\u0698\u06af\u06cc &#8220;\u06a9\u06cc\u0641 \u06a9\u0644\u0645\u0627\u062a&#8221; \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0645\u06cc \u06a9\u0646\u062f.  \u06a9\u0644\u0645\u0627\u062a\u06cc \u06a9\u0647 \u06a9\u0645\u062a\u0631 \u062f\u06cc\u062f\u0647 \u0645\u06cc \u0634\u0648\u0646\u062f \u0628\u0631\u0627\u06cc \u0637\u0628\u0642\u0647 \u0628\u0646\u062f\u06cc \u0686\u0646\u062f\u0627\u0646 \u0645\u0641\u06cc\u062f \u0646\u06cc\u0633\u062a\u0646\u062f.<\/p>\n<p>\u0628\u0647 \u0647\u0645\u06cc\u0646 \u062a\u0631\u062a\u06cc\u0628\u060c <code>max_df<\/code> \u0645\u0634\u062e\u0635 \u0645\u06cc \u06a9\u0646\u062f \u06a9\u0647 \u0641\u0642\u0637 \u0627\u0632 \u06a9\u0644\u0645\u0627\u062a\u06cc \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0634\u0648\u062f \u06a9\u0647 \u062d\u062f\u0627\u06a9\u062b\u0631 \u062f\u0631 80\u066a \u0627\u0633\u0646\u0627\u062f \u0648\u062c\u0648\u062f \u062f\u0627\u0631\u062f.  \u06a9\u0644\u0645\u0627\u062a\u06cc \u06a9\u0647 \u062f\u0631 \u0647\u0645\u0647 \u0627\u0633\u0646\u0627\u062f \u0648\u062c\u0648\u062f \u062f\u0627\u0631\u062f \u0628\u0633\u06cc\u0627\u0631 \u0631\u0627\u06cc\u062c \u0647\u0633\u062a\u0646\u062f \u0648 \u0628\u0631\u0627\u06cc \u0637\u0628\u0642\u0647 \u0628\u0646\u062f\u06cc \u0686\u0646\u062f\u0627\u0646 \u0645\u0641\u06cc\u062f \u0646\u06cc\u0633\u062a\u0646\u062f.  \u0628\u0647 \u0647\u0645\u06cc\u0646 \u062a\u0631\u062a\u06cc\u0628\u060c <code>min-df<\/code> \u0631\u0648\u06cc 7 \u062a\u0646\u0638\u06cc\u0645 \u0634\u062f\u0647 \u0627\u0633\u062a \u06a9\u0647 \u0646\u0634\u0627\u0646 \u0645\u06cc \u062f\u0647\u062f \u06a9\u0644\u0645\u0627\u062a\u06cc \u0631\u0627 \u06a9\u0647 \u062f\u0631 \u062d\u062f\u0627\u0642\u0644 7 \u0633\u0646\u062f \u0648\u062c\u0648\u062f \u062f\u0627\u0631\u062f \u0631\u0627 \u0634\u0627\u0645\u0644 \u0645\u06cc \u0634\u0648\u062f.<\/p>\n<h3 id=\"dividingdataintotrainingandtestsets\"><span class=\"ez-toc-section\" id=\"%d8%aa%d9%82%d8%b3%db%8c%d9%85_%d8%af%d8%a7%d8%af%d9%87_%d9%87%d8%a7_%d8%a8%d9%87_%d9%85%d8%ac%d9%85%d9%88%d8%b9%d9%87_%d9%87%d8%a7%db%8c_%d8%a2%d9%85%d9%88%d8%b2%d8%b4%db%8c_%d9%88_%d8%a2%d8%b2%d9%85%d8%a7%db%8c%d8%b4%db%8c\"><\/span>\u062a\u0642\u0633\u06cc\u0645 \u062f\u0627\u062f\u0647 \u0647\u0627 \u0628\u0647 \u0645\u062c\u0645\u0648\u0639\u0647 \u0647\u0627\u06cc \u0622\u0645\u0648\u0632\u0634\u06cc \u0648 \u0622\u0632\u0645\u0627\u06cc\u0634\u06cc<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p>\u062f\u0631 \u0642\u0633\u0645\u062a \u0642\u0628\u0644 \u062f\u0627\u062f\u0647 \u0647\u0627 \u0631\u0627 \u0628\u0647 \u0634\u06a9\u0644 \u0639\u062f\u062f\u06cc \u062a\u0628\u062f\u06cc\u0644 \u06a9\u0631\u062f\u06cc\u0645.  \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u0622\u062e\u0631\u06cc\u0646 \u0645\u0631\u062d\u0644\u0647 \u0642\u0628\u0644 \u0627\u0632 \u0622\u0645\u0648\u0632\u0634 \u0627\u0644\u06af\u0648\u0631\u06cc\u062a\u0645 \u0647\u0627\u06cc \u062e\u0648\u062f\u060c \u0628\u0627\u06cc\u062f \u062f\u0627\u062f\u0647 \u0647\u0627\u06cc \u062e\u0648\u062f \u0631\u0627 \u0628\u0647 \u0645\u062c\u0645\u0648\u0639\u0647 \u0647\u0627\u06cc \u0622\u0645\u0648\u0632\u0634\u06cc \u0648 \u0622\u0632\u0645\u0627\u06cc\u0634\u06cc \u062a\u0642\u0633\u06cc\u0645 \u06a9\u0646\u06cc\u0645.  \u0645\u062c\u0645\u0648\u0639\u0647 \u0622\u0645\u0648\u0632\u0634\u06cc \u0628\u0631\u0627\u06cc \u0622\u0645\u0648\u0632\u0634 \u0627\u0644\u06af\u0648\u0631\u06cc\u062a\u0645 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u062e\u0648\u0627\u0647\u062f \u0634\u062f \u062f\u0631 \u062d\u0627\u0644\u06cc \u06a9\u0647 \u0645\u062c\u0645\u0648\u0639\u0647 \u062a\u0633\u062a \u0628\u0631\u0627\u06cc \u0627\u0631\u0632\u06cc\u0627\u0628\u06cc \u0639\u0645\u0644\u06a9\u0631\u062f \u0645\u062f\u0644 \u06cc\u0627\u062f\u06af\u06cc\u0631\u06cc \u0645\u0627\u0634\u06cc\u0646 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u062e\u0648\u0627\u0647\u062f \u0634\u062f.<\/p>\n<p>\u06a9\u062f \u0632\u06cc\u0631 \u0631\u0627 \u0627\u062c\u0631\u0627 \u06a9\u0646\u06cc\u062f:<\/p>\n<pre><code class=\"hljs\"><span class=\"hljs-keyword\">from<\/span> sklearn.model_selection <span class=\"hljs-keyword\">import<\/span> train_test_split\n\nX_train, X_test, y_train, y_test = train_test_split(processed_features, labels, test_size=<span class=\"hljs-number\">0.2<\/span>, random_state=<span class=\"hljs-number\">0<\/span>)\n<\/code><\/pre>\n<p>\u062f\u0631 \u06a9\u062f \u0628\u0627\u0644\u0627 \u0645\u0627 \u0627\u0632 <code>train_test_split<\/code> \u06a9\u0644\u0627\u0633 \u0627\u0632 <code>sklearn.model_selection<\/code> \u0645\u0627\u0698\u0648\u0644 \u0628\u0631\u0627\u06cc \u062a\u0642\u0633\u06cc\u0645 \u062f\u0627\u062f\u0647 \u0647\u0627\u06cc \u0645\u0627 \u0628\u0647 \u0645\u062c\u0645\u0648\u0639\u0647 \u0647\u0627\u06cc \u0622\u0645\u0648\u0632\u0634\u06cc \u0648 \u0622\u0632\u0645\u0627\u06cc\u0634\u06cc.  \u0627\u06cc\u0646 \u0631\u0648\u0634 \u0645\u062c\u0645\u0648\u0639\u0647 \u0648\u06cc\u0698\u06af\u06cc \u0631\u0627 \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u067e\u0627\u0631\u0627\u0645\u062a\u0631 \u0627\u0648\u0644\u060c \u0645\u062c\u0645\u0648\u0639\u0647 \u0628\u0631\u0686\u0633\u0628 \u0631\u0627 \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u067e\u0627\u0631\u0627\u0645\u062a\u0631 \u062f\u0648\u0645 \u0648 \u0645\u0642\u062f\u0627\u0631\u06cc \u0628\u0631\u0627\u06cc the \u0645\u06cc \u06af\u06cc\u0631\u062f <code>test_size<\/code> \u067e\u0627\u0631\u0627\u0645\u062a\u0631.  \u0645\u0627 \u0645\u0642\u062f\u0627\u0631 0.2 \u0631\u0627 \u0628\u0631\u0627\u06cc \u0622\u0646 \u0645\u0634\u062e\u0635 \u06a9\u0631\u062f\u06cc\u0645 <code>test_size<\/code> \u0628\u0647 \u0627\u06cc\u0646 \u0645\u0639\u0646\u06cc \u06a9\u0647 \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647 \u0647\u0627\u06cc \u0645\u0627 \u0628\u0647 \u062f\u0648 \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647 \u0647\u0627\u06cc 80% \u0648 20% \u062a\u0642\u0633\u06cc\u0645 \u0645\u06cc \u0634\u0648\u062f.  \u0645\u0627 \u0627\u0632 \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647 80% \u0628\u0631\u0627\u06cc \u0622\u0645\u0648\u0632\u0634 \u0648 20% \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647 \u0628\u0631\u0627\u06cc \u0622\u0632\u0645\u0627\u06cc\u0634 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u062e\u0648\u0627\u0647\u06cc\u0645 \u06a9\u0631\u062f.<\/p>\n<h3 id=\"trainingthemodel\"><span class=\"ez-toc-section\" id=\"%d8%a2%d9%85%d9%88%d8%b2%d8%b4_%d9%85%d8%af%d9%84\"><\/span>\u0622\u0645\u0648\u0632\u0634 \u0645\u062f\u0644<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p>\u0647\u0646\u06af\u0627\u0645\u06cc \u06a9\u0647 \u062f\u0627\u062f\u0647 \u0647\u0627 \u0628\u0647 \u0645\u062c\u0645\u0648\u0639\u0647 \u0647\u0627\u06cc \u0622\u0645\u0648\u0632\u0634\u06cc \u0648 \u0622\u0632\u0645\u0627\u06cc\u0634\u06cc \u062a\u0642\u0633\u06cc\u0645 \u0645\u06cc \u0634\u0648\u0646\u062f\u060c \u0645\u06cc \u062a\u0648\u0627\u0646 \u0627\u0632 \u0627\u0644\u06af\u0648\u0631\u06cc\u062a\u0645 \u0647\u0627\u06cc \u06cc\u0627\u062f\u06af\u06cc\u0631\u06cc \u0645\u0627\u0634\u06cc\u0646 \u0628\u0631\u0627\u06cc \u06cc\u0627\u062f\u06af\u06cc\u0631\u06cc \u0627\u0632 \u062f\u0627\u062f\u0647 \u0647\u0627\u06cc \u0622\u0645\u0648\u0632\u0634\u06cc \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0631\u062f.  \u0634\u0645\u0627 \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u062f \u0627\u0632 \u0647\u0631 \u0627\u0644\u06af\u0648\u0631\u06cc\u062a\u0645 \u06cc\u0627\u062f\u06af\u06cc\u0631\u06cc \u0645\u0627\u0634\u06cc\u0646\u06cc \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0646\u06cc\u062f.  \u0628\u0627 \u0627\u06cc\u0646 \u062d\u0627\u0644\u060c \u0645\u0627 \u0627\u0632 \u0627\u0644\u06af\u0648\u0631\u06cc\u062a\u0645 Random Forest \u0628\u0647 \u062f\u0644\u06cc\u0644 \u062a\u0648\u0627\u0646\u0627\u06cc\u06cc \u0622\u0646 \u062f\u0631 \u0639\u0645\u0644 \u0628\u0631 \u0631\u0648\u06cc \u062f\u0627\u062f\u0647 \u0647\u0627\u06cc \u063a\u06cc\u0631 \u0639\u0627\u062f\u06cc \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u062e\u0648\u0627\u0647\u06cc\u0645 \u06a9\u0631\u062f.<\/p>\n<p>\u0631\u0627 <code>sklearn.ensemble<\/code> \u0645\u0627\u0698\u0648\u0644 \u0634\u0627\u0645\u0644 <code>RandomForestClassifier<\/code> \u06a9\u0644\u0627\u0633\u06cc \u06a9\u0647 \u0645\u06cc \u062a\u0648\u0627\u0646\u062f \u0628\u0631\u0627\u06cc \u0622\u0645\u0648\u0632\u0634 \u0645\u062f\u0644 \u06cc\u0627\u062f\u06af\u06cc\u0631\u06cc \u0645\u0627\u0634\u06cc\u0646 \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 \u0627\u0644\u06af\u0648\u0631\u06cc\u062a\u0645 \u062c\u0646\u06af\u0644 \u062a\u0635\u0627\u062f\u0641\u06cc \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0634\u0648\u062f.  \u0628\u0631\u0627\u06cc \u0627\u0646\u062c\u0627\u0645 \u0627\u06cc\u0646 \u06a9\u0627\u0631\u060c \u0628\u0627\u06cc\u062f \u0628\u0627 \u0634\u0645\u0627\u0631\u0647 \u062a\u0645\u0627\u0633 \u0628\u06af\u06cc\u0631\u06cc\u062f <code>fit<\/code> \u0631\u0648\u0634 \u0631\u0648\u06cc \u0631\u0627 <code>RandomForestClassifier<\/code> \u06a9\u0644\u0627\u0633 \u0648 \u0648\u06cc\u0698\u06af\u06cc\u200c\u0647\u0627 \u0648 \u0628\u0631\u0686\u0633\u0628\u200c\u0647\u0627\u06cc \u0622\u0645\u0648\u0632\u0634\u06cc \u0645\u0627 \u0631\u0627 \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u067e\u0627\u0631\u0627\u0645\u062a\u0631 \u0627\u0631\u0633\u0627\u0644 \u06a9\u0646\u06cc\u062f.  \u0628\u0647 \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0632\u06cc\u0631 \u0646\u06af\u0627\u0647 \u06a9\u0646\u06cc\u062f:<\/p>\n<pre><code class=\"hljs\"><span class=\"hljs-keyword\">from<\/span> sklearn.ensemble <span class=\"hljs-keyword\">import<\/span> RandomForestClassifier\n\ntext_classifier = RandomForestClassifier(n_estimators=<span class=\"hljs-number\">200<\/span>, random_state=<span class=\"hljs-number\">0<\/span>)\ntext_classifier.fit(X_train, y_train)\n<\/code><\/pre>\n<h3 id=\"makingpredictionsandevaluatingthemodel\"><span class=\"ez-toc-section\" id=\"%d9%be%db%8c%d8%b4_%d8%a8%db%8c%d9%86%db%8c_%d9%88_%d8%a7%d8%b1%d8%b2%db%8c%d8%a7%d8%a8%db%8c_%d9%85%d8%af%d9%84\"><\/span>\u067e\u06cc\u0634 \u0628\u06cc\u0646\u06cc \u0648 \u0627\u0631\u0632\u06cc\u0627\u0628\u06cc \u0645\u062f\u0644<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p>\u0647\u0646\u06af\u0627\u0645\u06cc \u06a9\u0647 \u0645\u062f\u0644 \u0622\u0645\u0648\u0632\u0634 \u062f\u0627\u062f\u0647 \u0634\u062f\u060c \u0622\u062e\u0631\u06cc\u0646 \u0645\u0631\u062d\u0644\u0647 \u067e\u06cc\u0634 \u0628\u06cc\u0646\u06cc \u0627\u0633\u062a \u0631\u0648\u06cc \u0645\u062f\u0644.  \u0628\u0631\u0627\u06cc \u0627\u0646\u062c\u0627\u0645 \u0627\u06cc\u0646 \u06a9\u0627\u0631\u060c \u0628\u0627\u06cc\u062f \u0628\u0627 \u0634\u0645\u0627\u0631\u0647 \u062a\u0645\u0627\u0633 \u0628\u06af\u06cc\u0631\u06cc\u062f <code>predict<\/code> \u0631\u0648\u0634 \u0631\u0648\u06cc \u0647\u062f\u0641 \u0627\u0632 <code>RandomForestClassifier<\/code> \u06a9\u0644\u0627\u0633\u06cc \u06a9\u0647 \u0628\u0631\u0627\u06cc \u0622\u0645\u0648\u0632\u0634 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0631\u062f\u06cc\u0645  \u0628\u0647 \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0632\u06cc\u0631 \u0646\u06af\u0627\u0647 \u06a9\u0646\u06cc\u062f:<\/p>\n<pre><code class=\"hljs\">predictions = text_classifier.predict(X_test)\n<\/code><\/pre>\n<p>\u062f\u0631 \u0646\u0647\u0627\u06cc\u062a\u060c \u0628\u0631\u0627\u06cc \u0627\u0631\u0632\u06cc\u0627\u0628\u06cc \u0639\u0645\u0644\u06a9\u0631\u062f \u0645\u062f\u0644\u200c\u0647\u0627\u06cc \u06cc\u0627\u062f\u06af\u06cc\u0631\u06cc \u0645\u0627\u0634\u06cc\u0646\u060c \u0645\u06cc\u200c\u062a\u0648\u0627\u0646\u06cc\u0645 \u0627\u0632 \u0645\u0639\u06cc\u0627\u0631\u0647\u0627\u06cc \u0637\u0628\u0642\u0647\u200c\u0628\u0646\u062f\u06cc \u0645\u0627\u0646\u0646\u062f a <a rel=\"nofollow noopener\" target=\"_blank\" href=\"https:\/\/en.wikipedia.org\/wiki\/Confusion_matrix\">\u0645\u0627\u062a\u0631\u06cc\u0633 \u0633\u0631\u062f\u0631\u06af\u0645\u06cc<\/a>\u060c <a rel=\"nofollow noopener\" target=\"_blank\" href=\"https:\/\/en.wikipedia.org\/wiki\/F1_score\">\u0627\u0646\u062f\u0627\u0632\u0647 \u06af\u06cc\u0631\u06cc F1<\/a>\u060c \u062f\u0642\u062a \u0648 \u063a\u06cc\u0631\u0647<\/p>\n<p>\u0628\u0631\u0627\u06cc \u06cc\u0627\u0641\u062a\u0646 \u0645\u0642\u0627\u062f\u06cc\u0631 \u0627\u06cc\u0646 \u0645\u0639\u06cc\u0627\u0631\u0647\u0627\u060c \u0645\u06cc\u200c\u062a\u0648\u0627\u0646\u06cc\u0645 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0646\u06cc\u0645 <code>classification_report<\/code>\u060c <code>confusion_matrix<\/code>\u060c \u0648 <code>accuracy_score<\/code> \u0622\u0628 \u0648 \u0628\u0631\u0642 \u0627\u0632 <code>sklearn.metrics<\/code> \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647  \u0628\u0647 \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0632\u06cc\u0631 \u0646\u06af\u0627\u0647 \u06a9\u0646\u06cc\u062f:<\/p>\n<pre><code class=\"hljs\"><span class=\"hljs-keyword\">from<\/span> sklearn.metrics <span class=\"hljs-keyword\">import<\/span> classification_report, confusion_matrix, accuracy_score\n\n<span class=\"hljs-built_in\">print<\/span>(confusion_matrix(y_test,predictions))\n<span class=\"hljs-built_in\">print<\/span>(classification_report(y_test,predictions))\n<span class=\"hljs-built_in\">print<\/span>(accuracy_score(y_test, predictions))\n<\/code><\/pre>\n<p>\u062e\u0631\u0648\u062c\u06cc \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0628\u0627\u0644\u0627 \u0628\u0647 \u0634\u06a9\u0644 \u0632\u06cc\u0631 \u0627\u0633\u062a:<\/p>\n<pre><code class=\"hljs\">((1724  101   45)\n ( 329  237   48)\n ( 142   58  244))\n              precision    recall  f1-score   support\n\n    negative       0.79      0.92      0.85      1870\n     neutral       0.60      0.39      0.47       614\n    positive       0.72      0.55      0.62       444\n\n   micro avg       0.75      0.75      0.75      2928\n   macro avg       0.70      0.62      0.65      2928\nweighted avg       0.74      0.75      0.73      2928\n\n0.7530737704918032\n<\/code><\/pre>\n<p>\u0627\u0632 \u062e\u0631\u0648\u062c\u06cc \u0645\u06cc \u0628\u06cc\u0646\u06cc\u062f \u06a9\u0647 \u0627\u0644\u06af\u0648\u0631\u06cc\u062a\u0645 \u0645\u0627 \u0628\u0647 \u062f\u0642\u062a 75.30 \u062f\u0633\u062a \u06cc\u0627\u0641\u062a\u0647 \u0627\u0633\u062a.<\/p>\n<h2 id=\"conclusion\"><span class=\"ez-toc-section\" id=\"%d9%86%d8%aa%db%8c%d8%ac%d9%87\"><\/span>\u0646\u062a\u06cc\u062c\u0647<span class=\"ez-toc-section-end\"><\/span><\/h2>\n<p>\u062a\u062c\u0632\u06cc\u0647 \u0648 \u062a\u062d\u0644\u06cc\u0644 \u0627\u062d\u0633\u0627\u0633\u0627\u062a \u06cc\u06a9\u06cc \u0627\u0632 \u0645\u062a\u062f\u0627\u0648\u0644 \u062a\u0631\u06cc\u0646 \u06a9\u0627\u0631\u0647\u0627\u06cc NLP \u0627\u0633\u062a \u06a9\u0647 \u0628\u0647 \u062a\u0639\u06cc\u06cc\u0646 \u0627\u0641\u06a9\u0627\u0631 \u0639\u0645\u0648\u0645\u06cc \u062f\u0631 \u0645\u0648\u0631\u062f \u06cc\u06a9 \u0645\u0648\u0636\u0648\u0639 \u062e\u0627\u0635 \u06a9\u0645\u06a9 \u0645\u06cc \u06a9\u0646\u062f.<\/p>\n<p>\u062f\u0631 \u0627\u06cc\u0646 \u0645\u0642\u0627\u0644\u0647\u060c \u062f\u06cc\u062f\u06cc\u0645 \u06a9\u0647 \u0686\u06af\u0648\u0646\u0647 \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647\u200c\u0647\u0627\u06cc \u0645\u062e\u062a\u0644\u0641 \u067e\u0627\u06cc\u062a\u0648\u0646 \u0628\u0647 \u0627\u0646\u062c\u0627\u0645 \u062a\u062d\u0644\u06cc\u0644 \u0627\u062d\u0633\u0627\u0633\u0627\u062a \u06a9\u0645\u06a9 \u0645\u06cc\u200c\u06a9\u0646\u0646\u062f.  \u0645\u0627 \u062a\u062c\u0632\u06cc\u0647 \u0648 \u062a\u062d\u0644\u06cc\u0644 \u062a\u0648\u06cc\u06cc\u062a \u0647\u0627\u06cc \u0639\u0645\u0648\u0645\u06cc \u062f\u0631 \u0645\u0648\u0631\u062f \u0634\u0634 \u0634\u0631\u06a9\u062a \u0647\u0648\u0627\u067e\u06cc\u0645\u0627\u06cc\u06cc \u0627\u06cc\u0627\u0644\u0627\u062a \u0645\u062a\u062d\u062f\u0647 \u0631\u0627 \u0627\u0646\u062c\u0627\u0645 \u062f\u0627\u062f\u06cc\u0645 \u0648 \u0628\u0647 \u062f\u0642\u062a \u062d\u062f\u0648\u062f 75\u066a \u0631\u0633\u06cc\u062f\u06cc\u0645.  \u0645\u0646 \u0628\u0647 \u0634\u0645\u0627 \u062a\u0648\u0635\u06cc\u0647 \u0645\u06cc\u200c\u06a9\u0646\u0645 \u0627\u0632 \u0627\u0644\u06af\u0648\u0631\u06cc\u062a\u0645\u200c\u0647\u0627\u06cc \u06cc\u0627\u062f\u06af\u06cc\u0631\u06cc \u0645\u0627\u0634\u06cc\u0646 \u062f\u06cc\u06af\u0631\u06cc \u0645\u0627\u0646\u0646\u062f \u0631\u06af\u0631\u0633\u06cc\u0648\u0646 \u0644\u062c\u0633\u062a\u06cc\u06a9\u060c SVM \u06cc\u0627 KNN \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0646\u06cc\u062f \u0648 \u0628\u0628\u06cc\u0646\u06cc\u062f \u0622\u06cc\u0627 \u0645\u06cc\u200c\u062a\u0648\u0627\u0646\u06cc\u062f \u0646\u062a\u0627\u06cc\u062c \u0628\u0647\u062a\u0631\u06cc \u0628\u06af\u06cc\u0631\u06cc\u062f.<\/p>\n<p>\u062f\u0631 \u0645\u0642\u0627\u0644\u0647 \u0628\u0639\u062f\u06cc \u0631\u0648\u0634 \u0627\u0646\u062c\u0627\u0645 \u0645\u062f\u0644\u200c\u0633\u0627\u0632\u06cc \u0645\u0648\u0636\u0648\u0639 \u0628\u0627 Scikit-Learn \u0631\u0627 \u0646\u0634\u0627\u0646 \u062e\u0648\u0627\u0647\u0645 \u062f\u0627\u062f\u060c \u06a9\u0647 \u06cc\u06a9 \u062a\u06a9\u0646\u06cc\u06a9 \u0628\u062f\u0648\u0646 \u0646\u0638\u0627\u0631\u062a \u0628\u0631\u0627\u06cc \u062a\u062c\u0632\u06cc\u0647 \u0648 \u062a\u062d\u0644\u06cc\u0644 \u062d\u062c\u0645 \u0632\u06cc\u0627\u062f\u06cc \u0627\u0632 \u062f\u0627\u062f\u0647\u200c\u0647\u0627\u06cc \u0645\u062a\u0646\u06cc \u0628\u0627 \u062e\u0648\u0634\u0647\u200c\u0628\u0646\u062f\u06cc \u0627\u0633\u0646\u0627\u062f \u062f\u0631 \u06af\u0631\u0648\u0647\u200c\u0647\u0627 \u0627\u0633\u062a.<\/p>\n<\/div>\n<p><script>\n                        !function(f,b,e,v,n,t,s)\n                        {if(f.fbq)return;n=f.fbq=function(){n.callMethod?\n                        n.callMethod.apply(n,arguments):n.queue.push(arguments)};\n                        if(!f._fbq)f._fbq=n;n.push=n;n.loaded=!0;n.version='2.0';\n                        n.queue=();t=b.createElement(e);t.async=!0;\n                        t.src=v;s=b.getElementsByTagName(e)(0);\n                        s.parentNode.insertBefore(t,s)}(window, document,'script',\n                        'https:\/\/connect.facebook.net\/en_US\/fbevents.js');\n                        fbq('init', '525232124909042');\n                        fbq('track', 'PageView');\n                    <\/script>    (\u0628\u0631\u0686\u0633\u0628\u200c\u0647\u0627 \u0628\u0647 \u062a\u0631\u062c\u0645\u0647)# python<br \/>\n<br \/><br \/>\n<br \/>\u0645\u0646\u062a\u0634\u0631 \u0634\u062f\u0647 \u062f\u0631 1403-01-23 19:05:08<br \/>\n<\/p>\n\n\n<div class=\"kk-star-ratings kksr-auto kksr-align-center kksr-valign-bottom\"\n    data-payload='{&quot;align&quot;:&quot;center&quot;,&quot;id&quot;:&quot;16341&quot;,&quot;slug&quot;:&quot;default&quot;,&quot;valign&quot;:&quot;bottom&quot;,&quot;ignore&quot;:&quot;&quot;,&quot;reference&quot;:&quot;auto&quot;,&quot;class&quot;:&quot;&quot;,&quot;count&quot;:&quot;0&quot;,&quot;legendonly&quot;:&quot;&quot;,&quot;readonly&quot;:&quot;&quot;,&quot;score&quot;:&quot;0&quot;,&quot;starsonly&quot;:&quot;&quot;,&quot;best&quot;:&quot;5&quot;,&quot;gap&quot;:&quot;5&quot;,&quot;greet&quot;:&quot;\u0627\u0645\u062a\u06cc\u0627\u0632 \u0634\u0645\u0627 \u0628\u0647 \u0627\u06cc\u0646 \u0645\u0637\u0644\u0628&quot;,&quot;legend&quot;:&quot;0\\\/5 (0 \u0631\u0627\u06cc)&quot;,&quot;size&quot;:&quot;30&quot;,&quot;title&quot;:&quot;\u067e\u0627\u06cc\u062a\u0648\u0646 \u0628\u0631\u0627\u06cc NLP: \u062a\u062c\u0632\u06cc\u0647 \u0648 \u062a\u062d\u0644\u06cc\u0644 \u0627\u062d\u0633\u0627\u0633\u0627\u062a \u0628\u0627 Scikit-Learn&quot;,&quot;width&quot;:&quot;0&quot;,&quot;_legend&quot;:&quot;{score}\\\/{best} ({count} \u0631\u0627\u06cc)&quot;,&quot;font_factor&quot;:&quot;1.25&quot;}'>\n            \n<div class=\"kksr-stars\">\n    \n<div class=\"kksr-stars-inactive\">\n            <div class=\"kksr-star\" data-star=\"1\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" data-star=\"2\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" data-star=\"3\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" data-star=\"4\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" data-star=\"5\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n    <\/div>\n    \n<div class=\"kksr-stars-active\" style=\"width: 0px;\">\n            <div class=\"kksr-star\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n    <\/div>\n<\/div>\n                \n\n<div class=\"kksr-legend\" style=\"font-size: 24px;\">\n            <span class=\"kksr-muted\">\u0627\u0645\u062a\u06cc\u0627\u0632 \u0634\u0645\u0627 \u0628\u0647 \u0627\u06cc\u0646 \u0645\u0637\u0644\u0628<\/span>\n    <\/div>\n    <\/div>\n","protected":false},"excerpt":{"rendered":"<p><span class=\"span-reading-time rt-reading-time\" style=\"display: block;\"><span class=\"rt-label rt-prefix\">\u0632\u0645\u0627\u0646 \u0644\u0627\u0632\u0645 \u0628\u0631\u0627\u06cc \u0645\u0637\u0627\u0644\u0639\u0647: <\/span> <span class=\"rt-time\"> 8<\/span> <span class=\"rt-label rt-postfix\">\u062f\u0642\u06cc\u0642\u0647<\/span><\/span>\u0627\u06cc\u0646 \u067e\u0646\u062c\u0645\u06cc\u0646 \u0645\u0642\u0627\u0644\u0647 \u0627\u0632 \u0645\u062c\u0645\u0648\u0639\u0647 \u0645\u0642\u0627\u0644\u0627\u062a \u0627\u0633\u062a \u0631\u0648\u06cc NLP \u0628\u0631\u0627\u06cc \u067e\u0627\u06cc\u062a\u0648\u0646. \u062f\u0631 \u0645\u0642\u0627\u0644\u0647 \u0642\u0628\u0644\u06cc \u062e\u0648\u062f \u062a\u0648\u0636\u06cc\u062d \u062f\u0627\u062f\u0645 \u06a9\u0647 \u0686\u06af\u0648\u0646\u0647 \u0645\u06cc\u200c\u062a\u0648\u0627\u0646 \u0627\u0632 \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 spaCy \u067e\u0627\u06cc\u062a\u0648\u0646 \u0628\u0631\u0627\u06cc \u0627\u0646\u062c\u0627\u0645 \u0628\u062e\u0634\u200c\u0647\u0627\u06cc\u06cc \u0627\u0632 \u0628\u0631\u0686\u0633\u0628\u200c\u06af\u0630\u0627\u0631\u06cc \u06af\u0641\u062a\u0627\u0631 \u0648 \u0634\u0646\u0627\u0633\u0627\u06cc\u06cc \u0645\u0648\u062c\u0648\u062f\u06cc\u062a \u0646\u0627\u0645\u200c\u06af\u0630\u0627\u0631\u06cc \u0634\u062f\u0647 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0631\u062f. \u062f\u0631 \u0627\u06cc\u0646 \u0645\u0642\u0627\u0644\u0647\u060c \u0631\u0648\u0634 \u0627\u0646\u062c\u0627\u0645 \u062a\u062c\u0632\u06cc\u0647 \u0648 \u062a\u062d\u0644\u06cc\u0644 \u0627\u062d\u0633\u0627\u0633\u0627\u062a \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 \u062f\u0627\u062f\u0647 \u0647\u0627\u06cc \u062a\u0648\u06cc\u06cc\u062a\u0631 \u0631\u0627 \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 [&hellip;]<\/p>\n","protected":false},"author":3,"featured_media":16342,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"footnotes":""},"categories":[1743,620],"tags":[],"class_list":["post-16341","post","type-post","status-publish","format-standard","has-post-thumbnail","hentry","category-python","category-programming"],"acf":[],"_links":{"self":[{"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/posts\/16341","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/users\/3"}],"replies":[{"embeddable":true,"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/comments?post=16341"}],"version-history":[{"count":0,"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/posts\/16341\/revisions"}],"wp:featuredmedia":[{"embeddable":true,"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/media\/16342"}],"wp:attachment":[{"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/media?parent=16341"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/categories?post=16341"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/tags?post=16341"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}