{"id":16336,"date":"2024-01-23T18:04:14","date_gmt":"2024-01-23T14:34:14","guid":{"rendered":"https:\/\/rasanegar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%d9%85%d8%af%d9%84%d8%b3%d8%a7%d8%b2%db%8c-%d9%85%d9%88%d8%b6%d9%88%d8%b9\/"},"modified":"2024-01-23T18:04:14","modified_gmt":"2024-01-23T14:34:14","slug":"%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%d9%85%d8%af%d9%84%d8%b3%d8%a7%d8%b2%db%8c-%d9%85%d9%88%d8%b6%d9%88%d8%b9","status":"publish","type":"post","link":"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%d9%85%d8%af%d9%84%d8%b3%d8%a7%d8%b2%db%8c-%d9%85%d9%88%d8%b6%d9%88%d8%b9\/","title":{"rendered":"\u067e\u0627\u06cc\u062a\u0648\u0646 \u0628\u0631\u0627\u06cc NLP: \u0645\u062f\u0644\u200c\u0633\u0627\u0632\u06cc \u0645\u0648\u0636\u0648\u0639"},"content":{"rendered":"<div id=\"ez-toc-container\" class=\"ez-toc-v2_0_85 counter-hierarchy ez-toc-counter ez-toc-custom ez-toc-container-direction\">\n<div class=\"ez-toc-title-container\"><p class=\"ez-toc-title\" style=\"cursor:inherit\">\u0633\u0631\u0641\u0635\u0644\u0647\u0627\u06cc \u0645\u0637\u0644\u0628<\/p>\n<\/div><nav><ul class='ez-toc-list ez-toc-list-level-1 ' ><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class=\"ez-toc-link ez-toc-heading-1\" href=\"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%d9%85%d8%af%d9%84%d8%b3%d8%a7%d8%b2%db%8c-%d9%85%d9%88%d8%b6%d9%88%d8%b9\/#%d9%85%d8%af%d9%84%d8%b3%d8%a7%d8%b2%db%8c_%d9%85%d9%88%d8%b6%d9%88%d8%b9_%da%86%db%8c%d8%b3%d8%aa%d8%9f\" >\u0645\u062f\u0644\u0633\u0627\u0632\u06cc \u0645\u0648\u0636\u0648\u0639 \u0686\u06cc\u0633\u062a\u061f<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class=\"ez-toc-link ez-toc-heading-2\" href=\"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%d9%85%d8%af%d9%84%d8%b3%d8%a7%d8%b2%db%8c-%d9%85%d9%88%d8%b6%d9%88%d8%b9\/#%d8%aa%d8%ae%d8%b5%db%8c%d8%b5_%d8%af%db%8c%d8%b1%db%8c%da%a9%d9%84%d9%87_%d9%86%d9%87%d9%81%d8%aa%d9%87_lda\" >\u062a\u062e\u0635\u06cc\u0635 \u062f\u06cc\u0631\u06cc\u06a9\u0644\u0647 \u0646\u0647\u0641\u062a\u0647 (LDA)<\/a><ul class='ez-toc-list-level-3' ><li class='ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-3\" href=\"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%d9%85%d8%af%d9%84%d8%b3%d8%a7%d8%b2%db%8c-%d9%85%d9%88%d8%b6%d9%88%d8%b9\/#lda_%d8%a8%d8%b1%d8%a7%db%8c_%d9%85%d8%af%d9%84_%d8%b3%d8%a7%d8%b2%db%8c_%d9%85%d9%88%d8%b6%d9%88%d8%b9_%d8%af%d8%b1_%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86\" >LDA \u0628\u0631\u0627\u06cc \u0645\u062f\u0644 \u0633\u0627\u0632\u06cc \u0645\u0648\u0636\u0648\u0639 \u062f\u0631 \u067e\u0627\u06cc\u062a\u0648\u0646<\/a><\/li><\/ul><\/li><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class=\"ez-toc-link ez-toc-heading-4\" href=\"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%d9%85%d8%af%d9%84%d8%b3%d8%a7%d8%b2%db%8c-%d9%85%d9%88%d8%b6%d9%88%d8%b9\/#%d9%81%d8%a7%da%a9%d8%aa%d9%88%d8%b1%d8%b3%d8%a7%d8%b2%db%8c_%d9%85%d8%a7%d8%aa%d8%b1%db%8c%d8%b3_%d8%ba%db%8c%d8%b1_%d9%85%d9%86%d9%81%db%8c_nmf\" >\u0641\u0627\u06a9\u062a\u0648\u0631\u0633\u0627\u0632\u06cc \u0645\u0627\u062a\u0631\u06cc\u0633 \u063a\u06cc\u0631 \u0645\u0646\u0641\u06cc (NMF)<\/a><ul class='ez-toc-list-level-3' ><li class='ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-5\" href=\"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%d9%85%d8%af%d9%84%d8%b3%d8%a7%d8%b2%db%8c-%d9%85%d9%88%d8%b6%d9%88%d8%b9\/#nmf_%d8%a8%d8%b1%d8%a7%db%8c_%d9%85%d8%af%d9%84_%d8%b3%d8%a7%d8%b2%db%8c_%d9%85%d9%88%d8%b6%d9%88%d8%b9_%d8%af%d8%b1_%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86\" >NMF \u0628\u0631\u0627\u06cc \u0645\u062f\u0644 \u0633\u0627\u0632\u06cc \u0645\u0648\u0636\u0648\u0639 \u062f\u0631 \u067e\u0627\u06cc\u062a\u0648\u0646<\/a><\/li><\/ul><\/li><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class=\"ez-toc-link ez-toc-heading-6\" href=\"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%d9%85%d8%af%d9%84%d8%b3%d8%a7%d8%b2%db%8c-%d9%85%d9%88%d8%b6%d9%88%d8%b9\/#%d9%86%d8%aa%db%8c%d8%ac%d9%87\" >\u0646\u062a\u06cc\u062c\u0647<\/a><\/li><\/ul><\/nav><\/div>\n<span class=\"span-reading-time rt-reading-time\" style=\"display: block;\"><span class=\"rt-label rt-prefix\">\u0632\u0645\u0627\u0646 \u0644\u0627\u0632\u0645 \u0628\u0631\u0627\u06cc \u0645\u0637\u0627\u0644\u0639\u0647: <\/span> <span class=\"rt-time\"> 8<\/span> <span class=\"rt-label rt-postfix\">\u062f\u0642\u06cc\u0642\u0647<\/span><\/span><p> <br \/>\n<\/p>\n<div><noscript><\/noscript><\/p>\n<p>\u0627\u06cc\u0646 \u0634\u0634\u0645\u06cc\u0646 \u0645\u0642\u0627\u0644\u0647 \u0627\u0632 \u0633\u0631\u06cc \u0645\u0642\u0627\u0644\u0627\u062a \u0645\u0646 \u0627\u0633\u062a \u0631\u0648\u06cc \u067e\u0627\u06cc\u062a\u0648\u0646 \u0628\u0631\u0627\u06cc NLP.  \u062f\u0631 \u0645\u0642\u0627\u0644\u0647 \u0642\u0628\u0644\u06cc \u062e\u0648\u062f\u060c \u062f\u0631 \u0645\u0648\u0631\u062f \u0686\u06af\u0648\u0646\u06af\u06cc \u0627\u0646\u062c\u0627\u0645 \u062a\u062c\u0632\u06cc\u0647 \u0648 \u062a\u062d\u0644\u06cc\u0644 \u0627\u062d\u0633\u0627\u0633\u0627\u062a \u062f\u0627\u062f\u0647 \u0647\u0627\u06cc \u062a\u0648\u06cc\u06cc\u062a\u0631 \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 Scikit-Learn \u067e\u0627\u06cc\u062a\u0648\u0646 \u0635\u062d\u0628\u062a \u06a9\u0631\u062f\u0645.  \u062f\u0631 \u0627\u06cc\u0646 \u0645\u0642\u0627\u0644\u0647 \u0628\u0647 \u0628\u0631\u0631\u0633\u06cc \u0645\u062f\u0644 \u0633\u0627\u0632\u06cc \u0645\u0648\u0636\u0648\u0639 \u0645\u06cc \u067e\u0631\u062f\u0627\u0632\u06cc\u0645 \u06a9\u0647 \u06cc\u06a9\u06cc \u062f\u06cc\u06af\u0631 \u0627\u0632 \u06a9\u0627\u0631\u0628\u0631\u062f\u0647\u0627\u06cc \u0628\u0633\u06cc\u0627\u0631 \u0645\u0647\u0645 NLP \u0627\u0633\u062a.  \u062e\u0648\u0627\u0647\u06cc\u0645 \u062f\u06cc\u062f \u06a9\u0647 \u0686\u06af\u0648\u0646\u0647 \u0645\u06cc \u062a\u0648\u0627\u0646 \u0645\u062f\u0644 \u0633\u0627\u0632\u06cc \u0645\u0648\u0636\u0648\u0639 \u0631\u0627 \u0628\u0627 \u067e\u0627\u06cc\u062a\u0648\u0646 \u0627\u0646\u062c\u0627\u0645 \u062f\u0627\u062f.<\/p>\n<h2 id=\"whatistopicmodeling\"><span class=\"ez-toc-section\" id=\"%d9%85%d8%af%d9%84%d8%b3%d8%a7%d8%b2%db%8c_%d9%85%d9%88%d8%b6%d9%88%d8%b9_%da%86%db%8c%d8%b3%d8%aa%d8%9f\"><\/span>\u0645\u062f\u0644\u0633\u0627\u0632\u06cc \u0645\u0648\u0636\u0648\u0639 \u0686\u06cc\u0633\u062a\u061f<span class=\"ez-toc-section-end\"><\/span><\/h2>\n<p>\u0645\u062f\u0644\u200c\u0633\u0627\u0632\u06cc \u0645\u0648\u0636\u0648\u0639 \u06cc\u06a9 \u062a\u06a9\u0646\u06cc\u06a9 \u0628\u062f\u0648\u0646 \u0646\u0638\u0627\u0631\u062a \u0627\u0633\u062a \u06a9\u0647 \u0642\u0635\u062f \u062f\u0627\u0631\u062f \u062d\u062c\u0645 \u0632\u06cc\u0627\u062f\u06cc \u0627\u0632 \u062f\u0627\u062f\u0647\u200c\u0647\u0627\u06cc \u0645\u062a\u0646\u06cc \u0631\u0627 \u0628\u0627 \u062e\u0648\u0634\u0647\u200c\u0628\u0646\u062f\u06cc \u0627\u0633\u0646\u0627\u062f \u062f\u0631 \u06af\u0631\u0648\u0647\u200c\u0647\u0627 \u062a\u062c\u0632\u06cc\u0647 \u0648 \u062a\u062d\u0644\u06cc\u0644 \u06a9\u0646\u062f.  \u062f\u0631 \u0645\u0648\u0631\u062f \u0645\u062f\u0644\u200c\u0633\u0627\u0632\u06cc \u0645\u0648\u0636\u0648\u0639\u060c \u062f\u0627\u062f\u0647\u200c\u0647\u0627\u06cc \u0645\u062a\u0646\u06cc \u0647\u06cc\u0686 \u0628\u0631\u0686\u0633\u0628\u06cc \u0628\u0647 \u0622\u0646 \u0645\u062a\u0635\u0644 \u0646\u06cc\u0633\u062a\u0646\u062f.  \u062f\u0631 \u0639\u0648\u0636\u060c \u0645\u062f\u0644\u200c\u0633\u0627\u0632\u06cc \u0645\u0648\u0636\u0648\u0639 \u0633\u0639\u06cc \u0645\u06cc\u200c\u06a9\u0646\u062f \u0627\u0633\u0646\u0627\u062f \u0631\u0627 \u062f\u0631 \u062e\u0648\u0634\u0647\u200c\u0647\u0627 \u06af\u0631\u0648\u0647\u200c\u0628\u0646\u062f\u06cc \u06a9\u0646\u062f \u0631\u0648\u06cc \u0648\u06cc\u0698\u06af\u06cc \u0647\u0627\u06cc \u0645\u0634\u0627\u0628\u0647<\/p>\n<p>\u06cc\u06a9 \u0645\u062b\u0627\u0644 \u0645\u0639\u0645\u0648\u0644\u06cc \u0627\u0632 \u0645\u062f\u0644\u200c\u0633\u0627\u0632\u06cc \u0645\u0648\u0636\u0648\u0639\u060c \u062e\u0648\u0634\u0647\u200c\u0628\u0646\u062f\u06cc \u062a\u0639\u062f\u0627\u062f \u0632\u06cc\u0627\u062f\u06cc \u0627\u0632 \u0645\u0642\u0627\u0644\u0627\u062a \u0631\u0648\u0632\u0646\u0627\u0645\u0647\u200c\u0627\u06cc \u0627\u0633\u062a \u06a9\u0647 \u0628\u0647 \u0647\u0645\u0627\u0646 \u062f\u0633\u062a\u0647 \u062a\u0639\u0644\u0642 \u062f\u0627\u0631\u0646\u062f.  \u0628\u0647 \u0639\u0628\u0627\u0631\u062a \u062f\u06cc\u06af\u0631\u060c \u0627\u0633\u0646\u0627\u062f\u06cc \u0631\u0627 \u06a9\u0647 \u0645\u0648\u0636\u0648\u0639 \u06cc\u06a9\u0633\u0627\u0646\u06cc \u062f\u0627\u0631\u0646\u062f\u060c \u062e\u0648\u0634\u0647 \u0628\u0646\u062f\u06cc \u06a9\u0646\u06cc\u062f.  \u062f\u0631 \u0627\u06cc\u0646\u062c\u0627 \u0630\u06a9\u0631 \u0627\u06cc\u0646 \u0646\u06a9\u062a\u0647 \u0636\u0631\u0648\u0631\u06cc \u0627\u0633\u062a \u06a9\u0647 \u0627\u0631\u0632\u06cc\u0627\u0628\u06cc \u0639\u0645\u0644\u06a9\u0631\u062f \u0645\u062f\u0644 \u0633\u0627\u0632\u06cc \u0645\u0648\u0636\u0648\u0639 \u0628\u0633\u06cc\u0627\u0631 \u062f\u0634\u0648\u0627\u0631 \u0627\u0633\u062a \u0632\u06cc\u0631\u0627 \u067e\u0627\u0633\u062e \u062f\u0631\u0633\u062a\u06cc \u0648\u062c\u0648\u062f \u0646\u062f\u0627\u0631\u062f.  \u0627\u06cc\u0646 \u0628\u0633\u062a\u06af\u06cc \u0628\u0647 \u06a9\u0627\u0631\u0628\u0631 \u062f\u0627\u0631\u062f \u06a9\u0647 \u0648\u06cc\u0698\u06af\u06cc \u0647\u0627\u06cc \u0645\u0634\u0627\u0628\u0647\u06cc \u0631\u0627 \u0628\u06cc\u0646 \u0627\u0633\u0646\u0627\u062f \u06cc\u06a9 \u062e\u0648\u0634\u0647 \u0628\u06cc\u0627\u0628\u062f \u0648 \u06cc\u06a9 \u0628\u0631\u0686\u0633\u0628 \u06cc\u0627 \u0645\u0648\u0636\u0648\u0639 \u0645\u0646\u0627\u0633\u0628 \u0628\u0647 \u0622\u0646 \u0627\u062e\u062a\u0635\u0627\u0635 \u062f\u0647\u062f.<\/p>\n<p>\u062f\u0648 \u0631\u0648\u06cc\u06a9\u0631\u062f \u0639\u0645\u062f\u062a\u0627 \u0628\u0631\u0627\u06cc \u0645\u062f\u0644 \u0633\u0627\u0632\u06cc \u0645\u0648\u0636\u0648\u0639 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0645\u06cc \u0634\u0648\u062f: <a rel=\"nofollow noopener\" target=\"_blank\" href=\"https:\/\/en.wikipedia.org\/wiki\/Latent_Dirichlet_allocation\">\u062a\u062e\u0635\u06cc\u0635 \u062f\u06cc\u0631\u06cc\u06a9\u0644\u0647 \u0646\u0647\u0641\u062a\u0647<\/a> \u0648 <a rel=\"nofollow noopener\" target=\"_blank\" href=\"https:\/\/en.wikipedia.org\/wiki\/Non-negative_matrix_factorization\">\u0641\u0627\u06a9\u062a\u0648\u0631\u0633\u0627\u0632\u06cc \u0645\u0627\u062a\u0631\u06cc\u0633 \u063a\u06cc\u0631 \u0645\u0646\u0641\u06cc<\/a>.  \u062f\u0631 \u0628\u062e\u0634\u200c\u0647\u0627\u06cc \u0628\u0639\u062f\u06cc\u060c \u0647\u0631 \u062f\u0648\u06cc \u0627\u06cc\u0646 \u0631\u0648\u06cc\u06a9\u0631\u062f\u0647\u0627 \u0631\u0627 \u0628\u0647 \u0627\u062e\u062a\u0635\u0627\u0631 \u0628\u0631\u0631\u0633\u06cc \u062e\u0648\u0627\u0647\u06cc\u0645 \u06a9\u0631\u062f \u0648 \u062e\u0648\u0627\u0647\u06cc\u0645 \u062f\u06cc\u062f \u06a9\u0647 \u0686\u06af\u0648\u0646\u0647 \u0645\u06cc\u200c\u062a\u0648\u0627\u0646 \u0622\u0646\u0647\u0627 \u0631\u0627 \u0628\u0631\u0627\u06cc \u0645\u062f\u0644\u200c\u0633\u0627\u0632\u06cc \u0645\u0648\u0636\u0648\u0639 \u062f\u0631 \u067e\u0627\u06cc\u062a\u0648\u0646 \u0628\u0647 \u06a9\u0627\u0631 \u0628\u0631\u062f.<\/p>\n<h2 id=\"latentdirichletallocationlda\"><span class=\"ez-toc-section\" id=\"%d8%aa%d8%ae%d8%b5%db%8c%d8%b5_%d8%af%db%8c%d8%b1%db%8c%da%a9%d9%84%d9%87_%d9%86%d9%87%d9%81%d8%aa%d9%87_lda\"><\/span>\u062a\u062e\u0635\u06cc\u0635 \u062f\u06cc\u0631\u06cc\u06a9\u0644\u0647 \u0646\u0647\u0641\u062a\u0647 (LDA)<span class=\"ez-toc-section-end\"><\/span><\/h2>\n<p>LDA \u0628\u0631 \u062f\u0648 \u0641\u0631\u0636 \u06a9\u0644\u06cc \u0627\u0633\u062a\u0648\u0627\u0631 \u0627\u0633\u062a:<\/p>\n<ul>\n<li>\u0627\u0633\u0646\u0627\u062f\u06cc \u06a9\u0647 \u062f\u0627\u0631\u0627\u06cc \u06a9\u0644\u0645\u0627\u062a \u0645\u0634\u0627\u0628\u0647 \u0647\u0633\u062a\u0646\u062f \u0645\u0639\u0645\u0648\u0644\u0627\u064b \u0645\u0648\u0636\u0648\u0639 \u06cc\u06a9\u0633\u0627\u0646\u06cc \u062f\u0627\u0631\u0646\u062f<\/li>\n<li>\u0627\u0633\u0646\u0627\u062f\u06cc \u06a9\u0647 \u062f\u0627\u0631\u0627\u06cc \u06af\u0631\u0648\u0647\u200c\u0647\u0627\u06cc\u06cc \u0627\u0632 \u06a9\u0644\u0645\u0627\u062a \u0647\u0633\u062a\u0646\u062f \u06a9\u0647 \u0627\u063a\u0644\u0628 \u062f\u0631 \u06a9\u0646\u0627\u0631 \u0647\u0645 \u0642\u0631\u0627\u0631 \u0645\u06cc\u200c\u06af\u06cc\u0631\u0646\u062f\u060c \u0645\u0639\u0645\u0648\u0644\u0627\u064b \u0645\u0648\u0636\u0648\u0639 \u06cc\u06a9\u0633\u0627\u0646\u06cc \u062f\u0627\u0631\u0646\u062f.<\/li>\n<\/ul>\n<p>\u0627\u06cc\u0646 \u0645\u0641\u0631\u0648\u0636\u0627\u062a \u0645\u0646\u0637\u0642\u06cc \u0647\u0633\u062a\u0646\u062f \u0632\u06cc\u0631\u0627 \u0627\u0633\u0646\u0627\u062f\u06cc \u06a9\u0647 \u0645\u0648\u0636\u0648\u0639 \u06cc\u06a9\u0633\u0627\u0646\u06cc \u062f\u0627\u0631\u0646\u062f\u060c \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u0645\u062b\u0627\u0644\u060c \u0645\u0648\u0636\u0648\u0639\u0627\u062a \u062a\u062c\u0627\u0631\u06cc \u062f\u0627\u0631\u0627\u06cc \u06a9\u0644\u0645\u0627\u062a\u06cc \u0645\u0627\u0646\u0646\u062f &#8220;\u0627\u0642\u062a\u0635\u0627\u062f&#8221;\u060c &#8220;\u0633\u0648\u062f&#8221;\u060c &#8220;\u0628\u0627\u0632\u0627\u0631 \u0633\u0647\u0627\u0645&#8221;\u060c &#8220;\u0632\u06cc\u0627\u0646&#8221; \u0648 \u063a\u06cc\u0631\u0647 \u062e\u0648\u0627\u0647\u0646\u062f \u0628\u0648\u062f. \u0641\u0631\u0636 \u062f\u0648\u0645 \u0628\u06cc\u0627\u0646 \u0645\u06cc \u06a9\u0646\u062f \u06a9\u0647 \u0627\u06af\u0631 \u0627\u06cc\u0646 \u0645\u0648\u0627\u0631\u062f \u06a9\u0644\u0645\u0627\u062a \u0627\u063a\u0644\u0628 \u0628\u0627 \u0647\u0645 \u062f\u0631 \u0686\u0646\u062f\u06cc\u0646 \u0633\u0646\u062f \u0648\u062c\u0648\u062f \u062f\u0627\u0631\u0646\u062f\u060c \u0622\u0646 \u0627\u0633\u0646\u0627\u062f \u0645\u0645\u06a9\u0646 \u0627\u0633\u062a \u0645\u062a\u0639\u0644\u0642 \u0628\u0647 \u06cc\u06a9 \u062f\u0633\u062a\u0647 \u0628\u0627\u0634\u0646\u062f.<\/p>\n<p>\u0627\u0632 \u0646\u0638\u0631 \u0631\u06cc\u0627\u0636\u06cc\u060c \u062f\u0648 \u0641\u0631\u0636 \u0628\u0627\u0644\u0627 \u0631\u0627 \u0645\u06cc \u062a\u0648\u0627\u0646 \u0628\u0647 \u0635\u0648\u0631\u062a \u0632\u06cc\u0631 \u0646\u0634\u0627\u0646 \u062f\u0627\u062f:<\/p>\n<ul>\n<li>\u0627\u0633\u0646\u0627\u062f \u062a\u0648\u0632\u06cc\u0639 \u0627\u062d\u062a\u0645\u0627\u0644 \u0628\u0631 \u0631\u0648\u06cc \u0645\u0648\u0636\u0648\u0639\u0627\u062a \u067e\u0646\u0647\u0627\u0646 \u0647\u0633\u062a\u0646\u062f<\/li>\n<li>\u0645\u0648\u0636\u0648\u0639\u0627\u062a \u062a\u0648\u0632\u06cc\u0639 \u0627\u062d\u062a\u0645\u0627\u0644 \u0628\u0631 \u0631\u0648\u06cc \u06a9\u0644\u0645\u0627\u062a \u0647\u0633\u062a\u0646\u062f<\/li>\n<\/ul>\n<h3 id=\"ldafortopicmodelinginpython\"><span class=\"ez-toc-section\" id=\"lda_%d8%a8%d8%b1%d8%a7%db%8c_%d9%85%d8%af%d9%84_%d8%b3%d8%a7%d8%b2%db%8c_%d9%85%d9%88%d8%b6%d9%88%d8%b9_%d8%af%d8%b1_%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86\"><\/span>LDA \u0628\u0631\u0627\u06cc \u0645\u062f\u0644 \u0633\u0627\u0632\u06cc \u0645\u0648\u0636\u0648\u0639 \u062f\u0631 \u067e\u0627\u06cc\u062a\u0648\u0646<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p>\u062f\u0631 \u0627\u06cc\u0646 \u0628\u062e\u0634 \u062e\u0648\u0627\u0647\u06cc\u0645 \u062f\u06cc\u062f \u06a9\u0647 \u0686\u06af\u0648\u0646\u0647 \u0645\u06cc \u062a\u0648\u0627\u0646 \u0627\u0632 \u067e\u0627\u06cc\u062a\u0648\u0646 \u0628\u0631\u0627\u06cc \u067e\u06cc\u0627\u062f\u0647 \u0633\u0627\u0632\u06cc LDA \u0628\u0631\u0627\u06cc \u0645\u062f\u0644 \u0633\u0627\u0632\u06cc \u0645\u0648\u0636\u0648\u0639 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0631\u062f.  \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647 \u0647\u0627 \u0631\u0627 \u0645\u06cc \u062a\u0648\u0627\u0646 \u0627\u0632 <a rel=\"nofollow noopener\" target=\"_blank\" href=\"https:\/\/www.kaggle.com\/sdxingaijing\/topic-model-lda-algorithm\/data\">\u06a9\u0627\u06af\u0644<\/a>.<\/p>\n<p>\u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647 \u0634\u0627\u0645\u0644 \u0646\u0638\u0631\u0627\u062a \u06a9\u0627\u0631\u0628\u0631\u0627\u0646 \u0628\u0631\u0627\u06cc \u0645\u062d\u0635\u0648\u0644\u0627\u062a \u0645\u062e\u062a\u0644\u0641 \u062f\u0631 \u062f\u0633\u062a\u0647 \u0645\u0648\u0627\u062f \u063a\u0630\u0627\u06cc\u06cc \u0627\u0633\u062a.  \u0645\u0627 \u0627\u0632 LDA \u0628\u0631\u0627\u06cc \u06af\u0631\u0648\u0647 \u0628\u0646\u062f\u06cc \u0646\u0638\u0631\u0627\u062a \u06a9\u0627\u0631\u0628\u0631\u0627\u0646 \u062f\u0631 5 \u062f\u0633\u062a\u0647 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0645\u06cc \u06a9\u0646\u06cc\u0645.<\/p>\n<p>\u0627\u0648\u0644\u06cc\u0646 \u0642\u062f\u0645\u060c \u0645\u062b\u0644 \u0647\u0645\u06cc\u0634\u0647\u060c \u0627\u06cc\u0646 \u0627\u0633\u062a \u06a9\u0647 import \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647 \u0647\u0627 \u0628\u0647 \u0647\u0645\u0631\u0627\u0647 \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 \u0647\u0627\u06cc \u0645\u0648\u0631\u062f \u0646\u06cc\u0627\u0632  \u0628\u0631\u0627\u06cc \u0627\u06cc\u0646 \u06a9\u0627\u0631 \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0632\u06cc\u0631 \u0631\u0627 \u0627\u062c\u0631\u0627 \u06a9\u0646\u06cc\u062f:<\/p>\n<pre><code class=\"hljs\"><span class=\"hljs-keyword\">import<\/span> pandas <span class=\"hljs-keyword\">as<\/span> pd\n<span class=\"hljs-keyword\">import<\/span> numpy <span class=\"hljs-keyword\">as<\/span> np\n\nreviews_datasets = pd.read_csv(<span class=\"hljs-string\">r'E:\\Datasets\\Reviews.csv'<\/span>)\nreviews_datasets = reviews_datasets.head(<span class=\"hljs-number\">20000<\/span>)\nreviews_datasets.dropna()\n<\/code><\/pre>\n<p>\u062f\u0631 \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0628\u0627\u0644\u0627 \u0645\u0627 import \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647 \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 <code>read_csv<\/code> \u0631\u0648\u0634 \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 \u067e\u0627\u0646\u062f\u0627\u0647\u0627  \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647 \u0627\u0635\u0644\u06cc \u0634\u0627\u0645\u0644 \u062d\u062f\u0648\u062f 500 \u0647\u0632\u0627\u0631 \u0628\u0631\u0631\u0633\u06cc \u0627\u0633\u062a.  \u0628\u0627 \u0627\u06cc\u0646 \u062d\u0627\u0644\u060c \u0628\u0647 \u062f\u0644\u06cc\u0644 \u0645\u062d\u062f\u0648\u062f\u06cc\u062a \u062d\u0627\u0641\u0638\u0647\u060c \u0645\u0646 \u0641\u0642\u0637 LDA \u0631\u0627 \u0627\u0646\u062c\u0627\u0645 \u062e\u0648\u0627\u0647\u0645 \u062f\u0627\u062f \u0631\u0648\u06cc 20 \u0647\u0632\u0627\u0631 \u0631\u06a9\u0648\u0631\u062f \u0627\u0648\u0644  \u062f\u0631 \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0628\u0627\u0644\u0627 \u0645\u0627 20 \u0647\u0632\u0627\u0631 \u0631\u062f\u06cc\u0641 \u0627\u0648\u0644 \u0631\u0627 \u0641\u06cc\u0644\u062a\u0631 \u06a9\u0631\u062f\u0647 \u0648 \u0633\u067e\u0633 \u0645\u0642\u0627\u062f\u06cc\u0631 null \u0631\u0627 \u0627\u0632 \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647 \u062d\u0630\u0641 \u0645\u06cc \u06a9\u0646\u06cc\u0645.<\/p>\n<p>\u0628\u0639\u062f\u060c \u0645\u0627 print \u067e\u0646\u062c \u0631\u062f\u06cc\u0641 \u0627\u0648\u0644 \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647 \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 <code>head()<\/code> \u0639\u0645\u0644\u06a9\u0631\u062f \u0628\u0627\u0632\u0631\u0633\u06cc \u062f\u0627\u062f\u0647 \u0647\u0627\u06cc \u0645\u0627:<\/p>\n<pre><code class=\"hljs\">reviews_datasets.head()\n<\/code><\/pre>\n<p>\u062f\u0631 \u062e\u0631\u0648\u062c\u06cc \u062f\u0627\u062f\u0647 \u0647\u0627\u06cc \u0632\u06cc\u0631 \u0631\u0627 \u0645\u0634\u0627\u0647\u062f\u0647 \u062e\u0648\u0627\u0647\u06cc\u062f \u06a9\u0631\u062f:<\/p>\n<p><img decoding=\"async\" class=\"img-responsive\" src=\"https:\/\/rasanegar.com\/blog\/wp-content\/uploads\/2024\/01\/python-nlp-topic-modeling-1.png\" alt=\"\" title=\"\"><\/p>\n<p>\u0645\u0627 LDA \u0631\u0627 \u0627\u0639\u0645\u0627\u0644 \u062e\u0648\u0627\u0647\u06cc\u0645 \u06a9\u0631\u062f \u0631\u0648\u06cc \u0633\u062a\u0648\u0646 &#8220;\u0645\u062a\u0646&#8221; \u0627\u0632 \u0622\u0646\u062c\u0627\u06cc\u06cc \u06a9\u0647 \u062d\u0627\u0648\u06cc \u0646\u0638\u0631\u0627\u062a \u0627\u0633\u062a\u060c \u0628\u0642\u06cc\u0647 \u0633\u062a\u0648\u0646 \u0647\u0627 \u0646\u0627\u062f\u06cc\u062f\u0647 \u06af\u0631\u0641\u062a\u0647 \u0645\u06cc \u0634\u0648\u0646\u062f.<\/p>\n<p>\u0628\u06cc\u0627\u06cc\u06cc\u062f \u0628\u0631\u0631\u0633\u06cc \u0634\u0645\u0627\u0631\u0647 350 \u0631\u0627 \u0628\u0628\u06cc\u0646\u06cc\u0645.<\/p>\n<pre><code class=\"hljs\">reviews_datasets(<span class=\"hljs-string\">'Text'<\/span>)(<span class=\"hljs-number\">350<\/span>)\n<\/code><\/pre>\n<p>\u062f\u0631 \u062e\u0631\u0648\u062c\u06cc\u060c \u0645\u062a\u0646 \u0628\u0631\u0631\u0633\u06cc \u0632\u06cc\u0631 \u0631\u0627 \u0645\u0634\u0627\u0647\u062f\u0647 \u062e\u0648\u0627\u0647\u06cc\u062f \u06a9\u0631\u062f:<\/p>\n<pre><code class=\"hljs\">'These chocolate covered espresso beans are wonderful!  The chocolate is very dark and rich and the \"bean\" inside is a very delightful blend of flavors with just enough caffine to really give it a zing.'\n<\/code><\/pre>\n<p>\u0642\u0628\u0644 \u0627\u0632 \u0627\u06cc\u0646\u06a9\u0647 \u0628\u062a\u0648\u0627\u0646\u06cc\u0645 LDA \u0631\u0627 \u0627\u0639\u0645\u0627\u0644 \u06a9\u0646\u06cc\u0645\u060c \u0628\u0627\u06cc\u062f \u0648\u0627\u0698\u06af\u0627\u0646\u06cc \u0627\u0632 \u062a\u0645\u0627\u0645 \u06a9\u0644\u0645\u0627\u062a \u0645\u0648\u062c\u0648\u062f \u062f\u0631 \u062f\u0627\u062f\u0647 \u0647\u0627\u06cc \u062e\u0648\u062f \u0627\u06cc\u062c\u0627\u062f \u06a9\u0646\u06cc\u0645.  \u0627\u0632 \u0645\u0642\u0627\u0644\u0647 \u0642\u0628\u0644\u06cc \u0628\u0647 \u06cc\u0627\u062f \u062f\u0627\u0634\u062a\u0647 \u0628\u0627\u0634\u06cc\u062f\u060c \u0645\u0627 \u0645\u06cc\u200c\u062a\u0648\u0627\u0646\u06cc\u0645 \u0627\u06cc\u0646 \u06a9\u0627\u0631 \u0631\u0627 \u0628\u0627 \u06a9\u0645\u06a9 \u0628\u0631\u062f\u0627\u0631 \u0634\u0645\u0627\u0631\u0634 \u0627\u0646\u062c\u0627\u0645 \u062f\u0647\u06cc\u0645.  \u0628\u0647 \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0632\u06cc\u0631 \u0646\u06af\u0627\u0647 \u06a9\u0646\u06cc\u062f:<\/p>\n<pre><code class=\"hljs\"><span class=\"hljs-keyword\">from<\/span> sklearn.feature_extraction.text <span class=\"hljs-keyword\">import<\/span> CountVectorizer\n\ncount_vect = CountVectorizer(max_df=<span class=\"hljs-number\">0.8<\/span>, min_df=<span class=\"hljs-number\">2<\/span>, stop_words=<span class=\"hljs-string\">'english'<\/span>)\ndoc_term_matrix = count_vect.fit_transform(reviews_datasets(<span class=\"hljs-string\">'Text'<\/span>).values.astype(<span class=\"hljs-string\">'U'<\/span>))\n<\/code><\/pre>\n<p>\u062f\u0631 \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0628\u0627\u0644\u0627 \u0645\u0627 \u0627\u0632 <code>CountVectorizer<\/code> \u06a9\u0644\u0627\u0633 \u0627\u0632 <code>sklearn.feature_extraction.text<\/code> \u0645\u0627\u0698\u0648\u0644 \u0628\u0631\u0627\u06cc \u0627\u06cc\u062c\u0627\u062f \u06cc\u06a9 \u0645\u0627\u062a\u0631\u06cc\u0633 \u0633\u0646\u062f-\u062a\u0631\u0645.  \u0645\u0627 \u0645\u0634\u062e\u0635 \u0645\u06cc \u06a9\u0646\u06cc\u0645 \u06a9\u0647 \u0641\u0642\u0637 \u06a9\u0644\u0645\u0627\u062a\u06cc \u0631\u0627 \u06a9\u0647 \u062f\u0631 \u06a9\u0645\u062a\u0631 \u0627\u0632 80\u066a \u0633\u0646\u062f \u0638\u0627\u0647\u0631 \u0645\u06cc \u0634\u0648\u0646\u062f \u0648 \u062d\u062f\u0627\u0642\u0644 \u062f\u0631 2 \u0633\u0646\u062f \u0638\u0627\u0647\u0631 \u0645\u06cc \u0634\u0648\u0646\u062f \u0634\u0627\u0645\u0644 \u0634\u0648\u062f.  \u0645\u0627 \u0647\u0645\u0686\u0646\u06cc\u0646 \u062a\u0645\u0627\u0645 \u06a9\u0644\u0645\u0627\u062a \u062a\u0648\u0642\u0641 \u0631\u0627 \u062d\u0630\u0641 \u0645\u06cc \u06a9\u0646\u06cc\u0645 \u0632\u06cc\u0631\u0627 \u0622\u0646\u0647\u0627 \u0648\u0627\u0642\u0639\u0627\u064b \u0628\u0647 \u0645\u062f\u0644 \u0633\u0627\u0632\u06cc \u0645\u0648\u0636\u0648\u0639 \u06a9\u0645\u06a9 \u0646\u0645\u06cc \u06a9\u0646\u0646\u062f.<\/p>\n<p>\u062d\u0627\u0644\u0627 \u0628\u06cc\u0627\u06cc\u06cc\u062f \u0628\u0647 \u0645\u0627\u062a\u0631\u06cc\u0633 \u0627\u0635\u0637\u0644\u0627\u062d \u0633\u0646\u062f \u062e\u0648\u062f \u0646\u06af\u0627\u0647 \u06a9\u0646\u06cc\u0645:<\/p>\n<pre><code class=\"hljs\">doc_term_matrix\n<\/code><\/pre>\n<p>\u062e\u0631\u0648\u062c\u06cc:<\/p>\n<pre><code class=\"hljs\">&lt;20000x14546 sparse matrix of type '&lt;class 'numpy.int64'&gt;'\nwith 594703 stored elements in Compressed Sparse Row format&gt;\n<\/code><\/pre>\n<p>\u0647\u0631 \u06cc\u06a9 \u0627\u0632 20 \u0647\u0632\u0627\u0631 \u0633\u0646\u062f \u0628\u0647 \u0635\u0648\u0631\u062a \u0628\u0631\u062f\u0627\u0631 14546 \u0628\u0639\u062f\u06cc \u0646\u0634\u0627\u0646 \u062f\u0627\u062f\u0647 \u0645\u06cc \u0634\u0648\u062f\u060c \u0628\u0647 \u0627\u06cc\u0646 \u0645\u0639\u0646\u06cc \u06a9\u0647 \u0648\u0627\u0698\u06af\u0627\u0646 \u0645\u0627 \u062f\u0627\u0631\u0627\u06cc 14546 \u06a9\u0644\u0645\u0647 \u0627\u0633\u062a.<\/p>\n<p>\u062f\u0631 \u0645\u0631\u062d\u0644\u0647 \u0628\u0639\u062f\u060c \u0627\u0632 LDA \u0628\u0631\u0627\u06cc \u0627\u06cc\u062c\u0627\u062f \u0645\u0648\u0636\u0648\u0639\u0627\u062a \u0628\u0647 \u0647\u0645\u0631\u0627\u0647 \u062a\u0648\u0632\u06cc\u0639 \u0627\u062d\u062a\u0645\u0627\u0644 \u0628\u0631\u0627\u06cc \u0647\u0631 \u06a9\u0644\u0645\u0647 \u062f\u0631 \u0648\u0627\u0698\u06af\u0627\u0646 \u062e\u0648\u062f \u0628\u0631\u0627\u06cc \u0647\u0631 \u0645\u0648\u0636\u0648\u0639 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u062e\u0648\u0627\u0647\u06cc\u0645 \u06a9\u0631\u062f.  \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0632\u06cc\u0631 \u0631\u0627 \u0627\u062c\u0631\u0627 \u06a9\u0646\u06cc\u062f:<\/p>\n<pre><code class=\"hljs\"><span class=\"hljs-keyword\">from<\/span> sklearn.decomposition <span class=\"hljs-keyword\">import<\/span> LatentDirichletAllocation\n\nLDA = LatentDirichletAllocation(n_components=<span class=\"hljs-number\">5<\/span>, random_state=<span class=\"hljs-number\">42<\/span>)\nLDA.fit(doc_term_matrix)\n<\/code><\/pre>\n<p>\u062f\u0631 \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0628\u0627\u0644\u0627 \u0645\u0627 \u0627\u0632 <code>LatentDirichletAllocation<\/code> \u06a9\u0644\u0627\u0633 \u0627\u0632 <code>sklearn.decomposition<\/code> \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 \u0628\u0631\u0627\u06cc \u0627\u0646\u062c\u0627\u0645 LDA \u0631\u0648\u06cc \u0645\u0627\u062a\u0631\u06cc\u0633 \u0633\u0646\u062f &#8211; \u0645\u062f\u062a \u0645\u0627  \u067e\u0627\u0631\u0627\u0645\u062a\u0631 <code>n_components<\/code> \u062a\u0639\u062f\u0627\u062f \u062f\u0633\u062a\u0647 \u0647\u0627 \u06cc\u0627 \u0645\u0648\u0636\u0648\u0639\u0627\u062a\u06cc \u0631\u0627 \u0645\u0634\u062e\u0635 \u0645\u06cc \u06a9\u0646\u062f \u06a9\u0647 \u0645\u06cc \u062e\u0648\u0627\u0647\u06cc\u0645 \u0645\u062a\u0646 \u0645\u0627 \u0628\u0647 \u0622\u0646\u0647\u0627 \u062a\u0642\u0633\u06cc\u0645 \u0634\u0648\u062f.  \u067e\u0627\u0631\u0627\u0645\u062a\u0631 <code>random_state<\/code> (\u0645\u0639\u0631\u0648\u0641 \u0628\u0647 <a rel=\"nofollow noopener\" target=\"_blank\" href=\"https:\/\/en.wikipedia.org\/wiki\/Random_seed\">\u062f\u0627\u0646\u0647<\/a>) \u0631\u0648\u06cc 42 \u062a\u0646\u0638\u06cc\u0645 \u0634\u062f\u0647 \u0627\u0633\u062a \u062a\u0627 \u0646\u062a\u0627\u06cc\u062c\u06cc \u0645\u0634\u0627\u0628\u0647 \u0645\u0646 \u0628\u062f\u0633\u062a \u0622\u0648\u0631\u06cc\u062f.<\/p>\n<p>\u0628\u06cc\u0627\u06cc\u06cc\u062f \u0628\u0647 \u0637\u0648\u0631 \u062a\u0635\u0627\u062f\u0641\u06cc \u06a9\u0644\u0645\u0627\u062a \u0631\u0627 \u0627\u0632 \u062f\u0627\u06cc\u0631\u0647 \u0644\u063a\u0627\u062a \u062e\u0648\u062f \u0628\u06cc\u0627\u0648\u0631\u06cc\u0645.  \u0645\u06cc \u062f\u0627\u0646\u06cc\u0645 \u06a9\u0647 count vectorizer \u062a\u0645\u0627\u0645 \u06a9\u0644\u0645\u0627\u062a \u0645\u0648\u062c\u0648\u062f \u062f\u0631 \u0648\u0627\u0698\u06af\u0627\u0646 \u0645\u0627 \u0631\u0627 \u0634\u0627\u0645\u0644 \u0645\u06cc \u0634\u0648\u062f.  \u0645\u0627 \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u0645 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0646\u06cc\u0645 <code>get_feature_names()<\/code> \u0631\u0648\u0634 \u0648 \u0634\u0646\u0627\u0633\u0647 \u06a9\u0644\u0645\u0647 \u0627\u06cc \u0631\u0627 \u06a9\u0647 \u0645\u06cc \u062e\u0648\u0627\u0647\u06cc\u0645 \u0648\u0627\u06a9\u0634\u06cc \u06a9\u0646\u06cc\u0645 \u0628\u0647 \u0622\u0646 \u0627\u0631\u0633\u0627\u0644 \u06a9\u0646\u06cc\u062f.<\/p>\n<p>\u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0632\u06cc\u0631 \u0628\u0647 \u0637\u0648\u0631 \u062a\u0635\u0627\u062f\u0641\u06cc 10 \u06a9\u0644\u0645\u0647 \u0631\u0627 \u0627\u0632 \u0648\u0627\u0698\u06af\u0627\u0646 \u0645\u0627 \u0645\u06cc \u0622\u0648\u0631\u062f:<\/p>\n<pre><code class=\"hljs\"><span class=\"hljs-keyword\">import<\/span> random\n\n<span class=\"hljs-keyword\">for<\/span> i <span class=\"hljs-keyword\">in<\/span> <span class=\"hljs-built_in\">range<\/span>(<span class=\"hljs-number\">10<\/span>):\n    random_id = random.randint(<span class=\"hljs-number\">0<\/span>,<span class=\"hljs-built_in\">len<\/span>(count_vect.get_feature_names()))\n    <span class=\"hljs-built_in\">print<\/span>(count_vect.get_feature_names()(random_id))\n<\/code><\/pre>\n<p>\u062e\u0631\u0648\u062c\u06cc \u0628\u0647 \u0634\u06a9\u0644 \u0632\u06cc\u0631 \u0627\u0633\u062a:<\/p>\n<pre><code class=\"hljs\">bribe\ntarragon\nqualifies\nprepare\nhangs\nnoted\nchurning\nbreeds\nzon\nchunkier\n<\/code><\/pre>\n<p>\u0628\u06cc\u0627\u06cc\u06cc\u062f 10 \u06a9\u0644\u0645\u0647 \u0628\u0627 \u0628\u06cc\u0634\u062a\u0631\u06cc\u0646 \u0627\u062d\u062a\u0645\u0627\u0644 \u0628\u0631\u0627\u06cc \u0645\u0648\u0636\u0648\u0639 \u0627\u0648\u0644 \u067e\u06cc\u062f\u0627 \u06a9\u0646\u06cc\u0645.  \u0628\u0631\u0627\u06cc \u062f\u0631\u06cc\u0627\u0641\u062a \u0645\u0648\u0636\u0648\u0639 \u0627\u0648\u0644 \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u062f \u0627\u0632 <code>components_<\/code> \u0648\u06cc\u0698\u06af\u06cc \u0648 \u06cc\u06a9 \u0634\u0627\u062e\u0635 0 \u0631\u0627 \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u0645\u0642\u062f\u0627\u0631 \u0627\u0631\u0633\u0627\u0644 \u06a9\u0646\u06cc\u062f:<\/p>\n<pre><code class=\"hljs\">first_topic = LDA.components_(<span class=\"hljs-number\">0<\/span>)\n<\/code><\/pre>\n<p>\u0645\u0628\u062d\u062b \u0627\u0648\u0644 \u0634\u0627\u0645\u0644 \u0627\u062d\u062a\u0645\u0627\u0644\u0627\u062a 14546 \u06a9\u0644\u0645\u0647 \u0628\u0631\u0627\u06cc \u0645\u0628\u062d\u062b 1 \u0627\u0633\u062a. \u0628\u0631\u0627\u06cc \u0645\u0631\u062a\u0628 \u0633\u0627\u0632\u06cc \u0634\u0627\u062e\u0635 \u0647\u0627 \u0628\u0631 \u0627\u0633\u0627\u0633 \u0645\u0642\u0627\u062f\u06cc\u0631 \u0627\u062d\u062a\u0645\u0627\u0644\u060c \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u0645 \u0627\u0632 <code>argsort()<\/code> \u062a\u0627\u0628\u0639.  \u067e\u0633 \u0627\u0632 \u0645\u0631\u062a\u0628 \u0633\u0627\u0632\u06cc\u060c 10 \u06a9\u0644\u0645\u0647 \u0628\u0627 \u0628\u0627\u0644\u0627\u062a\u0631\u06cc\u0646 \u0627\u062d\u062a\u0645\u0627\u0644 \u0627\u06a9\u0646\u0648\u0646 \u0628\u0647 10 \u0646\u0645\u0627\u06cc\u0647 \u0622\u062e\u0631 \u0622\u0631\u0627\u06cc\u0647 \u062a\u0639\u0644\u0642 \u062f\u0627\u0631\u0646\u062f.  \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0632\u06cc\u0631 \u0646\u0645\u0627\u06cc\u0647 \u0647\u0627\u06cc 10 \u06a9\u0644\u0645\u0647 \u0628\u0627 \u0628\u06cc\u0634\u062a\u0631\u06cc\u0646 \u0627\u062d\u062a\u0645\u0627\u0644 \u0631\u0627 \u0628\u0631\u0645\u06cc \u06af\u0631\u062f\u0627\u0646\u062f:<\/p>\n<pre><code class=\"hljs\">top_topic_words = first_topic.argsort()(-<span class=\"hljs-number\">10<\/span>:)\n<\/code><\/pre>\n<p>\u062e\u0631\u0648\u062c\u06cc:<\/p>\n<pre><code class=\"hljs\">array((14106,  5892,  7088,  4290, 12596,  5771,  5187, 12888,  7498,\n       12921), dtype=int64)\n<\/code><\/pre>\n<p>\u0633\u067e\u0633 \u0645\u06cc \u062a\u0648\u0627\u0646 \u0627\u0632 \u0627\u06cc\u0646 \u0634\u0627\u062e\u0635 \u0647\u0627 \u0628\u0631\u0627\u06cc \u0628\u0627\u0632\u06cc\u0627\u0628\u06cc \u0627\u0631\u0632\u0634 \u06a9\u0644\u0645\u0627\u062a \u0627\u0632 \u0642\u0633\u0645\u062a \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0631\u062f <code>count_vect<\/code> \u0634\u06cc\u060c \u06a9\u0647 \u0645\u06cc \u062a\u0648\u0627\u0646\u062f \u0628\u0647 \u0635\u0648\u0631\u062a \u0632\u06cc\u0631 \u0627\u0646\u062c\u0627\u0645 \u0634\u0648\u062f:<\/p>\n<pre><code class=\"hljs\"><span class=\"hljs-keyword\">for<\/span> i <span class=\"hljs-keyword\">in<\/span> top_topic_words:\n    <span class=\"hljs-built_in\">print<\/span>(count_vect.get_feature_names()(i))\n<\/code><\/pre>\n<p>\u062f\u0631 \u062e\u0631\u0648\u062c\u06cc \u0628\u0627\u06cc\u062f \u06a9\u0644\u0645\u0627\u062a \u0632\u06cc\u0631 \u0631\u0627 \u0628\u0628\u06cc\u0646\u06cc\u062f:<\/p>\n<pre><code class=\"hljs\">water\ngreat\njust\ndrink\nsugar\ngood\nflavor\ntaste\nlike\ntea\n<\/code><\/pre>\n<p>\u06a9\u0644\u0645\u0627\u062a \u0646\u0634\u0627\u0646 \u0645\u06cc \u062f\u0647\u0646\u062f \u06a9\u0647 \u0627\u0648\u0644\u06cc\u0646 \u0645\u0648\u0636\u0648\u0639 \u0645\u0645\u06a9\u0646 \u0627\u0633\u062a \u062f\u0631 \u0645\u0648\u0631\u062f \u0686\u0627\u06cc \u0628\u0627\u0634\u062f.<\/p>\n<p>\u0627\u062c\u0627\u0632\u0647 \u062f\u0647\u06cc\u062f print 10 \u06a9\u0644\u0645\u0647 \u0628\u0627 \u0628\u06cc\u0634\u062a\u0631\u06cc\u0646 \u0627\u062d\u062a\u0645\u0627\u0644 \u0628\u0631\u0627\u06cc \u0647\u0631 \u067e\u0646\u062c \u0645\u0648\u0636\u0648\u0639:<\/p>\n<pre><code class=\"hljs\"><span class=\"hljs-keyword\">for<\/span> i,topic <span class=\"hljs-keyword\">in<\/span> <span class=\"hljs-built_in\">enumerate<\/span>(LDA.components_):\n    <span class=\"hljs-built_in\">print<\/span>(<span class=\"hljs-string\">f'Top 10 words for topic #<span class=\"hljs-subst\">{i}<\/span>:'<\/span>)\n    <span class=\"hljs-built_in\">print<\/span>((count_vect.get_feature_names()(i) <span class=\"hljs-keyword\">for<\/span> i <span class=\"hljs-keyword\">in<\/span> topic.argsort()(-<span class=\"hljs-number\">10<\/span>:)))\n    <span class=\"hljs-built_in\">print<\/span>(<span class=\"hljs-string\">'\\n'<\/span>)\n<\/code><\/pre>\n<p>\u062e\u0631\u0648\u062c\u06cc \u0628\u0647 \u0634\u06a9\u0644 \u0632\u06cc\u0631 \u0627\u0633\u062a:<\/p>\n<pre><code class=\"hljs\">Top 10 words for topic #0:\n('water', 'great', 'just', 'drink', 'sugar', 'good', 'flavor', 'taste', 'like', 'tea')\n\n\nTop 10 words for topic #1:\n('br', 'chips', 'love', 'flavor', 'chocolate', 'just', 'great', 'taste', 'good', 'like')\n\n\nTop 10 words for topic #2:\n('just', 'drink', 'orange', 'sugar', 'soda', 'water', 'like', 'juice', 'product', 'br')\n\n\nTop 10 words for topic #3:\n('gluten', 'eat', 'free', 'product', 'like', 'dogs', 'treats', 'dog', 'br', 'food')\n\n\nTop 10 words for topic #4:\n('cups', 'price', 'great', 'like', 'amazon', 'good', 'br', 'product', 'cup', 'coffee')\n<\/code><\/pre>\n<p>\u062e\u0631\u0648\u062c\u06cc \u0646\u0634\u0627\u0646 \u0645\u06cc\u200c\u062f\u0647\u062f \u06a9\u0647 \u0645\u0628\u062d\u062b \u062f\u0648\u0645 \u0645\u0645\u06a9\u0646 \u0627\u0633\u062a \u062d\u0627\u0648\u06cc \u0646\u0638\u0631\u0627\u062a\u06cc \u062f\u0631\u0628\u0627\u0631\u0647 \u0634\u06a9\u0644\u0627\u062a\u200c\u0647\u0627 \u0648 \u063a\u06cc\u0631\u0647 \u0628\u0627\u0634\u062f.  \u0645\u06cc \u0628\u06cc\u0646\u06cc\u062f \u06a9\u0647 \u0686\u0646\u062f \u06a9\u0644\u0645\u0647 \u0631\u0627\u06cc\u062c \u062f\u0631 \u0647\u0645\u0647 \u062f\u0633\u062a\u0647 \u0647\u0627 \u0648\u062c\u0648\u062f \u062f\u0627\u0631\u062f.  \u0627\u06cc\u0646 \u0628\u0647 \u0627\u06cc\u0646 \u062f\u0644\u06cc\u0644 \u0627\u0633\u062a \u06a9\u0647 \u06a9\u0644\u0645\u0627\u062a \u06a9\u0645\u06cc \u0648\u062c\u0648\u062f \u062f\u0627\u0631\u062f \u06a9\u0647 \u062a\u0642\u0631\u06cc\u0628\u0627\u064b \u0628\u0631\u0627\u06cc \u0647\u0645\u0647 \u0645\u0648\u0636\u0648\u0639\u0627\u062a \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0645\u06cc \u0634\u0648\u062f.  \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u0645\u062b\u0627\u0644 &#8220;\u062e\u0648\u0628&#8221;\u060c &#8220;\u0639\u0627\u0644\u06cc&#8221;\u060c &#8220;\u0645\u0627\u0646\u0646\u062f&#8221; \u0648 \u063a\u06cc\u0631\u0647.<\/p>\n<p>\u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u0622\u062e\u0631\u06cc\u0646 \u0645\u0631\u062d\u0644\u0647\u060c \u06cc\u06a9 \u0633\u062a\u0648\u0646 \u0628\u0647 \u0642\u0627\u0628 \u062f\u0627\u062f\u0647 \u0627\u0635\u0644\u06cc \u0627\u0636\u0627\u0641\u0647 \u0645\u06cc \u06a9\u0646\u06cc\u0645 \u06a9\u0647 \u0645\u0648\u0636\u0648\u0639 \u0631\u0627 \u0628\u0631\u0627\u06cc \u0645\u062a\u0646 \u0630\u062e\u06cc\u0631\u0647 \u0645\u06cc \u06a9\u0646\u062f.  \u0628\u0631\u0627\u06cc \u0627\u06cc\u0646 \u06a9\u0627\u0631 \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u0645 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0646\u06cc\u0645 <code>LDA.transform()<\/code> \u0631\u0648\u0634 \u0648 \u0645\u0627\u062a\u0631\u06cc\u0633 \u0633\u0646\u062f-\u062a\u0631\u0645 \u062e\u0648\u062f \u0631\u0627 \u0627\u0631\u0633\u0627\u0644 \u06a9\u0646\u06cc\u062f.  \u0627\u06cc\u0646 \u0631\u0648\u0634 \u0627\u062d\u062a\u0645\u0627\u0644 \u062a\u0645\u0627\u0645 \u0645\u0648\u0636\u0648\u0639\u0627\u062a \u0631\u0627 \u0628\u0647 \u0647\u0631 \u0633\u0646\u062f \u0627\u062e\u062a\u0635\u0627\u0635 \u0645\u06cc \u062f\u0647\u062f.  \u0628\u0647 \u06a9\u062f \u0632\u06cc\u0631 \u0646\u06af\u0627\u0647 \u06a9\u0646\u06cc\u062f:<\/p>\n<pre><code class=\"hljs\">topic_values = LDA.transform(doc_term_matrix)\ntopic_values.shape\n<\/code><\/pre>\n<p>\u062f\u0631 \u062e\u0631\u0648\u062c\u06cc\u060c (20000\u060c 5) \u0631\u0627 \u062e\u0648\u0627\u0647\u06cc\u062f \u062f\u06cc\u062f \u06a9\u0647 \u0628\u0647 \u0627\u06cc\u0646 \u0645\u0639\u0646\u06cc \u0627\u0633\u062a \u06a9\u0647 \u0647\u0631 \u06cc\u06a9 \u0627\u0632 \u0633\u0646\u062f \u062f\u0627\u0631\u0627\u06cc 5 \u0633\u062a\u0648\u0646 \u0627\u0633\u062a \u06a9\u0647 \u0647\u0631 \u0633\u062a\u0648\u0646 \u0628\u0627 \u0645\u0642\u062f\u0627\u0631 \u0627\u062d\u062a\u0645\u0627\u0644 \u06cc\u06a9 \u0645\u0648\u0636\u0648\u0639 \u062e\u0627\u0635 \u0645\u0637\u0627\u0628\u0642\u062a \u062f\u0627\u0631\u062f.  \u0628\u0631\u0627\u06cc \u067e\u06cc\u062f\u0627 \u06a9\u0631\u062f\u0646 \u0634\u0627\u062e\u0635 \u0645\u0648\u0636\u0648\u0639 \u0628\u0627 \u062d\u062f\u0627\u06a9\u062b\u0631 \u0645\u0642\u062f\u0627\u0631\u060c \u0645\u06cc\u200c\u062a\u0648\u0627\u0646\u06cc\u0645 \u0622\u0646 \u0631\u0627 \u0641\u0631\u0627\u062e\u0648\u0627\u0646\u06cc \u06a9\u0646\u06cc\u0645 <code>argmax()<\/code> \u0631\u0648\u0634 \u0648 \u0639\u062f\u062f 1 \u0631\u0627 \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u0645\u0642\u062f\u0627\u0631 \u067e\u0627\u0631\u0627\u0645\u062a\u0631 \u0645\u062d\u0648\u0631 \u0627\u0631\u0633\u0627\u0644 \u06a9\u0646\u06cc\u062f.<\/p>\n<p>\u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0632\u06cc\u0631 \u06cc\u06a9 \u0633\u062a\u0648\u0646 \u062c\u062f\u06cc\u062f \u0628\u0631\u0627\u06cc \u0645\u0648\u0636\u0648\u0639 \u062f\u0631 \u0642\u0627\u0628 \u062f\u0627\u062f\u0647 \u0627\u0636\u0627\u0641\u0647 \u0645\u06cc \u06a9\u0646\u062f \u0648 \u0645\u0642\u062f\u0627\u0631 \u0645\u0648\u0636\u0648\u0639 \u0631\u0627 \u0628\u0647 \u0647\u0631 \u0633\u0637\u0631 \u062f\u0631 \u0633\u062a\u0648\u0646 \u0627\u062e\u062a\u0635\u0627\u0635 \u0645\u06cc \u062f\u0647\u062f:<\/p>\n<pre><code class=\"hljs\">reviews_datasets(<span class=\"hljs-string\">'Topic'<\/span>) = topic_values.argmax(axis=<span class=\"hljs-number\">1<\/span>)\n<\/code><\/pre>\n<p>\u062d\u0627\u0644 \u0628\u06cc\u0627\u06cc\u06cc\u062f \u0628\u0628\u06cc\u0646\u06cc\u0645 \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647 \u0686\u06af\u0648\u0646\u0647 \u0628\u0647 \u0646\u0638\u0631 \u0645\u06cc \u0631\u0633\u062f:<\/p>\n<pre><code class=\"hljs\">reviews_datasets.head()\n<\/code><\/pre>\n<p>\u062e\u0631\u0648\u062c\u06cc:<\/p>\n<p><img decoding=\"async\" class=\"img-responsive\" src=\"https:\/\/rasanegar.com\/blog\/wp-content\/uploads\/2024\/01\/python-nlp-topic-modeling-2.png\" alt=\"\" title=\"\"><\/p>\n<p>\u0634\u0645\u0627 \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u062f \u06cc\u06a9 \u0633\u062a\u0648\u0646 \u062c\u062f\u06cc\u062f \u0628\u0631\u0627\u06cc \u0645\u0648\u0636\u0648\u0639 \u062f\u0631 \u062e\u0631\u0648\u062c\u06cc \u0628\u0628\u06cc\u0646\u06cc\u062f.<\/p>\n<h2 id=\"nonnegativematrixfactorizationnmf\"><span class=\"ez-toc-section\" id=\"%d9%81%d8%a7%da%a9%d8%aa%d9%88%d8%b1%d8%b3%d8%a7%d8%b2%db%8c_%d9%85%d8%a7%d8%aa%d8%b1%db%8c%d8%b3_%d8%ba%db%8c%d8%b1_%d9%85%d9%86%d9%81%db%8c_nmf\"><\/span>\u0641\u0627\u06a9\u062a\u0648\u0631\u0633\u0627\u0632\u06cc \u0645\u0627\u062a\u0631\u06cc\u0633 \u063a\u06cc\u0631 \u0645\u0646\u0641\u06cc (NMF)<span class=\"ez-toc-section-end\"><\/span><\/h2>\n<p>\u062f\u0631 \u0628\u062e\u0634 \u0642\u0628\u0644\u060c \u062f\u06cc\u062f\u06cc\u0645 \u06a9\u0647 \u0686\u06af\u0648\u0646\u0647 \u0645\u06cc \u062a\u0648\u0627\u0646 \u0627\u0632 LDA \u0628\u0631\u0627\u06cc \u0645\u062f\u0644 \u0633\u0627\u0632\u06cc \u0645\u0648\u0636\u0648\u0639 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0631\u062f.  \u062f\u0631 \u0627\u06cc\u0646 \u0628\u062e\u0634 \u062e\u0648\u0627\u0647\u06cc\u0645 \u062f\u06cc\u062f \u06a9\u0647 \u0686\u06af\u0648\u0646\u0647 \u0645\u06cc \u062a\u0648\u0627\u0646 \u0627\u0632 \u0641\u0627\u06a9\u062a\u0648\u0631\u0633\u0627\u0632\u06cc \u0645\u0627\u062a\u0631\u06cc\u0633 \u063a\u06cc\u0631 \u0645\u0646\u0641\u06cc \u0628\u0631\u0627\u06cc \u0645\u062f\u0644 \u0633\u0627\u0632\u06cc \u0645\u0648\u0636\u0648\u0639 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0631\u062f.<\/p>\n<p>\u0641\u0627\u06a9\u062a\u0648\u0631\u0633\u0627\u0632\u06cc \u0645\u0627\u062a\u0631\u06cc\u0633 \u063a\u06cc\u0631 \u0645\u0646\u0641\u06cc \u0646\u06cc\u0632 \u06cc\u06a9 \u062a\u06a9\u0646\u06cc\u06a9 \u06cc\u0627\u062f\u06af\u06cc\u0631\u06cc \u0646\u0638\u0627\u0631\u062a \u0634\u062f\u0647 \u0627\u0633\u062a \u06a9\u0647 \u062e\u0648\u0634\u0647 \u0628\u0646\u062f\u06cc \u0648 \u0647\u0645\u0686\u0646\u06cc\u0646 \u06a9\u0627\u0647\u0634 \u0627\u0628\u0639\u0627\u062f \u0631\u0627 \u0627\u0646\u062c\u0627\u0645 \u0645\u06cc \u062f\u0647\u062f.  \u0645\u06cc \u062a\u0648\u0627\u0646 \u0627\u0632 \u0622\u0646 \u062f\u0631 \u062a\u0631\u06a9\u06cc\u0628 \u0628\u0627 \u0637\u0631\u062d TF-IDF \u0628\u0631\u0627\u06cc \u0627\u0646\u062c\u0627\u0645 \u0645\u062f\u0644 \u0633\u0627\u0632\u06cc \u0645\u0648\u0636\u0648\u0639 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0631\u062f.  \u062f\u0631 \u0627\u06cc\u0646 \u0628\u062e\u0634 \u062e\u0648\u0627\u0647\u06cc\u0645 \u062f\u06cc\u062f \u06a9\u0647 \u0686\u06af\u0648\u0646\u0647 \u0645\u06cc \u062a\u0648\u0627\u0646 \u0627\u0632 \u067e\u0627\u06cc\u062a\u0648\u0646 \u0628\u0631\u0627\u06cc \u0627\u0646\u062c\u0627\u0645 \u0641\u0627\u06a9\u062a\u0648\u0631\u0633\u0627\u0632\u06cc \u0645\u0627\u062a\u0631\u06cc\u0633 \u063a\u06cc\u0631 \u0645\u0646\u0641\u06cc \u0628\u0631\u0627\u06cc \u0645\u062f\u0644 \u0633\u0627\u0632\u06cc \u0645\u0648\u0636\u0648\u0639 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0631\u062f.<\/p>\n<h3 id=\"nmffortopicmodelinginpython\"><span class=\"ez-toc-section\" id=\"nmf_%d8%a8%d8%b1%d8%a7%db%8c_%d9%85%d8%af%d9%84_%d8%b3%d8%a7%d8%b2%db%8c_%d9%85%d9%88%d8%b6%d9%88%d8%b9_%d8%af%d8%b1_%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86\"><\/span>NMF \u0628\u0631\u0627\u06cc \u0645\u062f\u0644 \u0633\u0627\u0632\u06cc \u0645\u0648\u0636\u0648\u0639 \u062f\u0631 \u067e\u0627\u06cc\u062a\u0648\u0646<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p>\u062f\u0631 \u0627\u06cc\u0646 \u0642\u0633\u0645\u062a \u0645\u062f\u0644 \u0633\u0627\u0632\u06cc \u0645\u0648\u0636\u0648\u0639 \u0631\u0627 \u0627\u0646\u062c\u0627\u0645 \u0645\u06cc \u062f\u0647\u06cc\u0645 \u0631\u0648\u06cc \u0647\u0645\u0627\u0646 \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647 \u0627\u06cc \u06a9\u0647 \u062f\u0631 \u0628\u062e\u0634 \u0622\u062e\u0631 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0631\u062f\u06cc\u0645.  \u062e\u0648\u0627\u0647\u06cc\u062f \u062f\u06cc\u062f \u06a9\u0647 \u0645\u0631\u0627\u062d\u0644 \u0646\u06cc\u0632 \u06a9\u0627\u0645\u0644\u0627 \u0645\u0634\u0627\u0628\u0647 \u0647\u0633\u062a\u0646\u062f.<\/p>\n<p>\u0645\u0627 \u0628\u0627 \u0648\u0627\u0631\u062f \u06a9\u0631\u062f\u0646 \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647 \u0647\u0627 \u0634\u0631\u0648\u0639 \u0645\u06cc \u06a9\u0646\u06cc\u0645:<\/p>\n<pre><code class=\"hljs\"><span class=\"hljs-keyword\">import<\/span> pandas <span class=\"hljs-keyword\">as<\/span> pd\n<span class=\"hljs-keyword\">import<\/span> numpy <span class=\"hljs-keyword\">as<\/span> np\n\nreviews_datasets = pd.read_csv(<span class=\"hljs-string\">r'E:\\Datasets\\Reviews.csv'<\/span>)\nreviews_datasets = reviews_datasets.head(<span class=\"hljs-number\">20000<\/span>)\nreviews_datasets.dropna()\n<\/code><\/pre>\n<p>\u062f\u0631 \u0642\u0633\u0645\u062a \u0642\u0628\u0644 \u0627\u0632 thee count vectorizer \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0631\u062f\u06cc\u0645\u060c \u0627\u0645\u0627 \u062f\u0631 \u0627\u06cc\u0646 \u0628\u062e\u0634 \u0627\u0632 TFIDF vectorizer \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0645\u06cc \u06a9\u0646\u06cc\u0645 \u0632\u06cc\u0631\u0627 NMF \u0628\u0627 TFIDF \u06a9\u0627\u0631 \u0645\u06cc \u06a9\u0646\u062f.  \u0645\u0627 \u06cc\u06a9 \u0645\u0627\u062a\u0631\u06cc\u0633 \u0627\u0635\u0637\u0644\u0627\u062d \u0633\u0646\u062f \u0628\u0627 TFIDF \u0627\u06cc\u062c\u0627\u062f \u062e\u0648\u0627\u0647\u06cc\u0645 \u06a9\u0631\u062f.  \u0628\u0647 \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0632\u06cc\u0631 \u0646\u06af\u0627\u0647 \u06a9\u0646\u06cc\u062f:<\/p>\n<pre><code class=\"hljs\"><span class=\"hljs-keyword\">from<\/span> sklearn.feature_extraction.text <span class=\"hljs-keyword\">import<\/span> TfidfVectorizer\n\ntfidf_vect = TfidfVectorizer(max_df=<span class=\"hljs-number\">0.8<\/span>, min_df=<span class=\"hljs-number\">2<\/span>, stop_words=<span class=\"hljs-string\">'english'<\/span>)\ndoc_term_matrix = tfidf_vect.fit_transform(reviews_datasets(<span class=\"hljs-string\">'Text'<\/span>).values.astype(<span class=\"hljs-string\">'U'<\/span>))\n<\/code><\/pre>\n<p>\u0647\u0646\u06af\u0627\u0645\u06cc \u06a9\u0647 \u0645\u0627\u062a\u0631\u06cc\u0633 \u0627\u0635\u0637\u0644\u0627\u062d \u0633\u0646\u062f \u0627\u06cc\u062c\u0627\u062f \u0634\u062f\u060c \u0645\u06cc\u200c\u062a\u0648\u0627\u0646\u06cc\u0645 \u06cc\u06a9 \u0645\u0627\u062a\u0631\u06cc\u0633 \u0627\u062d\u062a\u0645\u0627\u0644 \u0627\u06cc\u062c\u0627\u062f \u06a9\u0646\u06cc\u0645 \u06a9\u0647 \u0634\u0627\u0645\u0644 \u0627\u062d\u062a\u0645\u0627\u0644\u0627\u062a \u0647\u0645\u0647 \u06a9\u0644\u0645\u0627\u062a \u062f\u0631 \u0648\u0627\u0698\u06af\u0627\u0646 \u0628\u0631\u0627\u06cc \u0647\u0645\u0647 \u0645\u0648\u0636\u0648\u0639\u0627\u062a \u0627\u0633\u062a.  \u0628\u0631\u0627\u06cc \u0627\u06cc\u0646 \u06a9\u0627\u0631 \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u0645 \u0627\u0632 <code>NMF<\/code> \u06a9\u0644\u0627\u0633 \u0627\u0632 <code>sklearn.decomposition<\/code> \u0645\u062f\u0648\u0644.  \u0628\u0647 \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0632\u06cc\u0631 \u0646\u06af\u0627\u0647 \u06a9\u0646\u06cc\u062f:<\/p>\n<pre><code class=\"hljs\"><span class=\"hljs-keyword\">from<\/span> sklearn.decomposition <span class=\"hljs-keyword\">import<\/span> NMF\n\nnmf = NMF(n_components=<span class=\"hljs-number\">5<\/span>, random_state=<span class=\"hljs-number\">42<\/span>)\nnmf.fit(doc_term_matrix )\n<\/code><\/pre>\n<p>\u0647\u0645\u0627\u0646\u0637\u0648\u0631 \u06a9\u0647 \u062f\u0631 \u0628\u062e\u0634 \u0642\u0628\u0644 \u0627\u0646\u062c\u0627\u0645 \u062f\u0627\u062f\u06cc\u0645\u060c \u0628\u06cc\u0627\u06cc\u06cc\u062f \u0628\u0647 \u0637\u0648\u0631 \u062a\u0635\u0627\u062f\u0641\u06cc 10 \u06a9\u0644\u0645\u0647 \u0627\u0632 \u0648\u0627\u0698\u06af\u0627\u0646 \u062e\u0648\u062f \u0631\u0627 \u0628\u062f\u0633\u062a \u0622\u0648\u0631\u06cc\u0645:<\/p>\n<pre><code class=\"hljs\"><span class=\"hljs-keyword\">import<\/span> random\n\n<span class=\"hljs-keyword\">for<\/span> i <span class=\"hljs-keyword\">in<\/span> <span class=\"hljs-built_in\">range<\/span>(<span class=\"hljs-number\">10<\/span>):\n    random_id = random.randint(<span class=\"hljs-number\">0<\/span>,<span class=\"hljs-built_in\">len<\/span>(tfidf_vect.get_feature_names()))\n    <span class=\"hljs-built_in\">print<\/span>(tfidf_vect.get_feature_names()(random_id))\n<\/code><\/pre>\n<p>\u062f\u0631 \u062e\u0631\u0648\u062c\u06cc\u060c \u06a9\u0644\u0645\u0627\u062a \u0632\u06cc\u0631 \u0631\u0627 \u0645\u0634\u0627\u0647\u062f\u0647 \u062e\u0648\u0627\u0647\u06cc\u062f \u06a9\u0631\u062f:<\/p>\n<pre><code class=\"hljs\">safest\npith\nache\nformula\nfussy\nfrontier\nburps\nspeaker\nresponsibility\ndive\n<\/code><\/pre>\n<p>\u062f\u0631 \u0645\u0631\u062d\u0644\u0647 \u0628\u0639\u062f\u060c \u0628\u0631\u062f\u0627\u0631 \u0627\u062d\u062a\u0645\u0627\u0644 \u06a9\u0644\u0645\u0627\u062a \u0631\u0627 \u0628\u0631\u0627\u06cc \u0645\u0628\u062d\u062b \u0627\u0648\u0644 \u0628\u0627\u0632\u06cc\u0627\u0628\u06cc \u0645\u06cc \u06a9\u0646\u06cc\u0645 \u0648 \u0634\u0627\u062e\u0635 \u0647\u0627\u06cc \u062f\u0647 \u06a9\u0644\u0645\u0647 \u0628\u0627 \u0628\u06cc\u0634\u062a\u0631\u06cc\u0646 \u0627\u062d\u062a\u0645\u0627\u0644 \u0631\u0627 \u0628\u0627\u0632\u06cc\u0627\u0628\u06cc \u0645\u06cc \u06a9\u0646\u06cc\u0645:<\/p>\n<pre><code class=\"hljs\">first_topic = nmf.components_(<span class=\"hljs-number\">0<\/span>)\ntop_topic_words = first_topic.argsort()(-<span class=\"hljs-number\">10<\/span>:)\n<\/code><\/pre>\n<p>\u0627\u06a9\u0646\u0648\u0646 \u0645\u06cc \u062a\u0648\u0627\u0646 \u0627\u06cc\u0646 \u0634\u0627\u062e\u0635 \u0647\u0627 \u0631\u0627 \u0628\u0647 <code>tfidf_vect<\/code> \u0628\u0631\u0627\u06cc \u0628\u0627\u0632\u06cc\u0627\u0628\u06cc \u06a9\u0644\u0645\u0627\u062a \u0648\u0627\u0642\u0639\u06cc \u0627\u0639\u062a\u0631\u0627\u0636 \u06a9\u0646\u06cc\u062f.  \u0628\u0647 \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0632\u06cc\u0631 \u0646\u06af\u0627\u0647 \u06a9\u0646\u06cc\u062f:<\/p>\n<pre><code class=\"hljs\"><span class=\"hljs-keyword\">for<\/span> i <span class=\"hljs-keyword\">in<\/span> top_topic_words:\n    <span class=\"hljs-built_in\">print<\/span>(tfidf_vect.get_feature_names()(i))\n<\/code><\/pre>\n<p>\u062e\u0631\u0648\u062c\u06cc \u0628\u0647 \u0634\u06a9\u0644 \u0632\u06cc\u0631 \u0627\u0633\u062a:<\/p>\n<pre><code class=\"hljs\">really\nchocolate\nlove\nflavor\njust\nproduct\ntaste\ngreat\ngood\nlike\n<\/code><\/pre>\n<p>\u06a9\u0644\u0645\u0627\u062a \u0645\u0648\u0636\u0648\u0639 1 \u0646\u0634\u0627\u0646 \u0645\u06cc \u062f\u0647\u062f \u06a9\u0647 \u0645\u0648\u0636\u0648\u0639 1 \u0645\u0645\u06a9\u0646 \u0627\u0633\u062a \u062d\u0627\u0648\u06cc \u0646\u0638\u0631\u0627\u062a\u06cc \u0628\u0631\u0627\u06cc \u0634\u06a9\u0644\u0627\u062a \u0628\u0627\u0634\u062f.  \u062d\u0627\u0644\u0627 \u0628\u06cc\u0627\u06cc\u06cc\u062f print \u062f\u0647 \u06a9\u0644\u0645\u0647 \u0628\u0627 \u0628\u06cc\u0634\u062a\u0631\u06cc\u0646 \u0627\u062d\u062a\u0645\u0627\u0644 \u0628\u0631\u0627\u06cc \u0647\u0631 \u06cc\u06a9 \u0627\u0632 \u0645\u0648\u0636\u0648\u0639\u0627\u062a:<\/p>\n<pre><code class=\"hljs\"><span class=\"hljs-keyword\">for<\/span> i,topic <span class=\"hljs-keyword\">in<\/span> <span class=\"hljs-built_in\">enumerate<\/span>(nmf.components_):\n    <span class=\"hljs-built_in\">print<\/span>(<span class=\"hljs-string\">f'Top 10 words for topic #<span class=\"hljs-subst\">{i}<\/span>:'<\/span>)\n    <span class=\"hljs-built_in\">print<\/span>((tfidf_vect.get_feature_names()(i) <span class=\"hljs-keyword\">for<\/span> i <span class=\"hljs-keyword\">in<\/span> topic.argsort()(-<span class=\"hljs-number\">10<\/span>:)))\n    <span class=\"hljs-built_in\">print<\/span>(<span class=\"hljs-string\">'\\n'<\/span>)\n<\/code><\/pre>\n<p>\u062e\u0631\u0648\u062c\u06cc \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0628\u0627\u0644\u0627 \u0628\u0647 \u0634\u06a9\u0644 \u0632\u06cc\u0631 \u0627\u0633\u062a:<\/p>\n<pre><code class=\"hljs\">Top 10 words for topic #0:\n('really', 'chocolate', 'love', 'flavor', 'just', 'product', 'taste', 'great', 'good', 'like')\n\n\nTop 10 words for topic #1:\n('like', 'keurig', 'roast', 'flavor', 'blend', 'bold', 'strong', 'cups', 'cup', 'coffee')\n\n\nTop 10 words for topic #2:\n('com', 'amazon', 'orange', 'switch', 'water', 'drink', 'soda', 'sugar', 'juice', 'br')\n\n\nTop 10 words for topic #3:\n('bags', 'flavor', 'drink', 'iced', 'earl', 'loose', 'grey', 'teas', 'green', 'tea')\n\n\nTop 10 words for topic #4:\n('old', 'love', 'cat', 'eat', 'treat', 'loves', 'dogs', 'food', 'treats', 'dog')\n<\/code><\/pre>\n<p>\u06a9\u0644\u0645\u0627\u062a \u0645\u0631\u0628\u0648\u0637 \u0628\u0647 \u0645\u0628\u062d\u062b 1 \u0646\u0634\u0627\u0646 \u0645\u06cc \u062f\u0647\u062f \u06a9\u0647 \u0627\u06cc\u0646 \u0645\u0648\u0636\u0648\u0639 \u062d\u0627\u0648\u06cc \u0646\u0638\u0631\u0627\u062a\u06cc \u062f\u0631 \u0645\u0648\u0631\u062f \u0642\u0647\u0648\u0647 \u0627\u0633\u062a.  \u0628\u0647 \u0637\u0648\u0631 \u0645\u0634\u0627\u0628\u0647\u060c \u0648\u0627\u0698\u0647\u200c\u0647\u0627\u06cc \u0645\u0628\u062d\u062b 2 \u0646\u0634\u0627\u0646 \u0645\u06cc\u200c\u062f\u0647\u062f \u06a9\u0647 \u062d\u0627\u0648\u06cc \u0646\u0638\u0631\u0627\u062a\u06cc \u062f\u0631\u0628\u0627\u0631\u0647 \u0646\u0648\u0634\u0627\u0628\u0647\u200c\u0647\u0627 \u0648 \u0622\u0628\u0645\u06cc\u0648\u0647\u200c\u0647\u0627 \u0627\u0633\u062a.  \u0645\u0648\u0636\u0648\u0639 3 \u062f\u0648\u0628\u0627\u0631\u0647 \u062d\u0627\u0648\u06cc \u0646\u0638\u0631\u0627\u062a\u06cc \u062f\u0631 \u0645\u0648\u0631\u062f \u0646\u0648\u0634\u06cc\u062f\u0646\u06cc \u0627\u0633\u062a.  \u062f\u0631 \u0646\u0647\u0627\u06cc\u062a\u060c \u0645\u0628\u062d\u062b 4 \u0645\u0645\u06a9\u0646 \u0627\u0633\u062a \u062d\u0627\u0648\u06cc \u0646\u0638\u0631\u0627\u062a\u06cc \u062f\u0631 \u0645\u0648\u0631\u062f \u063a\u0630\u0627\u06cc \u062d\u06cc\u0648\u0627\u0646\u0627\u062a \u0628\u0627\u0634\u062f \u0632\u06cc\u0631\u0627 \u062d\u0627\u0648\u06cc \u06a9\u0644\u0645\u0627\u062a\u06cc \u0645\u0627\u0646\u0646\u062f &#8220;\u06af\u0631\u0628\u0647&#8221;\u060c &#8220;\u0633\u06af&#8221;\u060c &#8220;\u062f\u0631\u0645\u0627\u0646&#8221; \u0648 \u063a\u06cc\u0631\u0647 \u0627\u0633\u062a.<\/p>\n<p>\u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0632\u06cc\u0631 \u0645\u0648\u0636\u0648\u0639\u0627\u062a \u0631\u0627 \u0628\u0647 \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647 \u0627\u0636\u0627\u0641\u0647 \u0645\u06cc \u06a9\u0646\u062f \u0648 \u067e\u0646\u062c \u0631\u062f\u06cc\u0641 \u0627\u0648\u0644 \u0631\u0627 \u0646\u0645\u0627\u06cc\u0634 \u0645\u06cc \u062f\u0647\u062f:<\/p>\n<pre><code class=\"hljs\">topic_values = nmf.transform(doc_term_matrix)\nreviews_datasets(<span class=\"hljs-string\">'Topic'<\/span>) = topic_values.argmax(axis=<span class=\"hljs-number\">1<\/span>)\nreviews_datasets.head()\n<\/code><\/pre>\n<p>\u062e\u0631\u0648\u062c\u06cc \u06a9\u062f \u0628\u0627\u0644\u0627 \u0628\u0647 \u0634\u06a9\u0644 \u0632\u06cc\u0631 \u0627\u0633\u062a:<\/p>\n<p><img decoding=\"async\" class=\"img-responsive\" src=\"https:\/\/rasanegar.com\/blog\/wp-content\/uploads\/2024\/01\/python-nlp-topic-modeling-3.png\" alt=\"\" title=\"\"><\/p>\n<p>\u0647\u0645\u0627\u0646\u0637\u0648\u0631 \u06a9\u0647 \u0645\u06cc \u0628\u06cc\u0646\u06cc\u062f \u0628\u0647 \u0647\u0631 \u0628\u0631\u0631\u0633\u06cc \u06cc\u06a9 \u0645\u0648\u0636\u0648\u0639 \u0627\u062e\u062a\u0635\u0627\u0635 \u062f\u0627\u062f\u0647 \u0634\u062f\u0647 \u0627\u0633\u062a \u06a9\u0647 \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 \u0631\u0648\u0634 NMF \u0627\u06cc\u062c\u0627\u062f \u0634\u062f\u0647 \u0627\u0633\u062a.<\/p>\n<h2 id=\"conclusion\"><span class=\"ez-toc-section\" id=\"%d9%86%d8%aa%db%8c%d8%ac%d9%87\"><\/span>\u0646\u062a\u06cc\u062c\u0647<span class=\"ez-toc-section-end\"><\/span><\/h2>\n<p>\u0645\u062f\u0644\u200c\u0633\u0627\u0632\u06cc \u0645\u0648\u0636\u0648\u0639 \u06cc\u06a9\u06cc \u0627\u0632 \u062d\u0648\u0632\u0647\u200c\u0647\u0627\u06cc \u062a\u062d\u0642\u06cc\u0642\u0627\u062a\u06cc \u0628\u0633\u06cc\u0627\u0631 \u0645\u0648\u0631\u062f \u062a\u0648\u062c\u0647 \u062f\u0631 NLP \u0627\u0633\u062a.  \u0628\u0631\u0627\u06cc \u06af\u0631\u0648\u0647 \u0628\u0646\u062f\u06cc \u062d\u062c\u0645 \u0632\u06cc\u0627\u062f\u06cc \u0627\u0632 \u062f\u0627\u062f\u0647 \u0647\u0627\u06cc \u0645\u062a\u0646\u06cc \u0628\u062f\u0648\u0646 \u0628\u0631\u0686\u0633\u0628 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0645\u06cc \u0634\u0648\u062f.  \u062f\u0631 \u0627\u06cc\u0646 \u0645\u0642\u0627\u0644\u0647 \u062f\u0648 \u0631\u0648\u06cc\u06a9\u0631\u062f \u0628\u0631\u0627\u06cc \u0645\u062f\u0644 \u0633\u0627\u0632\u06cc \u0645\u0648\u0636\u0648\u0639\u06cc \u062a\u0648\u0636\u06cc\u062d \u062f\u0627\u062f\u0647 \u0634\u062f\u0647 \u0627\u0633\u062a.  \u062f\u0631 \u0627\u06cc\u0646 \u0645\u0642\u0627\u0644\u0647 \u062f\u06cc\u062f\u06cc\u0645 \u06a9\u0647 \u0686\u06af\u0648\u0646\u0647 \u0645\u06cc \u062a\u0648\u0627\u0646 \u0627\u0632 \u062a\u062e\u0635\u06cc\u0635 \u062f\u06cc\u0631\u06cc\u06a9\u0644\u0647 \u067e\u0646\u0647\u0627\u0646 \u0648 \u0641\u0627\u06a9\u062a\u0648\u0631\u0633\u0627\u0632\u06cc \u0645\u0627\u062a\u0631\u06cc\u0633 \u063a\u06cc\u0631 \u0645\u0646\u0641\u06cc \u0628\u0631\u0627\u06cc \u0645\u062f\u0644 \u0633\u0627\u0632\u06cc \u0645\u0648\u0636\u0648\u0639 \u0628\u0627 \u06a9\u0645\u06a9 \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 \u0647\u0627\u06cc \u067e\u0627\u06cc\u062a\u0648\u0646 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0631\u062f.<\/p>\n<\/div>\n<p><script>\n                        !function(f,b,e,v,n,t,s)\n                        {if(f.fbq)return;n=f.fbq=function(){n.callMethod?\n                        n.callMethod.apply(n,arguments):n.queue.push(arguments)};\n                        if(!f._fbq)f._fbq=n;n.push=n;n.loaded=!0;n.version='2.0';\n                        n.queue=();t=b.createElement(e);t.async=!0;\n                        t.src=v;s=b.getElementsByTagName(e)(0);\n                        s.parentNode.insertBefore(t,s)}(window, document,'script',\n                        'https:\/\/connect.facebook.net\/en_US\/fbevents.js');\n                        fbq('init', '525232124909042');\n                        fbq('track', 'PageView');\n                    <\/script>    (\u0628\u0631\u0686\u0633\u0628\u200c\u0647\u0627 \u0628\u0647 \u062a\u0631\u062c\u0645\u0647)# python<br \/>\n<br \/><br \/>\n<br \/>\u0645\u0646\u062a\u0634\u0631 \u0634\u062f\u0647 \u062f\u0631 1403-01-23 18:04:03<br \/>\n<\/p>\n\n\n<div class=\"kk-star-ratings kksr-auto kksr-align-center kksr-valign-bottom\"\n    data-payload='{&quot;align&quot;:&quot;center&quot;,&quot;id&quot;:&quot;16336&quot;,&quot;slug&quot;:&quot;default&quot;,&quot;valign&quot;:&quot;bottom&quot;,&quot;ignore&quot;:&quot;&quot;,&quot;reference&quot;:&quot;auto&quot;,&quot;class&quot;:&quot;&quot;,&quot;count&quot;:&quot;0&quot;,&quot;legendonly&quot;:&quot;&quot;,&quot;readonly&quot;:&quot;&quot;,&quot;score&quot;:&quot;0&quot;,&quot;starsonly&quot;:&quot;&quot;,&quot;best&quot;:&quot;5&quot;,&quot;gap&quot;:&quot;5&quot;,&quot;greet&quot;:&quot;\u0627\u0645\u062a\u06cc\u0627\u0632 \u0634\u0645\u0627 \u0628\u0647 \u0627\u06cc\u0646 \u0645\u0637\u0644\u0628&quot;,&quot;legend&quot;:&quot;0\\\/5 (0 \u0631\u0627\u06cc)&quot;,&quot;size&quot;:&quot;30&quot;,&quot;title&quot;:&quot;\u067e\u0627\u06cc\u062a\u0648\u0646 \u0628\u0631\u0627\u06cc NLP: \u0645\u062f\u0644\u200c\u0633\u0627\u0632\u06cc \u0645\u0648\u0636\u0648\u0639&quot;,&quot;width&quot;:&quot;0&quot;,&quot;_legend&quot;:&quot;{score}\\\/{best} ({count} \u0631\u0627\u06cc)&quot;,&quot;font_factor&quot;:&quot;1.25&quot;}'>\n            \n<div class=\"kksr-stars\">\n    \n<div class=\"kksr-stars-inactive\">\n            <div class=\"kksr-star\" data-star=\"1\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" data-star=\"2\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" data-star=\"3\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" data-star=\"4\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" data-star=\"5\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n    <\/div>\n    \n<div class=\"kksr-stars-active\" style=\"width: 0px;\">\n            <div class=\"kksr-star\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n    <\/div>\n<\/div>\n                \n\n<div class=\"kksr-legend\" style=\"font-size: 24px;\">\n            <span class=\"kksr-muted\">\u0627\u0645\u062a\u06cc\u0627\u0632 \u0634\u0645\u0627 \u0628\u0647 \u0627\u06cc\u0646 \u0645\u0637\u0644\u0628<\/span>\n    <\/div>\n    <\/div>\n","protected":false},"excerpt":{"rendered":"<p><span class=\"span-reading-time rt-reading-time\" style=\"display: block;\"><span class=\"rt-label rt-prefix\">\u0632\u0645\u0627\u0646 \u0644\u0627\u0632\u0645 \u0628\u0631\u0627\u06cc \u0645\u0637\u0627\u0644\u0639\u0647: <\/span> <span class=\"rt-time\"> 8<\/span> <span class=\"rt-label rt-postfix\">\u062f\u0642\u06cc\u0642\u0647<\/span><\/span>\u0627\u06cc\u0646 \u0634\u0634\u0645\u06cc\u0646 \u0645\u0642\u0627\u0644\u0647 \u0627\u0632 \u0633\u0631\u06cc \u0645\u0642\u0627\u0644\u0627\u062a \u0645\u0646 \u0627\u0633\u062a \u0631\u0648\u06cc \u067e\u0627\u06cc\u062a\u0648\u0646 \u0628\u0631\u0627\u06cc NLP. \u062f\u0631 \u0645\u0642\u0627\u0644\u0647 \u0642\u0628\u0644\u06cc \u062e\u0648\u062f\u060c \u062f\u0631 \u0645\u0648\u0631\u062f \u0686\u06af\u0648\u0646\u06af\u06cc \u0627\u0646\u062c\u0627\u0645 \u062a\u062c\u0632\u06cc\u0647 \u0648 \u062a\u062d\u0644\u06cc\u0644 \u0627\u062d\u0633\u0627\u0633\u0627\u062a \u062f\u0627\u062f\u0647 \u0647\u0627\u06cc \u062a\u0648\u06cc\u06cc\u062a\u0631 \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 Scikit-Learn \u067e\u0627\u06cc\u062a\u0648\u0646 \u0635\u062d\u0628\u062a \u06a9\u0631\u062f\u0645. \u062f\u0631 \u0627\u06cc\u0646 \u0645\u0642\u0627\u0644\u0647 \u0628\u0647 \u0628\u0631\u0631\u0633\u06cc \u0645\u062f\u0644 \u0633\u0627\u0632\u06cc \u0645\u0648\u0636\u0648\u0639 \u0645\u06cc \u067e\u0631\u062f\u0627\u0632\u06cc\u0645 \u06a9\u0647 \u06cc\u06a9\u06cc \u062f\u06cc\u06af\u0631 \u0627\u0632 \u06a9\u0627\u0631\u0628\u0631\u062f\u0647\u0627\u06cc \u0628\u0633\u06cc\u0627\u0631 \u0645\u0647\u0645 NLP \u0627\u0633\u062a. \u062e\u0648\u0627\u0647\u06cc\u0645 [&hellip;]<\/p>\n","protected":false},"author":3,"featured_media":16337,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"footnotes":""},"categories":[1743,620],"tags":[],"class_list":["post-16336","post","type-post","status-publish","format-standard","has-post-thumbnail","hentry","category-python","category-programming"],"acf":[],"_links":{"self":[{"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/posts\/16336","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/users\/3"}],"replies":[{"embeddable":true,"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/comments?post=16336"}],"version-history":[{"count":0,"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/posts\/16336\/revisions"}],"wp:featuredmedia":[{"embeddable":true,"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/media\/16337"}],"wp:attachment":[{"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/media?parent=16336"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/categories?post=16336"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/tags?post=16336"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}