{"id":16164,"date":"2024-01-21T15:36:00","date_gmt":"2024-01-21T12:06:00","guid":{"rendered":"https:\/\/rasanegar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%d8%aa%d9%88%d8%b3%d8%b9%d9%87-%db%8c%da%a9-%d9%be%d8%b1%da%a9%d9%86%d9%86%d8%af%d9%87-%d9%85%d8%aa%d9%86-%d8%ae%d9%88%d8%af%da%a9\/"},"modified":"2024-01-21T15:36:00","modified_gmt":"2024-01-21T12:06:00","slug":"%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%d8%aa%d9%88%d8%b3%d8%b9%d9%87-%db%8c%da%a9-%d9%be%d8%b1%da%a9%d9%86%d9%86%d8%af%d9%87-%d9%85%d8%aa%d9%86-%d8%ae%d9%88%d8%af%da%a9","status":"publish","type":"post","link":"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%d8%aa%d9%88%d8%b3%d8%b9%d9%87-%db%8c%da%a9-%d9%be%d8%b1%da%a9%d9%86%d9%86%d8%af%d9%87-%d9%85%d8%aa%d9%86-%d8%ae%d9%88%d8%af%da%a9\/","title":{"rendered":"\u067e\u0627\u06cc\u062a\u0648\u0646 \u0628\u0631\u0627\u06cc NLP: \u062a\u0648\u0633\u0639\u0647 \u06cc\u06a9 \u067e\u0631\u06a9\u0646\u0646\u062f\u0647 \u0645\u062a\u0646 \u062e\u0648\u062f\u06a9\u0627\u0631 \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 N-Gram"},"content":{"rendered":"<div id=\"ez-toc-container\" class=\"ez-toc-v2_0_85 counter-hierarchy ez-toc-counter ez-toc-custom ez-toc-container-direction\">\n<div class=\"ez-toc-title-container\"><p class=\"ez-toc-title\" style=\"cursor:inherit\">\u0633\u0631\u0641\u0635\u0644\u0647\u0627\u06cc \u0645\u0637\u0644\u0628<\/p>\n<\/div><nav><ul class='ez-toc-list ez-toc-list-level-1 ' ><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class=\"ez-toc-link ez-toc-heading-1\" href=\"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%d8%aa%d9%88%d8%b3%d8%b9%d9%87-%db%8c%da%a9-%d9%be%d8%b1%da%a9%d9%86%d9%86%d8%af%d9%87-%d9%85%d8%aa%d9%86-%d8%ae%d9%88%d8%af%da%a9\/#%d9%85%d8%b4%da%a9%d9%84%d8%a7%d8%aa_%d8%a8%d8%a7_%d8%b1%d9%88%d8%b4_tf-idf_%d9%88_%da%a9%db%8c%d8%b3%d9%87_%da%a9%d9%84%d9%85%d8%a7%d8%aa\" >\u0645\u0634\u06a9\u0644\u0627\u062a \u0628\u0627 \u0631\u0648\u0634 TF-IDF \u0648 \u06a9\u06cc\u0633\u0647 \u06a9\u0644\u0645\u0627\u062a<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class=\"ez-toc-link ez-toc-heading-2\" href=\"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%d8%aa%d9%88%d8%b3%d8%b9%d9%87-%db%8c%da%a9-%d9%be%d8%b1%da%a9%d9%86%d9%86%d8%af%d9%87-%d9%85%d8%aa%d9%86-%d8%ae%d9%88%d8%af%da%a9\/#%d9%86%d8%b8%d8%b1%db%8c%d9%87_%d9%85%d8%af%d9%84_n-grams\" >\u0646\u0638\u0631\u06cc\u0647 \u0645\u062f\u0644 N-Grams<\/a><ul class='ez-toc-list-level-3' ><li class='ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-3\" href=\"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%d8%aa%d9%88%d8%b3%d8%b9%d9%87-%db%8c%da%a9-%d9%be%d8%b1%da%a9%d9%86%d9%86%d8%af%d9%87-%d9%85%d8%aa%d9%86-%d8%ae%d9%88%d8%af%da%a9\/#%d8%a7%d8%aa%d8%b5%d8%a7%d9%84_n-gram_%d8%a8%d8%a7_%d8%b2%d9%86%d8%ac%db%8c%d8%b1%d9%87_%d9%85%d8%a7%d8%b1%da%a9%d9%88%d9%81\" >\u0627\u062a\u0635\u0627\u0644 N-Gram \u0628\u0627 \u0632\u0646\u062c\u06cc\u0631\u0647 \u0645\u0627\u0631\u06a9\u0648\u0641<\/a><\/li><\/ul><\/li><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class=\"ez-toc-link ez-toc-heading-4\" href=\"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%d8%aa%d9%88%d8%b3%d8%b9%d9%87-%db%8c%da%a9-%d9%be%d8%b1%da%a9%d9%86%d9%86%d8%af%d9%87-%d9%85%d8%aa%d9%86-%d8%ae%d9%88%d8%af%da%a9\/#n-grams_%d8%a7%d8%b2_%d8%a7%d8%a8%d8%aa%d8%af%d8%a7_%d8%af%d8%b1_%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86\" >N-Grams \u0627\u0632 \u0627\u0628\u062a\u062f\u0627 \u062f\u0631 \u067e\u0627\u06cc\u062a\u0648\u0646<\/a><ul class='ez-toc-list-level-3' ><li class='ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-5\" href=\"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%d8%aa%d9%88%d8%b3%d8%b9%d9%87-%db%8c%da%a9-%d9%be%d8%b1%da%a9%d9%86%d9%86%d8%af%d9%87-%d9%85%d8%aa%d9%86-%d8%ae%d9%88%d8%af%da%a9\/#%da%a9%d8%a7%d8%b1%d8%a7%da%a9%d8%aa%d8%b1%d9%87%d8%a7_%d9%85%d8%af%d9%84_n-grams\" >\u06a9\u0627\u0631\u0627\u06a9\u062a\u0631\u0647\u0627 \u0645\u062f\u0644 N-Grams<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-6\" href=\"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%d8%aa%d9%88%d8%b3%d8%b9%d9%87-%db%8c%da%a9-%d9%be%d8%b1%da%a9%d9%86%d9%86%d8%af%d9%87-%d9%85%d8%aa%d9%86-%d8%ae%d9%88%d8%af%da%a9\/#%d9%85%d8%af%d9%84_n-grams_%da%a9%d9%84%d9%85%d8%a7%d8%aa\" >\u0645\u062f\u0644 N-Grams \u06a9\u0644\u0645\u0627\u062a<\/a><\/li><\/ul><\/li><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class=\"ez-toc-link ez-toc-heading-7\" href=\"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%d8%aa%d9%88%d8%b3%d8%b9%d9%87-%db%8c%da%a9-%d9%be%d8%b1%da%a9%d9%86%d9%86%d8%af%d9%87-%d9%85%d8%aa%d9%86-%d8%ae%d9%88%d8%af%da%a9\/#%d9%86%d8%aa%db%8c%d8%ac%d9%87\" >\u0646\u062a\u06cc\u062c\u0647<\/a><\/li><\/ul><\/nav><\/div>\n<span class=\"span-reading-time rt-reading-time\" style=\"display: block;\"><span class=\"rt-label rt-prefix\">\u0632\u0645\u0627\u0646 \u0644\u0627\u0632\u0645 \u0628\u0631\u0627\u06cc \u0645\u0637\u0627\u0644\u0639\u0647: <\/span> <span class=\"rt-time\"> 8<\/span> <span class=\"rt-label rt-postfix\">\u062f\u0642\u06cc\u0642\u0647<\/span><\/span><p> <br \/>\n<\/p>\n<div><noscript><\/noscript><\/p>\n<p>\u0627\u06cc\u0646 \u067e\u0627\u0646\u0632\u062f\u0647\u0645\u06cc\u0646 \u0645\u0642\u0627\u0644\u0647 \u0627\u0632 \u0633\u0631\u06cc \u0645\u0642\u0627\u0644\u0627\u062a \u0645\u0646 \u0627\u0633\u062a \u0631\u0648\u06cc \u067e\u0627\u06cc\u062a\u0648\u0646 \u0628\u0631\u0627\u06cc NLP.  \u062f\u0631 \u0645\u0642\u0627\u0644\u0647 \u0642\u0628\u0644\u06cc \u0627\u0645 \u0631\u0648\u0634 \u067e\u06cc\u0627\u062f\u0647 \u0633\u0627\u0632\u06cc \u0631\u0627 \u062a\u0648\u0636\u06cc\u062d \u062f\u0627\u062f\u0645 <a rel=\"nofollow noopener\" target=\"_blank\" href=\"https:\/\/en.wikipedia.org\/wiki\/Tf%E2%80%93idf\">TF-IDF<\/a> \u0631\u0648\u06cc\u06a9\u0631\u062f \u0627\u0632 \u0627\u0628\u062a\u062f\u0627 \u062f\u0631 \u067e\u0627\u06cc\u062a\u0648\u0646  \u0642\u0628\u0644 \u0627\u0632 \u0622\u0646\u060c \u0631\u0648\u0634 \u067e\u06cc\u0627\u062f\u0647\u200c\u0633\u0627\u0632\u06cc \u0631\u0648\u06cc\u06a9\u0631\u062f \u06a9\u06cc\u0633\u0647\u200c\u0627\u06cc \u06a9\u0644\u0645\u0627\u062a \u0631\u0627 \u0627\u0632 \u0627\u0628\u062a\u062f\u0627 \u062f\u0631 \u067e\u0627\u06cc\u062a\u0648\u0646 \u0645\u0637\u0627\u0644\u0639\u0647 \u06a9\u0631\u062f\u06cc\u0645.<\/p>\n<p>\u0627\u0645\u0631\u0648\u0632\u060c \u0631\u0648\u06cc\u06a9\u0631\u062f N-Grams \u0631\u0627 \u0645\u0637\u0627\u0644\u0639\u0647 \u062e\u0648\u0627\u0647\u06cc\u0645 \u06a9\u0631\u062f \u0648 \u062e\u0648\u0627\u0647\u06cc\u0645 \u062f\u06cc\u062f \u06a9\u0647 \u0686\u06af\u0648\u0646\u0647 \u0645\u06cc \u062a\u0648\u0627\u0646 \u0627\u0632 \u0631\u0648\u06cc\u06a9\u0631\u062f N-Grams \u0628\u0631\u0627\u06cc \u0627\u06cc\u062c\u0627\u062f \u06cc\u06a9 \u067e\u0631\u06a9\u0646\u0646\u062f\u0647 \u0645\u062a\u0646 \u062e\u0648\u062f\u06a9\u0627\u0631 \u0633\u0627\u062f\u0647 \u06cc\u0627 \u0645\u0648\u062a\u0648\u0631 \u067e\u06cc\u0634\u0646\u0647\u0627\u062f \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0631\u062f.  \u067e\u0631\u06a9\u0646\u0646\u062f\u0647 \u0645\u062a\u0646 \u062e\u0648\u062f\u06a9\u0627\u0631 \u06cc\u06a9 \u0628\u0631\u0646\u0627\u0645\u0647 \u0628\u0633\u06cc\u0627\u0631 \u06a9\u0627\u0631\u0628\u0631\u062f\u06cc \u0627\u0633\u062a \u0648 \u0628\u0647 \u0637\u0648\u0631 \u06af\u0633\u062a\u0631\u062f\u0647 \u062a\u0648\u0633\u0637 \u06af\u0648\u06af\u0644 \u0648 \u06af\u0648\u0634\u06cc \u0647\u0627\u06cc \u0647\u0648\u0634\u0645\u0646\u062f \u0645\u062e\u062a\u0644\u0641 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0645\u06cc \u0634\u0648\u062f \u06a9\u0647 \u062f\u0631 \u0622\u0646 \u06a9\u0627\u0631\u0628\u0631 \u0645\u0642\u062f\u0627\u0631\u06cc \u0645\u062a\u0646 \u0631\u0627 \u0648\u0627\u0631\u062f \u0645\u06cc \u06a9\u0646\u062f \u0648 \u0645\u062a\u0646 \u0628\u0627\u0642\u06cc\u0645\u0627\u0646\u062f\u0647 \u0628\u0647 \u0637\u0648\u0631 \u062e\u0648\u062f\u06a9\u0627\u0631 \u062a\u0648\u0633\u0637 \u0628\u0631\u0646\u0627\u0645\u0647 \u062a\u06a9\u0645\u06cc\u0644 \u06cc\u0627 \u067e\u06cc\u0634\u0646\u0647\u0627\u062f \u0645\u06cc \u0634\u0648\u062f.<\/p>\n<h2 id=\"problemswithtfidfandbagofwordsapproach\"><span class=\"ez-toc-section\" id=\"%d9%85%d8%b4%da%a9%d9%84%d8%a7%d8%aa_%d8%a8%d8%a7_%d8%b1%d9%88%d8%b4_tf-idf_%d9%88_%da%a9%db%8c%d8%b3%d9%87_%da%a9%d9%84%d9%85%d8%a7%d8%aa\"><\/span>\u0645\u0634\u06a9\u0644\u0627\u062a \u0628\u0627 \u0631\u0648\u0634 TF-IDF \u0648 \u06a9\u06cc\u0633\u0647 \u06a9\u0644\u0645\u0627\u062a<span class=\"ez-toc-section-end\"><\/span><\/h2>\n<p>\u0642\u0628\u0644 \u0627\u0632 \u0627\u06cc\u0646\u06a9\u0647 \u0628\u062e\u0648\u0627\u0647\u06cc\u0645 \u0645\u062f\u0644 N-Grams \u0631\u0627 \u067e\u06cc\u0627\u062f\u0647 \u0633\u0627\u0632\u06cc \u06a9\u0646\u06cc\u0645\u060c \u0627\u062c\u0627\u0632\u0647 \u062f\u0647\u06cc\u062f \u0627\u0628\u062a\u062f\u0627 \u0627\u0634\u06a9\u0627\u0644\u0627\u062a \u06a9\u06cc\u0633\u0647 \u06a9\u0644\u0645\u0627\u062a \u0648 \u0631\u0648\u06cc\u06a9\u0631\u062f\u0647\u0627\u06cc TF-IDF \u0631\u0627 \u0645\u0648\u0631\u062f \u0628\u062d\u062b \u0642\u0631\u0627\u0631 \u062f\u0647\u06cc\u0645.<\/p>\n<p>\u062f\u0631 \u06a9\u06cc\u0633\u0647 \u06a9\u0644\u0645\u0627\u062a \u0648 \u0631\u0648\u06cc\u06a9\u0631\u062f TF-IDF\u060c \u06a9\u0644\u0645\u0627\u062a \u0628\u0647 \u0635\u0648\u0631\u062a \u062c\u062f\u0627\u06af\u0627\u0646\u0647 \u0628\u0631\u0631\u0633\u06cc \u0645\u06cc \u0634\u0648\u0646\u062f \u0648 \u0647\u0631 \u06a9\u0644\u0645\u0647 \u0628\u0647 \u0647\u0645\u062a\u0627\u06cc \u0639\u062f\u062f\u06cc \u062e\u0648\u062f \u062a\u0628\u062f\u06cc\u0644 \u0645\u06cc \u0634\u0648\u062f.  \u0627\u0637\u0644\u0627\u0639\u0627\u062a \u0645\u062a\u0646 \u06a9\u0644\u0645\u0647 \u062d\u0641\u0638 \u0646\u0645\u06cc \u0634\u0648\u062f.  \u062f\u0648 \u062c\u0645\u0644\u0647 \u00ab\u0645\u0627\u0634\u06cc\u0646 \u0648 \u0641\u0631\u0634 \u0642\u0631\u0645\u0632 \u0628\u0632\u0631\u06af\u00bb \u0648 \u00ab\u0641\u0631\u0634 \u0642\u0631\u0645\u0632 \u0628\u0632\u0631\u06af \u0648 \u0645\u0627\u0634\u06cc\u0646\u00bb \u0631\u0627 \u062f\u0631 \u0646\u0638\u0631 \u0628\u06af\u06cc\u0631\u06cc\u062f.  \u0627\u06af\u0631 \u0627\u0632 \u0631\u0648\u06cc\u06a9\u0631\u062f \u06cc\u06a9 \u06a9\u06cc\u0633\u0647 \u06a9\u0644\u0645\u0627\u062a \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0646\u06cc\u062f\u060c \u0628\u0631\u062f\u0627\u0631\u0647\u0627\u06cc \u06cc\u06a9\u0633\u0627\u0646\u06cc \u0631\u0627 \u0628\u0631\u0627\u06cc \u0627\u06cc\u0646 \u062f\u0648 \u062c\u0645\u0644\u0647 \u062f\u0631\u06cc\u0627\u0641\u062a \u062e\u0648\u0627\u0647\u06cc\u062f \u06a9\u0631\u062f.  \u0628\u0627 \u0627\u06cc\u0646 \u062d\u0627\u0644\u060c \u0628\u0647 \u0648\u0636\u0648\u062d \u0645\u06cc \u062a\u0648\u0627\u0646 \u062f\u0631\u06cc\u0627\u0641\u062a \u06a9\u0647 \u062f\u0631 \u062c\u0645\u0644\u0647 \u0627\u0648\u0644 \u0645\u0627 \u062f\u0631 \u0645\u0648\u0631\u062f \u06cc\u06a9 &#8220;\u0645\u0627\u0634\u06cc\u0646 \u0642\u0631\u0645\u0632 \u0628\u0632\u0631\u06af&#8221; \u0635\u062d\u0628\u062a \u0645\u06cc \u06a9\u0646\u06cc\u0645\u060c \u062f\u0631 \u062d\u0627\u0644\u06cc \u06a9\u0647 \u062c\u0645\u0644\u0647 \u062f\u0648\u0645 \u062d\u0627\u0648\u06cc \u0627\u0637\u0644\u0627\u0639\u0627\u062a\u06cc \u062f\u0631 \u0645\u0648\u0631\u062f &#8220;\u0641\u0631\u0634 \u0642\u0631\u0645\u0632 \u0628\u0632\u0631\u06af&#8221; \u0627\u0633\u062a.  \u0627\u0632 \u0627\u06cc\u0646 \u0631\u0648\u060c \u0627\u0637\u0644\u0627\u0639\u0627\u062a \u0632\u0645\u06cc\u0646\u0647 \u0628\u0633\u06cc\u0627\u0631 \u0645\u0647\u0645 \u0627\u0633\u062a.  \u0645\u062f\u0644 N-Grams \u0627\u0633\u0627\u0633\u0627\u064b \u0628\u0647 \u0645\u0627 \u06a9\u0645\u06a9 \u0645\u06cc \u06a9\u0646\u062f \u062a\u0627 \u0627\u0637\u0644\u0627\u0639\u0627\u062a \u0632\u0645\u06cc\u0646\u0647 \u0631\u0627 \u0636\u0628\u0637 \u06a9\u0646\u06cc\u0645.<\/p>\n<h2 id=\"theoryofngramsmodel\"><span class=\"ez-toc-section\" id=\"%d9%86%d8%b8%d8%b1%db%8c%d9%87_%d9%85%d8%af%d9%84_n-grams\"><\/span>\u0646\u0638\u0631\u06cc\u0647 \u0645\u062f\u0644 N-Grams<span class=\"ez-toc-section-end\"><\/span><\/h2>\n<p>\u0648\u06cc\u06a9\u06cc\u200c\u067e\u062f\u06cc\u0627 N-Gram \u0631\u0627 \u0628\u0647\u200c\u0639\u0646\u0648\u0627\u0646 \u00ab\u062a\u0648\u0627\u0644\u06cc \u067e\u06cc\u0648\u0633\u062a\u0647 \u0627\u0632 N \u0645\u0648\u0631\u062f \u0627\u0632 \u06cc\u06a9 \u0646\u0645\u0648\u0646\u0647 \u0645\u0639\u06cc\u0646 \u0627\u0632 \u0645\u062a\u0646 \u06cc\u0627 \u06af\u0641\u062a\u0627\u0631\u00bb \u062a\u0639\u0631\u06cc\u0641 \u0645\u06cc\u200c\u06a9\u0646\u062f.  \u062f\u0631 \u0627\u06cc\u0646\u062c\u0627 \u06cc\u06a9 \u0622\u06cc\u062a\u0645 \u0645\u06cc \u062a\u0648\u0627\u0646\u062f \u06cc\u06a9 \u06a9\u0627\u0631\u0627\u06a9\u062a\u0631\u060c \u06cc\u06a9 \u06a9\u0644\u0645\u0647 \u06cc\u0627 \u06cc\u06a9 \u062c\u0645\u0644\u0647 \u0628\u0627\u0634\u062f \u0648 N \u0645\u06cc \u062a\u0648\u0627\u0646\u062f \u0647\u0631 \u0639\u062f\u062f \u0635\u062d\u06cc\u062d\u06cc \u0628\u0627\u0634\u062f.  \u0648\u0642\u062a\u06cc N 2 \u0628\u0627\u0634\u062f\u060c \u062f\u0646\u0628\u0627\u0644\u0647 \u0631\u0627 \u0628\u06cc\u06af\u0631\u0627\u0645 \u0645\u06cc \u0646\u0627\u0645\u06cc\u0645.  \u0628\u0647 \u0637\u0648\u0631 \u0645\u0634\u0627\u0628\u0647\u060c \u062f\u0646\u0628\u0627\u0644\u0647 \u0627\u06cc \u0627\u0632 3 \u0645\u0648\u0631\u062f \u0631\u0627 \u06cc\u06a9 \u062a\u0631\u06cc\u06af\u0631\u0627\u0645 \u0645\u06cc \u0646\u0627\u0645\u0646\u062f \u0648 \u0628\u0647 \u0647\u0645\u06cc\u0646 \u062a\u0631\u062a\u06cc\u0628 \u0631\u0648\u06cc.<\/p>\n<p>\u0628\u0631\u0627\u06cc \u062f\u0631\u06a9 \u0645\u062f\u0644 N-Grams\u060c \u0627\u0628\u062a\u062f\u0627 \u0628\u0627\u06cc\u062f \u0628\u0641\u0647\u0645\u06cc\u0645 \u06a9\u0647 \u0632\u0646\u062c\u06cc\u0631\u0647 \u0647\u0627\u06cc \u0645\u0627\u0631\u06a9\u0648\u0641 \u0686\u06af\u0648\u0646\u0647 \u06a9\u0627\u0631 \u0645\u06cc \u06a9\u0646\u0646\u062f.<\/p>\n<h3 id=\"connectionofngramswithmarkovchains\"><span class=\"ez-toc-section\" id=\"%d8%a7%d8%aa%d8%b5%d8%a7%d9%84_n-gram_%d8%a8%d8%a7_%d8%b2%d9%86%d8%ac%db%8c%d8%b1%d9%87_%d9%85%d8%a7%d8%b1%da%a9%d9%88%d9%81\"><\/span>\u0627\u062a\u0635\u0627\u0644 N-Gram \u0628\u0627 \u0632\u0646\u062c\u06cc\u0631\u0647 \u0645\u0627\u0631\u06a9\u0648\u0641<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p>\u0622 <a rel=\"nofollow noopener\" target=\"_blank\" href=\"https:\/\/en.wikipedia.org\/wiki\/Markov_chain\">\u0632\u0646\u062c\u06cc\u0631 \u0645\u0627\u0631\u06a9\u0648\u0641<\/a> \u062f\u0646\u0628\u0627\u0644\u0647 \u0627\u06cc \u0627\u0632 \u062d\u0627\u0644\u0627\u062a \u0627\u0633\u062a.  \u06cc\u06a9 \u0633\u06cc\u0633\u062a\u0645 \u0645\u0627\u0631\u06a9\u0648\u0641 \u0628\u0627 2 \u062d\u0627\u0644\u062a X \u0648 Y \u0631\u0627 \u062f\u0631 \u0646\u0638\u0631 \u0628\u06af\u06cc\u0631\u06cc\u062f. \u062f\u0631 \u0632\u0646\u062c\u06cc\u0631\u0647 \u0645\u0627\u0631\u06a9\u0648\u0641\u060c \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u062f \u062f\u0631 \u06cc\u06a9 \u062d\u0627\u0644\u062a \u0628\u0645\u0627\u0646\u06cc\u062f \u06cc\u0627 \u0628\u0647 \u062d\u0627\u0644\u062a \u062f\u06cc\u06af\u0631 \u0628\u0631\u0648\u06cc\u062f.  \u062f\u0631 \u0645\u062b\u0627\u0644 \u0645\u0627\u060c \u0627\u06cc\u0627\u0644\u062a \u0647\u0627\u06cc \u0645\u0627 \u0631\u0641\u062a\u0627\u0631 \u0632\u06cc\u0631 \u0631\u0627 \u062f\u0627\u0631\u0646\u062f:<\/p>\n<ol>\n<li>\u0627\u062d\u062a\u0645\u0627\u0644 \u062c\u0627\u0628\u062c\u0627\u06cc\u06cc \u0627\u0632 X \u0628\u0647 Y 50\u066a \u0648 \u0628\u0647 \u0637\u0648\u0631 \u0645\u0634\u0627\u0628\u0647\u060c \u0627\u062d\u062a\u0645\u0627\u0644 \u0645\u0627\u0646\u062f\u0646 \u062f\u0631 X 50\u066a \u0627\u0633\u062a.<\/li>\n<li>\u0628\u0647 \u0647\u0645\u06cc\u0646 \u062a\u0631\u062a\u06cc\u0628\u060c \u0627\u062d\u062a\u0645\u0627\u0644 \u0645\u0627\u0646\u062f\u0646 \u062f\u0631 Y 50\u066a \u0627\u0633\u062a \u062f\u0631 \u062d\u0627\u0644\u06cc \u06a9\u0647 \u0627\u062d\u062a\u0645\u0627\u0644 \u0628\u0627\u0632\u06af\u0634\u062a \u0628\u0647 X \u0646\u06cc\u0632 50\u066a \u0627\u0633\u062a.<\/li>\n<\/ol>\n<p>\u0628\u0647 \u0627\u06cc\u0646 \u062a\u0631\u062a\u06cc\u0628 \u0645\u06cc \u062a\u0648\u0627\u0646 \u06cc\u06a9 \u062f\u0646\u0628\u0627\u0644\u0647 \u0645\u0627\u0631\u06a9\u0648\u0641 \u0645\u0627\u0646\u0646\u062f XXYX \u0648 \u063a\u06cc\u0631\u0647 \u062a\u0648\u0644\u06cc\u062f \u06a9\u0631\u062f.<\/p>\n<p>\u062f\u0631 \u0645\u062f\u0644 N-Grams\u060c \u06cc\u06a9 \u0622\u06cc\u062a\u0645 \u062f\u0631 \u06cc\u06a9 \u062f\u0646\u0628\u0627\u0644\u0647 \u0631\u0627 \u0645\u06cc \u062a\u0648\u0627\u0646 \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u06cc\u06a9 \u062d\u0627\u0644\u062a \u0645\u0627\u0631\u06a9\u0648\u0641 \u062f\u0631 \u0646\u0638\u0631 \u06af\u0631\u0641\u062a.  \u0628\u06cc\u0627\u06cc\u06cc\u062f \u06cc\u06a9 \u0645\u062b\u0627\u0644 \u0633\u0627\u062f\u0647 \u0627\u0632 \u0628\u06cc\u06af\u0631\u0627\u0645 \u0647\u0627\u06cc \u06a9\u0627\u0631\u0627\u06a9\u062a\u0631 \u0631\u0627 \u0628\u0628\u06cc\u0646\u06cc\u0645 \u06a9\u0647 \u062f\u0631 \u0622\u0646 \u0647\u0631 \u0634\u062e\u0635\u06cc\u062a \u06cc\u06a9 \u062d\u0627\u0644\u062a \u0645\u0627\u0631\u06a9\u0648\u0641 \u0627\u0633\u062a.<\/p>\n<pre><code class=\"hljs\">Football is a very famous game\n<\/code><\/pre>\n<p>\u0628\u06cc\u06af\u0631\u0627\u0645 \u06a9\u0627\u0631\u0627\u06a9\u062a\u0631\u0647\u0627\u06cc \u062c\u0645\u0644\u0647 \u0628\u0627\u0644\u0627 \u0628\u0647 \u0635\u0648\u0631\u062a \u0632\u06cc\u0631 \u062e\u0648\u0627\u0647\u062f \u0628\u0648\u062f: <code>fo<\/code>\u060c <code>oo<\/code>\u060c <code>ot<\/code>\u060c <code>tb<\/code>\u060c <code>ba<\/code>\u060c <code>al<\/code>\u060c <code>ll<\/code>\u060c <code>l <\/code>\u060c <code> i<\/code>\u060c <code>is<\/code> \u0648 \u063a\u06cc\u0631\u0647 \u0631\u0648\u06cc.  \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u062f \u0628\u0628\u06cc\u0646\u06cc\u062f \u06a9\u0647 \u0628\u06cc\u06af\u0631\u0627\u0645 \u0647\u0627 \u0627\u0633\u0627\u0633\u0627\u064b \u062f\u0646\u0628\u0627\u0644\u0647 \u0627\u06cc \u0627\u0632 \u062f\u0648 \u06a9\u0627\u0631\u0627\u06a9\u062a\u0631 \u0645\u062a\u0648\u0627\u0644\u06cc \u0647\u0633\u062a\u0646\u062f.<\/p>\n<p>\u0628\u0647 \u0637\u0648\u0631 \u0645\u0634\u0627\u0628\u0647\u060c \u062a\u0631\u06cc\u06af\u0631\u0627\u0645 \u0647\u0627 \u062f\u0646\u0628\u0627\u0644\u0647 \u0627\u06cc \u0627\u0632 \u0633\u0647 \u06a9\u0627\u0631\u0627\u06a9\u062a\u0631 \u0628\u0647 \u0647\u0645 \u067e\u06cc\u0648\u0633\u062a\u0647 \u0647\u0633\u062a\u0646\u062f\u060c \u0647\u0645\u0627\u0646\u0637\u0648\u0631 \u06a9\u0647 \u062f\u0631 \u0632\u06cc\u0631 \u0646\u0634\u0627\u0646 \u062f\u0627\u062f\u0647 \u0634\u062f\u0647 \u0627\u0633\u062a:<\/p>\n<p><code>foo<\/code>\u060c <code>oot<\/code>\u060c <code>otb<\/code>\u060c <code>tba<\/code> \u0648 \u063a\u06cc\u0631\u0647 \u0631\u0648\u06cc.<\/p>\n<p>\u062f\u0631 \u062f\u0648 \u0645\u062b\u0627\u0644 \u0642\u0628\u0644\u06cc\u060c \u0628\u06cc\u06af\u0631\u0627\u0645 \u0648 \u062a\u0631\u06cc\u06af\u0631\u0627\u0645 \u06a9\u0627\u0631\u0627\u06a9\u062a\u0631\u0647\u0627 \u0631\u0627 \u062f\u06cc\u062f\u06cc\u0645.  \u0645\u0627 \u0647\u0645\u0686\u0646\u06cc\u0646 \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u0645 \u0628\u06cc\u06af\u0631\u0627\u0645 \u0648 \u0633\u0647 \u0636\u0644\u0639\u06cc \u0627\u0632 <em>\u06a9\u0644\u0645\u0627\u062a<\/em>.<\/p>\n<p>\u0628\u06cc\u0627\u06cc\u06cc\u062f \u0628\u0647 \u0645\u062b\u0627\u0644 \u0642\u0628\u0644\u06cc \u062e\u0648\u062f \u06cc\u0639\u0646\u06cc \u00ab\u0645\u0627\u0634\u06cc\u0646 \u0648 \u0641\u0631\u0634 \u0642\u0631\u0645\u0632 \u0628\u0632\u0631\u06af\u00bb \u0628\u0631\u06af\u0631\u062f\u06cc\u0645.  \u0628\u06cc\u06af\u0631\u0627\u0645 \u0627\u06cc\u0646 \u062c\u0645\u0644\u0647 \u00ab\u0642\u0631\u0645\u0632 \u0628\u0632\u0631\u06af\u00bb\u060c \u00ab\u0645\u0627\u0634\u06cc\u0646 \u0642\u0631\u0645\u0632\u00bb\u060c \u00ab\u0645\u0627\u0634\u06cc\u0646 \u0648\u00bb\u060c \u00ab\u0648 \u0641\u0631\u0634\u00bb \u062e\u0648\u0627\u0647\u062f \u0628\u0648\u062f.  \u0628\u0647 \u0647\u0645\u06cc\u0646 \u062a\u0631\u062a\u06cc\u0628\u060c \u0628\u06cc\u06af\u0631\u0627\u0645 \u0647\u0627\u06cc \u062c\u0645\u0644\u0647 \u00ab\u0641\u0631\u0634 \u0642\u0631\u0645\u0632 \u0628\u0632\u0631\u06af \u0648 \u0645\u0627\u0634\u06cc\u0646\u00bb \u00ab\u0642\u0631\u0645\u0632 \u0628\u0632\u0631\u06af\u00bb\u060c \u00ab\u0641\u0631\u0634 \u0642\u0631\u0645\u0632\u00bb\u060c \u00ab\u0641\u0631\u0634 \u0648\u00bb\u060c \u00ab\u0648 \u0645\u0627\u0634\u06cc\u0646\u00bb \u062e\u0648\u0627\u0647\u062f \u0628\u0648\u062f.<\/p>\n<p>\u062f\u0631 \u0627\u06cc\u0646\u062c\u0627 \u062f\u0631 \u0627\u06cc\u0646 \u0645\u0648\u0631\u062f \u0628\u0627 \u0628\u06cc\u06af\u0631\u0627\u0645 \u0647\u0627\u060c \u06cc\u06a9 \u0646\u0645\u0627\u06cc\u0634 \u0628\u0631\u062f\u0627\u0631\u06cc \u0645\u062a\u0641\u0627\u0648\u062a \u0628\u0631\u0627\u06cc \u0647\u0631 \u062f\u0648 \u062c\u0645\u0644\u0647 \u062f\u0631\u06cc\u0627\u0641\u062a \u0645\u06cc \u06a9\u0646\u06cc\u0645.<\/p>\n<p>\u062f\u0631 \u0628\u062e\u0634 \u0628\u0639\u062f\u06cc\u060c \u0645\u062f\u0644 N-Grams \u0631\u0627 \u0627\u0632 \u0627\u0628\u062a\u062f\u0627 \u062f\u0631 \u067e\u0627\u06cc\u062a\u0648\u0646 \u067e\u06cc\u0627\u062f\u0647 \u0633\u0627\u0632\u06cc \u0645\u06cc \u06a9\u0646\u06cc\u0645 \u0648 \u062e\u0648\u0627\u0647\u06cc\u0645 \u062f\u06cc\u062f \u06a9\u0647 \u0686\u06af\u0648\u0646\u0647 \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u0645 \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 N-Gram \u0645\u0627\u0646\u0646\u062f \u0627\u06cc\u0646 \u06cc\u06a9 \u067e\u0631\u06a9\u0646\u0646\u062f\u0647 \u0645\u062a\u0646 \u062e\u0648\u062f\u06a9\u0627\u0631 \u0627\u06cc\u062c\u0627\u062f \u06a9\u0646\u06cc\u0645.<\/p>\n<h2 id=\"ngramsfromscratchinpython\"><span class=\"ez-toc-section\" id=\"n-grams_%d8%a7%d8%b2_%d8%a7%d8%a8%d8%aa%d8%af%d8%a7_%d8%af%d8%b1_%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86\"><\/span>N-Grams \u0627\u0632 \u0627\u0628\u062a\u062f\u0627 \u062f\u0631 \u067e\u0627\u06cc\u062a\u0648\u0646<span class=\"ez-toc-section-end\"><\/span><\/h2>\n<p>\u0645\u0627 \u062f\u0631 \u0627\u06cc\u0646 \u0628\u062e\u0634 \u062f\u0648 \u0646\u0648\u0639 \u0645\u062f\u0644 N-Gram \u0627\u06cc\u062c\u0627\u062f \u0645\u06cc \u06a9\u0646\u06cc\u0645: \u06cc\u06a9 \u0645\u062f\u0644 N-Grams \u0628\u0627 \u06a9\u0627\u0631\u0627\u06a9\u062a\u0631 \u0648 \u06cc\u06a9 \u0645\u062f\u0644 N-Gram \u06a9\u0644\u0645\u0647.<\/p>\n<h3 id=\"charactersngramsmodel\"><span class=\"ez-toc-section\" id=\"%da%a9%d8%a7%d8%b1%d8%a7%da%a9%d8%aa%d8%b1%d9%87%d8%a7_%d9%85%d8%af%d9%84_n-grams\"><\/span>\u06a9\u0627\u0631\u0627\u06a9\u062a\u0631\u0647\u0627 \u0645\u062f\u0644 N-Grams<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p>\u062f\u0631 \u0627\u06cc\u0646 \u0642\u0633\u0645\u062a \u0631\u0648\u0634 \u0627\u06cc\u062c\u0627\u062f \u06cc\u06a9 \u0645\u062f\u0644 \u06a9\u0627\u0631\u0627\u06a9\u062a\u0631 \u0633\u0627\u062f\u0647 N-Gram \u0631\u0627 \u062a\u0648\u0636\u06cc\u062d \u062e\u0648\u0627\u0647\u0645 \u062f\u0627\u062f.  \u062f\u0631 \u0642\u0633\u0645\u062a \u0628\u0639\u062f\u06cc \u0631\u0648\u0634 \u067e\u06cc\u0627\u062f\u0647 \u0633\u0627\u0632\u06cc \u0645\u062f\u0644 N-Gram \u0631\u0627 \u062e\u0648\u0627\u0647\u06cc\u0645 \u062f\u06cc\u062f.<\/p>\n<p>\u0628\u0631\u0627\u06cc \u0627\u06cc\u062c\u0627\u062f \u0645\u062c\u0645\u0648\u0639\u0647 \u062e\u0648\u062f\u060c \u0645\u0642\u0627\u0644\u0647 \u0648\u06cc\u06a9\u06cc\u200c\u067e\u062f\u06cc\u0627 \u0631\u0627 \u062e\u0631\u0627\u0634 \u0645\u06cc\u200c\u062f\u0647\u06cc\u0645 \u0631\u0648\u06cc \u062a\u0646\u06cc\u0633.  \u0627\u0648\u0644 \u0628\u06cc\u0627\u06cc\u06cc\u062f import \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 \u0647\u0627\u06cc\u06cc \u06a9\u0647 \u0628\u0631\u0627\u06cc \u062f\u0627\u0646\u0644\u0648\u062f \u0648 \u062a\u062c\u0632\u06cc\u0647 \u0645\u0642\u0627\u0644\u0647 \u0648\u06cc\u06a9\u06cc \u067e\u062f\u06cc\u0627 \u0646\u06cc\u0627\u0632 \u062f\u0627\u0631\u06cc\u0645.<\/p>\n<pre><code class=\"hljs\"><span class=\"hljs-keyword\">import<\/span> nltk\n<span class=\"hljs-keyword\">import<\/span> numpy <span class=\"hljs-keyword\">as<\/span> np\n<span class=\"hljs-keyword\">import<\/span> random\n<span class=\"hljs-keyword\">import<\/span> string\n\n<span class=\"hljs-keyword\">import<\/span> bs4 <span class=\"hljs-keyword\">as<\/span> bs\n<span class=\"hljs-keyword\">import<\/span> urllib.request\n<span class=\"hljs-keyword\">import<\/span> re\n<\/code><\/pre>\n<p>\u0645\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u062e\u0648\u0627\u0647\u06cc\u0645 \u06a9\u0631\u062f <a rel=\"nofollow noopener\" target=\"_blank\" href=\"https:\/\/www.crummy.com\/software\/BeautifulSoup\/bs4\/doc\/\" class=\"broken_link\">\u0633\u0648\u067e \u0632\u06cc\u0628\u06274<\/a> \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 \u0628\u0631\u0627\u06cc \u062a\u062c\u0632\u06cc\u0647 \u062f\u0627\u062f\u0647 \u0647\u0627\u06cc \u0648\u06cc\u06a9\u06cc \u067e\u062f\u06cc\u0627.  \u0639\u0644\u0627\u0648\u0647 \u0628\u0631 \u0627\u06cc\u0646\u060c \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 regex \u067e\u0627\u06cc\u062a\u0648\u0646\u060c <code>re<\/code>\u060c \u0628\u0631\u0627\u06cc \u0628\u0631\u062e\u06cc \u0627\u0632 \u06a9\u0627\u0631\u0647\u0627\u06cc \u067e\u06cc\u0634 \u067e\u0631\u062f\u0627\u0632\u0634 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u062e\u0648\u0627\u0647\u062f \u0634\u062f \u0631\u0648\u06cc \u0645\u062a\u0646.<\/p>\n<p>\u0647\u0645\u0627\u0646\u0637\u0648\u0631 \u06a9\u0647 \u0642\u0628\u0644\u0627 \u06af\u0641\u062a\u06cc\u0645 \u0627\u0632 \u0645\u0642\u0627\u0644\u0647 \u0648\u06cc\u06a9\u06cc \u067e\u062f\u06cc\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u062e\u0648\u0627\u0647\u06cc\u0645 \u06a9\u0631\u062f \u0631\u0648\u06cc \u062a\u0646\u06cc\u0633 \u0628\u0631\u0627\u06cc \u0627\u06cc\u062c\u0627\u062f \u0645\u062c\u0645\u0648\u0639\u0647 \u0645\u0627.  \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0632\u06cc\u0631 \u0645\u0642\u0627\u0644\u0647 \u0648\u06cc\u06a9\u06cc\u200c\u067e\u062f\u06cc\u0627 \u0631\u0627 \u0628\u0627\u0632\u06cc\u0627\u0628\u06cc \u0645\u06cc\u200c\u06a9\u0646\u062f \u0648 \u062a\u0645\u0627\u0645 \u067e\u0627\u0631\u0627\u06af\u0631\u0627\u0641\u200c\u0647\u0627 \u0631\u0627 \u0627\u0632 \u0645\u062a\u0646 \u0645\u0642\u0627\u0644\u0647 \u0627\u0633\u062a\u062e\u0631\u0627\u062c \u0645\u06cc\u200c\u06a9\u0646\u062f.  \u062f\u0631 \u0646\u0647\u0627\u06cc\u062a\u060c \u0645\u062a\u0646 \u0628\u0631\u0627\u06cc \u067e\u0631\u062f\u0627\u0632\u0634 \u0622\u0633\u0627\u0646 \u062a\u0631 \u0628\u0647 \u062d\u0631\u0648\u0641 \u06a9\u0648\u0686\u06a9 \u062a\u0628\u062f\u06cc\u0644 \u0645\u06cc \u0634\u0648\u062f.<\/p>\n<pre><code class=\"hljs\">raw_html = urllib.request.urlopen(<span class=\"hljs-string\">'https:\/\/en.wikipedia.org\/wiki\/Tennis'<\/span>)\nraw_html = raw_html.read()\n\narticle_html = bs.BeautifulSoup(raw_html, <span class=\"hljs-string\">'lxml'<\/span>)\narticle_paragraphs = article_html.find_all(<span class=\"hljs-string\">'p'<\/span>)\narticle_text = <span class=\"hljs-string\">''<\/span>\n\n<span class=\"hljs-keyword\">for<\/span> para <span class=\"hljs-keyword\">in<\/span> article_paragraphs:\n    article_text += para.text\n\narticle_text = article_text.lower()\n<\/code><\/pre>\n<p>\u0628\u0639\u062f\u060c \u0647\u0645\u0647 \u0686\u06cc\u0632 \u0631\u0627 \u0627\u0632 \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647 \u062e\u0648\u062f \u062d\u0630\u0641 \u0645\u06cc \u06a9\u0646\u06cc\u0645 \u0628\u0647 \u062c\u0632 \u062d\u0631\u0648\u0641\u060c \u0646\u0642\u0637\u0647 \u0648 \u0641\u0627\u0635\u0644\u0647:<\/p>\n<pre><code class=\"hljs\">article_text = re.sub(r'(^A-Za-z. )', '', article_text)\n<\/code><\/pre>\n<p>\u0645\u0627 \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647 \u062e\u0648\u062f \u0631\u0627 \u0627\u0632 \u0642\u0628\u0644 \u067e\u0631\u062f\u0627\u0632\u0634 \u06a9\u0631\u062f\u0647 \u0627\u06cc\u0645 \u0648 \u0627\u06a9\u0646\u0648\u0646 \u0632\u0645\u0627\u0646 \u0627\u06cc\u062c\u0627\u062f \u06cc\u06a9 \u0645\u062f\u0644 N-Gram \u0627\u0633\u062a.  \u0645\u0627 \u06cc\u06a9 \u0645\u062f\u0644 \u062a\u0631\u06cc\u06af\u0631\u0627\u0645 \u06a9\u0627\u0631\u0627\u06a9\u062a\u0631 \u0627\u06cc\u062c\u0627\u062f \u062e\u0648\u0627\u0647\u06cc\u0645 \u06a9\u0631\u062f.  \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0632\u06cc\u0631 \u0631\u0627 \u0627\u062c\u0631\u0627 \u06a9\u0646\u06cc\u062f:<\/p>\n<pre><code class=\"hljs\">ngrams = {}\nchars = <span class=\"hljs-number\">3<\/span>\n\n<span class=\"hljs-keyword\">for<\/span> i <span class=\"hljs-keyword\">in<\/span> <span class=\"hljs-built_in\">range<\/span>(<span class=\"hljs-built_in\">len<\/span>(article_text)-chars):\n    seq = article_text(i:i+chars)\n    <span class=\"hljs-built_in\">print<\/span>(seq)\n    <span class=\"hljs-keyword\">if<\/span> seq <span class=\"hljs-keyword\">not<\/span> <span class=\"hljs-keyword\">in<\/span> ngrams.keys():\n        ngrams(seq) = ()\n    ngrams(seq).append(article_text(i+chars))\n<\/code><\/pre>\n<p>\u062f\u0631 \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0628\u0627\u0644\u0627 \u06cc\u06a9 \u062f\u06cc\u06a9\u0634\u0646\u0631\u06cc \u0627\u06cc\u062c\u0627\u062f \u0645\u06cc \u06a9\u0646\u06cc\u0645 <code>ngrams<\/code>.  \u06a9\u0644\u06cc\u062f\u0647\u0627\u06cc \u0627\u06cc\u0646 \u0641\u0631\u0647\u0646\u06af \u0644\u063a\u062a\u060c \u062a\u0631\u06cc\u06af\u0631\u0627\u0645 \u0647\u0627\u06cc \u06a9\u0627\u0631\u0627\u06a9\u062a\u0631 \u062f\u0631 \u0645\u062c\u0645\u0648\u0639\u0647 \u0645\u0627 \u0648 \u0645\u0642\u0627\u062f\u06cc\u0631\u060c \u06a9\u0627\u0631\u0627\u06a9\u062a\u0631\u0647\u0627\u06cc\u06cc \u062e\u0648\u0627\u0647\u0646\u062f \u0628\u0648\u062f \u06a9\u0647 \u062f\u0631 \u06a9\u0646\u0627\u0631 \u062a\u0631\u06cc\u06af\u0631\u0627\u0645 \u0647\u0627 \u0642\u0631\u0627\u0631 \u0645\u06cc \u06af\u06cc\u0631\u0646\u062f.  \u0628\u0639\u062f\u060c \u0627\u0632 \u0622\u0646\u062c\u0627\u06cc\u06cc \u06a9\u0647 \u0645\u0627 \u06cc\u06a9 N-Gram \u0627\u0632 \u0633\u0647 \u06a9\u0627\u0631\u0627\u06a9\u062a\u0631 \u0627\u06cc\u062c\u0627\u062f \u0645\u06cc \u06a9\u0646\u06cc\u0645\u060c \u06cc\u06a9 \u0645\u062a\u063a\u06cc\u0631 \u0631\u0627 \u0627\u0639\u0644\u0627\u0645 \u0645\u06cc \u06a9\u0646\u06cc\u0645 <code>chars<\/code>.  \u067e\u0633 \u0627\u0632 \u0622\u0646\u060c \u0627\u0632 \u06a9\u0627\u0631\u0627\u06a9\u062a\u0631 \u0686\u0647\u0627\u0631\u0645 \u0634\u0631\u0648\u0639 \u0645\u06cc \u06a9\u0646\u06cc\u0645\u060c \u0647\u0645\u0647 \u06a9\u0627\u0631\u0627\u06a9\u062a\u0631\u0647\u0627\u06cc \u0645\u062c\u0645\u0648\u0639\u0647 \u062e\u0648\u062f \u0631\u0627 \u062a\u06a9\u0631\u0627\u0631 \u0645\u06cc \u06a9\u0646\u06cc\u0645.<\/p>\n<p>\u0633\u067e\u0633 \u062f\u0631 \u062f\u0627\u062e\u0644 \u062d\u0644\u0642\u0647\u060c \u0628\u0627 \u0641\u06cc\u0644\u062a\u0631 \u06a9\u0631\u062f\u0646 \u0633\u0647 \u06a9\u0627\u0631\u0627\u06a9\u062a\u0631 \u0628\u0639\u062f\u06cc\u060c \u062a\u0631\u06cc\u06af\u0631\u0627\u0645 \u0631\u0627 \u0627\u0633\u062a\u062e\u0631\u0627\u062c \u0645\u06cc \u06a9\u0646\u06cc\u0645.  \u062a\u0631\u06cc\u06af\u0631\u0627\u0645 \u062f\u0631 \u0630\u062e\u06cc\u0631\u0647 \u0645\u06cc \u0634\u0648\u062f <code>seq<\/code> \u0645\u062a\u063a\u06cc\u0631.  \u0633\u067e\u0633 \u0628\u0631\u0631\u0633\u06cc \u0645\u06cc \u06a9\u0646\u06cc\u0645 \u06a9\u0647 \u0622\u06cc\u0627 \u0633\u0647 \u062e\u0637 \u062f\u0631 \u0641\u0631\u0647\u0646\u06af \u0644\u063a\u062a \u0648\u062c\u0648\u062f \u062f\u0627\u0631\u062f \u06cc\u0627 \u062e\u06cc\u0631.  \u0627\u06af\u0631 \u062f\u0631 \u0622\u0646 \u0648\u062c\u0648\u062f \u0646\u062f\u0627\u0634\u062a\u0647 \u0628\u0627\u0634\u062f <code>ngrams<\/code> \u0641\u0631\u0647\u0646\u06af \u0644\u063a\u062a \u0645\u0627 \u062a\u0631\u06cc\u06af\u0631\u0627\u0645 \u0631\u0627 \u0628\u0647 \u0641\u0631\u0647\u0646\u06af \u0644\u063a\u062a \u0627\u0636\u0627\u0641\u0647 \u0645\u06cc \u06a9\u0646\u06cc\u0645.  \u067e\u0633 \u0627\u0632 \u0622\u0646\u060c \u06cc\u06a9 \u0644\u06cc\u0633\u062a \u062e\u0627\u0644\u06cc \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u0645\u0642\u062f\u0627\u0631 \u0628\u0647 trigram \u0627\u062e\u062a\u0635\u0627\u0635 \u0645\u06cc \u062f\u0647\u06cc\u0645.  \u062f\u0631 \u0646\u0647\u0627\u06cc\u062a\u060c \u06a9\u0627\u0631\u0627\u06a9\u062a\u0631\u06cc \u06a9\u0647 \u0628\u0639\u062f \u0627\u0632 \u062a\u0631\u06cc\u06af\u0631\u0627\u0645 \u0648\u062c\u0648\u062f \u062f\u0627\u0631\u062f \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u06cc\u06a9 \u0645\u0642\u062f\u0627\u0631 \u0628\u0647 \u0644\u06cc\u0633\u062a \u0627\u0636\u0627\u0641\u0647 \u0645\u06cc \u0634\u0648\u062f.<\/p>\n<p>\u0627\u06af\u0631 \u062f\u06cc\u06a9\u0634\u0646\u0631\u06cc \u0631\u0627 \u0628\u0627\u0632 \u06a9\u0646\u06cc\u062f <code>ngrams<\/code> \u062f\u0631 \u0627\u06a9\u0633\u067e\u0644\u0648\u0631\u0631 \u0645\u062a\u063a\u06cc\u0631 Spyder.  \u0634\u0645\u0627 \u0628\u0627\u06cc\u062f \u0686\u06cc\u0632\u06cc \u0634\u0628\u06cc\u0647 \u0628\u0647 \u0627\u06cc\u0646 \u0631\u0627 \u0628\u0628\u06cc\u0646\u06cc\u062f:<\/p>\n<p><img decoding=\"async\" class=\"img-responsive\" src=\"https:\/\/rasanegar.com\/blog\/wp-content\/uploads\/2024\/01\/python-nlp-developing-automatic-text-filler-n-grams-1.png\" alt=\"\" title=\"\"><\/p>\n<p>\u0634\u0645\u0627 \u0645\u06cc\u200c\u062a\u0648\u0627\u0646\u06cc\u062f \u0633\u0647\u200c\u06af\u0631\u0627\u0645\u200c\u0647\u0627 \u0631\u0627 \u0628\u0647\u200c\u0639\u0646\u0648\u0627\u0646 \u06a9\u0644\u06cc\u062f\u060c \u0648 \u06a9\u0627\u0631\u0627\u06a9\u062a\u0631\u0647\u0627\u06cc \u0645\u0631\u0628\u0648\u0637\u0647 \u0631\u0627 \u06a9\u0647 \u0628\u0639\u062f \u0627\u0632 \u0633\u0647\u200c\u06af\u0648\u0634\u200c\u0647\u0627 \u062f\u0631 \u0645\u062a\u0646 \u0631\u062e \u0645\u06cc\u200c\u062f\u0647\u0646\u062f\u060c \u0628\u0647\u200c\u0639\u0646\u0648\u0627\u0646 \u0645\u0642\u0627\u062f\u06cc\u0631 \u0628\u0628\u06cc\u0646\u06cc\u062f.  \u0645\u0645\u06a9\u0646 \u0627\u0633\u062a \u06a9\u0644\u06cc\u062f\u0647\u0627\u06cc\u06cc \u0631\u0627 \u0628\u0627 \u062f\u0648 \u06a9\u0627\u0631\u0627\u06a9\u062a\u0631 \u062f\u0631 \u0641\u0631\u0647\u0646\u06af \u0644\u063a\u062a \u0628\u0628\u06cc\u0646\u06cc\u062f \u0627\u0645\u0627 \u062f\u0631 \u0648\u0627\u0642\u0639 \u062f\u0648 \u06a9\u0627\u0631\u0627\u06a9\u062a\u0631 \u0646\u06cc\u0633\u062a\u0646\u062f.  \u0634\u062e\u0635\u06cc\u062a \u0633\u0648\u0645 \u062f\u0631 \u0648\u0627\u0642\u0639 \u06cc\u06a9 \u0641\u0636\u0627 \u0627\u0633\u062a.<\/p>\n<p>\u0628\u06cc\u0627\u06cc\u06cc\u062f \u0627\u06a9\u0646\u0648\u0646 \u0633\u0639\u06cc \u06a9\u0646\u06cc\u0645 \u0645\u062a\u0646 \u0631\u0627 \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 \u0633\u0647 \u06a9\u0627\u0631\u0627\u06a9\u062a\u0631 \u0627\u0648\u0644 \u0645\u062c\u0645\u0648\u0639\u0647 \u062e\u0648\u062f \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u0648\u0631\u0648\u062f\u06cc \u062a\u0648\u0644\u06cc\u062f \u06a9\u0646\u06cc\u0645.  \u0633\u0647 \u0634\u062e\u0635\u06cc\u062a \u0627\u0648\u0644 \u0645\u062c\u0645\u0648\u0639\u0647 \u0645\u0627 &#8220;\u062f\u0647&#8221; \u0647\u0633\u062a\u0646\u062f.  \u0628\u0647 \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0632\u06cc\u0631 \u0646\u06af\u0627\u0647 \u06a9\u0646\u06cc\u062f:<\/p>\n<pre><code class=\"hljs\">curr_sequence = article_text(<span class=\"hljs-number\">0<\/span>:chars)\noutput = curr_sequence\n<span class=\"hljs-keyword\">for<\/span> i <span class=\"hljs-keyword\">in<\/span> <span class=\"hljs-built_in\">range<\/span>(<span class=\"hljs-number\">200<\/span>):\n    <span class=\"hljs-keyword\">if<\/span> curr_sequence <span class=\"hljs-keyword\">not<\/span> <span class=\"hljs-keyword\">in<\/span> ngrams.keys():\n        <span class=\"hljs-keyword\">break<\/span>\n    possible_chars = ngrams(curr_sequence)\n    next_char = possible_chars(random.randrange(<span class=\"hljs-built_in\">len<\/span>(possible_chars)))\n    output += next_char\n    curr_sequence = output(<span class=\"hljs-built_in\">len<\/span>(output)-chars:<span class=\"hljs-built_in\">len<\/span>(output))\n\n<span class=\"hljs-built_in\">print<\/span>(output)\n<\/code><\/pre>\n<p>\u062f\u0631 \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0628\u0627\u0644\u0627 \u0645\u0627 \u0627\u0628\u062a\u062f\u0627 \u0627\u0648\u0644\u06cc\u0646 \u062a\u0631\u06cc\u06af\u0631\u0627\u0645 \u06cc\u0639\u0646\u06cc \u0630\u062e\u06cc\u0631\u0647 \u0645\u06cc \u06a9\u0646\u06cc\u0645 <code>ten<\/code> \u0628\u0647 \u062f\u0631\u0648\u0646 <code>curr_sequence<\/code> \u0645\u062a\u063a\u06cc\u0631.  \u0645\u0627 \u06cc\u06a9 \u0645\u062a\u0646 \u0627\u0632 \u062f\u0648\u06cc\u0633\u062a \u06a9\u0627\u0631\u0627\u06a9\u062a\u0631 \u062a\u0648\u0644\u06cc\u062f \u0645\u06cc \u06a9\u0646\u06cc\u0645\u060c \u0628\u0646\u0627\u0628\u0631\u0627\u06cc\u0646 \u06cc\u06a9 \u062d\u0644\u0642\u0647 \u0631\u0627 \u0631\u0627\u0647 \u0627\u0646\u062f\u0627\u0632\u06cc \u0645\u06cc \u06a9\u0646\u06cc\u0645 \u06a9\u0647 200 \u0628\u0627\u0631 \u062a\u06a9\u0631\u0627\u0631 \u0645\u06cc \u0634\u0648\u062f.  \u062f\u0631 \u0637\u0648\u0644 \u0647\u0631 \u062a\u06a9\u0631\u0627\u0631\u060c \u0628\u0631\u0631\u0633\u06cc \u0645\u06cc \u06a9\u0646\u06cc\u0645 \u06a9\u0647 \u0622\u06cc\u0627 <code>curr_sequence<\/code> \u06cc\u0627 \u062a\u0631\u06cc\u06af\u0631\u0627\u0645 \u062f\u0631 <code>ngrams<\/code> \u0641\u0631\u0647\u0646\u06af \u0644\u063a\u062a.  \u0627\u06af\u0631 \u062a\u0631\u06cc\u06af\u0631\u0627\u0645 \u062f\u0631 \u06cc\u0627\u0641\u062a \u0646\u0634\u062f <code>ngrams<\/code> \u0641\u0631\u0647\u0646\u06af \u0644\u063a\u062a\u060c \u0645\u0627 \u0628\u0647 \u0633\u0627\u062f\u06af\u06cc \u0627\u0632 \u062d\u0644\u0642\u0647 \u062e\u0627\u0631\u062c \u0645\u06cc \u0634\u0648\u06cc\u0645.<\/p>\n<p>\u0628\u0639\u062f\u060c <code>curr_sequence<\/code> \u062a\u0631\u06cc\u06af\u0631\u0627\u0645 \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u06a9\u0644\u06cc\u062f \u0628\u0647 <code>ngrams<\/code> \u0641\u0631\u0647\u0646\u06af \u0644\u063a\u062a\u060c \u06a9\u0647 \u0644\u06cc\u0633\u062a\u06cc \u0627\u0632 \u06a9\u0627\u0631\u0627\u06a9\u062a\u0631\u0647\u0627\u06cc \u0627\u062d\u062a\u0645\u0627\u0644\u06cc \u0628\u0639\u062f\u06cc \u0631\u0627 \u0628\u0631\u0645\u06cc \u06af\u0631\u062f\u0627\u0646\u062f.  \u0627\u0632 \u0644\u06cc\u0633\u062a \u06a9\u0627\u0631\u0627\u06a9\u062a\u0631\u0647\u0627\u06cc \u0627\u062d\u062a\u0645\u0627\u0644\u06cc \u0628\u0639\u062f\u06cc\u060c \u06cc\u06a9 \u0634\u0627\u062e\u0635 \u0628\u0647 \u0637\u0648\u0631 \u062a\u0635\u0627\u062f\u0641\u06cc \u0627\u0646\u062a\u062e\u0627\u0628 \u0645\u06cc \u0634\u0648\u062f \u06a9\u0647 \u0628\u0647 \u0622\u0646 \u0627\u0631\u0633\u0627\u0644 \u0645\u06cc \u0634\u0648\u062f <code>possible_chars<\/code> \u0644\u06cc\u0633\u062a\u06cc \u0628\u0631\u0627\u06cc \u0628\u062f\u0633\u062a \u0622\u0648\u0631\u062f\u0646 \u06a9\u0627\u0631\u0627\u06a9\u062a\u0631 \u0628\u0639\u062f\u06cc \u0628\u0631\u0627\u06cc \u0633\u0647 \u062e\u0637 \u0641\u0639\u0644\u06cc.  \u0633\u067e\u0633 \u06a9\u0627\u0631\u0627\u06a9\u062a\u0631 \u0628\u0639\u062f\u06cc \u0628\u0647 \u0639\u0644\u0627\u0645\u062a \u0627\u0636\u0627\u0641\u0647 \u0645\u06cc \u0634\u0648\u062f <code>output<\/code> \u0645\u062a\u063a\u06cc\u0631\u06cc \u06a9\u0647 \u062d\u0627\u0648\u06cc \u062e\u0631\u0648\u062c\u06cc \u0646\u0647\u0627\u06cc\u06cc \u0627\u0633\u062a.<\/p>\n<p>\u062f\u0631 \u0646\u0647\u0627\u06cc\u062a\u060c <code>curr_sequence<\/code> \u0628\u0627 \u0633\u0647 \u06af\u0631\u0627\u0645 \u0628\u0639\u062f\u06cc \u0627\u0632 \u0645\u062c\u0645\u0648\u0639\u0647 \u0645\u062a\u0646 \u0628\u0647 \u0631\u0648\u0632 \u0645\u06cc \u0634\u0648\u062f.  \u0627\u06af\u0631 \u0634\u0645\u0627 print \u0631\u0627 <code>output<\/code> \u0645\u062a\u063a\u06cc\u0631\u06cc \u06a9\u0647 \u0634\u0627\u0645\u0644 \u062f\u0648\u06cc\u0633\u062a \u06a9\u0627\u0631\u0627\u06a9\u062a\u0631 \u062a\u0648\u0644\u06cc\u062f \u0634\u062f\u0647 \u0628\u0647 \u0635\u0648\u0631\u062a \u062e\u0648\u062f\u06a9\u0627\u0631 \u0627\u0633\u062a\u060c \u0628\u0627\u06cc\u062f \u0686\u06cc\u0632\u06cc \u0634\u0628\u06cc\u0647 \u0628\u0647 \u0627\u06cc\u0646 \u0631\u0627 \u0628\u0628\u06cc\u0646\u06cc\u062f (\u0644\u0627\u0632\u0645 \u0628\u0647 \u0630\u06a9\u0631 \u0627\u0633\u062a \u06a9\u0647 \u0627\u0632 \u0622\u0646\u062c\u0627\u06cc\u06cc \u06a9\u0647 \u06a9\u0627\u0631\u0627\u06a9\u062a\u0631 \u0628\u0639\u062f\u06cc \u0628\u0647 \u0635\u0648\u0631\u062a \u062a\u0635\u0627\u062f\u0641\u06cc \u0627\u0646\u062a\u062e\u0627\u0628 \u0645\u06cc \u0634\u0648\u062f\u060c \u062e\u0631\u0648\u062c\u06cc \u0634\u0645\u0627 \u0645\u06cc \u062a\u0648\u0627\u0646\u062f \u0645\u062a\u0641\u0627\u0648\u062a \u0628\u0627\u0634\u062f):<\/p>\n<p><strong>\u062e\u0631\u0648\u062c\u06cc:<\/strong><\/p>\n<pre><code class=\"hljs\">tent pointo somensiver tournamedal pare the greak in the next peak sweder most begal tennis sport. the be has siders with sidernaments as was that adming up is coach rackhanced ball of ment. a game and\n<\/code><\/pre>\n<p>\u062e\u0631\u0648\u062c\u06cc \u062f\u0631 \u0627\u06cc\u0646\u062c\u0627 \u062f\u0631 \u0627\u06cc\u0646 \u0645\u0648\u0631\u062f \u0686\u0646\u062f\u0627\u0646 \u0645\u0639\u0646\u06cc \u0646\u062f\u0627\u0631\u062f.  \u0627\u06af\u0631 \u0627\u0631\u0632\u0634 \u0622\u0646 \u0631\u0627 \u0627\u0641\u0632\u0627\u06cc\u0634 \u062f\u0647\u06cc\u062f <code>chars<\/code> \u0645\u062a\u063a\u06cc\u0631 \u0628\u0647 4. \u0634\u0645\u0627 \u0628\u0627\u06cc\u062f \u0646\u062a\u0627\u06cc\u062c \u0645\u0634\u0627\u0628\u0647 \u062e\u0631\u0648\u062c\u06cc \u0647\u0627\u06cc \u0632\u06cc\u0631 \u0631\u0627 \u0628\u0628\u06cc\u0646\u06cc\u062f:<\/p>\n<pre><code class=\"hljs\">tennis ahead with the club players under.most coaching motion us . the especific at the hit and events first predomination but of ends \u0631\u0648\u06cc the u.s. cyclops have achieved the end or net inches call over age\n<\/code><\/pre>\n<p>\u0645\u06cc \u0628\u06cc\u0646\u06cc\u062f \u06a9\u0647 \u0646\u062a\u0627\u06cc\u062c \u06a9\u0645\u06cc \u0628\u0647\u062a\u0631 \u0627\u0632 \u0646\u062a\u0627\u06cc\u062c\u06cc \u0627\u0633\u062a \u06a9\u0647 \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 3 \u06af\u0631\u0645 \u0628\u0647 \u062f\u0633\u062a \u0622\u0648\u0631\u062f\u06cc\u0645.  \u0628\u0627 \u0627\u0641\u0632\u0627\u06cc\u0634 \u062a\u0639\u062f\u0627\u062f N-Gram\u060c \u067e\u06cc\u0634\u0646\u0647\u0627\u062f\/\u067e\u0631 \u06a9\u0631\u062f\u0646 \u0645\u062a\u0646 \u0645\u0627 \u0647\u0645\u0686\u0646\u0627\u0646 \u0628\u0647\u0628\u0648\u062f \u0645\u06cc \u06cc\u0627\u0628\u062f.<\/p>\n<p>\u062f\u0631 \u0642\u0633\u0645\u062a \u0628\u0639\u062f\u06cc \u0645\u062f\u0644 Words N-Grams \u0631\u0627 \u067e\u06cc\u0627\u062f\u0647 \u0633\u0627\u0632\u06cc \u0645\u06cc \u06a9\u0646\u06cc\u0645.  \u062e\u0648\u0627\u0647\u06cc\u062f \u062f\u06cc\u062f \u06a9\u0647 \u0645\u062a\u0646 \u062a\u0648\u0644\u06cc\u062f \u0634\u062f\u0647 \u062f\u0631 \u0645\u0648\u0631\u062f \u0645\u062f\u0644 Words N-Grams \u0628\u0633\u06cc\u0627\u0631 \u0645\u0639\u0646\u0627\u062f\u0627\u0631 \u062e\u0648\u0627\u0647\u062f \u0628\u0648\u062f.<\/p>\n<h3 id=\"wordsngramsmodel\"><span class=\"ez-toc-section\" id=\"%d9%85%d8%af%d9%84_n-grams_%da%a9%d9%84%d9%85%d8%a7%d8%aa\"><\/span>\u0645\u062f\u0644 N-Grams \u06a9\u0644\u0645\u0627\u062a<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p>\u062f\u0631 \u0645\u062f\u0644 Words N-Grams\u060c \u0647\u0631 \u06a9\u0644\u0645\u0647 \u062f\u0631 \u0645\u062a\u0646 \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u06cc\u06a9 \u0645\u0648\u0631\u062f \u062c\u062f\u0627\u06af\u0627\u0646\u0647 \u062f\u0631 \u0646\u0638\u0631 \u06af\u0631\u0641\u062a\u0647 \u0645\u06cc \u0634\u0648\u062f.  \u062f\u0631 \u0627\u06cc\u0646 \u0642\u0633\u0645\u062a \u0645\u062f\u0644 Words N-Grams \u0631\u0627 \u067e\u06cc\u0627\u062f\u0647 \u0633\u0627\u0632\u06cc \u06a9\u0631\u062f\u0647 \u0648 \u0627\u0632 \u0622\u0646 \u0628\u0631\u0627\u06cc \u0627\u06cc\u062c\u0627\u062f \u067e\u0631\u06a9\u0646\u0646\u062f\u0647 \u0645\u062a\u0646 \u062e\u0648\u062f\u06a9\u0627\u0631 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0645\u06cc \u06a9\u0646\u06cc\u0645.<\/p>\n<p>\u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647 \u0627\u06cc \u06a9\u0647 \u0645\u06cc \u062e\u0648\u0627\u0647\u06cc\u0645 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0646\u06cc\u0645 \u0647\u0645\u0627\u0646 \u0645\u062c\u0645\u0648\u0639\u0647 \u0627\u06cc \u0627\u0633\u062a \u06a9\u0647 \u062f\u0631 \u0628\u062e\u0634 \u06af\u0630\u0634\u062a\u0647 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0631\u062f\u06cc\u0645.<\/p>\n<p>\u0628\u06cc\u0627\u06cc\u06cc\u062f \u0627\u0628\u062a\u062f\u0627 \u06cc\u06a9 \u0641\u0631\u0647\u0646\u06af \u0644\u063a\u062a \u0628\u0633\u0627\u0632\u06cc\u0645 \u06a9\u0647 \u062d\u0627\u0648\u06cc \u062a\u0631\u06cc\u06af\u0631\u0627\u0645 \u0647\u0627\u06cc \u06a9\u0644\u0645\u0647 \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u06a9\u0644\u06cc\u062f \u0648 \u0644\u06cc\u0633\u062a\u06cc \u0627\u0632 \u06a9\u0644\u0645\u0627\u062a\u06cc \u0627\u0633\u062a \u06a9\u0647 \u0628\u0639\u062f \u0627\u0632 \u0633\u0647 \u062e\u0637 \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u0645\u0642\u0627\u062f\u06cc\u0631 \u0648\u062c\u0648\u062f \u062f\u0627\u0631\u062f.<\/p>\n<pre><code class=\"hljs\">ngrams = {}\nwords = <span class=\"hljs-number\">3<\/span>\n\nwords_tokens = nltk.word_tokenize(article_text)\n<span class=\"hljs-keyword\">for<\/span> i <span class=\"hljs-keyword\">in<\/span> <span class=\"hljs-built_in\">range<\/span>(<span class=\"hljs-built_in\">len<\/span>(words_tokens)-words):\n    seq = <span class=\"hljs-string\">' '<\/span>.join(words_tokens(i:i+words))\n    <span class=\"hljs-built_in\">print<\/span>(seq)\n    <span class=\"hljs-keyword\">if<\/span>  seq <span class=\"hljs-keyword\">not<\/span> <span class=\"hljs-keyword\">in<\/span> ngrams.keys():\n        ngrams(seq) = ()\n    ngrams(seq).append(words_tokens(i+words))\n<\/code><\/pre>\n<p>\u062f\u0631 \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0628\u0627\u0644\u0627\u060c \u06cc\u06a9 \u0645\u062f\u0644 \u062a\u0631\u06cc\u06af\u0631\u0627\u0645 Words \u0627\u06cc\u062c\u0627\u062f \u0645\u06cc \u06a9\u0646\u06cc\u0645.  \u0627\u06cc\u0646 process \u0645\u0634\u0627\u0628\u0647 \u0645\u0648\u0631\u062f\u06cc \u0627\u0633\u062a \u06a9\u0647 \u0628\u0631\u0627\u06cc \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 \u062a\u0631\u06cc\u06af\u0631\u0627\u0645 \u0647\u0627\u06cc \u06a9\u0627\u0631\u0627\u06a9\u062a\u0631 \u062f\u0646\u0628\u0627\u0644 \u0645\u06cc \u0634\u0648\u062f.  \u0628\u0627 \u0627\u06cc\u0646 \u062d\u0627\u0644\u060c \u062f\u0631 \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0628\u0627\u0644\u0627\u060c \u0627\u0628\u062a\u062f\u0627 \u0645\u062c\u0645\u0648\u0639\u0647 \u062e\u0648\u062f \u0631\u0627 \u0628\u0647 \u06a9\u0644\u0645\u0627\u062a \u0646\u0634\u0627\u0646\u0647 \u06af\u0630\u0627\u0631\u06cc \u0645\u06cc \u06a9\u0646\u06cc\u0645.<\/p>\n<p>\u062f\u0631 \u0645\u0631\u062d\u0644\u0647 \u0628\u0639\u062f\u060c \u062a\u0645\u0627\u0645 \u06a9\u0644\u0645\u0627\u062a \u0631\u0627 \u062a\u06a9\u0631\u0627\u0631 \u0645\u06cc \u06a9\u0646\u06cc\u0645 \u0648 \u0633\u067e\u0633 \u0633\u0647 \u06a9\u0644\u0645\u0647 \u0641\u0639\u0644\u06cc \u0631\u0627 \u0628\u0647 \u0647\u0645 \u0645\u06cc \u067e\u06cc\u0648\u0646\u062f\u06cc\u0645 \u062a\u0627 \u06cc\u06a9 \u0633\u0647 \u062e\u0637 \u062a\u0634\u06a9\u06cc\u0644 \u062f\u0647\u06cc\u0645.  \u067e\u0633 \u0627\u0632 \u0622\u0646\u060c \u0628\u0631\u0631\u0633\u06cc \u0645\u06cc \u06a9\u0646\u06cc\u0645 \u06a9\u0647 \u0622\u06cc\u0627 \u06a9\u0644\u0645\u0647 trigram \u062f\u0631 \u0622\u0646 \u0648\u062c\u0648\u062f \u062f\u0627\u0631\u062f \u06cc\u0627 \u062e\u06cc\u0631 <code>ngrams<\/code> \u0641\u0631\u0647\u0646\u06af \u0644\u063a\u062a.  \u0627\u06af\u0631 \u062a\u0631\u06cc\u06af\u0631\u0627\u0645 \u0627\u0632 \u0642\u0628\u0644 \u0648\u062c\u0648\u062f \u0646\u062f\u0627\u0634\u062a\u0647 \u0628\u0627\u0634\u062f\u060c \u0645\u0627 \u0628\u0647 \u0633\u0627\u062f\u06af\u06cc \u0622\u0646 \u0631\u0627 \u062f\u0631 \u0622\u0646 \u0642\u0631\u0627\u0631 \u0645\u06cc \u062f\u0647\u06cc\u0645 <code>ngrams<\/code> \u0641\u0631\u0647\u0646\u06af \u0644\u063a\u062a \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u06cc\u06a9 \u06a9\u0644\u06cc\u062f<\/p>\n<p>\u062f\u0631 \u0646\u0647\u0627\u06cc\u062a\u060c \u0641\u0647\u0631\u0633\u062a\u06cc \u0627\u0632 \u06a9\u0644\u0645\u0627\u062a\u06cc \u0631\u0627 \u06a9\u0647 \u0627\u0632 \u0633\u0647 \u062e\u0637 \u067e\u06cc\u0631\u0648\u06cc \u0645\u06cc \u06a9\u0646\u0646\u062f \u062f\u0631 \u06a9\u0644 \u0645\u062c\u0645\u0648\u0639\u0647 \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u0645\u0642\u062f\u0627\u0631 \u062f\u0631 \u0641\u0631\u0647\u0646\u06af \u0644\u063a\u062a \u0627\u0636\u0627\u0641\u0647 \u0645\u06cc \u06a9\u0646\u06cc\u0645.<\/p>\n<p>\u062d\u0627\u0644\u0627 \u0627\u06af\u0631 \u0628\u0647 <code>ngrams<\/code> \u062f\u06cc\u06a9\u0634\u0646\u0631\u06cc\u060c \u062f\u0631 \u0627\u06a9\u0633\u067e\u0644\u0648\u0631\u0631 \u0645\u062a\u063a\u06cc\u0631\u060c \u0628\u0647 \u0634\u06a9\u0644 \u0632\u06cc\u0631 \u062e\u0648\u0627\u0647\u062f \u0628\u0648\u062f:<\/p>\n<p><img decoding=\"async\" class=\"img-responsive\" src=\"https:\/\/rasanegar.com\/blog\/wp-content\/uploads\/2024\/01\/python-nlp-developing-automatic-text-filler-n-grams-2.png\" alt=\"\" title=\"\"><\/p>\n<p>\u0634\u0645\u0627 \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u062f \u062a\u0631\u06cc\u06af\u0631\u0627\u0645 \u0647\u0627 \u0631\u0627 \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u06a9\u0644\u06cc\u062f\u0647\u0627\u06cc \u0641\u0631\u0647\u0646\u06af \u0644\u063a\u062a \u0648 \u06a9\u0644\u0645\u0627\u062a \u0645\u0631\u0628\u0648\u0637\u0647 \u0631\u0627 \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u0645\u0642\u0627\u062f\u06cc\u0631 \u0641\u0631\u0647\u0646\u06af \u0644\u063a\u062a \u0645\u0634\u0627\u0647\u062f\u0647 \u06a9\u0646\u06cc\u062f.<\/p>\n<p>\u0628\u06cc\u0627\u06cc\u06cc\u062f \u0627\u06a9\u0646\u0648\u0646 \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 \u06a9\u0644\u0645\u0647 trigrams \u06a9\u0647 \u0627\u06cc\u062c\u0627\u062f \u06a9\u0631\u062f\u06cc\u0645\u060c \u06cc\u06a9 \u067e\u0631\u06a9\u0646\u0646\u062f\u0647 \u0645\u062a\u0646 \u062e\u0648\u062f\u06a9\u0627\u0631 \u0627\u06cc\u062c\u0627\u062f \u06a9\u0646\u06cc\u0645.<\/p>\n<pre><code class=\"hljs\">curr_sequence = <span class=\"hljs-string\">' '<\/span>.join(words_tokens(<span class=\"hljs-number\">0<\/span>:words))\noutput = curr_sequence\n<span class=\"hljs-keyword\">for<\/span> i <span class=\"hljs-keyword\">in<\/span> <span class=\"hljs-built_in\">range<\/span>(<span class=\"hljs-number\">50<\/span>):\n    <span class=\"hljs-keyword\">if<\/span> curr_sequence <span class=\"hljs-keyword\">not<\/span> <span class=\"hljs-keyword\">in<\/span> ngrams.keys():\n        <span class=\"hljs-keyword\">break<\/span>\n    possible_words = ngrams(curr_sequence)\n    next_word = possible_words(random.randrange(<span class=\"hljs-built_in\">len<\/span>(possible_words)))\n    output += <span class=\"hljs-string\">' '<\/span> + next_word\n    seq_words = nltk.word_tokenize(output)\n    curr_sequence = <span class=\"hljs-string\">' '<\/span>.join(seq_words(<span class=\"hljs-built_in\">len<\/span>(seq_words)-words:<span class=\"hljs-built_in\">len<\/span>(seq_words)))\n\n<span class=\"hljs-built_in\">print<\/span>(output)\n<\/code><\/pre>\n<p>\u062f\u0631 \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0628\u0627\u0644\u0627\u060c \u0645\u0642\u062f\u0627\u0631 \u0631\u0627 \u0645\u0642\u062f\u0627\u0631\u062f\u0647\u06cc \u0627\u0648\u0644\u06cc\u0647 \u0645\u06cc \u06a9\u0646\u06cc\u0645 <code>curr_sequence<\/code> \u0645\u062a\u063a\u06cc\u0631 \u0628\u0627 \u0633\u0647 \u06af\u0631\u0627\u0645 \u0627\u0648\u0644 \u062f\u0631 \u0628\u062f\u0646\u0647.  \u0627\u0648\u0644\u06cc\u0646 \u062a\u0631\u06cc\u06af\u0631\u0627\u0645 &#8220;\u062a\u0646\u06cc\u0633 \u06cc\u06a9 \u0627\u0633\u062a&#8221; \u0627\u0633\u062a.  \u0645\u0627 50 \u06a9\u0644\u0645\u0647 \u0631\u0627 \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 \u0633\u0647 \u062e\u0637 \u0627\u0648\u0644 \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u0648\u0631\u0648\u062f\u06cc \u062a\u0648\u0644\u06cc\u062f \u062e\u0648\u0627\u0647\u06cc\u0645 \u06a9\u0631\u062f.  \u0628\u0631\u0627\u06cc \u0627\u0646\u062c\u0627\u0645 \u0627\u06cc\u0646 \u06a9\u0627\u0631\u060c \u06cc\u06a9 \u062d\u0644\u0642\u0647 for \u0631\u0627 \u0627\u062c\u0631\u0627 \u0645\u06cc \u06a9\u0646\u06cc\u0645 \u06a9\u0647 50 \u0628\u0627\u0631 \u0627\u062c\u0631\u0627 \u0645\u06cc \u0634\u0648\u062f.  \u062f\u0631 \u0637\u0648\u0644 \u0647\u0631 \u062a\u06a9\u0631\u0627\u0631\u060c \u0627\u0628\u062a\u062f\u0627 \u0628\u0631\u0631\u0633\u06cc \u0645\u06cc \u0634\u0648\u062f \u06a9\u0647 \u0622\u06cc\u0627 \u06a9\u0644\u0645\u0647 trigram \u062f\u0631 \u0622\u0646 \u0648\u062c\u0648\u062f \u062f\u0627\u0631\u062f \u06cc\u0627 \u062e\u06cc\u0631 <code>ngrams<\/code> \u0641\u0631\u0647\u0646\u06af \u0644\u063a\u062a.  \u0627\u06af\u0631 \u0646\u0647\u060c \u062d\u0644\u0642\u0647 \u0645\u06cc \u0634\u06a9\u0646\u062f.  \u062f\u0631 \u063a\u06cc\u0631 \u0627\u06cc\u0646 \u0635\u0648\u0631\u062a\u060c \u0641\u0647\u0631\u0633\u062a \u06a9\u0644\u0645\u0627\u062a\u06cc \u06a9\u0647 \u0627\u062d\u062a\u0645\u0627\u0644\u0627\u064b \u067e\u0633 \u0627\u0632 \u0633\u0647\u200c\u06af\u0631\u0627\u0645 \u062f\u0646\u0628\u0627\u0644 \u0645\u06cc\u200c\u0634\u0648\u0646\u062f\u060c \u0627\u0632 \u0642\u0633\u0645\u062a \u0628\u0627\u0632\u06cc\u0627\u0628\u06cc \u0645\u06cc\u200c\u0634\u0648\u0646\u062f <code>ngrams<\/code> \u0641\u0631\u0647\u0646\u06af \u0644\u063a\u062a \u0628\u0627 \u0639\u0628\u0648\u0631 \u0627\u0632 \u0633\u0647 \u062e\u0637 \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u0645\u0642\u062f\u0627\u0631.  \u0627\u0632 \u0644\u06cc\u0633\u062a \u06a9\u0644\u0645\u0627\u062a \u0645\u0645\u06a9\u0646\u060c \u06cc\u06a9 \u06a9\u0644\u0645\u0647 \u0628\u0647 \u0635\u0648\u0631\u062a \u062a\u0635\u0627\u062f\u0641\u06cc \u0627\u0646\u062a\u062e\u0627\u0628 \u0634\u062f\u0647 \u0648 \u062f\u0631 \u0627\u0646\u062a\u0647\u0627\u06cc out \u0627\u0636\u0627\u0641\u0647 \u0645\u06cc \u0634\u0648\u062f.  \u062f\u0631 \u0646\u0647\u0627\u06cc\u062a\u060c <code>curr_sequence<\/code> \u0645\u062a\u063a\u06cc\u0631 \u0628\u0627 \u0645\u0642\u062f\u0627\u0631 \u0633\u0647 \u06af\u0631\u0627\u0645 \u0628\u0639\u062f\u06cc \u062f\u0631 \u0641\u0631\u0647\u0646\u06af \u0644\u063a\u062a \u0628\u0647 \u0631\u0648\u0632 \u0645\u06cc \u0634\u0648\u062f.<\/p>\n<p>\u0645\u062a\u0646 \u062a\u0648\u0644\u06cc\u062f \u0634\u062f\u0647 \u0628\u0647 \u0627\u06cc\u0646 \u0634\u06a9\u0644 \u0627\u0633\u062a.  \u0645\u06cc\u200c\u062a\u0648\u0627\u0646\u06cc\u062f \u0628\u0628\u06cc\u0646\u06cc\u062f \u06a9\u0647 \u062f\u0631 \u0645\u0648\u0631\u062f \u0633\u0647\u200c\u06af\u0631\u0627\u0645\u200c\u0647\u0627\u06cc \u06a9\u0644\u0645\u0647\u060c \u0645\u062a\u0646\u06cc \u06a9\u0647 \u0628\u0647\u200c\u0637\u0648\u0631 \u062e\u0648\u062f\u06a9\u0627\u0631 \u062a\u0648\u0644\u06cc\u062f \u0645\u06cc\u200c\u0634\u0648\u062f \u0628\u0633\u06cc\u0627\u0631 \u0645\u0639\u0646\u0627\u062f\u0627\u0631\u062a\u0631 \u0627\u0633\u062a.<\/p>\n<p><strong>\u062e\u0631\u0648\u062c\u06cc:<\/strong><\/p>\n<pre><code class=\"hljs\">tennis is a racket sport that can be played individually against a single opponent singles or between two teams of two players each doubles. each player uses a tennis racket include a handle known as the grip connected to a neck which joins a roughly elliptical frame that holds a matrix of\n<\/code><\/pre>\n<p>\u0627\u06af\u0631 \u0645\u0642\u062f\u0627\u0631 \u0645\u062a\u063a\u06cc\u0631 \u06a9\u0644\u0645\u0627\u062a \u0631\u0627 \u0628\u0631 \u0631\u0648\u06cc 4 \u062a\u0646\u0638\u06cc\u0645 \u06a9\u0646\u06cc\u062f (\u0627\u0632 4 \u06af\u0631\u0645 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0646\u06cc\u062f) \u0628\u0631\u0627\u06cc \u062a\u0648\u0644\u06cc\u062f \u0645\u062a\u0646\u060c \u062e\u0631\u0648\u062c\u06cc \u0634\u0645\u0627 \u0645\u0627\u0646\u0646\u062f \u0634\u06a9\u0644 \u0632\u06cc\u0631 \u0642\u0648\u06cc \u062a\u0631 \u0628\u0647 \u0646\u0638\u0631 \u0645\u06cc \u0631\u0633\u062f:<\/p>\n<pre><code class=\"hljs\">tennis is a racket sport that can be played individually against a single opponent singles or between two teams of two players each doubles . each player uses a tennis racket that is strung with cord to strike a hollow rubber ball covered with felt over or around a net and into the opponents\n<\/code><\/pre>\n<p>\u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u062f \u0628\u0628\u06cc\u0646\u06cc\u062f \u06a9\u0647 \u062e\u0631\u0648\u062c\u06cc \u0628\u0627 4 \u06af\u0631\u0645 \u0645\u0646\u0637\u0642\u06cc \u062a\u0631 \u0627\u0633\u062a.  \u0627\u06cc\u0646 \u0639\u0645\u062f\u062a\u0627\u064b \u0628\u0647 \u0627\u06cc\u0646 \u062f\u0644\u06cc\u0644 \u0627\u0633\u062a \u06a9\u0647 \u0645\u0648\u0644\u062f \u0645\u0627 \u0639\u0645\u062f\u062a\u0627\u064b \u0647\u0645\u0627\u0646 \u0645\u062a\u0646 \u0631\u0627 \u0627\u0632 \u0645\u0642\u0627\u0644\u0647 \u0648\u06cc\u06a9\u06cc\u200c\u067e\u062f\u06cc\u0627 \u0628\u0627\u0632\u0633\u0627\u0632\u06cc \u0645\u06cc\u200c\u06a9\u0646\u062f\u060c \u0627\u0645\u0627 \u0628\u0627 \u0628\u0631\u062e\u06cc \u067e\u06cc\u0634\u0631\u0641\u062a\u200c\u0647\u0627\u06cc \u062c\u0632\u0626\u06cc \u062f\u0631 \u0645\u0648\u0644\u062f\u060c \u0648 \u0645\u062c\u0645\u0648\u0639\u0647 \u0628\u0632\u0631\u06af\u200c\u062a\u0631\u060c \u0645\u0648\u0644\u062f \u0645\u0627 \u0645\u06cc\u200c\u062a\u0648\u0627\u0646\u062f \u0628\u0647 \u0631\u0627\u062d\u062a\u06cc \u062c\u0645\u0644\u0627\u062a \u062c\u062f\u06cc\u062f \u0648 \u0645\u0646\u062d\u0635\u0631\u0628\u0647\u200c\u0641\u0631\u062f \u0631\u0627 \u0646\u06cc\u0632 \u062a\u0648\u0644\u06cc\u062f \u06a9\u0646\u062f.<\/p>\n<h2 id=\"conclusion\"><span class=\"ez-toc-section\" id=\"%d9%86%d8%aa%db%8c%d8%ac%d9%87\"><\/span>\u0646\u062a\u06cc\u062c\u0647<span class=\"ez-toc-section-end\"><\/span><\/h2>\n<p>\u0645\u062f\u0644 N-Grams \u06cc\u06a9\u06cc \u0627\u0632 \u067e\u0631\u06a9\u0627\u0631\u0628\u0631\u062f\u062a\u0631\u06cc\u0646 \u0645\u062f\u0644\u200c\u0647\u0627\u06cc \u062c\u0645\u0644\u0647 \u0628\u0647 \u0628\u0631\u062f\u0627\u0631\u06cc \u0627\u0633\u062a \u0632\u06cc\u0631\u0627 \u0632\u0645\u06cc\u0646\u0647 \u0628\u06cc\u0646 N-\u06a9\u0644\u0645\u0627\u062a \u0631\u0627 \u062f\u0631 \u06cc\u06a9 \u062c\u0645\u0644\u0647 \u0646\u0634\u0627\u0646 \u0645\u06cc\u200c\u062f\u0647\u062f.  \u062f\u0631 \u0627\u06cc\u0646 \u0645\u0642\u0627\u0644\u0647 \u0646\u0638\u0631\u06cc\u0647 \u0645\u062f\u0644 N-Grams \u0631\u0627 \u0645\u0634\u0627\u0647\u062f\u0647 \u06a9\u0631\u062f\u06cc\u062f.  \u0647\u0645\u0686\u0646\u06cc\u0646 \u0631\u0648\u0634 \u067e\u06cc\u0627\u062f\u0647 \u0633\u0627\u0632\u06cc \u06a9\u0627\u0631\u0627\u06a9\u062a\u0631\u0647\u0627\u06cc N-Grams \u0648 Words N-Grams \u0631\u0627 \u0645\u0634\u0627\u0647\u062f\u0647 \u06a9\u0631\u062f\u06cc\u062f.  \u062f\u0631 \u0646\u0647\u0627\u06cc\u062a\u060c \u0631\u0648\u0634 \u0627\u06cc\u062c\u0627\u062f \u067e\u0631\u06a9\u0646\u0646\u062f\u0647 \u0645\u062a\u0646 \u062e\u0648\u062f\u06a9\u0627\u0631 \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 \u0647\u0631 \u062f\u0648 \u0631\u0648\u0634 \u0631\u0627 \u0645\u0637\u0627\u0644\u0639\u0647 \u06a9\u0631\u062f\u06cc\u062f.<\/p>\n<\/div>\n<p><script>\n                        !function(f,b,e,v,n,t,s)\n                        {if(f.fbq)return;n=f.fbq=function(){n.callMethod?\n                        n.callMethod.apply(n,arguments):n.queue.push(arguments)};\n                        if(!f._fbq)f._fbq=n;n.push=n;n.loaded=!0;n.version='2.0';\n                        n.queue=();t=b.createElement(e);t.async=!0;\n                        t.src=v;s=b.getElementsByTagName(e)(0);\n                        s.parentNode.insertBefore(t,s)}(window, document,'script',\n                        'https:\/\/connect.facebook.net\/en_US\/fbevents.js');\n                        fbq('init', '525232124909042');\n                        fbq('track', 'PageView');\n                    <\/script>    (\u0628\u0631\u0686\u0633\u0628\u200c\u0647\u0627 \u0628\u0647 \u062a\u0631\u062c\u0645\u0647)# python<br \/>\n<br \/><br \/>\n<br \/>\u0645\u0646\u062a\u0634\u0631 \u0634\u062f\u0647 \u062f\u0631 1403-01-21 15:35:50<br \/>\n<\/p>\n\n\n<div class=\"kk-star-ratings kksr-auto kksr-align-center kksr-valign-bottom\"\n    data-payload='{&quot;align&quot;:&quot;center&quot;,&quot;id&quot;:&quot;16164&quot;,&quot;slug&quot;:&quot;default&quot;,&quot;valign&quot;:&quot;bottom&quot;,&quot;ignore&quot;:&quot;&quot;,&quot;reference&quot;:&quot;auto&quot;,&quot;class&quot;:&quot;&quot;,&quot;count&quot;:&quot;0&quot;,&quot;legendonly&quot;:&quot;&quot;,&quot;readonly&quot;:&quot;&quot;,&quot;score&quot;:&quot;0&quot;,&quot;starsonly&quot;:&quot;&quot;,&quot;best&quot;:&quot;5&quot;,&quot;gap&quot;:&quot;5&quot;,&quot;greet&quot;:&quot;\u0627\u0645\u062a\u06cc\u0627\u0632 \u0634\u0645\u0627 \u0628\u0647 \u0627\u06cc\u0646 \u0645\u0637\u0644\u0628&quot;,&quot;legend&quot;:&quot;0\\\/5 (0 \u0631\u0627\u06cc)&quot;,&quot;size&quot;:&quot;30&quot;,&quot;title&quot;:&quot;\u067e\u0627\u06cc\u062a\u0648\u0646 \u0628\u0631\u0627\u06cc NLP: \u062a\u0648\u0633\u0639\u0647 \u06cc\u06a9 \u067e\u0631\u06a9\u0646\u0646\u062f\u0647 \u0645\u062a\u0646 \u062e\u0648\u062f\u06a9\u0627\u0631 \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 N-Gram&quot;,&quot;width&quot;:&quot;0&quot;,&quot;_legend&quot;:&quot;{score}\\\/{best} ({count} \u0631\u0627\u06cc)&quot;,&quot;font_factor&quot;:&quot;1.25&quot;}'>\n            \n<div class=\"kksr-stars\">\n    \n<div class=\"kksr-stars-inactive\">\n            <div class=\"kksr-star\" data-star=\"1\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" data-star=\"2\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" data-star=\"3\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" data-star=\"4\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" data-star=\"5\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n    <\/div>\n    \n<div class=\"kksr-stars-active\" style=\"width: 0px;\">\n            <div class=\"kksr-star\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n    <\/div>\n<\/div>\n                \n\n<div class=\"kksr-legend\" style=\"font-size: 24px;\">\n            <span class=\"kksr-muted\">\u0627\u0645\u062a\u06cc\u0627\u0632 \u0634\u0645\u0627 \u0628\u0647 \u0627\u06cc\u0646 \u0645\u0637\u0644\u0628<\/span>\n    <\/div>\n    <\/div>\n","protected":false},"excerpt":{"rendered":"<p><span class=\"span-reading-time rt-reading-time\" style=\"display: block;\"><span class=\"rt-label rt-prefix\">\u0632\u0645\u0627\u0646 \u0644\u0627\u0632\u0645 \u0628\u0631\u0627\u06cc \u0645\u0637\u0627\u0644\u0639\u0647: <\/span> <span class=\"rt-time\"> 8<\/span> <span class=\"rt-label rt-postfix\">\u062f\u0642\u06cc\u0642\u0647<\/span><\/span>\u0627\u06cc\u0646 \u067e\u0627\u0646\u0632\u062f\u0647\u0645\u06cc\u0646 \u0645\u0642\u0627\u0644\u0647 \u0627\u0632 \u0633\u0631\u06cc \u0645\u0642\u0627\u0644\u0627\u062a \u0645\u0646 \u0627\u0633\u062a \u0631\u0648\u06cc \u067e\u0627\u06cc\u062a\u0648\u0646 \u0628\u0631\u0627\u06cc NLP. \u062f\u0631 \u0645\u0642\u0627\u0644\u0647 \u0642\u0628\u0644\u06cc \u0627\u0645 \u0631\u0648\u0634 \u067e\u06cc\u0627\u062f\u0647 \u0633\u0627\u0632\u06cc \u0631\u0627 \u062a\u0648\u0636\u06cc\u062d \u062f\u0627\u062f\u0645 TF-IDF \u0631\u0648\u06cc\u06a9\u0631\u062f \u0627\u0632 \u0627\u0628\u062a\u062f\u0627 \u062f\u0631 \u067e\u0627\u06cc\u062a\u0648\u0646 \u0642\u0628\u0644 \u0627\u0632 \u0622\u0646\u060c \u0631\u0648\u0634 \u067e\u06cc\u0627\u062f\u0647\u200c\u0633\u0627\u0632\u06cc \u0631\u0648\u06cc\u06a9\u0631\u062f \u06a9\u06cc\u0633\u0647\u200c\u0627\u06cc \u06a9\u0644\u0645\u0627\u062a \u0631\u0627 \u0627\u0632 \u0627\u0628\u062a\u062f\u0627 \u062f\u0631 \u067e\u0627\u06cc\u062a\u0648\u0646 \u0645\u0637\u0627\u0644\u0639\u0647 \u06a9\u0631\u062f\u06cc\u0645. \u0627\u0645\u0631\u0648\u0632\u060c \u0631\u0648\u06cc\u06a9\u0631\u062f N-Grams \u0631\u0627 \u0645\u0637\u0627\u0644\u0639\u0647 \u062e\u0648\u0627\u0647\u06cc\u0645 \u06a9\u0631\u062f \u0648 \u062e\u0648\u0627\u0647\u06cc\u0645 \u062f\u06cc\u062f \u06a9\u0647 \u0686\u06af\u0648\u0646\u0647 [&hellip;]<\/p>\n","protected":false},"author":3,"featured_media":16165,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"footnotes":""},"categories":[1743,620],"tags":[],"class_list":["post-16164","post","type-post","status-publish","format-standard","has-post-thumbnail","hentry","category-python","category-programming"],"acf":[],"_links":{"self":[{"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/posts\/16164","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/users\/3"}],"replies":[{"embeddable":true,"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/comments?post=16164"}],"version-history":[{"count":0,"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/posts\/16164\/revisions"}],"wp:featuredmedia":[{"embeddable":true,"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/media\/16165"}],"wp:attachment":[{"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/media?parent=16164"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/categories?post=16164"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/tags?post=16164"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}