{"id":16368,"date":"2024-01-24T04:03:12","date_gmt":"2024-01-24T00:33:12","guid":{"rendered":"https:\/\/rasanegar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%d8%aa%d8%b7%d8%a8%db%8c%d9%82-%d9%88%d8%a7%da%98%da%af%d8%a7%d9%86-%d9%88-%d8%b9%d8%a8%d8%a7%d8%b1%d8%aa-%d8%a8%d8%a7-spacy\/"},"modified":"2024-01-24T04:03:12","modified_gmt":"2024-01-24T00:33:12","slug":"%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%d8%aa%d8%b7%d8%a8%db%8c%d9%82-%d9%88%d8%a7%da%98%da%af%d8%a7%d9%86-%d9%88-%d8%b9%d8%a8%d8%a7%d8%b1%d8%aa-%d8%a8%d8%a7-spacy","status":"publish","type":"post","link":"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%d8%aa%d8%b7%d8%a8%db%8c%d9%82-%d9%88%d8%a7%da%98%da%af%d8%a7%d9%86-%d9%88-%d8%b9%d8%a8%d8%a7%d8%b1%d8%aa-%d8%a8%d8%a7-spacy\/","title":{"rendered":"\u067e\u0627\u06cc\u062a\u0648\u0646 \u0628\u0631\u0627\u06cc NLP: \u062a\u0637\u0628\u06cc\u0642 \u0648\u0627\u0698\u06af\u0627\u0646 \u0648 \u0639\u0628\u0627\u0631\u062a \u0628\u0627 SpaCy"},"content":{"rendered":"<div id=\"ez-toc-container\" class=\"ez-toc-v2_0_85 counter-hierarchy ez-toc-counter ez-toc-custom ez-toc-container-direction\">\n<div class=\"ez-toc-title-container\"><p class=\"ez-toc-title\" style=\"cursor:inherit\">\u0633\u0631\u0641\u0635\u0644\u0647\u0627\u06cc \u0645\u0637\u0644\u0628<\/p>\n<\/div><nav><ul class='ez-toc-list ez-toc-list-level-1 ' ><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class=\"ez-toc-link ez-toc-heading-1\" href=\"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%d8%aa%d8%b7%d8%a8%db%8c%d9%82-%d9%88%d8%a7%da%98%da%af%d8%a7%d9%86-%d9%88-%d8%b9%d8%a8%d8%a7%d8%b1%d8%aa-%d8%a8%d8%a7-spacy\/#%d8%aa%d8%b7%d8%a8%db%8c%d9%82_%d9%85%d8%a8%d8%aa%d9%86%db%8c_%d8%a8%d8%b1_%d9%82%d8%a7%d9%86%d9%88%d9%86\" >\u062a\u0637\u0628\u06cc\u0642 \u0645\u0628\u062a\u0646\u06cc \u0628\u0631 \u0642\u0627\u0646\u0648\u0646<\/a><ul class='ez-toc-list-level-3' ><li class='ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-2\" href=\"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%d8%aa%d8%b7%d8%a8%db%8c%d9%82-%d9%88%d8%a7%da%98%da%af%d8%a7%d9%86-%d9%88-%d8%b9%d8%a8%d8%a7%d8%b1%d8%aa-%d8%a8%d8%a7-spacy\/#%d8%a7%db%8c%d8%ac%d8%a7%d8%af_%d8%b4%db%8c%d8%a1_%d9%85%d8%b7%d8%a7%d8%a8%d9%82%d8%aa\" >\u0627\u06cc\u062c\u0627\u062f \u0634\u06cc\u0621 \u0645\u0637\u0627\u0628\u0642\u062a<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-3\" href=\"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%d8%aa%d8%b7%d8%a8%db%8c%d9%82-%d9%88%d8%a7%da%98%da%af%d8%a7%d9%86-%d9%88-%d8%b9%d8%a8%d8%a7%d8%b1%d8%aa-%d8%a8%d8%a7-spacy\/#%d8%aa%d8%b9%d8%b1%db%8c%d9%81_%d8%a7%d9%84%da%af%d9%88%d9%87%d8%a7\" >\u062a\u0639\u0631\u06cc\u0641 \u0627\u0644\u06af\u0648\u0647\u0627<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-4\" href=\"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%d8%aa%d8%b7%d8%a8%db%8c%d9%82-%d9%88%d8%a7%da%98%da%af%d8%a7%d9%86-%d9%88-%d8%b9%d8%a8%d8%a7%d8%b1%d8%aa-%d8%a8%d8%a7-spacy\/#%d8%a7%d8%b9%d9%85%d8%a7%d9%84_%d8%aa%d8%b7%d8%a8%db%8c%d9%82_%d8%af%d8%b1_%d8%b3%d9%86%d8%af\" >\u0627\u0639\u0645\u0627\u0644 \u062a\u0637\u0628\u06cc\u0642 \u062f\u0631 \u0633\u0646\u062f<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-5\" href=\"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%d8%aa%d8%b7%d8%a8%db%8c%d9%82-%d9%88%d8%a7%da%98%da%af%d8%a7%d9%86-%d9%88-%d8%b9%d8%a8%d8%a7%d8%b1%d8%aa-%d8%a8%d8%a7-spacy\/#%da%af%d8%b2%db%8c%d9%86%d9%87_%d9%87%d8%a7%db%8c_%d8%a8%db%8c%d8%b4%d8%aa%d8%b1_%d8%a8%d8%b1%d8%a7%db%8c_%d8%aa%d8%b7%d8%a8%db%8c%d9%82_%d9%85%d8%a8%d8%aa%d9%86%db%8c_%d8%a8%d8%b1_%d9%82%d8%a7%d9%86%d9%88%d9%86\" >\u06af\u0632\u06cc\u0646\u0647 \u0647\u0627\u06cc \u0628\u06cc\u0634\u062a\u0631 \u0628\u0631\u0627\u06cc \u062a\u0637\u0628\u06cc\u0642 \u0645\u0628\u062a\u0646\u06cc \u0628\u0631 \u0642\u0627\u0646\u0648\u0646<\/a><\/li><\/ul><\/li><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class=\"ez-toc-link ez-toc-heading-6\" href=\"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%d8%aa%d8%b7%d8%a8%db%8c%d9%82-%d9%88%d8%a7%da%98%da%af%d8%a7%d9%86-%d9%88-%d8%b9%d8%a8%d8%a7%d8%b1%d8%aa-%d8%a8%d8%a7-spacy\/#%d8%aa%d8%b7%d8%a8%db%8c%d9%82_%d9%85%d8%a8%d8%aa%d9%86%db%8c_%d8%a8%d8%b1_%d8%b9%d8%a8%d8%a7%d8%b1%d8%aa\" >\u062a\u0637\u0628\u06cc\u0642 \u0645\u0628\u062a\u0646\u06cc \u0628\u0631 \u0639\u0628\u0627\u0631\u062a<\/a><ul class='ez-toc-list-level-3' ><li class='ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-7\" href=\"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%d8%aa%d8%b7%d8%a8%db%8c%d9%82-%d9%88%d8%a7%da%98%da%af%d8%a7%d9%86-%d9%88-%d8%b9%d8%a8%d8%a7%d8%b1%d8%aa-%d8%a8%d8%a7-spacy\/#%d8%b4%db%8c%d8%a1_%d8%aa%d8%b7%d8%a8%db%8c%d9%82_%d8%b9%d8%a8%d8%a7%d8%b1%d8%aa_%d8%a7%db%8c%d8%ac%d8%a7%d8%af_%da%a9%d9%86%db%8c%d8%af\" >\u0634\u06cc\u0621 \u062a\u0637\u0628\u06cc\u0642 \u0639\u0628\u0627\u0631\u062a \u0627\u06cc\u062c\u0627\u062f \u06a9\u0646\u06cc\u062f<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-8\" href=\"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%d8%aa%d8%b7%d8%a8%db%8c%d9%82-%d9%88%d8%a7%da%98%da%af%d8%a7%d9%86-%d9%88-%d8%b9%d8%a8%d8%a7%d8%b1%d8%aa-%d8%a8%d8%a7-spacy\/#%d9%81%d9%87%d8%b1%d8%b3%d8%aa_%d8%b9%d8%a8%d8%a7%d8%b1%d8%a7%d8%aa_%d8%b1%d8%a7_%d8%a7%db%8c%d8%ac%d8%a7%d8%af_%da%a9%d9%86%db%8c%d8%af\" >\u0641\u0647\u0631\u0633\u062a \u0639\u0628\u0627\u0631\u0627\u062a \u0631\u0627 \u0627\u06cc\u062c\u0627\u062f \u06a9\u0646\u06cc\u062f<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-9\" href=\"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%d8%aa%d8%b7%d8%a8%db%8c%d9%82-%d9%88%d8%a7%da%98%da%af%d8%a7%d9%86-%d9%88-%d8%b9%d8%a8%d8%a7%d8%b1%d8%aa-%d8%a8%d8%a7-spacy\/#%d8%a7%d8%b9%d9%85%d8%a7%d9%84_%d8%aa%d8%b7%d8%a8%db%8c%d9%82_%d8%af%d8%b1_%d8%b3%d9%86%d8%af-2\" >\u0627\u0639\u0645\u0627\u0644 \u062a\u0637\u0628\u06cc\u0642 \u062f\u0631 \u0633\u0646\u062f<\/a><\/li><\/ul><\/li><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class=\"ez-toc-link ez-toc-heading-10\" href=\"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%d8%aa%d8%b7%d8%a8%db%8c%d9%82-%d9%88%d8%a7%da%98%da%af%d8%a7%d9%86-%d9%88-%d8%b9%d8%a8%d8%a7%d8%b1%d8%aa-%d8%a8%d8%a7-spacy\/#%da%a9%d9%84%d9%85%d8%a7%d8%aa_%d8%b1%d8%a7_%d9%85%d8%aa%d9%88%d9%82%d9%81_%da%a9%d9%86%db%8c%d8%af\" >\u06a9\u0644\u0645\u0627\u062a \u0631\u0627 \u0645\u062a\u0648\u0642\u0641 \u06a9\u0646\u06cc\u062f<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class=\"ez-toc-link ez-toc-heading-11\" href=\"https:\/\/rasanegaar.com\/blog\/%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86-%d8%a8%d8%b1%d8%a7%db%8c-nlp-%d8%aa%d8%b7%d8%a8%db%8c%d9%82-%d9%88%d8%a7%da%98%da%af%d8%a7%d9%86-%d9%88-%d8%b9%d8%a8%d8%a7%d8%b1%d8%aa-%d8%a8%d8%a7-spacy\/#%d9%86%d8%aa%db%8c%d8%ac%d9%87\" >\u0646\u062a\u06cc\u062c\u0647<\/a><\/li><\/ul><\/nav><\/div>\n<span class=\"span-reading-time rt-reading-time\" style=\"display: block;\"><span class=\"rt-label rt-prefix\">\u0632\u0645\u0627\u0646 \u0644\u0627\u0632\u0645 \u0628\u0631\u0627\u06cc \u0645\u0637\u0627\u0644\u0639\u0647: <\/span> <span class=\"rt-time\"> 8<\/span> <span class=\"rt-label rt-postfix\">\u062f\u0642\u06cc\u0642\u0647<\/span><\/span><p> <br \/>\n<\/p>\n<div><noscript><\/noscript><\/p>\n<p>\u0627\u06cc\u0646 \u0633\u0648\u0645\u06cc\u0646 \u0645\u0642\u0627\u0644\u0647 \u0627\u0632 \u0627\u06cc\u0646 \u0633\u0631\u06cc \u0645\u0642\u0627\u0644\u0627\u062a \u0627\u0633\u062a \u0631\u0648\u06cc \u067e\u0627\u06cc\u062a\u0648\u0646 \u0628\u0631\u0627\u06cc \u067e\u0631\u062f\u0627\u0632\u0634 \u0632\u0628\u0627\u0646 \u0637\u0628\u06cc\u0639\u06cc  \u062f\u0631 \u0645\u0642\u0627\u0644\u0647 \u0642\u0628\u0644\u06cc \u062f\u06cc\u062f\u06cc\u0645 \u06a9\u0647 \u0686\u06af\u0648\u0646\u0647 NLTK \u067e\u0627\u06cc\u062a\u0648\u0646 \u0648 <a rel=\"nofollow noopener\" target=\"_blank\" href=\"https:\/\/spacy.io\/\">\u0641\u0636\u0627\u06cc\u06cc<\/a> \u0627\u0632 \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 \u0647\u0627 \u0645\u06cc \u062a\u0648\u0627\u0646 \u0628\u0631\u0627\u06cc \u0627\u0646\u062c\u0627\u0645 \u0648\u0638\u0627\u06cc\u0641 \u0633\u0627\u062f\u0647 NLP \u0645\u0627\u0646\u0646\u062f <a rel=\"nofollow noopener\" target=\"_blank\" href=\"https:\/\/en.wikipedia.org\/wiki\/Lexical_analysis#Tokenization\">\u0646\u0634\u0627\u0646\u0647 \u06af\u0630\u0627\u0631\u06cc<\/a>\u060c <a rel=\"nofollow noopener\" target=\"_blank\" href=\"https:\/\/nlp.stanford.edu\/IR-book\/html\/htmledition\/stemming-and-lemmatization-1.html\">\u0631\u06cc\u0634\u0647 \u06cc\u0627\u0628\u06cc \u0648 \u0631\u06cc\u0634\u0647 \u06cc\u0627\u0628\u06cc<\/a>.  \u0645\u0627 \u0647\u0645\u0686\u0646\u06cc\u0646 \u062f\u06cc\u062f\u06cc\u0645 \u06a9\u0647 \u0686\u06af\u0648\u0646\u0647 \u0645\u06cc\u200c\u062a\u0648\u0627\u0646 \u0628\u062e\u0634\u200c\u0647\u0627\u06cc\u06cc \u0627\u0632 \u0628\u0631\u0686\u0633\u0628\u200c\u06af\u0630\u0627\u0631\u06cc \u06af\u0641\u062a\u0627\u0631\u060c \u0634\u0646\u0627\u0633\u0627\u06cc\u06cc \u0645\u0648\u062c\u0648\u062f\u06cc\u062a \u0646\u0627\u0645\u200c\u06af\u0630\u0627\u0631\u06cc \u0634\u062f\u0647 \u0648 \u062a\u062c\u0632\u06cc\u0647 \u0627\u0633\u0645 \u0631\u0627 \u0627\u0646\u062c\u0627\u0645 \u062f\u0627\u062f.  \u0628\u0627 \u0627\u06cc\u0646 \u062d\u0627\u0644\u060c \u062a\u0645\u0627\u0645 \u0627\u06cc\u0646 \u0639\u0645\u0644\u06cc\u0627\u062a \u0627\u0646\u062c\u0627\u0645 \u0645\u06cc \u0634\u0648\u062f \u0631\u0648\u06cc \u06a9\u0644\u0645\u0627\u062a \u0641\u0631\u062f\u06cc<\/p>\n<p>\u062f\u0631 \u0627\u06cc\u0646 \u0645\u0642\u0627\u0644\u0647\u060c \u06cc\u06a9 \u0642\u062f\u0645 \u062c\u0644\u0648\u062a\u0631 \u0631\u0641\u062a\u0647 \u0648 \u0648\u0627\u0698\u06af\u0627\u0646 \u0648 \u062a\u0637\u0628\u06cc\u0642 \u0639\u0628\u0627\u0631\u0627\u062a \u0631\u0627 \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 spaCy \u0628\u0631\u0631\u0633\u06cc \u062e\u0648\u0627\u0647\u06cc\u0645 \u06a9\u0631\u062f.  \u0645\u0627 \u0627\u0644\u06af\u0648\u0647\u0627 \u0631\u0627 \u062a\u0639\u0631\u06cc\u0641 \u0645\u06cc \u06a9\u0646\u06cc\u0645 \u0648 \u0633\u067e\u0633 \u062e\u0648\u0627\u0647\u06cc\u0645 \u062f\u06cc\u062f \u06a9\u0647 \u06a9\u062f\u0627\u0645 \u0639\u0628\u0627\u0631\u0627\u062a \u0628\u0627 \u0627\u0644\u06af\u0648\u06cc \u062a\u0639\u0631\u06cc\u0641 \u0634\u062f\u0647 \u0645\u0637\u0627\u0628\u0642\u062a \u062f\u0627\u0631\u0646\u062f.  \u0627\u06cc\u0646 \u0634\u0628\u06cc\u0647 \u0628\u0647 \u062a\u0639\u0631\u06cc\u0641 \u0639\u0628\u0627\u0631\u0627\u062a \u0645\u0646\u0638\u0645 \u0627\u0633\u062a \u06a9\u0647 \u0634\u0627\u0645\u0644 \u0628\u062e\u0634 \u0647\u0627\u06cc\u06cc \u0627\u0632 \u06af\u0641\u062a\u0627\u0631 \u0627\u0633\u062a.<\/p>\n<h2 id=\"rulebasedmatching\"><span class=\"ez-toc-section\" id=\"%d8%aa%d8%b7%d8%a8%db%8c%d9%82_%d9%85%d8%a8%d8%aa%d9%86%db%8c_%d8%a8%d8%b1_%d9%82%d8%a7%d9%86%d9%88%d9%86\"><\/span>\u062a\u0637\u0628\u06cc\u0642 \u0645\u0628\u062a\u0646\u06cc \u0628\u0631 \u0642\u0627\u0646\u0648\u0646<span class=\"ez-toc-section-end\"><\/span><\/h2>\n<p>\u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 spaCy \u0647\u0645\u0631\u0627\u0647 \u0628\u0627 \u06cc\u06a9 <code>Matcher<\/code> \u0627\u0628\u0632\u0627\u0631\u06cc \u06a9\u0647 \u0645\u06cc \u062a\u0648\u0627\u0646\u062f \u0628\u0631\u0627\u06cc \u062a\u0639\u06cc\u06cc\u0646 \u0642\u0648\u0627\u0646\u06cc\u0646 \u0633\u0641\u0627\u0631\u0634\u06cc \u0628\u0631\u0627\u06cc \u062a\u0637\u0628\u06cc\u0642 \u0639\u0628\u0627\u0631\u062a \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0634\u0648\u062f.  \u0627\u06cc\u0646 process \u0628\u0631\u0627\u06cc \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 <code>Matcher<\/code> \u0627\u0628\u0632\u0627\u0631 \u0628\u0633\u06cc\u0627\u0631 \u0645\u0633\u062a\u0642\u06cc\u0645 \u0627\u0633\u062a.  \u0627\u0648\u0644\u06cc\u0646 \u06a9\u0627\u0631\u06cc \u06a9\u0647 \u0628\u0627\u06cc\u062f \u0627\u0646\u062c\u0627\u0645 \u062f\u0647\u06cc\u062f \u0627\u06cc\u0646 \u0627\u0633\u062a \u06a9\u0647 \u0627\u0644\u06af\u0648\u0647\u0627\u06cc\u06cc \u0631\u0627 \u06a9\u0647 \u0645\u06cc \u062e\u0648\u0627\u0647\u06cc\u062f \u0645\u0637\u0627\u0628\u0642\u062a \u062f\u0647\u06cc\u062f\u060c \u062a\u0639\u0631\u06cc\u0641 \u06a9\u0646\u06cc\u062f.  \u0628\u0639\u062f\u060c \u0634\u0645\u0627 \u0628\u0627\u06cc\u062f \u0627\u0644\u06af\u0648\u0647\u0627 \u0631\u0627 \u0628\u0647 \u0622\u0646 \u0627\u0636\u0627\u0641\u0647 \u06a9\u0646\u06cc\u062f <code>Matcher<\/code> \u0627\u0628\u0632\u0627\u0631 \u0648 \u062f\u0631 \u0646\u0647\u0627\u06cc\u062a\u060c \u0634\u0645\u0627 \u0628\u0627\u06cc\u062f \u0622\u0646 \u0631\u0627 \u0627\u0639\u0645\u0627\u0644 \u06a9\u0646\u06cc\u062f <code>Matcher<\/code> \u0627\u0628\u0632\u0627\u0631\u06cc \u0628\u0631\u0627\u06cc \u0633\u0646\u062f\u06cc \u06a9\u0647 \u0645\u06cc\u200c\u062e\u0648\u0627\u0647\u06cc\u062f \u0642\u0648\u0627\u0646\u06cc\u0646 \u062e\u0648\u062f \u0631\u0627 \u0628\u0627 \u0622\u0646 \u0645\u0637\u0627\u0628\u0642\u062a \u062f\u0647\u06cc\u062f.  \u0627\u06cc\u0646 \u0628\u0647 \u0628\u0647\u062a\u0631\u06cc\u0646 \u0634\u06a9\u0644 \u0628\u0627 \u06a9\u0645\u06a9 \u06cc\u06a9 \u0645\u062b\u0627\u0644 \u062a\u0648\u0636\u06cc\u062d \u062f\u0627\u062f\u0647 \u0645\u06cc \u0634\u0648\u062f.<\/p>\n<p>\u0628\u0631\u0627\u06cc \u062a\u0637\u0628\u06cc\u0642 \u0645\u0628\u062a\u0646\u06cc \u0628\u0631 \u0642\u0627\u0646\u0648\u0646\u060c \u0628\u0627\u06cc\u062f \u0645\u0631\u0627\u062d\u0644 \u0632\u06cc\u0631 \u0631\u0627 \u0627\u0646\u062c\u0627\u0645 \u062f\u0647\u06cc\u062f:<\/p>\n<h3 id=\"creatingmatcherobject\"><span class=\"ez-toc-section\" id=\"%d8%a7%db%8c%d8%ac%d8%a7%d8%af_%d8%b4%db%8c%d8%a1_%d9%85%d8%b7%d8%a7%d8%a8%d9%82%d8%aa\"><\/span>\u0627\u06cc\u062c\u0627\u062f \u0634\u06cc\u0621 \u0645\u0637\u0627\u0628\u0642\u062a<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p>\u0627\u0648\u0644\u06cc\u0646 \u06af\u0627\u0645 \u0627\u06cc\u0646 \u0627\u0633\u062a \u06a9\u0647 \u0634\u06cc\u0621 \u0645\u0637\u0627\u0628\u0642\u062a \u0627\u06cc\u062c\u0627\u062f \u06a9\u0646\u06cc\u062f:<\/p>\n<pre><code class=\"hljs\"><span class=\"hljs-keyword\">import<\/span> spacy\nnlp = spacy.load(<span class=\"hljs-string\">'en_core_web_sm'<\/span>)\n\n<span class=\"hljs-keyword\">from<\/span> spacy.matcher <span class=\"hljs-keyword\">import<\/span> Matcher\nm_tool = Matcher(nlp.vocab)\n<\/code><\/pre>\n<h3 id=\"definingpatterns\"><span class=\"ez-toc-section\" id=\"%d8%aa%d8%b9%d8%b1%db%8c%d9%81_%d8%a7%d9%84%da%af%d9%88%d9%87%d8%a7\"><\/span>\u062a\u0639\u0631\u06cc\u0641 \u0627\u0644\u06af\u0648\u0647\u0627<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p>\u0645\u0631\u062d\u0644\u0647 \u0628\u0639\u062f\u06cc \u062a\u0639\u0631\u06cc\u0641 \u0627\u0644\u06af\u0648\u0647\u0627\u06cc\u06cc \u0627\u0633\u062a \u06a9\u0647 \u0628\u0631\u0627\u06cc \u0641\u06cc\u0644\u062a\u0631 \u06a9\u0631\u062f\u0646 \u0639\u0628\u0627\u0631\u0627\u062a \u0645\u0634\u0627\u0628\u0647 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0645\u06cc \u0634\u0648\u062f.  \u0641\u0631\u0636 \u06a9\u0646\u06cc\u062f \u0645\u06cc\u200c\u062e\u0648\u0627\u0647\u06cc\u0645 \u0639\u0628\u0627\u0631\u0627\u062a \u00ab\u0631\u0648\u0628\u0627\u0647 \u0642\u0647\u0648\u0647\u200c\u0627\u06cc \u0633\u0631\u06cc\u0639\u00bb\u060c \u00ab\u0631\u0648\u0628\u0627\u0647 \u0642\u0647\u0648\u0647\u200c\u0627\u06cc \u0633\u0631\u06cc\u0639\u00bb\u060c \u00ab\u0631\u0648\u0628\u0627\u0647 \u0642\u0647\u0648\u0647\u200c\u0627\u06cc \u0633\u0631\u06cc\u0639\u00bb \u06cc\u0627 \u00ab\u0631\u0648\u0628\u0627\u0647 \u0642\u0647\u0648\u0647\u200c\u0627\u06cc \u0633\u0631\u06cc\u0639\u00bb \u0631\u0627 \u067e\u06cc\u062f\u0627 \u06a9\u0646\u06cc\u0645.  \u0628\u0631\u0627\u06cc \u0627\u0646\u062c\u0627\u0645 \u0627\u06cc\u0646 \u06a9\u0627\u0631\u060c \u0628\u0627\u06cc\u062f \u0686\u0647\u0627\u0631 \u0627\u0644\u06af\u0648\u06cc \u0632\u06cc\u0631 \u0631\u0627 \u0627\u06cc\u062c\u0627\u062f \u06a9\u0646\u06cc\u0645:<\/p>\n<pre><code class=\"hljs\">p1 = ({<span class=\"hljs-string\">'LOWER'<\/span>: <span class=\"hljs-string\">'quickbrownfox'<\/span>})\np2 = ({<span class=\"hljs-string\">'LOWER'<\/span>: <span class=\"hljs-string\">'quick'<\/span>}, {<span class=\"hljs-string\">'IS_PUNCT'<\/span>: <span class=\"hljs-literal\">True<\/span>}, {<span class=\"hljs-string\">'LOWER'<\/span>: <span class=\"hljs-string\">'brown'<\/span>}, {<span class=\"hljs-string\">'IS_PUNCT'<\/span>: <span class=\"hljs-literal\">True<\/span>}, {<span class=\"hljs-string\">'LOWER'<\/span>: <span class=\"hljs-string\">'fox'<\/span>})\np3 = ({<span class=\"hljs-string\">'LOWER'<\/span>: <span class=\"hljs-string\">'quick'<\/span>}, {<span class=\"hljs-string\">'LOWER'<\/span>: <span class=\"hljs-string\">'brown'<\/span>}, {<span class=\"hljs-string\">'LOWER'<\/span>: <span class=\"hljs-string\">'fox'<\/span>})\np4 =  ({<span class=\"hljs-string\">'LOWER'<\/span>: <span class=\"hljs-string\">'quick'<\/span>}, {<span class=\"hljs-string\">'LOWER'<\/span>: <span class=\"hljs-string\">'brownfox'<\/span>})\n<\/code><\/pre>\n<p>\u062f\u0631 \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0628\u0627\u0644\u0627\u060c<\/p>\n<ul>\n<li>p1 \u0628\u0647 \u062f\u0646\u0628\u0627\u0644 \u0639\u0628\u0627\u0631\u062a &#8220;quickbrownfox&#8221; \u0627\u0633\u062a<\/li>\n<li>p2 \u0628\u0647 \u062f\u0646\u0628\u0627\u0644 \u0639\u0628\u0627\u0631\u062a &#8220;quick-brown-fox&#8221; \u0645\u06cc \u06af\u0631\u062f\u062f.<\/li>\n<li>p3 \u0633\u0639\u06cc \u0645\u06cc \u06a9\u0646\u062f &#8220;qucik brown fox&#8221; \u0631\u0627 \u062c\u0633\u062a\u062c\u0648 \u06a9\u0646\u062f.<\/li>\n<li>p4 \u0628\u0647 \u062f\u0646\u0628\u0627\u0644 \u0639\u0628\u0627\u0631\u062a &#8220;Quick Brownfox&#8221; \u0627\u0633\u062a.<\/li>\n<\/ul>\n<p>\u0648\u06cc\u0698\u06af\u06cc \u0646\u0634\u0627\u0646\u0647 <code>LOWER<\/code> \u062a\u0639\u0631\u06cc\u0641 \u0645\u06cc \u06a9\u0646\u062f \u06a9\u0647 \u0639\u0628\u0627\u0631\u062a \u0628\u0627\u06cc\u062f \u0642\u0628\u0644 \u0627\u0632 \u062a\u0637\u0628\u06cc\u0642 \u0628\u0647 \u062d\u0631\u0648\u0641 \u06a9\u0648\u0686\u06a9 \u062a\u0628\u062f\u06cc\u0644 \u0634\u0648\u062f.<\/p>\n<p>\u067e\u0633 \u0627\u0632 \u062a\u0639\u0631\u06cc\u0641 \u0627\u0644\u06af\u0648\u0647\u0627\u060c \u0628\u0627\u06cc\u062f \u0622\u0646\u0647\u0627 \u0631\u0627 \u0628\u0647 \u0622\u0646 \u0627\u0636\u0627\u0641\u0647 \u06a9\u0646\u06cc\u0645 <code>Matcher<\/code> \u0634\u06cc \u0627\u06cc \u06a9\u0647 \u0642\u0628\u0644\u0627 \u0627\u06cc\u062c\u0627\u062f \u06a9\u0631\u062f\u06cc\u0645.<\/p>\n<pre><code class=\"hljs\">m_tool.add(<span class=\"hljs-string\">'QBF'<\/span>, <span class=\"hljs-literal\">None<\/span>, p1, p2, p3, p4)\n<\/code><\/pre>\n<p>\u062f\u0631 \u0627\u06cc\u0646\u062c\u0627 &#8220;QBF&#8221; \u0646\u0627\u0645 \u0647\u0645\u0633\u0627\u0646 \u0645\u0627 \u0627\u0633\u062a.  \u0647\u0631 \u0627\u0633\u0645\u06cc \u0645\u06cc\u062a\u0648\u0646\u06cc \u0628\u0647\u0634 \u0628\u062f\u06cc<\/p>\n<h3 id=\"applyingmatchertothedocument\"><span class=\"ez-toc-section\" id=\"%d8%a7%d8%b9%d9%85%d8%a7%d9%84_%d8%aa%d8%b7%d8%a8%db%8c%d9%82_%d8%af%d8%b1_%d8%b3%d9%86%d8%af\"><\/span>\u0627\u0639\u0645\u0627\u0644 \u062a\u0637\u0628\u06cc\u0642 \u062f\u0631 \u0633\u0646\u062f<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p>\u0645\u0627 \u062e\u0648\u062f\u0645\u0627\u0646 \u0631\u0627 \u062f\u0627\u0631\u06cc\u0645 <code>matcher<\/code> \u0622\u0645\u0627\u062f\u0647.  \u0645\u0631\u062d\u0644\u0647 \u0628\u0639\u062f\u06cc \u0627\u0639\u0645\u0627\u0644 \u062a\u0637\u0628\u06cc\u0642 \u0627\u0633\u062a \u0631\u0648\u06cc \u06cc\u06a9 \u0633\u0646\u062f \u0645\u062a\u0646\u06cc \u0648 \u0628\u0628\u06cc\u0646\u06cc\u0645 \u0622\u06cc\u0627 \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u0645 \u0645\u0637\u0627\u0628\u0642\u062a \u062f\u0627\u0634\u062a\u0647 \u0628\u0627\u0634\u06cc\u0645.  \u0628\u06cc\u0627\u06cc\u06cc\u062f \u0627\u0628\u062a\u062f\u0627 \u06cc\u06a9 \u0633\u0646\u062f \u0633\u0627\u062f\u0647 \u0627\u06cc\u062c\u0627\u062f \u06a9\u0646\u06cc\u0645:<\/p>\n<pre><code class=\"hljs\">sentence = nlp(<span class=\"hljs-string\">u'The quick-brown-fox jumps over the lazy dog. The quick brown fox eats well. \\\n               the quickbrownfox is dead. the dog misses the quick brownfox'<\/span>)\n<\/code><\/pre>\n<p>\u0628\u0631\u0627\u06cc \u0627\u0639\u0645\u0627\u0644 \u062a\u0637\u0628\u06cc\u0642 \u0628\u0631 \u06cc\u06a9 \u0633\u0646\u062f.  \u0633\u0646\u062f \u0628\u0627\u06cc\u062f \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u06cc\u06a9 \u067e\u0627\u0631\u0627\u0645\u062a\u0631 \u0628\u0647 \u0634\u06cc \u062a\u0637\u0628\u06cc\u0642 \u062f\u0627\u062f\u0647 \u0634\u0648\u062f.  \u0646\u062a\u06cc\u062c\u0647\u060c \u062a\u0645\u0627\u0645 \u0634\u0646\u0627\u0633\u0647\u200c\u0647\u0627\u06cc \u0639\u0628\u0627\u0631\u0627\u062a\u06cc \u0627\u0633\u062a \u06a9\u0647 \u062f\u0631 \u0633\u0646\u062f \u062a\u0637\u0628\u06cc\u0642 \u062f\u0627\u062f\u0647 \u0634\u062f\u0647\u200c\u0627\u0646\u062f\u060c \u0647\u0645\u0631\u0627\u0647 \u0628\u0627 \u0645\u0648\u0642\u0639\u06cc\u062a\u200c\u0647\u0627\u06cc \u0634\u0631\u0648\u0639 \u0648 \u067e\u0627\u06cc\u0627\u0646 \u0622\u0646\u0647\u0627 \u062f\u0631 \u0633\u0646\u062f.  \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0632\u06cc\u0631 \u0631\u0627 \u0627\u062c\u0631\u0627 \u06a9\u0646\u06cc\u062f:<\/p>\n<pre><code class=\"hljs\">phrase_matches = m_tool(sentence)\n<span class=\"hljs-built_in\">print<\/span>(phrase_matches )\n<\/code><\/pre>\n<p>\u062e\u0631\u0648\u062c\u06cc \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0628\u0627\u0644\u0627 \u0628\u0647 \u0634\u06a9\u0644 \u0632\u06cc\u0631 \u0627\u0633\u062a:<\/p>\n<pre><code class=\"hljs\">((12825528024649263697, 1, 6), (12825528024649263697, 13, 16), (12825528024649263697, 21, 22), (12825528024649263697, 29, 31))\n<\/code><\/pre>\n<p>\u0627\u0632 \u062e\u0631\u0648\u062c\u06cc \u0645\u0634\u0627\u0647\u062f\u0647 \u0645\u06cc \u06a9\u0646\u06cc\u062f \u06a9\u0647 \u0686\u0647\u0627\u0631 \u0639\u0628\u0627\u0631\u062a \u0645\u0637\u0627\u0628\u0642\u062a \u062f\u0627\u062f\u0647 \u0634\u062f\u0647 \u0627\u0646\u062f.  \u0627\u0648\u0644\u06cc\u0646 \u0639\u062f\u062f \u0637\u0648\u0644\u0627\u0646\u06cc \u062f\u0631 \u0647\u0631 \u062e\u0631\u0648\u062c\u06cc\u060c \u0634\u0646\u0627\u0633\u0647 \u0639\u0628\u0627\u0631\u062a \u0645\u0637\u0627\u0628\u0642\u062a \u0634\u062f\u0647 \u0627\u0633\u062a\u060c \u0639\u062f\u062f \u062f\u0648\u0645 \u0648 \u0633\u0648\u0645 \u0645\u0648\u0642\u0639\u06cc\u062a \u0647\u0627\u06cc \u0634\u0631\u0648\u0639 \u0648 \u067e\u0627\u06cc\u0627\u0646 \u0639\u0628\u0627\u0631\u062a \u0647\u0633\u062a\u0646\u062f.<\/p>\n<p>\u0628\u0631\u0627\u06cc \u0627\u06cc\u0646\u06a9\u0647 \u062f\u0631 \u0648\u0627\u0642\u0639 \u0646\u062a\u06cc\u062c\u0647 \u0631\u0627 \u0628\u0647 \u0631\u0648\u0634\u06cc \u0628\u0647\u062a\u0631 \u0645\u0634\u0627\u0647\u062f\u0647 \u06a9\u0646\u06cc\u0645\u060c \u0645\u06cc\u200c\u062a\u0648\u0627\u0646\u06cc\u0645 \u0627\u0632 \u0637\u0631\u06cc\u0642 \u0647\u0631 \u0639\u0628\u0627\u0631\u062a \u0645\u0646\u0637\u0628\u0642 \u062a\u06a9\u0631\u0627\u0631 \u06a9\u0646\u06cc\u0645 \u0648 \u0645\u0642\u062f\u0627\u0631 \u0631\u0634\u062a\u0647 \u0622\u0646 \u0631\u0627 \u0646\u0645\u0627\u06cc\u0634 \u062f\u0647\u06cc\u0645.  \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0632\u06cc\u0631 \u0631\u0627 \u0627\u062c\u0631\u0627 \u06a9\u0646\u06cc\u062f:<\/p>\n<pre><code class=\"hljs\"><span class=\"hljs-keyword\">for<\/span> match_id, start, end <span class=\"hljs-keyword\">in<\/span> phrase_matches:\n    string_id = nlp.vocab.strings(match_id)  \n    span = sentence(start:end)                   \n    <span class=\"hljs-built_in\">print<\/span>(match_id, string_id, start, end, span.text)\n<\/code><\/pre>\n<p><strong>\u062e\u0631\u0648\u062c\u06cc:<\/strong><\/p>\n<pre><code class=\"hljs\">12825528024649263697 QBF 1 6 quick-brown-fox\n12825528024649263697 QBF 13 16 quick brown fox\n12825528024649263697 QBF 21 22 quickbrownfox\n12825528024649263697 QBF 29 31 quick brownfox\n<\/code><\/pre>\n<p>\u0627\u0632 \u062e\u0631\u0648\u062c\u06cc\u060c \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u062f \u062a\u0645\u0627\u0645 \u0639\u0628\u0627\u0631\u0627\u062a \u0645\u0646\u0637\u0628\u0642 \u0628\u0647 \u0647\u0645\u0631\u0627\u0647 \u0634\u0646\u0627\u0633\u0647 \u0648\u0627\u0698\u06af\u0627\u0646 \u0648 \u0645\u0648\u0642\u0639\u06cc\u062a \u0634\u0631\u0648\u0639 \u0648 \u067e\u0627\u06cc\u0627\u0646 \u0631\u0627 \u0645\u0634\u0627\u0647\u062f\u0647 \u06a9\u0646\u06cc\u062f.<\/p>\n<h3 id=\"moreoptionsforrulebasedmatching\"><span class=\"ez-toc-section\" id=\"%da%af%d8%b2%db%8c%d9%86%d9%87_%d9%87%d8%a7%db%8c_%d8%a8%db%8c%d8%b4%d8%aa%d8%b1_%d8%a8%d8%b1%d8%a7%db%8c_%d8%aa%d8%b7%d8%a8%db%8c%d9%82_%d9%85%d8%a8%d8%aa%d9%86%db%8c_%d8%a8%d8%b1_%d9%82%d8%a7%d9%86%d9%88%d9%86\"><\/span>\u06af\u0632\u06cc\u0646\u0647 \u0647\u0627\u06cc \u0628\u06cc\u0634\u062a\u0631 \u0628\u0631\u0627\u06cc \u062a\u0637\u0628\u06cc\u0642 \u0645\u0628\u062a\u0646\u06cc \u0628\u0631 \u0642\u0627\u0646\u0648\u0646<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p>\u0627\u0633\u0646\u0627\u062f \u0631\u0633\u0645\u06cc \u0627\u0632 \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 sPacy \u062d\u0627\u0648\u06cc \u062c\u0632\u0626\u06cc\u0627\u062a \u0647\u0645\u0647 \u0645\u0648\u0627\u0631\u062f \u0627\u0633\u062a <a rel=\"nofollow noopener\" target=\"_blank\" href=\"https:\/\/spacy.io\/usage\/linguistic-features#adding-patterns-attributes\">\u0646\u0634\u0627\u0646\u0647 \u0647\u0627 \u0648 \u0648\u0627\u06cc\u0644\u062f \u06a9\u0627\u0631\u062a \u0647\u0627<\/a> \u06a9\u0647 \u0645\u06cc \u062a\u0648\u0627\u0646\u062f \u0628\u0631\u0627\u06cc \u062a\u0637\u0628\u06cc\u0642 \u0639\u0628\u0627\u0631\u062a \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0634\u0648\u062f.<\/p>\n<p>\u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u0645\u062b\u0627\u0644\u060c \u0648\u06cc\u0698\u06af\u06cc &#8220;*&#8221; \u0628\u0631\u0627\u06cc \u062c\u0633\u062a\u062c\u0648\u06cc \u06cc\u06a9 \u06cc\u0627 \u0686\u0646\u062f \u0646\u0645\u0648\u0646\u0647 \u0627\u0632 \u062a\u0648\u06a9\u0646 \u062a\u0639\u0631\u06cc\u0641 \u0634\u062f\u0647 \u0627\u0633\u062a.<\/p>\n<p>\u0628\u06cc\u0627\u06cc\u06cc\u062f \u06cc\u06a9 \u0627\u0644\u06af\u0648\u06cc \u0633\u0627\u062f\u0647 \u0628\u0646\u0648\u06cc\u0633\u06cc\u0645 \u06a9\u0647 \u0628\u062a\u0648\u0627\u0646\u062f \u0639\u0628\u0627\u0631\u062a &#8220;\u0633\u0631\u06cc\u0639&#8211;\u0642\u0647\u0648\u0647 \u0627\u06cc-\u0631\u0648\u0628\u0627\u0647&#8221; \u06cc\u0627 \u0633\u0631\u06cc\u0639 \u0642\u0647\u0648\u0647 \u0627\u06cc&#8212;\u0631\u0648\u0628\u0627\u0647 \u0631\u0627 \u0645\u0634\u062e\u0635 \u06a9\u0646\u062f.<\/p>\n<p>\u0628\u06cc\u0627\u06cc\u06cc\u062f \u0627\u0628\u062a\u062f\u0627 \u062a\u0637\u0628\u06cc\u0642 \u0642\u0628\u0644\u06cc \u0631\u0627 \u062d\u0630\u0641 \u06a9\u0646\u06cc\u0645 <code>QBF<\/code>.<\/p>\n<pre><code class=\"hljs\">m_tool.remove(<span class=\"hljs-string\">'QBF'<\/span>)\n<\/code><\/pre>\n<p>\u0628\u0639\u062f\u060c \u0628\u0627\u06cc\u062f \u0627\u0644\u06af\u0648\u06cc \u062c\u062f\u06cc\u062f \u062e\u0648\u062f \u0631\u0627 \u062a\u0639\u0631\u06cc\u0641 \u06a9\u0646\u06cc\u0645:<\/p>\n<pre><code class=\"hljs\">\np1 = ({<span class=\"hljs-string\">'LOWER'<\/span>: <span class=\"hljs-string\">'quick'<\/span>}, {<span class=\"hljs-string\">'IS_PUNCT'<\/span>: <span class=\"hljs-literal\">True<\/span>, <span class=\"hljs-string\">'OP'<\/span>:<span class=\"hljs-string\">'*'<\/span>}, {<span class=\"hljs-string\">'LOWER'<\/span>: <span class=\"hljs-string\">'brown'<\/span>}, {<span class=\"hljs-string\">'IS_PUNCT'<\/span>: <span class=\"hljs-literal\">True<\/span>, <span class=\"hljs-string\">'OP'<\/span>:<span class=\"hljs-string\">'*'<\/span>}, {<span class=\"hljs-string\">'LOWER'<\/span>: <span class=\"hljs-string\">'fox'<\/span>})\nm_tool.add(<span class=\"hljs-string\">'QBF'<\/span>, <span class=\"hljs-literal\">None<\/span>, p1)\n<\/code><\/pre>\n<p>\u0627\u0644\u06af\u0648 <code>p1<\/code> \u0628\u0627 \u062a\u0645\u0627\u0645 \u0639\u0628\u0627\u0631\u0627\u062a\u06cc \u06a9\u0647 \u06cc\u06a9 \u06cc\u0627 \u0686\u0646\u062f \u0639\u0644\u0627\u0645\u062a \u0646\u06af\u0627\u0631\u0634\u06cc \u062f\u0631 \u0639\u0628\u0627\u0631\u062a \u0648\u062c\u0648\u062f \u062f\u0627\u0631\u062f \u0645\u0637\u0627\u0628\u0642\u062a \u062e\u0648\u0627\u0647\u062f \u062f\u0627\u0634\u062a <code>quick brown fox<\/code>.  \u0628\u06cc\u0627\u06cc\u06cc\u062f \u0627\u06a9\u0646\u0648\u0646 \u0633\u0646\u062f \u062e\u0648\u062f \u0631\u0627 \u0628\u0631\u0627\u06cc \u0641\u06cc\u0644\u062a\u0631 \u062a\u0639\u0631\u06cc\u0641 \u06a9\u0646\u06cc\u0645:<\/p>\n<pre><code class=\"hljs\">sentence = nlp(u'The quick--brown--fox jumps over the  quick-brown---fox')\n<\/code><\/pre>\n<p>\u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u062f \u0628\u0628\u06cc\u0646\u06cc\u062f \u0633\u0646\u062f \u0645\u0627 \u062f\u0627\u0631\u0627\u06cc \u062f\u0648 \u0639\u0628\u0627\u0631\u062a quick&#8211;brown&#8211;fox \u0648 quick-brown&#8212;fox \u0627\u0633\u062a \u06a9\u0647 \u0628\u0627\u06cc\u062f \u0628\u0627 \u0627\u0644\u06af\u0648\u06cc \u0645\u0627 \u0645\u0637\u0627\u0628\u0642\u062a \u062f\u0627\u0634\u062a\u0647 \u0628\u0627\u0634\u062f.  \u0628\u06cc\u0627\u06cc\u06cc\u062f \u062a\u0637\u0628\u06cc\u0642 \u062e\u0648\u062f \u0631\u0627 \u062f\u0631 \u0633\u0646\u062f \u0627\u0639\u0645\u0627\u0644 \u06a9\u0646\u06cc\u0645 \u0648 \u0646\u062a\u0627\u06cc\u062c \u0631\u0627 \u0628\u0628\u06cc\u0646\u06cc\u0645:<\/p>\n<pre><code class=\"hljs\">phrase_matches = m_tool(sentence)\n\n<span class=\"hljs-keyword\">for<\/span> match_id, start, end <span class=\"hljs-keyword\">in<\/span> phrase_matches:\n    string_id = nlp.vocab.strings(match_id)  \n    span = sentence(start:end)                   \n    <span class=\"hljs-built_in\">print<\/span>(match_id, string_id, start, end, span.text)\n<\/code><\/pre>\n<p>\u062e\u0631\u0648\u062c\u06cc \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0628\u0627\u0644\u0627 \u0628\u0647 \u0634\u06a9\u0644 \u0632\u06cc\u0631 \u0627\u0633\u062a:<\/p>\n<pre><code class=\"hljs\">12825528024649263697 QBF 1 6 quick--brown--fox\n12825528024649263697 QBF 10 15 quick-brown---fox\n<\/code><\/pre>\n<p>\u0627\u0632 \u062e\u0631\u0648\u062c\u06cc \u0645\u06cc \u0628\u06cc\u0646\u06cc\u062f \u06a9\u0647 \u062a\u0637\u0628\u06cc\u0642 \u062f\u0647\u0646\u062f\u0647 \u0645\u0627 \u0628\u0627 \u0645\u0648\u0641\u0642\u06cc\u062a \u0627\u06cc\u0646 \u062f\u0648 \u0639\u0628\u0627\u0631\u062a \u0631\u0627 \u0645\u0637\u0627\u0628\u0642\u062a \u062f\u0627\u062f\u0647 \u0627\u0633\u062a.<\/p>\n<h2 id=\"phrasebasedmatching\"><span class=\"ez-toc-section\" id=\"%d8%aa%d8%b7%d8%a8%db%8c%d9%82_%d9%85%d8%a8%d8%aa%d9%86%db%8c_%d8%a8%d8%b1_%d8%b9%d8%a8%d8%a7%d8%b1%d8%aa\"><\/span>\u062a\u0637\u0628\u06cc\u0642 \u0645\u0628\u062a\u0646\u06cc \u0628\u0631 \u0639\u0628\u0627\u0631\u062a<span class=\"ez-toc-section-end\"><\/span><\/h2>\n<p>\u062f\u0631 \u0628\u062e\u0634 \u0622\u062e\u0631\u060c \u062f\u06cc\u062f\u06cc\u0645 \u06a9\u0647 \u0686\u06af\u0648\u0646\u0647 \u0645\u06cc\u200c\u062a\u0648\u0627\u0646\u06cc\u0645 \u0642\u0648\u0627\u0646\u06cc\u0646\u06cc \u0631\u0627 \u062a\u0639\u0631\u06cc\u0641 \u06a9\u0646\u06cc\u0645 \u06a9\u0647 \u0628\u062a\u0648\u0627\u0646 \u0627\u0632 \u0622\u0646\u0647\u0627 \u0628\u0631\u0627\u06cc \u0634\u0646\u0627\u0633\u0627\u06cc\u06cc \u0639\u0628\u0627\u0631\u0627\u062a \u0627\u0632 \u0633\u0646\u062f \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0631\u062f.  \u0639\u0644\u0627\u0648\u0647 \u0628\u0631 \u062a\u0639\u0631\u06cc\u0641 \u0642\u0648\u0627\u0646\u06cc\u0646\u060c \u0645\u06cc\u200c\u062a\u0648\u0627\u0646\u06cc\u0645 \u0645\u0633\u062a\u0642\u06cc\u0645\u0627\u064b \u0639\u0628\u0627\u0631\u0627\u062a\u06cc \u0631\u0627 \u06a9\u0647 \u0628\u0647 \u062f\u0646\u0628\u0627\u0644 \u0622\u0646 \u0647\u0633\u062a\u06cc\u0645\u060c \u0645\u0634\u062e\u0635 \u06a9\u0646\u06cc\u0645.<br \/>\u0627\u06cc\u0646 \u06cc\u06a9 \u0631\u0648\u0634 \u06a9\u0627\u0631\u0622\u0645\u062f\u062a\u0631 \u0628\u0631\u0627\u06cc \u062a\u0637\u0628\u06cc\u0642 \u0639\u0628\u0627\u0631\u062a \u0627\u0633\u062a.<\/p>\n<p>\u062f\u0631 \u0627\u06cc\u0646 \u0628\u062e\u0634\u060c \u062a\u0637\u0628\u06cc\u0642 \u0639\u0628\u0627\u0631\u062a \u0631\u0627 \u062f\u0631 \u06cc\u06a9 \u0645\u0642\u0627\u0644\u0647 \u0648\u06cc\u06a9\u06cc\u200c\u067e\u062f\u06cc\u0627 \u0627\u0646\u062c\u0627\u0645 \u0645\u06cc\u200c\u062f\u0647\u06cc\u0645 \u0631\u0648\u06cc \u0647\u0648\u0634 \u0645\u0635\u0646\u0648\u0639\u06cc.<\/p>\n<p>\u0642\u0628\u0644 \u0627\u0632 \u062f\u06cc\u062f\u0646 \u0645\u0631\u0627\u062d\u0644 \u0627\u0646\u062c\u0627\u0645 \u062a\u0637\u0628\u06cc\u0642 \u0639\u0628\u0627\u0631\u062a\u060c \u0627\u062c\u0627\u0632\u0647 \u062f\u0647\u06cc\u062f \u0627\u0628\u062a\u062f\u0627 \u0645\u0642\u0627\u0644\u0647 \u0648\u06cc\u06a9\u06cc \u067e\u062f\u06cc\u0627 \u0631\u0627 \u06a9\u0647 \u0628\u0631\u0627\u06cc \u0627\u0646\u062c\u0627\u0645 \u062a\u0637\u0628\u06cc\u0642 \u0639\u0628\u0627\u0631\u062a \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u062e\u0648\u0627\u0647\u06cc\u0645 \u06a9\u0631\u062f\u060c \u062a\u062c\u0632\u06cc\u0647 \u06a9\u0646\u06cc\u0645.  \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0632\u06cc\u0631 \u0631\u0627 \u0627\u062c\u0631\u0627 \u06a9\u0646\u06cc\u062f:<\/p>\n<pre><code class=\"hljs\"><span class=\"hljs-keyword\">import<\/span> bs4 <span class=\"hljs-keyword\">as<\/span> bs  \n<span class=\"hljs-keyword\">import<\/span> urllib.request  \n<span class=\"hljs-keyword\">import<\/span> re  \n<span class=\"hljs-keyword\">import<\/span> nltk\n\nscrapped_data = urllib.request.urlopen(<span class=\"hljs-string\">'https:\/\/en.wikipedia.org\/wiki\/Artificial_intelligence'<\/span>)  \narticle = scrapped_data .read()\n\nparsed_article = bs.BeautifulSoup(article,<span class=\"hljs-string\">'lxml'<\/span>)\n\nparagraphs = parsed_article.find_all(<span class=\"hljs-string\">'p'<\/span>)\n\narticle_text = <span class=\"hljs-string\">\"\"<\/span>\n\n<span class=\"hljs-keyword\">for<\/span> p <span class=\"hljs-keyword\">in<\/span> paragraphs:  \n    article_text += p.text\n    \n    \nprocessed_article = article_text.lower()  \nprocessed_article = re.sub(<span class=\"hljs-string\">'(^a-zA-Z)'<\/span>, <span class=\"hljs-string\">' '<\/span>, processed_article )  \nprocessed_article = re.sub(<span class=\"hljs-string\">r'\\s+'<\/span>, <span class=\"hljs-string\">' '<\/span>, processed_article)\n\n<\/code><\/pre>\n<p>\u0641\u06cc\u0644\u0645\u0646\u0627\u0645\u0647 \u0628\u0647 \u0637\u0648\u0631 \u0645\u0641\u0635\u0644 \u062f\u0631 \u0645\u0642\u0627\u0644\u0647 \u0645\u0646 \u062a\u0648\u0636\u06cc\u062d \u062f\u0627\u062f\u0647 \u0634\u062f\u0647 \u0627\u0633\u062a \u0631\u0648\u06cc \u067e\u06cc\u0627\u062f\u0647 \u0633\u0627\u0632\u06cc Word2Vec \u0628\u0627 <code>gensim<\/code> \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 \u062f\u0631 \u067e\u0627\u06cc\u062a\u0648\u0646  \u0627\u06af\u0631 \u0645\u06cc\u200c\u062e\u0648\u0627\u0647\u06cc\u062f \u0628\u0641\u0647\u0645\u06cc\u062f \u062a\u062c\u0632\u06cc\u0647 \u062f\u0631 \u067e\u0627\u06cc\u062a\u0648\u0646 \u0686\u06af\u0648\u0646\u0647 \u06a9\u0627\u0631 \u0645\u06cc\u200c\u06a9\u0646\u062f\u060c \u0645\u06cc\u200c\u062a\u0648\u0627\u0646\u06cc\u062f \u0628\u0631\u0648\u06cc\u062f \u0648 \u0645\u0642\u0627\u0644\u0647 \u0631\u0627 \u0628\u062e\u0648\u0627\u0646\u06cc\u062f.<\/p>\n<p>\u0627\u06cc\u0646 <code>processed_article<\/code> \u062d\u0627\u0648\u06cc \u0633\u0646\u062f\u06cc \u0627\u0633\u062a \u06a9\u0647 \u0628\u0631\u0627\u06cc \u062a\u0637\u0628\u06cc\u0642 \u0639\u0628\u0627\u0631\u062a \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u062e\u0648\u0627\u0647\u06cc\u0645 \u06a9\u0631\u062f.<\/p>\n<p>\u0645\u0631\u0627\u062d\u0644 \u0627\u0646\u062c\u0627\u0645 \u062a\u0637\u0628\u06cc\u0642 \u0639\u0628\u0627\u0631\u062a \u06a9\u0627\u0645\u0644\u0627\u064b \u0634\u0628\u06cc\u0647 \u062a\u0637\u0628\u06cc\u0642 \u0645\u0628\u062a\u0646\u06cc \u0628\u0631 \u0642\u0627\u0646\u0648\u0646 \u0627\u0633\u062a.<\/p>\n<h3 id=\"createphrasematcherobject\"><span class=\"ez-toc-section\" id=\"%d8%b4%db%8c%d8%a1_%d8%aa%d8%b7%d8%a8%db%8c%d9%82_%d8%b9%d8%a8%d8%a7%d8%b1%d8%aa_%d8%a7%db%8c%d8%ac%d8%a7%d8%af_%da%a9%d9%86%db%8c%d8%af\"><\/span>\u0634\u06cc\u0621 \u062a\u0637\u0628\u06cc\u0642 \u0639\u0628\u0627\u0631\u062a \u0627\u06cc\u062c\u0627\u062f \u06a9\u0646\u06cc\u062f<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p>\u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u0627\u0648\u0644\u06cc\u0646 \u06af\u0627\u0645\u060c \u0628\u0627\u06cc\u062f a \u0631\u0627 \u0627\u06cc\u062c\u0627\u062f \u06a9\u0646\u06cc\u062f <code>PhraseMatcher<\/code> \u0647\u062f\u0641 &#8211; \u0634\u06cc.  \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0632\u06cc\u0631 \u0627\u06cc\u0646 \u06a9\u0627\u0631 \u0631\u0627 \u0627\u0646\u062c\u0627\u0645 \u0645\u06cc \u062f\u0647\u062f:<\/p>\n<pre><code class=\"hljs\"><span class=\"hljs-keyword\">import<\/span> spacy\nnlp = spacy.load(<span class=\"hljs-string\">'en_core_web_sm'<\/span>)\n\n\n<span class=\"hljs-keyword\">from<\/span> spacy.matcher <span class=\"hljs-keyword\">import<\/span> PhraseMatcher\nphrase_matcher = PhraseMatcher(nlp.vocab)\n<\/code><\/pre>\n<p>\u062a\u0648\u062c\u0647 \u062f\u0627\u0634\u062a\u0647 \u0628\u0627\u0634\u06cc\u062f \u06a9\u0647 \u062f\u0631 \u0628\u062e\u0634 \u0642\u0628\u0644\u06cc \u06a9\u0647 a \u0631\u0627 \u0627\u06cc\u062c\u0627\u062f \u06a9\u0631\u062f\u06cc\u0645 <code>Matcher<\/code> \u0647\u062f\u0641 &#8211; \u0634\u06cc.  \u062f\u0631 \u0627\u06cc\u0646\u062c\u0627\u060c \u062f\u0631 \u0627\u06cc\u0646 \u0645\u0648\u0631\u062f\u060c \u0645\u0627 \u062f\u0631 \u062d\u0627\u0644 \u0627\u06cc\u062c\u0627\u062f \u06cc\u06a9 <code>PhraseMathcer<\/code> \u0647\u062f\u0641 &#8211; \u0634\u06cc.<\/p>\n<h3 id=\"createphraselist\"><span class=\"ez-toc-section\" id=\"%d9%81%d9%87%d8%b1%d8%b3%d8%aa_%d8%b9%d8%a8%d8%a7%d8%b1%d8%a7%d8%aa_%d8%b1%d8%a7_%d8%a7%db%8c%d8%ac%d8%a7%d8%af_%da%a9%d9%86%db%8c%d8%af\"><\/span>\u0641\u0647\u0631\u0633\u062a \u0639\u0628\u0627\u0631\u0627\u062a \u0631\u0627 \u0627\u06cc\u062c\u0627\u062f \u06a9\u0646\u06cc\u062f<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p>\u062f\u0631 \u0645\u0631\u062d\u0644\u0647 \u062f\u0648\u0645\u060c \u0628\u0627\u06cc\u062f \u0641\u0647\u0631\u0633\u062a\u06cc \u0627\u0632 \u0639\u0628\u0627\u0631\u0627\u062a \u0631\u0627 \u0627\u06cc\u062c\u0627\u062f \u06a9\u0646\u06cc\u062f \u062a\u0627 \u0645\u0637\u0627\u0628\u0642\u062a \u062f\u0627\u0634\u062a\u0647 \u0628\u0627\u0634\u062f \u0648 \u0633\u067e\u0633 \u0644\u06cc\u0633\u062a \u0631\u0627 \u0628\u0647 \u0627\u0633\u0646\u0627\u062f spaCy NLP \u062a\u0628\u062f\u06cc\u0644 \u06a9\u0646\u06cc\u062f\u060c \u0647\u0645\u0627\u0646\u0637\u0648\u0631 \u06a9\u0647 \u062f\u0631 \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0632\u06cc\u0631 \u0646\u0634\u0627\u0646 \u062f\u0627\u062f\u0647 \u0634\u062f\u0647 \u0627\u0633\u062a:<\/p>\n<pre><code class=\"hljs\">phrases = (<span class=\"hljs-string\">'machine learning'<\/span>, <span class=\"hljs-string\">'robots'<\/span>, <span class=\"hljs-string\">'intelligent agents'<\/span>)\n\npatterns = (nlp(text) <span class=\"hljs-keyword\">for<\/span> text <span class=\"hljs-keyword\">in<\/span> phrases)\n<\/code><\/pre>\n<p>\u062f\u0631 \u0646\u0647\u0627\u06cc\u062a \u0628\u0627\u06cc\u062f \u0644\u06cc\u0633\u062a \u0639\u0628\u0627\u0631\u0627\u062a \u062e\u0648\u062f \u0631\u0627 \u0628\u0647 \u0639\u0628\u0627\u0631\u062a matcher \u0627\u0636\u0627\u0641\u0647 \u06a9\u0646\u06cc\u062f.<\/p>\n<pre><code class=\"hljs\">phrase_matcher.add(<span class=\"hljs-string\">'AI'<\/span>, <span class=\"hljs-literal\">None<\/span>, *patterns)\n<\/code><\/pre>\n<p>\u062f\u0631 \u0627\u06cc\u0646\u062c\u0627 \u0646\u0627\u0645 \u0647\u0645\u0633\u0627\u0646 \u0645\u0627 AI \u0627\u0633\u062a.<\/p>\n<h3 id=\"applyingmatchertothedocument\"><span class=\"ez-toc-section\" id=\"%d8%a7%d8%b9%d9%85%d8%a7%d9%84_%d8%aa%d8%b7%d8%a8%db%8c%d9%82_%d8%af%d8%b1_%d8%b3%d9%86%d8%af-2\"><\/span>\u0627\u0639\u0645\u0627\u0644 \u062a\u0637\u0628\u06cc\u0642 \u062f\u0631 \u0633\u0646\u062f<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p>\u0645\u0627\u0646\u0646\u062f \u062a\u0637\u0628\u06cc\u0642 \u0645\u0628\u062a\u0646\u06cc \u0628\u0631 \u0642\u0627\u0646\u0648\u0646\u060c \u062f\u0648\u0628\u0627\u0631\u0647 \u0628\u0627\u06cc\u062f \u062a\u0637\u0628\u06cc\u0642 \u0639\u0628\u0627\u0631\u062a \u062e\u0648\u062f \u0631\u0627 \u062f\u0631 \u0633\u0646\u062f \u0627\u0639\u0645\u0627\u0644 \u06a9\u0646\u06cc\u0645.  \u0628\u0627 \u0627\u06cc\u0646 \u062d\u0627\u0644\u060c \u0645\u0642\u0627\u0644\u0647 \u062a\u062c\u0632\u06cc\u0647 \u0634\u062f\u0647 \u0645\u0627 \u062f\u0631 \u0642\u0627\u0644\u0628 \u0633\u0646\u062f spaCy \u0646\u06cc\u0633\u062a.  \u0628\u0646\u0627\u0628\u0631\u0627\u06cc\u0646\u060c \u0645\u0627 \u0645\u0642\u0627\u0644\u0647 \u062e\u0648\u062f \u0631\u0627 \u0628\u0647 \u0642\u0627\u0644\u0628 \u0633\u0646\u062f sPacy \u062a\u0628\u062f\u06cc\u0644 \u0645\u06cc \u06a9\u0646\u06cc\u0645 \u0648 \u0633\u067e\u0633 \u062a\u0637\u0628\u06cc\u0642 \u0639\u0628\u0627\u0631\u062a \u062e\u0648\u062f \u0631\u0627 \u062f\u0631 \u0645\u0642\u0627\u0644\u0647 \u0627\u0639\u0645\u0627\u0644 \u0645\u06cc \u06a9\u0646\u06cc\u0645.<\/p>\n<pre><code class=\"hljs\">sentence = nlp (processed_article)\n\nmatched_phrases = phrase_matcher(sentence)\n<\/code><\/pre>\n<p>\u062f\u0631 \u062e\u0631\u0648\u062c\u06cc\u060c \u0647\u0645\u0647 \u0634\u0646\u0627\u0633\u0647\u200c\u0647\u0627\u06cc \u062a\u0645\u0627\u0645 \u0639\u0628\u0627\u0631\u0627\u062a \u0645\u0646\u0637\u0628\u0642 \u0631\u0627 \u0628\u0647 \u0647\u0645\u0631\u0627\u0647 \u0646\u0645\u0627\u06cc\u0647\u200c\u0647\u0627\u06cc \u0634\u0631\u0648\u0639 \u0648 \u067e\u0627\u06cc\u0627\u0646 \u0622\u0646\u0647\u0627 \u062f\u0631 \u0633\u0646\u062f \u062e\u0648\u0627\u0647\u06cc\u0645 \u062f\u0627\u0634\u062a\u060c \u0647\u0645\u0627\u0646\u0637\u0648\u0631 \u06a9\u0647 \u062f\u0631 \u0632\u06cc\u0631 \u0646\u0634\u0627\u0646 \u062f\u0627\u062f\u0647 \u0634\u062f\u0647 \u0627\u0633\u062a:<\/p>\n<pre><code class=\"hljs\">((5530044837203964789, 37, 39),\n (5530044837203964789, 402, 404),\n (5530044837203964789, 693, 694),\n (5530044837203964789, 1284, 1286),\n (5530044837203964789, 3059, 3061),\n (5530044837203964789, 3218, 3220),\n (5530044837203964789, 3753, 3754),\n (5530044837203964789, 5212, 5213),\n (5530044837203964789, 5287, 5288),\n (5530044837203964789, 6769, 6771),\n (5530044837203964789, 6781, 6783),\n (5530044837203964789, 7496, 7498),\n (5530044837203964789, 7635, 7637),\n (5530044837203964789, 8002, 8004),\n (5530044837203964789, 9461, 9462),\n (5530044837203964789, 9955, 9957),\n (5530044837203964789, 10784, 10785),\n (5530044837203964789, 11250, 11251),\n (5530044837203964789, 12290, 12291),\n (5530044837203964789, 12411, 12412),\n (5530044837203964789, 12455, 12456))\n<\/code><\/pre>\n<p>\u0628\u0631\u0627\u06cc \u062f\u06cc\u062f\u0646 \u0645\u0642\u062f\u0627\u0631 \u0631\u0634\u062a\u0647 \u0639\u0628\u0627\u0631\u0627\u062a \u0645\u0637\u0627\u0628\u0642\u062a \u062f\u0627\u062f\u0647 \u0634\u062f\u0647\u060c \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0632\u06cc\u0631 \u0631\u0627 \u0627\u062c\u0631\u0627 \u06a9\u0646\u06cc\u062f:<\/p>\n<pre><code class=\"hljs\"><span class=\"hljs-keyword\">for<\/span> match_id, start, end <span class=\"hljs-keyword\">in<\/span> matched_phrases:\n    string_id = nlp.vocab.strings(match_id)  \n    span = sentence(start:end)                   \n    <span class=\"hljs-built_in\">print<\/span>(match_id, string_id, start, end, span.text)\n<\/code><\/pre>\n<p>\u062f\u0631 \u062e\u0631\u0648\u062c\u06cc\u060c \u0645\u0642\u062f\u0627\u0631 \u0631\u0634\u062a\u0647 \u0639\u0628\u0627\u0631\u0627\u062a \u0645\u0646\u0637\u0628\u0642 \u0631\u0627 \u0645\u0637\u0627\u0628\u0642 \u0634\u06a9\u0644 \u0632\u06cc\u0631 \u0645\u0634\u0627\u0647\u062f\u0647 \u062e\u0648\u0627\u0647\u06cc\u062f \u06a9\u0631\u062f:<\/p>\n<pre><code class=\"hljs\">5530044837203964789 AI 37 39 intelligent agents\n5530044837203964789 AI 402 404 machine learning\n5530044837203964789 AI 693 694 robots\n5530044837203964789 AI 1284 1286 machine learning\n5530044837203964789 AI 3059 3061 intelligent agents\n5530044837203964789 AI 3218 3220 machine learning\n5530044837203964789 AI 3753 3754 robots\n5530044837203964789 AI 5212 5213 robots\n5530044837203964789 AI 5287 5288 robots\n5530044837203964789 AI 6769 6771 machine learning\n5530044837203964789 AI 6781 6783 machine learning\n5530044837203964789 AI 7496 7498 machine learning\n5530044837203964789 AI 7635 7637 machine learning\n5530044837203964789 AI 8002 8004 machine learning\n5530044837203964789 AI 9461 9462 robots\n5530044837203964789 AI 9955 9957 machine learning\n5530044837203964789 AI 10784 10785 robots\n5530044837203964789 AI 11250 11251 robots\n5530044837203964789 AI 12290 12291 robots\n5530044837203964789 AI 12411 12412 robots\n5530044837203964789 AI 12455 12456 robots\n<\/code><\/pre>\n<p>\u0627\u0632 \u062e\u0631\u0648\u062c\u06cc \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u062f \u0647\u0631 \u0633\u0647 \u0639\u0628\u0627\u0631\u062a\u06cc \u0631\u0627 \u06a9\u0647 \u0633\u0639\u06cc \u06a9\u0631\u062f\u06cc\u0645 \u062c\u0633\u062a\u062c\u0648 \u06a9\u0646\u06cc\u0645 \u0628\u0647 \u0647\u0645\u0631\u0627\u0647 \u0641\u0647\u0631\u0633\u062a \u0634\u0631\u0648\u0639 \u0648 \u067e\u0627\u06cc\u0627\u0646 \u0622\u0646\u0647\u0627 \u0648 \u0634\u0646\u0627\u0633\u0647 \u0631\u0634\u062a\u0647 \u0647\u0627 \u0631\u0627 \u0645\u0634\u0627\u0647\u062f\u0647 \u06a9\u0646\u06cc\u062f.<\/p>\n<h2 id=\"stopwords\"><span class=\"ez-toc-section\" id=\"%da%a9%d9%84%d9%85%d8%a7%d8%aa_%d8%b1%d8%a7_%d9%85%d8%aa%d9%88%d9%82%d9%81_%da%a9%d9%86%db%8c%d8%af\"><\/span>\u06a9\u0644\u0645\u0627\u062a \u0631\u0627 \u0645\u062a\u0648\u0642\u0641 \u06a9\u0646\u06cc\u062f<span class=\"ez-toc-section-end\"><\/span><\/h2>\n<p>\u0642\u0628\u0644 \u0627\u0632 \u0627\u06cc\u0646\u06a9\u0647 \u0627\u06cc\u0646 \u0645\u0642\u0627\u0644\u0647 \u0631\u0627 \u0628\u0647 \u067e\u0627\u06cc\u0627\u0646 \u0628\u0631\u0633\u0627\u0646\u06cc\u0645\u060c \u0641\u0642\u0637 \u0645\u06cc \u062e\u0648\u0627\u0633\u062a\u0645 \u0644\u0645\u0633 \u06a9\u0646\u0645 \u0631\u0648\u06cc \u0645\u0641\u0647\u0648\u0645 \u06a9\u0644\u0645\u0627\u062a \u062a\u0648\u0642\u0641  \u06a9\u0644\u0645\u0627\u062a \u062a\u0648\u0642\u0641\u060c \u06a9\u0644\u0645\u0627\u062a \u0627\u0646\u06af\u0644\u06cc\u0633\u06cc \u0645\u0627\u0646\u0646\u062f &#8220;the&#8221;\u060c &#8220;a&#8221;\u060c &#8220;an&#8221; \u0648 \u063a\u06cc\u0631\u0647 \u0647\u0633\u062a\u0646\u062f \u06a9\u0647 \u0645\u0639\u0646\u0627\u06cc \u062e\u0627\u0635 \u062e\u0648\u062f \u0631\u0627 \u0646\u062f\u0627\u0631\u0646\u062f.  \u06a9\u0644\u0645\u0627\u062a \u062a\u0648\u0642\u0641 \u0627\u063a\u0644\u0628 \u0628\u0631\u0627\u06cc \u06a9\u0627\u0631\u0647\u0627\u06cc NLP \u0645\u0627\u0646\u0646\u062f \u0637\u0628\u0642\u0647 \u0628\u0646\u062f\u06cc \u0645\u062a\u0646 \u06cc\u0627 \u0645\u062f\u0644 \u0633\u0627\u0632\u06cc \u0632\u0628\u0627\u0646 \u0686\u0646\u062f\u0627\u0646 \u0645\u0641\u06cc\u062f \u0646\u06cc\u0633\u062a\u0646\u062f.  \u0628\u0646\u0627\u0628\u0631\u0627\u06cc\u0646 \u0627\u063a\u0644\u0628 \u0628\u0647\u062a\u0631 \u0627\u0633\u062a \u0642\u0628\u0644 \u0627\u0632 \u067e\u0631\u062f\u0627\u0632\u0634 \u0628\u06cc\u0634\u062a\u0631 \u0633\u0646\u062f\u060c \u0627\u06cc\u0646 \u06a9\u0644\u0645\u0627\u062a \u062a\u0648\u0642\u0641 \u0631\u0627 \u062d\u0630\u0641 \u06a9\u0646\u06cc\u062f.<\/p>\n<p>\u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 spaCy \u0634\u0627\u0645\u0644 305 \u06a9\u0644\u0645\u0647 \u062a\u0648\u0642\u0641 \u0627\u0633\u062a.  \u0639\u0644\u0627\u0648\u0647 \u0628\u0631 \u0627\u06cc\u0646\u060c \u0628\u0633\u062a\u0647 \u0628\u0647 \u0646\u06cc\u0627\u0632 \u062e\u0648\u062f\u060c \u0645\u06cc\u200c\u062a\u0648\u0627\u0646\u06cc\u0645 \u06a9\u0644\u0645\u0627\u062a \u062a\u0648\u0642\u0641 \u0631\u0627 \u0646\u06cc\u0632 \u0627\u0632 \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 spaCy \u0627\u0636\u0627\u0641\u0647 \u06cc\u0627 \u062d\u0630\u0641 \u06a9\u0646\u06cc\u0645.<\/p>\n<p>\u0628\u0631\u0627\u06cc \u062f\u06cc\u062f\u0646 \u06a9\u0644\u0645\u0627\u062a \u062a\u0648\u0642\u0641 \u067e\u06cc\u0634\u200c\u0641\u0631\u0636 spaCy \u0645\u06cc\u200c\u062a\u0648\u0627\u0646\u06cc\u0645 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0646\u06cc\u0645 <code>stop_words<\/code> \u0648\u06cc\u0698\u06af\u06cc \u0645\u062f\u0644 spaCy \u0647\u0645\u0627\u0646\u0637\u0648\u0631 \u06a9\u0647 \u062f\u0631 \u0632\u06cc\u0631 \u0646\u0634\u0627\u0646 \u062f\u0627\u062f\u0647 \u0634\u062f\u0647 \u0627\u0633\u062a:<\/p>\n<pre><code class=\"hljs\"><span class=\"hljs-keyword\">import<\/span> spacy\nsp = spacy.load(<span class=\"hljs-string\">'en_core_web_sm'<\/span>)\n<span class=\"hljs-built_in\">print<\/span>(sp.Defaults.stop_words)\n<\/code><\/pre>\n<p>\u062f\u0631 \u062e\u0631\u0648\u062c\u06cc\u060c \u062a\u0645\u0627\u0645 \u06a9\u0644\u0645\u0627\u062a \u062a\u0648\u0642\u0641 sPacy \u0631\u0627 \u062e\u0648\u0627\u0647\u06cc\u062f \u062f\u06cc\u062f:<\/p>\n<pre><code class=\"hljs\">{'less', 'except', 'top', 'me', 'three', 'fifteen', 'a', 'is', 'those', 'all', 'then', 'everyone', 'without', 'must', 'has', 'any', 'anyhow', 'keep', 'through', 'bottom', 'get', 'indeed', 'it', 'still', 'ten', 'whatever', 'doing', 'though', 'eight', 'various', 'myself', 'across', 'wherever', 'himself', 'always', 'thus', 'am', 'after', 'should', 'perhaps', 'at', 'down', 'own', 'rather', 'regarding', 'which', 'anywhere', 'whence', 'would', 'been', 'how', 'herself', 'now', 'might', 'please', 'behind', 'every', 'seems', 'alone', 'from', 'via', 'its', 'become', 'hers', 'there', 'front', 'whose', 'before', 'against', 'whereafter', 'up', 'whither', 'two', 'five', 'eleven', 'why', 'below', 'out', 'whereas', 'serious', 'six', 'give', 'also', 'became', 'his', 'anyway', 'none', 'again', 'onto', 'else', 'have', 'few', 'thereby', 'whoever', 'yet', 'part', 'just', 'afterwards', 'mostly', 'see', 'hereby', 'not', 'can', 'once', 'therefore', 'together', 'whom', 'elsewhere', 'beforehand', 'themselves', 'with', 'seem', 'many', 'upon', 'former', 'are', 'who', 'becoming', 'formerly', 'between', 'cannot', 'him', 'that', 'first', 'more', 'although', 'whenever', 'under', 'whereby', 'my', 'whereupon', 'anyone', 'toward', 'by', 'four', 'since', 'amongst', 'move', 'each', 'forty', 'somehow', 'as', 'besides', 'used', 'if', 'name', 'when', 'ever', 'however', 'otherwise', 'hundred', 'moreover', 'your', 'sometimes', 'the', 'empty', 'another', 'where', 'her', 'enough', 'quite', 'throughout', 'anything', 'she', 'and', 'does', 'above', 'within', 'show', 'in', 'this', 'back', 'made', 'nobody', 'off', 're', 'meanwhile', 'than', 'neither', 'twenty', 'call', 'you', 'next', 'thereupon', 'therein', 'go', 'or', 'seemed', 'such', 'latterly', 'already', 'mine', 'yourself', 'an', 'amount', 'hereupon', 'namely', 'same', 'their', 'of', 'yours', 'could', 'be', 'done', 'whole', 'seeming', 'someone', 'these', 'towards', 'among', 'becomes', 'per', 'thru', 'beyond', 'beside', 'both', 'latter', 'ours', 'well', 'make', 'nowhere', 'about', 'were', 'others', 'due', 'yourselves', 'unless', 'thereafter', 'even', 'too', 'most', 'everything', 'our', 'something', 'did', 'using', 'full', 'while', 'will', 'only', 'nor', 'often', 'side', 'being', 'least', 'over', 'some', 'along', 'was', 'very', '\u0631\u0648\u06cc', 'into', 'nine', 'noone', 'several', 'i', 'one', 'third', 'herein', 'but', 'further', 'here', 'whether', 'because', 'either', 'hereafter', 'really', 'so', 'somewhere', 'we', 'nevertheless', 'last', 'had', 'they', 'thence', 'almost', 'ca', 'everywhere', 'itself', 'no', 'ourselves', 'may', 'wherein', 'take', 'around', 'never', 'them', 'to', 'until', 'do', 'what', 'say', 'twelve', 'nothing', 'during', 'sixty', 'sometime', 'us', 'fifty', 'much', 'for', 'other', 'hence', 'he', 'put'}\n<\/code><\/pre>\n<p>\u0647\u0645\u0686\u0646\u06cc\u0646 \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u062f \u0628\u0631\u0631\u0633\u06cc \u06a9\u0646\u06cc\u062f \u06a9\u0647 \u0622\u06cc\u0627 \u06cc\u06a9 \u06a9\u0644\u0645\u0647 \u06cc\u06a9 \u06a9\u0644\u0645\u0647 \u062a\u0648\u0642\u0641 \u0627\u0633\u062a \u06cc\u0627 \u0646\u0647.  \u0628\u0631\u0627\u06cc \u0627\u06cc\u0646 \u06a9\u0627\u0631 \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u062f \u0627\u0632 <code>is_stop<\/code> \u0648\u06cc\u0698\u06af\u06cc \u0645\u0637\u0627\u0628\u0642 \u0634\u06a9\u0644 \u0632\u06cc\u0631:<\/p>\n<pre><code class=\"hljs\">sp.vocab(<span class=\"hljs-string\">'wonder'<\/span>).is_stop\n<\/code><\/pre>\n<p>\u0627\u0632 \u0622\u0646\u062c\u0627\u06cc\u06cc \u06a9\u0647 &#8220;\u0639\u062c\u0628&#8221; \u06cc\u06a9 \u06a9\u0644\u0645\u0647 \u062a\u0648\u0642\u0641 \u0641\u0636\u0627\u06cc\u06cc \u0646\u06cc\u0633\u062a\u060c \u062e\u0648\u0627\u0647\u06cc\u062f \u062f\u06cc\u062f <code>False<\/code> \u062f\u0631 \u062e\u0631\u0648\u062c\u06cc<\/p>\n<p>\u0628\u0631\u0627\u06cc \u0627\u0641\u0632\u0648\u062f\u0646 \u06cc\u0627 \u062d\u0630\u0641 \u06a9\u0644\u0645\u0627\u062a \u062a\u0648\u0642\u0641 \u062f\u0631 spaCy\u060c \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u062f \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0646\u06cc\u062f <code>sp.Defaults.stop_words.add()<\/code> \u0648 <code>sp.Defaults.stop_words.remove()<\/code> \u0631\u0648\u0634 \u0647\u0627 \u0628\u0647 \u062a\u0631\u062a\u06cc\u0628<\/p>\n<pre><code class=\"hljs\">sp.Defaults.stop_words.add(<span class=\"hljs-string\">'wonder'<\/span>)\n<\/code><\/pre>\n<p>\u0628\u0639\u062f\u060c \u0645\u0627 \u0628\u0627\u06cc\u062f \u062a\u0646\u0638\u06cc\u0645 \u06a9\u0646\u06cc\u0645 <code>is_stop<\/code> \u0628\u0631\u0627\u06cc <code>wonder<\/code> \u0628\u0647 &#8220;\u062f\u0631\u0633\u062a&#8221; \u0647\u0645\u0627\u0646\u0637\u0648\u0631 \u06a9\u0647 \u062f\u0631 \u0632\u06cc\u0631 \u0646\u0634\u0627\u0646 \u062f\u0627\u062f\u0647 \u0634\u062f\u0647 \u0627\u0633\u062a:<\/p>\n<pre><code class=\"hljs\">sp.vocab(<span class=\"hljs-string\">'wonder'<\/span>).is_stop = <span class=\"hljs-literal\">True<\/span>\n<\/code><\/pre>\n<h2 id=\"conclusion\"><span class=\"ez-toc-section\" id=\"%d9%86%d8%aa%db%8c%d8%ac%d9%87\"><\/span>\u0646\u062a\u06cc\u062c\u0647<span class=\"ez-toc-section-end\"><\/span><\/h2>\n<p>\u062a\u0637\u0628\u06cc\u0642 \u0639\u0628\u0627\u0631\u0627\u062a \u0648 \u0648\u0627\u0698\u06af\u0627\u0646 \u06cc\u06a9\u06cc \u0627\u0632 \u0645\u0647\u0645\u062a\u0631\u06cc\u0646 \u0648\u0638\u0627\u06cc\u0641 \u067e\u0631\u062f\u0627\u0632\u0634 \u0632\u0628\u0627\u0646 \u0637\u0628\u06cc\u0639\u06cc \u0627\u0633\u062a.  \u062f\u0631 \u0627\u06cc\u0646 \u0645\u0642\u0627\u0644\u0647\u060c \u0628\u062d\u062b \u062e\u0648\u062f \u0631\u0627 \u062f\u0631 \u0645\u0648\u0631\u062f \u0631\u0648\u0634 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 \u067e\u0627\u06cc\u062a\u0648\u0646 \u0628\u0631\u0627\u06cc \u0627\u0646\u062c\u0627\u0645 \u062a\u0637\u0628\u06cc\u0642 \u0645\u0628\u062a\u0646\u06cc \u0628\u0631 \u0642\u0627\u0646\u0648\u0646 \u0648 \u0639\u0628\u0627\u0631\u062a \u0627\u062f\u0627\u0645\u0647 \u062f\u0627\u062f\u06cc\u0645.  \u0639\u0644\u0627\u0648\u0647 \u0628\u0631 \u0627\u06cc\u0646\u060c \u06a9\u0644\u0645\u0627\u062a \u062a\u0648\u0642\u0641 spaCy \u0631\u0627 \u0646\u06cc\u0632 \u062f\u06cc\u062f\u06cc\u0645.<\/p>\n<p>\u062f\u0631 \u0645\u0642\u0627\u0644\u0647 \u0628\u0639\u062f\u06cc \u0628\u062e\u0634 \u0647\u0627\u06cc\u06cc \u0627\u0632 \u0628\u0631\u0686\u0633\u0628 \u06af\u0630\u0627\u0631\u06cc \u06af\u0641\u062a\u0627\u0631 \u0648 \u0634\u0646\u0627\u0633\u0627\u06cc\u06cc \u0645\u0648\u062c\u0648\u062f\u06cc\u062a \u0646\u0627\u0645\u06af\u0630\u0627\u0631\u06cc \u0634\u062f\u0647 \u0631\u0627 \u0628\u0647 \u0637\u0648\u0631 \u06a9\u0627\u0645\u0644 \u0645\u0634\u0627\u0647\u062f\u0647 \u062e\u0648\u0627\u0647\u06cc\u0645 \u06a9\u0631\u062f.<\/p>\n<\/div>\n<p><script>\n                        !function(f,b,e,v,n,t,s)\n                        {if(f.fbq)return;n=f.fbq=function(){n.callMethod?\n                        n.callMethod.apply(n,arguments):n.queue.push(arguments)};\n                        if(!f._fbq)f._fbq=n;n.push=n;n.loaded=!0;n.version='2.0';\n                        n.queue=();t=b.createElement(e);t.async=!0;\n                        t.src=v;s=b.getElementsByTagName(e)(0);\n                        s.parentNode.insertBefore(t,s)}(window, document,'script',\n                        'https:\/\/connect.facebook.net\/en_US\/fbevents.js');\n                        fbq('init', '525232124909042');\n                        fbq('track', 'PageView');\n                    <\/script>    (\u0628\u0631\u0686\u0633\u0628\u200c\u0647\u0627 \u0628\u0647 \u062a\u0631\u062c\u0645\u0647)# python<br \/>\n<br \/><br \/>\n<br \/>\u0645\u0646\u062a\u0634\u0631 \u0634\u062f\u0647 \u062f\u0631 1403-01-24 04:03:05<br \/>\n<\/p>\n\n\n<div class=\"kk-star-ratings kksr-auto kksr-align-center kksr-valign-bottom\"\n    data-payload='{&quot;align&quot;:&quot;center&quot;,&quot;id&quot;:&quot;16368&quot;,&quot;slug&quot;:&quot;default&quot;,&quot;valign&quot;:&quot;bottom&quot;,&quot;ignore&quot;:&quot;&quot;,&quot;reference&quot;:&quot;auto&quot;,&quot;class&quot;:&quot;&quot;,&quot;count&quot;:&quot;0&quot;,&quot;legendonly&quot;:&quot;&quot;,&quot;readonly&quot;:&quot;&quot;,&quot;score&quot;:&quot;0&quot;,&quot;starsonly&quot;:&quot;&quot;,&quot;best&quot;:&quot;5&quot;,&quot;gap&quot;:&quot;5&quot;,&quot;greet&quot;:&quot;\u0627\u0645\u062a\u06cc\u0627\u0632 \u0634\u0645\u0627 \u0628\u0647 \u0627\u06cc\u0646 \u0645\u0637\u0644\u0628&quot;,&quot;legend&quot;:&quot;0\\\/5 (0 \u0631\u0627\u06cc)&quot;,&quot;size&quot;:&quot;30&quot;,&quot;title&quot;:&quot;\u067e\u0627\u06cc\u062a\u0648\u0646 \u0628\u0631\u0627\u06cc NLP: \u062a\u0637\u0628\u06cc\u0642 \u0648\u0627\u0698\u06af\u0627\u0646 \u0648 \u0639\u0628\u0627\u0631\u062a \u0628\u0627 SpaCy&quot;,&quot;width&quot;:&quot;0&quot;,&quot;_legend&quot;:&quot;{score}\\\/{best} ({count} \u0631\u0627\u06cc)&quot;,&quot;font_factor&quot;:&quot;1.25&quot;}'>\n            \n<div class=\"kksr-stars\">\n    \n<div class=\"kksr-stars-inactive\">\n            <div class=\"kksr-star\" data-star=\"1\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" data-star=\"2\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" data-star=\"3\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" data-star=\"4\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" data-star=\"5\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n    <\/div>\n    \n<div class=\"kksr-stars-active\" style=\"width: 0px;\">\n            <div class=\"kksr-star\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n    <\/div>\n<\/div>\n                \n\n<div class=\"kksr-legend\" style=\"font-size: 24px;\">\n            <span class=\"kksr-muted\">\u0627\u0645\u062a\u06cc\u0627\u0632 \u0634\u0645\u0627 \u0628\u0647 \u0627\u06cc\u0646 \u0645\u0637\u0644\u0628<\/span>\n    <\/div>\n    <\/div>\n","protected":false},"excerpt":{"rendered":"<p><span class=\"span-reading-time rt-reading-time\" style=\"display: block;\"><span class=\"rt-label rt-prefix\">\u0632\u0645\u0627\u0646 \u0644\u0627\u0632\u0645 \u0628\u0631\u0627\u06cc \u0645\u0637\u0627\u0644\u0639\u0647: <\/span> <span class=\"rt-time\"> 8<\/span> <span class=\"rt-label rt-postfix\">\u062f\u0642\u06cc\u0642\u0647<\/span><\/span>\u0627\u06cc\u0646 \u0633\u0648\u0645\u06cc\u0646 \u0645\u0642\u0627\u0644\u0647 \u0627\u0632 \u0627\u06cc\u0646 \u0633\u0631\u06cc \u0645\u0642\u0627\u0644\u0627\u062a \u0627\u0633\u062a \u0631\u0648\u06cc \u067e\u0627\u06cc\u062a\u0648\u0646 \u0628\u0631\u0627\u06cc \u067e\u0631\u062f\u0627\u0632\u0634 \u0632\u0628\u0627\u0646 \u0637\u0628\u06cc\u0639\u06cc \u062f\u0631 \u0645\u0642\u0627\u0644\u0647 \u0642\u0628\u0644\u06cc \u062f\u06cc\u062f\u06cc\u0645 \u06a9\u0647 \u0686\u06af\u0648\u0646\u0647 NLTK \u067e\u0627\u06cc\u062a\u0648\u0646 \u0648 \u0641\u0636\u0627\u06cc\u06cc \u0627\u0632 \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 \u0647\u0627 \u0645\u06cc \u062a\u0648\u0627\u0646 \u0628\u0631\u0627\u06cc \u0627\u0646\u062c\u0627\u0645 \u0648\u0638\u0627\u06cc\u0641 \u0633\u0627\u062f\u0647 NLP \u0645\u0627\u0646\u0646\u062f \u0646\u0634\u0627\u0646\u0647 \u06af\u0630\u0627\u0631\u06cc\u060c \u0631\u06cc\u0634\u0647 \u06cc\u0627\u0628\u06cc \u0648 \u0631\u06cc\u0634\u0647 \u06cc\u0627\u0628\u06cc. \u0645\u0627 \u0647\u0645\u0686\u0646\u06cc\u0646 \u062f\u06cc\u062f\u06cc\u0645 \u06a9\u0647 \u0686\u06af\u0648\u0646\u0647 \u0645\u06cc\u200c\u062a\u0648\u0627\u0646 \u0628\u062e\u0634\u200c\u0647\u0627\u06cc\u06cc \u0627\u0632 \u0628\u0631\u0686\u0633\u0628\u200c\u06af\u0630\u0627\u0631\u06cc \u06af\u0641\u062a\u0627\u0631\u060c \u0634\u0646\u0627\u0633\u0627\u06cc\u06cc \u0645\u0648\u062c\u0648\u062f\u06cc\u062a \u0646\u0627\u0645\u200c\u06af\u0630\u0627\u0631\u06cc [&hellip;]<\/p>\n","protected":false},"author":3,"featured_media":9162,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"footnotes":""},"categories":[1743,620,1686],"tags":[],"class_list":["post-16368","post","type-post","status-publish","format-standard","has-post-thumbnail","hentry","category-python","category-programming","category-ai"],"acf":[],"_links":{"self":[{"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/posts\/16368","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/users\/3"}],"replies":[{"embeddable":true,"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/comments?post=16368"}],"version-history":[{"count":0,"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/posts\/16368\/revisions"}],"wp:featuredmedia":[{"embeddable":true,"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/media\/9162"}],"wp:attachment":[{"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/media?parent=16368"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/categories?post=16368"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/tags?post=16368"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}