{"id":17607,"date":"2024-07-10T19:40:13","date_gmt":"2024-07-10T16:10:13","guid":{"rendered":"https:\/\/rasanegaar.com\/blog\/%da%86%da%af%d9%88%d9%86%d9%87-%d8%a7%d8%b2-python-sdk-%d8%a8%d8%b1%d8%a7%db%8c-%d8%b3%d8%a7%d8%ae%d8%aa%d9%86-%d9%88%d8%a8-scraper-%d8%ae%d9%88%d8%af-%d8%a7%d8%b3%d8%aa%d9%81%d8%a7%d8%af%d9%87-%da%a9\/"},"modified":"2024-07-10T19:40:13","modified_gmt":"2024-07-10T16:10:13","slug":"%da%86%da%af%d9%88%d9%86%d9%87-%d8%a7%d8%b2-python-sdk-%d8%a8%d8%b1%d8%a7%db%8c-%d8%b3%d8%a7%d8%ae%d8%aa%d9%86-%d9%88%d8%a8-scraper-%d8%ae%d9%88%d8%af-%d8%a7%d8%b3%d8%aa%d9%81%d8%a7%d8%af%d9%87-%da%a9","status":"publish","type":"post","link":"https:\/\/rasanegaar.com\/blog\/%da%86%da%af%d9%88%d9%86%d9%87-%d8%a7%d8%b2-python-sdk-%d8%a8%d8%b1%d8%a7%db%8c-%d8%b3%d8%a7%d8%ae%d8%aa%d9%86-%d9%88%d8%a8-scraper-%d8%ae%d9%88%d8%af-%d8%a7%d8%b3%d8%aa%d9%81%d8%a7%d8%af%d9%87-%da%a9\/","title":{"rendered":"\u0686\u06af\u0648\u0646\u0647 \u0627\u0632 Python SDK \u0628\u0631\u0627\u06cc \u0633\u0627\u062e\u062a\u0646 \u0648\u0628 Scraper \u062e\u0648\u062f \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0646\u06cc\u062f"},"content":{"rendered":"<div id=\"ez-toc-container\" class=\"ez-toc-v2_0_85 counter-hierarchy ez-toc-counter ez-toc-custom ez-toc-container-direction\">\n<div class=\"ez-toc-title-container\"><p class=\"ez-toc-title\" style=\"cursor:inherit\">\u0633\u0631\u0641\u0635\u0644\u0647\u0627\u06cc \u0645\u0637\u0644\u0628<\/p>\n<\/div><nav><ul class='ez-toc-list ez-toc-list-level-1 ' ><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class=\"ez-toc-link ez-toc-heading-1\" href=\"https:\/\/rasanegaar.com\/blog\/%da%86%da%af%d9%88%d9%86%d9%87-%d8%a7%d8%b2-python-sdk-%d8%a8%d8%b1%d8%a7%db%8c-%d8%b3%d8%a7%d8%ae%d8%aa%d9%86-%d9%88%d8%a8-scraper-%d8%ae%d9%88%d8%af-%d8%a7%d8%b3%d8%aa%d9%81%d8%a7%d8%af%d9%87-%da%a9\/#web_scraping_%da%86%db%8c%d8%b3%d8%aa%d8%9f\" >Web scraping \u0686\u06cc\u0633\u062a\u061f<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class=\"ez-toc-link ez-toc-heading-2\" href=\"https:\/\/rasanegaar.com\/blog\/%da%86%da%af%d9%88%d9%86%d9%87-%d8%a7%d8%b2-python-sdk-%d8%a8%d8%b1%d8%a7%db%8c-%d8%b3%d8%a7%d8%ae%d8%aa%d9%86-%d9%88%d8%a8-scraper-%d8%ae%d9%88%d8%af-%d8%a7%d8%b3%d8%aa%d9%81%d8%a7%d8%af%d9%87-%da%a9\/#%d8%a2%d9%86%da%86%d9%87_%d8%af%d8%b1_%d8%a7%db%8c%d9%86%d8%ac%d8%a7_%d8%ae%d9%88%d8%a7%d9%87%db%8c%d8%af_%d8%a2%d9%85%d9%88%d8%ae%d8%aa\" >\u0622\u0646\u0686\u0647 \u062f\u0631 \u0627\u06cc\u0646\u062c\u0627 \u062e\u0648\u0627\u0647\u06cc\u062f \u0622\u0645\u0648\u062e\u062a<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class=\"ez-toc-link ez-toc-heading-3\" href=\"https:\/\/rasanegaar.com\/blog\/%da%86%da%af%d9%88%d9%86%d9%87-%d8%a7%d8%b2-python-sdk-%d8%a8%d8%b1%d8%a7%db%8c-%d8%b3%d8%a7%d8%ae%d8%aa%d9%86-%d9%88%d8%a8-scraper-%d8%ae%d9%88%d8%af-%d8%a7%d8%b3%d8%aa%d9%81%d8%a7%d8%af%d9%87-%da%a9\/#%da%86%da%af%d9%88%d9%86%d9%87_%d8%b3%d9%88%d9%be_%d8%b2%db%8c%d8%a8%d8%a7_%d9%88_%d8%af%d8%b1%d8%ae%d9%88%d8%a7%d8%b3%d8%aa_%d9%87%d8%a7%db%8c_%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86_%d8%a8%d8%a7_%d9%87%d9%85_%da%a9%d8%a7%d8%b1_%d9%85%db%8c_%da%a9%d9%86%d9%86%d8%af\" >\u0686\u06af\u0648\u0646\u0647 \u0633\u0648\u067e \u0632\u06cc\u0628\u0627 \u0648 \u062f\u0631\u062e\u0648\u0627\u0633\u062a \u0647\u0627\u06cc \u067e\u0627\u06cc\u062a\u0648\u0646 \u0628\u0627 \u0647\u0645 \u06a9\u0627\u0631 \u0645\u06cc \u06a9\u0646\u0646\u062f<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class=\"ez-toc-link ez-toc-heading-4\" href=\"https:\/\/rasanegaar.com\/blog\/%da%86%da%af%d9%88%d9%86%d9%87-%d8%a7%d8%b2-python-sdk-%d8%a8%d8%b1%d8%a7%db%8c-%d8%b3%d8%a7%d8%ae%d8%aa%d9%86-%d9%88%d8%a8-scraper-%d8%ae%d9%88%d8%af-%d8%a7%d8%b3%d8%aa%d9%81%d8%a7%d8%af%d9%87-%da%a9\/#%da%86%da%af%d9%88%d9%86%d9%87_%d8%a8%d8%a7_python_sdk_%db%8c%da%a9_web_scraper_%d8%a8%d8%b3%d8%a7%d8%b2%db%8c%d9%85\" >\u0686\u06af\u0648\u0646\u0647 \u0628\u0627 Python SDK \u06cc\u06a9 Web Scraper \u0628\u0633\u0627\u0632\u06cc\u0645<\/a><ul class='ez-toc-list-level-3' ><li class='ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-5\" href=\"https:\/\/rasanegaar.com\/blog\/%da%86%da%af%d9%88%d9%86%d9%87-%d8%a7%d8%b2-python-sdk-%d8%a8%d8%b1%d8%a7%db%8c-%d8%b3%d8%a7%d8%ae%d8%aa%d9%86-%d9%88%d8%a8-scraper-%d8%ae%d9%88%d8%af-%d8%a7%d8%b3%d8%aa%d9%81%d8%a7%d8%af%d9%87-%da%a9\/#%d9%85%d8%b1%d8%ad%d9%84%d9%87_1_%d9%88%d8%a7%d8%b1%d8%af_%da%a9%d8%b1%d8%af%d9%86_%da%a9%d8%aa%d8%a7%d8%a8%d8%ae%d8%a7%d9%86%d9%87_%d9%87%d8%a7%db%8c_%d8%b6%d8%b1%d9%88%d8%b1%db%8c\" >\u0645\u0631\u062d\u0644\u0647 1: \u0648\u0627\u0631\u062f \u06a9\u0631\u062f\u0646 \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 \u0647\u0627\u06cc \u0636\u0631\u0648\u0631\u06cc<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-6\" href=\"https:\/\/rasanegaar.com\/blog\/%da%86%da%af%d9%88%d9%86%d9%87-%d8%a7%d8%b2-python-sdk-%d8%a8%d8%b1%d8%a7%db%8c-%d8%b3%d8%a7%d8%ae%d8%aa%d9%86-%d9%88%d8%a8-scraper-%d8%ae%d9%88%d8%af-%d8%a7%d8%b3%d8%aa%d9%81%d8%a7%d8%af%d9%87-%da%a9\/#%d9%85%d8%b1%d8%ad%d9%84%d9%87_2_url_%d9%be%d8%a7%db%8c%d9%87_%d9%88_%d8%b3%d8%b1%d8%b5%d9%81%d8%ad%d9%87_csv_%d8%b1%d8%a7_%d8%aa%d8%b9%d8%b1%db%8c%d9%81_%da%a9%d9%86%db%8c%d8%af\" >\u0645\u0631\u062d\u0644\u0647 2: URL \u067e\u0627\u06cc\u0647 \u0648 \u0633\u0631\u0635\u0641\u062d\u0647 CSV \u0631\u0627 \u062a\u0639\u0631\u06cc\u0641 \u06a9\u0646\u06cc\u062f<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-7\" href=\"https:\/\/rasanegaar.com\/blog\/%da%86%da%af%d9%88%d9%86%d9%87-%d8%a7%d8%b2-python-sdk-%d8%a8%d8%b1%d8%a7%db%8c-%d8%b3%d8%a7%d8%ae%d8%aa%d9%86-%d9%88%d8%a8-scraper-%d8%ae%d9%88%d8%af-%d8%a7%d8%b3%d8%aa%d9%81%d8%a7%d8%af%d9%87-%da%a9\/#%d9%85%d8%b1%d8%ad%d9%84%d9%87_3_%db%8c%da%a9_%d8%aa%d8%a7%d8%a8%d8%b9_%d8%a8%d8%b1%d8%a7%db%8c_%d8%ae%d8%b1%d8%a7%d8%b4_%d8%af%d8%a7%d8%af%d9%86_%d8%ac%d8%b2%d8%a6%db%8c%d8%a7%d8%aa_%d9%85%d8%ac%d9%85%d9%88%d8%b9%d9%87_%d8%af%d8%a7%d8%af%d9%87_%d8%a7%db%8c%d8%ac%d8%a7%d8%af_%da%a9%d9%86%db%8c%d8%af\" >\u0645\u0631\u062d\u0644\u0647 3: \u06cc\u06a9 \u062a\u0627\u0628\u0639 \u0628\u0631\u0627\u06cc \u062e\u0631\u0627\u0634 \u062f\u0627\u062f\u0646 \u062c\u0632\u0626\u06cc\u0627\u062a \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647 \u0627\u06cc\u062c\u0627\u062f \u06a9\u0646\u06cc\u062f<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-8\" href=\"https:\/\/rasanegaar.com\/blog\/%da%86%da%af%d9%88%d9%86%d9%87-%d8%a7%d8%b2-python-sdk-%d8%a8%d8%b1%d8%a7%db%8c-%d8%b3%d8%a7%d8%ae%d8%aa%d9%86-%d9%88%d8%a8-scraper-%d8%ae%d9%88%d8%af-%d8%a7%d8%b3%d8%aa%d9%81%d8%a7%d8%af%d9%87-%da%a9\/#%d9%85%d8%b1%d8%ad%d9%84%d9%87_4_%db%8c%da%a9_%d8%aa%d8%a7%d8%a8%d8%b9_%d8%a8%d8%b1%d8%a7%db%8c_%d8%ae%d8%b1%d8%a7%d8%b4_%d8%af%d8%a7%d8%af%d9%86_%d9%84%db%8c%d8%b3%d8%aa_%d9%87%d8%a7%db%8c_%d9%85%d8%ac%d9%85%d9%88%d8%b9%d9%87_%d8%af%d8%a7%d8%af%d9%87_%d8%a7%db%8c%d8%ac%d8%a7%d8%af_%da%a9%d9%86%db%8c%d8%af\" >\u0645\u0631\u062d\u0644\u0647 4: \u06cc\u06a9 \u062a\u0627\u0628\u0639 \u0628\u0631\u0627\u06cc \u062e\u0631\u0627\u0634 \u062f\u0627\u062f\u0646 \u0644\u06cc\u0633\u062a \u0647\u0627\u06cc \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647 \u0627\u06cc\u062c\u0627\u062f \u06a9\u0646\u06cc\u062f<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-9\" href=\"https:\/\/rasanegaar.com\/blog\/%da%86%da%af%d9%88%d9%86%d9%87-%d8%a7%d8%b2-python-sdk-%d8%a8%d8%b1%d8%a7%db%8c-%d8%b3%d8%a7%d8%ae%d8%aa%d9%86-%d9%88%d8%a8-scraper-%d8%ae%d9%88%d8%af-%d8%a7%d8%b3%d8%aa%d9%81%d8%a7%d8%af%d9%87-%da%a9\/#%d9%85%d8%b1%d8%ad%d9%84%d9%87_5_%d8%a8%d8%a7_%d8%a7%d8%b3%d8%aa%d9%81%d8%a7%d8%af%d9%87_%d8%a7%d8%b2_%d9%be%d8%a7%d8%b1%d8%a7%d9%85%d8%aa%d8%b1%d9%87%d8%a7%db%8c_%d8%b5%d9%81%d8%ad%d9%87_%d8%a8%d9%86%d8%af%db%8c%d8%8c_%d8%b5%d9%81%d8%ad%d8%a7%d8%aa_%d8%b1%d8%a7_%d8%ad%d9%84%d9%82%d9%87_%d8%a8%d8%b2%d9%86%db%8c%d8%af\" >\u0645\u0631\u062d\u0644\u0647 5: \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 \u067e\u0627\u0631\u0627\u0645\u062a\u0631\u0647\u0627\u06cc \u0635\u0641\u062d\u0647 \u0628\u0646\u062f\u06cc\u060c \u0635\u0641\u062d\u0627\u062a \u0631\u0627 \u062d\u0644\u0642\u0647 \u0628\u0632\u0646\u06cc\u062f<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-10\" href=\"https:\/\/rasanegaar.com\/blog\/%da%86%da%af%d9%88%d9%86%d9%87-%d8%a7%d8%b2-python-sdk-%d8%a8%d8%b1%d8%a7%db%8c-%d8%b3%d8%a7%d8%ae%d8%aa%d9%86-%d9%88%d8%a8-scraper-%d8%ae%d9%88%d8%af-%d8%a7%d8%b3%d8%aa%d9%81%d8%a7%d8%af%d9%87-%da%a9\/#%d9%85%d8%b1%d8%ad%d9%84%d9%87_6_%d8%af%d8%a7%d8%af%d9%87_%d9%87%d8%a7%db%8c_%d8%ae%d8%b1%d8%a7%d8%b4%db%8c%d8%af%d9%87_%d8%b4%d8%af%d9%87_%d8%b1%d8%a7_%d8%af%d8%b1_%db%8c%da%a9_%d9%81%d8%a7%db%8c%d9%84_csv_%d8%b0%d8%ae%db%8c%d8%b1%d9%87_%da%a9%d9%86%db%8c%d8%af\" >\u0645\u0631\u062d\u0644\u0647 6: \u062f\u0627\u062f\u0647 \u0647\u0627\u06cc \u062e\u0631\u0627\u0634\u06cc\u062f\u0647 \u0634\u062f\u0647 \u0631\u0627 \u062f\u0631 \u06cc\u06a9 \u0641\u0627\u06cc\u0644 CSV \u0630\u062e\u06cc\u0631\u0647 \u06a9\u0646\u06cc\u062f<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-11\" href=\"https:\/\/rasanegaar.com\/blog\/%da%86%da%af%d9%88%d9%86%d9%87-%d8%a7%d8%b2-python-sdk-%d8%a8%d8%b1%d8%a7%db%8c-%d8%b3%d8%a7%d8%ae%d8%aa%d9%86-%d9%88%d8%a8-scraper-%d8%ae%d9%88%d8%af-%d8%a7%d8%b3%d8%aa%d9%81%d8%a7%d8%af%d9%87-%da%a9\/#%d9%85%d8%b1%d8%ad%d9%84%d9%87_7_%d8%b9%d9%85%d9%84%da%a9%d8%b1%d8%af_scraping_%d8%b1%d8%a7_%d8%a7%d8%ac%d8%b1%d8%a7_%da%a9%d9%86%db%8c%d8%af\" >\u0645\u0631\u062d\u0644\u0647 7: \u0639\u0645\u0644\u06a9\u0631\u062f Scraping \u0631\u0627 \u0627\u062c\u0631\u0627 \u06a9\u0646\u06cc\u062f<\/a><\/li><\/ul><\/li><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class=\"ez-toc-link ez-toc-heading-12\" href=\"https:\/\/rasanegaar.com\/blog\/%da%86%da%af%d9%88%d9%86%d9%87-%d8%a7%d8%b2-python-sdk-%d8%a8%d8%b1%d8%a7%db%8c-%d8%b3%d8%a7%d8%ae%d8%aa%d9%86-%d9%88%d8%a8-scraper-%d8%ae%d9%88%d8%af-%d8%a7%d8%b3%d8%aa%d9%81%d8%a7%d8%af%d9%87-%da%a9\/#%da%a9%d8%af_%da%a9%d8%a7%d9%85%d9%84\" >\u06a9\u062f \u06a9\u0627\u0645\u0644<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class=\"ez-toc-link ez-toc-heading-13\" href=\"https:\/\/rasanegaar.com\/blog\/%da%86%da%af%d9%88%d9%86%d9%87-%d8%a7%d8%b2-python-sdk-%d8%a8%d8%b1%d8%a7%db%8c-%d8%b3%d8%a7%d8%ae%d8%aa%d9%86-%d9%88%d8%a8-scraper-%d8%ae%d9%88%d8%af-%d8%a7%d8%b3%d8%aa%d9%81%d8%a7%d8%af%d9%87-%da%a9\/#%d9%86%d8%aa%db%8c%d8%ac%d9%87\" >\u0646\u062a\u06cc\u062c\u0647<\/a><\/li><\/ul><\/nav><\/div>\n<span class=\"span-reading-time rt-reading-time\" style=\"display: block;\"><span class=\"rt-label rt-prefix\">\u0632\u0645\u0627\u0646 \u0644\u0627\u0632\u0645 \u0628\u0631\u0627\u06cc \u0645\u0637\u0627\u0644\u0639\u0647: <\/span> <span class=\"rt-time\"> 7<\/span> <span class=\"rt-label rt-postfix\">\u062f\u0642\u06cc\u0642\u0647<\/span><\/span><p> <br \/>\n<\/p>\n<section class=\"post-content \" data-test-label=\"post-content\">\n<h2 id=\"what-is-web-scraping\"><span class=\"ez-toc-section\" id=\"web_scraping_%da%86%db%8c%d8%b3%d8%aa%d8%9f\"><\/span><strong>Web scraping \u0686\u06cc\u0633\u062a\u061f<\/strong><span class=\"ez-toc-section-end\"><\/span><\/h2>\n<p>Web scraping \u062a\u06a9\u0646\u06cc\u06a9\u06cc \u0627\u0633\u062a \u06a9\u0647 \u0628\u0631\u0627\u06cc \u062c\u0645\u0639 \u0622\u0648\u0631\u06cc \u0645\u0642\u0627\u062f\u06cc\u0631 \u0632\u06cc\u0627\u062f\u06cc \u062f\u0627\u062f\u0647 \u0628\u0647 \u0635\u0648\u0631\u062a \u062e\u0648\u062f\u06a9\u0627\u0631 \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 \u06cc\u06a9 \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0628\u0631\u0646\u0627\u0645\u0647 \u0646\u0648\u06cc\u0633\u06cc \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0645\u06cc \u0634\u0648\u062f.  \u0627\u06cc\u0646 \u0627\u0645\u0631 \u0622\u0646 \u0631\u0627 \u0628\u0631\u0627\u06cc \u0628\u0633\u06cc\u0627\u0631\u06cc \u0627\u0632 \u0645\u062a\u062e\u0635\u0635\u0627\u0646 \u0645\u0627\u0646\u0646\u062f \u062a\u062d\u0644\u06cc\u0644\u06af\u0631\u0627\u0646 \u062f\u0627\u062f\u0647\u060c \u0645\u062d\u0642\u0642\u0627\u0646 \u0628\u0627\u0632\u0627\u0631\u060c \u0645\u062a\u062e\u0635\u0635\u0627\u0646 \u0633\u0626\u0648\u060c \u062a\u062d\u0644\u06cc\u0644\u06af\u0631\u0627\u0646 \u062a\u062c\u0627\u0631\u06cc \u0648 \u0645\u062d\u0642\u0642\u0627\u0646 \u062f\u0627\u0646\u0634\u06af\u0627\u0647\u06cc \u0645\u0641\u06cc\u062f \u0645\u06cc \u06a9\u0646\u062f.<\/p>\n<h2 id=\"what-you-ll-learn-here\"><span class=\"ez-toc-section\" id=\"%d8%a2%d9%86%da%86%d9%87_%d8%af%d8%b1_%d8%a7%db%8c%d9%86%d8%ac%d8%a7_%d8%ae%d9%88%d8%a7%d9%87%db%8c%d8%af_%d8%a2%d9%85%d9%88%d8%ae%d8%aa\"><\/span><strong>\u0622\u0646\u0686\u0647 \u062f\u0631 \u0627\u06cc\u0646\u062c\u0627 \u062e\u0648\u0627\u0647\u06cc\u062f \u0622\u0645\u0648\u062e\u062a<\/strong><span class=\"ez-toc-section-end\"><\/span><\/h2>\n<p>\u067e\u0627\u06cc\u062a\u0648\u0646 \u062f\u0648 \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 \u0628\u0647 \u0646\u0627\u0645\u200c\u0647\u0627\u06cc Requests \u0648 Beautiful Soup \u0627\u0631\u0627\u0626\u0647 \u0645\u06cc\u200c\u06a9\u0646\u062f \u06a9\u0647 \u0628\u0647 \u0634\u0645\u0627 \u06a9\u0645\u06a9 \u0645\u06cc\u200c\u06a9\u0646\u062f \u0648\u0628\u200c\u0633\u0627\u06cc\u062a\u200c\u0647\u0627 \u0631\u0627 \u0631\u0627\u062d\u062a\u200c\u062a\u0631 \u062e\u0631\u0627\u0634 \u062f\u0647\u06cc\u062f.  \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u062a\u0631\u06a9\u06cc\u0628\u06cc \u0627\u0632 \u062f\u0631\u062e\u0648\u0627\u0633\u062a\u200c\u0647\u0627\u06cc Python \u0648 Beautiful Soup \u0645\u06cc\u200c\u062a\u0648\u0627\u0646\u062f \u0645\u062d\u062a\u0648\u0627\u06cc HTML \u0631\u0627 \u0627\u0632 \u06cc\u06a9 \u0648\u0628\u200c\u0633\u0627\u06cc\u062a \u0628\u0627\u0632\u06cc\u0627\u0628\u06cc \u06a9\u0646\u062f \u0648 \u0633\u067e\u0633 \u0622\u0646 \u0631\u0627 \u0628\u0631\u0627\u06cc \u0627\u0633\u062a\u062e\u0631\u0627\u062c \u062f\u0627\u062f\u0647\u200c\u0647\u0627\u06cc \u0645\u0648\u0631\u062f \u0646\u06cc\u0627\u0632 \u062a\u062c\u0632\u06cc\u0647 \u06a9\u0646\u062f.  \u062f\u0631 \u0627\u06cc\u0646 \u0645\u0642\u0627\u0644\u0647 \u0631\u0648\u0634 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 \u0627\u06cc\u0646 \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 \u0647\u0627 \u0631\u0627 \u0628\u0627 \u06cc\u06a9 \u0645\u062b\u0627\u0644 \u0628\u0647 \u0634\u0645\u0627 \u0646\u0634\u0627\u0646 \u0645\u06cc \u062f\u0647\u0645.<\/p>\n<p>\u0627\u06af\u0631 \u0628\u0627 \u0627\u06cc\u0646 \u0645\u0641\u0647\u0648\u0645 \u062a\u0627\u0632\u0647 \u06a9\u0627\u0631 \u0647\u0633\u062a\u06cc\u062f \u0648 \u062f\u0631 \u0633\u0637\u062d \u0645\u062a\u0648\u0633\u0637\u06cc \u0627\u0632 \u062a\u062e\u0635\u0635 \u067e\u0627\u06cc\u062a\u0648\u0646 \u062f\u0627\u0631\u06cc\u062f\u060c \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u062f \u062f\u0648\u0631\u0647 \u062a\u0648\u0633\u0639\u0647 \u067e\u0627\u06cc\u062a\u0648\u0646 \u0631\u0627 \u0628\u0631\u0631\u0633\u06cc \u06a9\u0646\u06cc\u062f. \u0631\u0648\u06cc \u0641\u0648\u0642 \u0645\u0647\u0627\u0631\u062a\u060c \u062c\u0627\u06cc\u06cc \u06a9\u0647 \u0645\u0646 \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u06cc\u06a9 \u0645\u062a\u062e\u0635\u0635 \u062f\u0631 \u0622\u0646 \u0645\u0634\u0627\u0631\u06a9\u062a \u0645\u06cc \u06a9\u0646\u0645. <\/p>\n<p>\u062f\u0631 \u067e\u0627\u06cc\u0627\u0646 \u0627\u06cc\u0646 \u0631\u0627\u0647\u0646\u0645\u0627\u060c \u0634\u0645\u0627 \u0628\u0631\u0627\u06cc \u0633\u0627\u062e\u062a\u0646 Web Scraper \u062e\u0648\u062f \u0645\u062c\u0647\u0632 \u062e\u0648\u0627\u0647\u06cc\u062f \u0634\u062f \u0648 \u062f\u0631\u06a9 \u0639\u0645\u06cc\u0642 \u062a\u0631\u06cc \u0627\u0632 \u06a9\u0627\u0631 \u0628\u0627 \u062d\u062c\u0645 \u0632\u06cc\u0627\u062f\u06cc \u0627\u0632 \u062f\u0627\u062f\u0647 \u0647\u0627 \u0648 \u0631\u0648\u0634 \u0627\u0639\u0645\u0627\u0644 \u0622\u0646 \u0628\u0631\u0627\u06cc \u062a\u0635\u0645\u06cc\u0645 \u06af\u06cc\u0631\u06cc \u0647\u0627\u06cc \u0645\u0628\u062a\u0646\u06cc \u0628\u0631 \u062f\u0627\u062f\u0647 \u062e\u0648\u0627\u0647\u06cc\u062f \u062f\u0627\u0634\u062a.<\/p>\n<p>\u0644\u0637\u0641\u0627\u064b \u062a\u0648\u062c\u0647 \u062f\u0627\u0634\u062a\u0647 \u0628\u0627\u0634\u06cc\u062f \u06a9\u0647 \u0627\u06af\u0631\u0686\u0647 \u0648\u0628 \u0627\u0633\u06a9\u0631\u0627\u067e\u0631 \u0627\u0628\u0632\u0627\u0631 \u0645\u0641\u06cc\u062f\u06cc \u0627\u0633\u062a\u060c \u0645\u0637\u0645\u0626\u0646 \u0634\u0648\u06cc\u062f \u06a9\u0647 \u0628\u0627 \u062a\u0645\u0627\u0645 \u062f\u0633\u062a\u0648\u0631\u0627\u0644\u0639\u0645\u0644\u200c\u0647\u0627\u06cc \u0642\u0627\u0646\u0648\u0646\u06cc \u0645\u0637\u0627\u0628\u0642\u062a \u062f\u0627\u0631\u06cc\u062f.  \u0627\u06cc\u0646 \u0634\u0627\u0645\u0644 \u0627\u062d\u062a\u0631\u0627\u0645 \u0628\u0647 \u0648\u0628 \u0633\u0627\u06cc\u062a \u0627\u0633\u062a <code>robots.txt<\/code> \u0641\u0627\u06cc\u0644 \u0648 \u0631\u0639\u0627\u06cc\u062a \u0634\u0631\u0627\u06cc\u0637 \u062e\u062f\u0645\u0627\u062a\u060c \u0628\u0646\u0627\u0628\u0631\u0627\u06cc\u0646 \u0627\u0632 \u0627\u0633\u062a\u062e\u0631\u0627\u062c \u063a\u06cc\u0631\u0645\u062c\u0627\u0632 \u062f\u0627\u062f\u0647 \u0647\u0627 \u062c\u0644\u0648\u06af\u06cc\u0631\u06cc \u06a9\u0646\u06cc\u062f. <\/p>\n<p>\u0647\u0645\u0686\u0646\u06cc\u0646 \u0642\u0628\u0644 \u0627\u0632 \u0633\u0648\u0647\u0627\u0646 \u0632\u062f\u0646 \u0627\u0632 \u0633\u0648\u0647\u0627\u0646 \u0632\u062f\u0646 \u0645\u0637\u0645\u0626\u0646 \u0634\u0648\u06cc\u062f process \u0628\u0647 \u0639\u0645\u0644\u06a9\u0631\u062f \u0648\u0628 \u0633\u0627\u06cc\u062a \u0622\u0633\u06cc\u0628 \u0646\u0645\u06cc \u0631\u0633\u0627\u0646\u062f \u06cc\u0627 \u0633\u0631\u0648\u0631\u0647\u0627\u06cc \u0622\u0646 \u0631\u0627 \u0628\u06cc\u0634 \u0627\u0632 \u062d\u062f \u0628\u0627\u0631\u06af\u0630\u0627\u0631\u06cc \u0645\u06cc \u06a9\u0646\u062f.  \u062f\u0631 \u0646\u0647\u0627\u06cc\u062a\u060c \u0628\u0627 \u062d\u0630\u0641 \u0646\u06a9\u0631\u062f\u0646 \u0627\u0637\u0644\u0627\u0639\u0627\u062a \u0634\u062e\u0635\u06cc \u06cc\u0627 \u062d\u0633\u0627\u0633 \u0628\u062f\u0648\u0646 \u0631\u0636\u0627\u06cc\u062a \u0645\u0646\u0627\u0633\u0628\u060c \u0628\u0647 \u062d\u0631\u06cc\u0645 \u062e\u0635\u0648\u0635\u06cc \u062f\u0627\u062f\u0647 \u0647\u0627 \u0627\u062d\u062a\u0631\u0627\u0645 \u0628\u06af\u0630\u0627\u0631\u06cc\u062f.<\/p>\n<h2 id=\"how-beautiful-soup-and-python-requests-work-together\"><span class=\"ez-toc-section\" id=\"%da%86%da%af%d9%88%d9%86%d9%87_%d8%b3%d9%88%d9%be_%d8%b2%db%8c%d8%a8%d8%a7_%d9%88_%d8%af%d8%b1%d8%ae%d9%88%d8%a7%d8%b3%d8%aa_%d9%87%d8%a7%db%8c_%d9%be%d8%a7%db%8c%d8%aa%d9%88%d9%86_%d8%a8%d8%a7_%d9%87%d9%85_%da%a9%d8%a7%d8%b1_%d9%85%db%8c_%da%a9%d9%86%d9%86%d8%af\"><\/span><strong>\u0686\u06af\u0648\u0646\u0647 \u0633\u0648\u067e \u0632\u06cc\u0628\u0627 \u0648 \u062f\u0631\u062e\u0648\u0627\u0633\u062a \u0647\u0627\u06cc \u067e\u0627\u06cc\u062a\u0648\u0646 \u0628\u0627 \u0647\u0645 \u06a9\u0627\u0631 \u0645\u06cc \u06a9\u0646\u0646\u062f<\/strong><span class=\"ez-toc-section-end\"><\/span><\/h2>\n<p>\u0628\u06cc\u0627\u06cc\u06cc\u062f \u0646\u0642\u0634 \u0647\u0631 \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 \u0631\u0627 \u062f\u0631\u06a9 \u06a9\u0646\u06cc\u0645. <\/p>\n<p>\u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 \u062f\u0631\u062e\u0648\u0627\u0633\u062a\u200c\u0647\u0627\u06cc \u067e\u0627\u06cc\u062a\u0648\u0646 \u0645\u0633\u0626\u0648\u0644 \u0648\u0627\u06a9\u0634\u06cc \u0645\u062d\u062a\u0648\u0627\u06cc HTML \u0627\u0632 \u0622\u062f\u0631\u0633 \u0627\u06cc\u0646\u062a\u0631\u0646\u062a\u06cc \u0634\u0645\u0627 \u062f\u0631 \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0627\u0633\u062a.  \u0647\u0646\u06af\u0627\u0645\u06cc \u06a9\u0647 \u0645\u062d\u062a\u0648\u0627 \u0631\u0627 \u0628\u0627\u0632\u06cc\u0627\u0628\u06cc \u0645\u06cc \u06a9\u0646\u062f\u060c \u062f\u0627\u062f\u0647 \u0647\u0627 \u0631\u0627 \u062f\u0631 \u06cc\u06a9 \u0634\u06cc \u067e\u0627\u0633\u062e \u0630\u062e\u06cc\u0631\u0647 \u0645\u06cc \u06a9\u0646\u062f. <\/p>\n<p>\u0633\u067e\u0633 Beautiful Soup \u06a9\u0627\u0631 \u0631\u0627 \u0628\u0647 \u062f\u0633\u062a \u0645\u06cc \u06af\u06cc\u0631\u062f \u0648 HTML \u062e\u0627\u0645 \u0631\u0627 \u0627\u0632 \u067e\u0627\u0633\u062e Requests \u0628\u0647 \u0642\u0627\u0644\u0628\u06cc \u0633\u0627\u062e\u062a\u0627\u0631\u06cc\u0627\u0641\u062a\u0647 \u062a\u0628\u062f\u06cc\u0644 \u0645\u06cc \u06a9\u0646\u062f \u0648 \u0622\u0646 \u0631\u0627 \u062a\u062c\u0632\u06cc\u0647 \u0645\u06cc \u06a9\u0646\u062f.  \u0633\u067e\u0633 \u0645\u06cc\u200c\u062a\u0648\u0627\u0646\u06cc\u062f \u0628\u0627 \u0645\u0634\u062e\u0635 \u06a9\u0631\u062f\u0646 \u0648\u06cc\u0698\u06af\u06cc\u200c\u0647\u0627\u060c \u062f\u0627\u062f\u0647\u200c\u0647\u0627 \u0631\u0627 \u0627\u0632 HTML \u062a\u062c\u0632\u06cc\u0647\u200c\u0634\u062f\u0647 \u067e\u0627\u06a9 \u06a9\u0646\u06cc\u062f \u0648 \u0628\u0647 \u0634\u0645\u0627 \u0627\u06cc\u0646 \u0627\u0645\u06a9\u0627\u0646 \u0631\u0627 \u0645\u06cc\u200c\u062f\u0647\u062f \u06a9\u0647 \u062c\u0645\u0639\u200c\u0622\u0648\u0631\u06cc \u062f\u0627\u062f\u0647\u200c\u0647\u0627\u06cc \u062e\u0627\u0635 \u0627\u0632 \u0648\u0628\u200c\u0633\u0627\u06cc\u062a\u200c\u0647\u0627 \u06cc\u0627 \u0645\u062e\u0627\u0632\u0646 \u0631\u0627 \u062e\u0648\u062f\u06a9\u0627\u0631 \u06a9\u0646\u06cc\u062f.<\/p>\n<p>\u0627\u0645\u0627 \u0627\u06cc\u0646 \u062f\u0648\u062a\u0627\u06cc\u06cc \u0645\u062d\u062f\u0648\u062f\u06cc\u062a \u0647\u0627\u06cc\u06cc \u062f\u0627\u0631\u062f.  \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 Requests \u0646\u0645\u06cc \u062a\u0648\u0627\u0646\u062f \u0648\u0628 \u0633\u0627\u06cc\u062a \u0647\u0627\u06cc\u06cc \u0628\u0627 \u0645\u062d\u062a\u0648\u0627\u06cc \u062c\u0627\u0648\u0627 \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u067e\u0648\u06cc\u0627 \u0631\u0627 \u0645\u062f\u06cc\u0631\u06cc\u062a \u06a9\u0646\u062f.  \u0628\u0646\u0627\u0628\u0631\u0627\u06cc\u0646 \u0634\u0645\u0627 \u0628\u0627\u06cc\u062f \u062f\u0631 \u062f\u0631\u062c\u0647 \u0627\u0648\u0644 \u0627\u0632 \u0622\u0646 \u0628\u0631\u0627\u06cc \u0633\u0627\u06cc\u062a \u0647\u0627\u06cc\u06cc \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0646\u06cc\u062f \u06a9\u0647 \u0645\u062d\u062a\u0648\u0627\u06cc \u0627\u06cc\u0633\u062a\u0627 \u0631\u0627 \u0627\u0632 \u0633\u0631\u0648\u0631\u0647\u0627 \u0627\u0631\u0627\u0626\u0647 \u0645\u06cc \u062f\u0647\u0646\u062f.  \u0627\u06af\u0631 \u0646\u06cc\u0627\u0632 \u0628\u0647 \u062e\u0631\u0627\u0634 \u062f\u0627\u062f\u0646 \u06cc\u06a9 \u0633\u0627\u06cc\u062a \u0628\u0627\u0631\u06af\u0630\u0627\u0631\u06cc \u0634\u062f\u0647 \u067e\u0648\u06cc\u0627 \u062f\u0627\u0631\u06cc\u062f\u060c \u0628\u0627\u06cc\u062f \u0627\u0632 \u0627\u0628\u0632\u0627\u0631\u0647\u0627\u06cc \u0627\u062a\u0648\u0645\u0627\u0633\u06cc\u0648\u0646 \u067e\u06cc\u0634\u0631\u0641\u062a\u0647 \u062a\u0631\u06cc \u0645\u0627\u0646\u0646\u062f \u0633\u0644\u0646\u06cc\u0648\u0645 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0646\u06cc\u062f.<\/p>\n<h2 id=\"how-to-build-a-web-scraper-with-python-sdk\"><span class=\"ez-toc-section\" id=\"%da%86%da%af%d9%88%d9%86%d9%87_%d8%a8%d8%a7_python_sdk_%db%8c%da%a9_web_scraper_%d8%a8%d8%b3%d8%a7%d8%b2%db%8c%d9%85\"><\/span><strong>\u0686\u06af\u0648\u0646\u0647 \u0628\u0627 Python SDK \u06cc\u06a9 Web Scraper \u0628\u0633\u0627\u0632\u06cc\u0645<\/strong><span class=\"ez-toc-section-end\"><\/span><\/h2>\n<p>\u0627\u06a9\u0646\u0648\u0646 \u06a9\u0647 \u0641\u0647\u0645\u06cc\u062f\u06cc\u0645 Beautiful Soup \u0648 Python Requests \u0686\u0647 \u06a9\u0627\u0631\u06cc \u0645\u06cc \u062a\u0648\u0627\u0646\u0646\u062f \u0627\u0646\u062c\u0627\u0645 \u062f\u0647\u0646\u062f\u060c \u0628\u06cc\u0627\u06cc\u06cc\u062f \u062f\u0631 \u0645\u0648\u0631\u062f \u0627\u06cc\u0646\u06a9\u0647 \u0686\u06af\u0648\u0646\u0647 \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u0645 \u062f\u0627\u062f\u0647 \u0647\u0627 \u0631\u0627 \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 \u0627\u06cc\u0646 \u0627\u0628\u0632\u0627\u0631\u0647\u0627 \u062e\u0631\u0627\u0634 \u062f\u0647\u06cc\u0645\u060c \u0628\u062d\u062b \u06a9\u0646\u06cc\u0645.<\/p>\n<p>\u062f\u0631 \u0645\u062b\u0627\u0644 \u0632\u06cc\u0631\u060c \u062f\u0627\u062f\u0647 \u0647\u0627 \u0631\u0627 \u0627\u0632 \u0645\u062e\u0632\u0646 \u06cc\u0627\u062f\u06af\u06cc\u0631\u06cc \u0645\u0627\u0634\u06cc\u0646 UC Irvine \u062c\u0645\u0639 \u0622\u0648\u0631\u06cc \u0645\u06cc \u06a9\u0646\u06cc\u0645. <\/p>\n<figure class=\"kg-card kg-image-card kg-width-wide kg-card-hascaption\"><img decoding=\"async\" src=\"https:\/\/rasanegaar.com\/blog\/wp-content\/uploads\/2024\/07\/AD_4nXd2MTmii-KD8tu6AAeHhbr9Sb5vauq3jC3AcYc2Yvd4kcCQLdTdVrBqZuFOpF-vKQ3E012hV7W6bm0iOtqrCsvJx6xsT165.png\" class=\"kg-image\" alt=\"AD_4nXd2MTmii-KD8tu6AAeHhbr9Sb5vauq3jC3AcYc2Yvd4kcCQLdTdVrBqZuFOpF-vKQ3E012hV7W6bm0iOtqrCsvJx6xsT165CV8MKj46T165CV000000000iOtqrCsvJx6xsT165CV8MKj46T165CV0000F 4XLVBuikCJpXTIB6c6JriJtP9MQ?key=f_hrU3B_rjNJFpKZiiV3Pw\" width=\"1600\" height=\"685\" loading=\"lazy\" title=\"\"><figcaption>\u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647 \u0647\u0627 \u062f\u0631 \u0645\u062e\u0632\u0646 \u06cc\u0627\u062f\u06af\u06cc\u0631\u06cc \u0645\u0627\u0634\u06cc\u0646 UC Irvine<\/figcaption><\/figure>\n<p>\u0647\u0645\u0627\u0646\u0637\u0648\u0631 \u06a9\u0647 \u0645\u06cc \u0628\u06cc\u0646\u06cc\u062f\u060c \u0634\u0627\u0645\u0644 \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647 \u0647\u0627\u06cc \u0632\u06cc\u0627\u062f\u06cc \u0627\u0633\u062a \u0648 \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u062f \u0628\u0627 \u0631\u0641\u062a\u0646 \u0628\u0647 \u06cc\u06a9 \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647\u060c \u062c\u0632\u0626\u06cc\u0627\u062a \u0628\u06cc\u0634\u062a\u0631\u06cc \u062f\u0631 \u0645\u0648\u0631\u062f \u0647\u0631 \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647 \u067e\u06cc\u062f\u0627 \u06a9\u0646\u06cc\u062f page \u0628\u0631\u0627\u06cc \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647  \u0634\u0645\u0627 \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u062f \u0628\u0647 \u0627\u062e\u062a\u0635\u0627\u0635\u06cc \u062f\u0633\u062a\u0631\u0633\u06cc \u062f\u0627\u0634\u062a\u0647 \u0628\u0627\u0634\u06cc\u062f page \u0628\u0627 \u06a9\u0644\u06cc\u06a9 \u06a9\u0631\u062f\u0646 \u0631\u0648\u06cc \u0646\u0627\u0645 \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647 \u062f\u0631 \u0644\u06cc\u0633\u062a \u0628\u0627\u0644\u0627. <\/p>\n<p>\u0628\u0631\u0627\u06cc \u062f\u0631\u06cc\u0627\u0641\u062a \u0627\u06cc\u062f\u0647 \u0627\u0632 \u0627\u0637\u0644\u0627\u0639\u0627\u062a \u0627\u0631\u0627\u0626\u0647 \u0634\u062f\u0647 \u0628\u0631\u0627\u06cc \u0647\u0631 \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647\u060c \u062a\u0635\u0648\u06cc\u0631 \u0632\u06cc\u0631 \u0631\u0627 \u0628\u0631\u0631\u0633\u06cc \u06a9\u0646\u06cc\u062f.<\/p>\n<figure class=\"kg-card kg-image-card kg-width-wide kg-card-hascaption\"><img decoding=\"async\" src=\"https:\/\/rasanegaar.com\/blog\/wp-content\/uploads\/2024\/07\/AD_4nXcb7_BVgpIh1P931U-HHX6BKIPN1ODKRzc6WqjX-n77uA9Uvz_e80wqc2YtJx2-Rq3HzWKtlDE31gV-7jz0UASzKrhq86X4.png\" class=\"kg-image\" alt=\"AD_4nXcb7_BVgpIh1P931U-HHX6BKIPN1ODKRzc6WqjX-n77uA9Uvz_e80wqc2YtJx2-Rq3HzWKtlDE31gV-7jz0UASzKrhq86VXV45KrhqNXV4VR5 k54hpyEetzyuDjMgPYW4KKW-oPhKjh8?key=f_hrU3B_rjNJFpKZiiV3Pw\" width=\"1185\" height=\"363\" loading=\"lazy\" title=\"\"><figcaption>\u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647 \u0639\u0646\u0628\u06cc\u0647<\/figcaption><\/figure>\n<p>\u06a9\u062f\u06cc \u06a9\u0647 \u062f\u0631 \u0632\u06cc\u0631 \u0645\u06cc \u0646\u0648\u06cc\u0633\u06cc\u0645 \u0627\u0632 \u0647\u0631 \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647 \u0639\u0628\u0648\u0631 \u0645\u06cc \u06a9\u0646\u062f\u060c \u062c\u0632\u0626\u06cc\u0627\u062a \u0631\u0627 \u0645\u06cc \u062e\u0631\u0627\u0634\u062f \u0648 \u0622\u0646\u0647\u0627 \u0631\u0627 \u062f\u0631 \u06cc\u06a9 \u0641\u0627\u06cc\u0644 CSV \u0630\u062e\u06cc\u0631\u0647 \u0645\u06cc \u06a9\u0646\u062f.<\/p>\n<h3 id=\"step-1-import-necessary-libraries\"><span class=\"ez-toc-section\" id=\"%d9%85%d8%b1%d8%ad%d9%84%d9%87_1_%d9%88%d8%a7%d8%b1%d8%af_%da%a9%d8%b1%d8%af%d9%86_%da%a9%d8%aa%d8%a7%d8%a8%d8%ae%d8%a7%d9%86%d9%87_%d9%87%d8%a7%db%8c_%d8%b6%d8%b1%d9%88%d8%b1%db%8c\"><\/span>\u0645\u0631\u062d\u0644\u0647 1: \u0648\u0627\u0631\u062f \u06a9\u0631\u062f\u0646 \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 \u0647\u0627\u06cc \u0636\u0631\u0648\u0631\u06cc<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p>\u0627\u0648\u0644\u06cc\u0646\u060c import \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 \u0647\u0627\u06cc \u0644\u0627\u0632\u0645: \u062f\u0631\u062e\u0648\u0627\u0633\u062a \u0628\u0631\u0627\u06cc \u0627\u06cc\u062c\u0627\u062f \u062f\u0631\u062e\u0648\u0627\u0633\u062a \u0647\u0627\u06cc HTTP\u060c BeautifulSoup \u0628\u0631\u0627\u06cc \u062a\u062c\u0632\u06cc\u0647 \u0645\u062d\u062a\u0648\u0627\u06cc HTML\u060c \u0648 CSV \u0628\u0631\u0627\u06cc \u0630\u062e\u06cc\u0631\u0647 \u062f\u0627\u062f\u0647 \u0647\u0627.<\/p>\n<pre><code class=\"language-python\">import requests\nfrom bs4 import BeautifulSoup\nimport csv<\/code><\/pre>\n<h3 id=\"step-2-define-the-base-url-and-csv-headers\"><span class=\"ez-toc-section\" id=\"%d9%85%d8%b1%d8%ad%d9%84%d9%87_2_url_%d9%be%d8%a7%db%8c%d9%87_%d9%88_%d8%b3%d8%b1%d8%b5%d9%81%d8%ad%d9%87_csv_%d8%b1%d8%a7_%d8%aa%d8%b9%d8%b1%db%8c%d9%81_%da%a9%d9%86%db%8c%d8%af\"><\/span>\u0645\u0631\u062d\u0644\u0647 2: URL \u067e\u0627\u06cc\u0647 \u0648 \u0633\u0631\u0635\u0641\u062d\u0647 CSV \u0631\u0627 \u062a\u0639\u0631\u06cc\u0641 \u06a9\u0646\u06cc\u062f<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p>URL \u067e\u0627\u06cc\u0647 \u0631\u0627 \u0628\u0631\u0627\u06cc \u0641\u0647\u0631\u0633\u062a \u0647\u0627\u06cc \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647 \u062a\u0646\u0638\u06cc\u0645 \u06a9\u0646\u06cc\u062f \u0648 \u0633\u0631\u0635\u0641\u062d\u0647 \u0647\u0627\u06cc \u0641\u0627\u06cc\u0644 CSV \u0631\u0627 \u06a9\u0647 \u062f\u0631 \u0622\u0646 \u062f\u0627\u062f\u0647 \u0647\u0627\u06cc \u062e\u0631\u0627\u0634\u06cc\u062f\u0647 \u0634\u062f\u0647 \u0630\u062e\u06cc\u0631\u0647 \u0645\u06cc \u0634\u0648\u062f\u060c \u062a\u0639\u0631\u06cc\u0641 \u06a9\u0646\u06cc\u062f.<\/p>\n<pre><code class=\"language-python\">def scrape_uci_datasets():\n    base_url = \"https:\/\/archive.ics.uci.edu\/datasets\"\n\n\n    headers = [\n        \"Dataset Name\", \"Donated Date\", \"Description\",\n        \"Dataset Characteristics\", \"Subject Area\", \"Associated Tasks\",\n        \"Feature Type\", \"Instances\", \"Features\"\n    ]\n\n\n    data = []\n<\/code><\/pre>\n<h3 id=\"step-3-create-a-function-to-scrape-dataset-details\"><span class=\"ez-toc-section\" id=\"%d9%85%d8%b1%d8%ad%d9%84%d9%87_3_%db%8c%da%a9_%d8%aa%d8%a7%d8%a8%d8%b9_%d8%a8%d8%b1%d8%a7%db%8c_%d8%ae%d8%b1%d8%a7%d8%b4_%d8%af%d8%a7%d8%af%d9%86_%d8%ac%d8%b2%d8%a6%db%8c%d8%a7%d8%aa_%d9%85%d8%ac%d9%85%d9%88%d8%b9%d9%87_%d8%af%d8%a7%d8%af%d9%87_%d8%a7%db%8c%d8%ac%d8%a7%d8%af_%da%a9%d9%86%db%8c%d8%af\"><\/span>\u0645\u0631\u062d\u0644\u0647 3: \u06cc\u06a9 \u062a\u0627\u0628\u0639 \u0628\u0631\u0627\u06cc \u062e\u0631\u0627\u0634 \u062f\u0627\u062f\u0646 \u062c\u0632\u0626\u06cc\u0627\u062a \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647 \u0627\u06cc\u062c\u0627\u062f \u06a9\u0646\u06cc\u062f<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p>\u06cc\u06a9 \u062a\u0627\u0628\u0639 \u0631\u0627 \u062a\u0639\u0631\u06cc\u0641 \u06a9\u0646\u06cc\u062f <code>scrape_dataset_details<\/code> \u06a9\u0647 URL \u06cc\u06a9 \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647 \u062c\u062f\u0627\u06af\u0627\u0646\u0647 \u0631\u0627 \u0645\u06cc \u06af\u06cc\u0631\u062f page\u060c \u0645\u062d\u062a\u0648\u0627\u06cc HTML \u0631\u0627 \u0628\u0627\u0632\u06cc\u0627\u0628\u06cc \u0645\u06cc \u06a9\u0646\u062f\u060c \u0622\u0646 \u0631\u0627 \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 BeautifulSoup \u062a\u062c\u0632\u06cc\u0647 \u0645\u06cc \u06a9\u0646\u062f \u0648 \u0627\u0637\u0644\u0627\u0639\u0627\u062a \u0645\u0631\u0628\u0648\u0637\u0647 \u0631\u0627 \u0627\u0633\u062a\u062e\u0631\u0627\u062c \u0645\u06cc \u06a9\u0646\u062f.<\/p>\n<pre><code class=\"language-python\">\n    def scrape_dataset_details(dataset_url):\n        response = requests.get(dataset_url)\n        soup = BeautifulSoup(response.text, 'html.parser')\n\n\n        dataset_name = soup.find(\n            'h1', class_='text-3xl font-semibold text-primary-content')\n        dataset_name = dataset_name.text.strip() if dataset_name else \"N\/A\"\n\n\n        donated_date = soup.find('h2', class_='text-sm text-primary-content')\n        donated_date = donated_date.text.strip().replace(\n            'Donated \u0631\u0648\u06cc ', '') if donated_date else \"N\/A\"\n\n\n        description = soup.find('p', class_='svelte-17wf9gp')\n        description = description.text.strip() if description else \"N\/A\"\n\n\n        details = soup.find_all('div', class_='col-span-4')\n\n\n        dataset_characteristics = details[0].find('p').text.strip() if len(\n            details) &gt; 0 else \"N\/A\"\n        subject_area = details[1].find('p').text.strip() if len(\n            details) &gt; 1 else \"N\/A\"\n        associated_tasks = details[2].find('p').text.strip() if len(\n            details) &gt; 2 else \"N\/A\"\n        feature_type = details[3].find('p').text.strip() if len(\n            details) &gt; 3 else \"N\/A\"\n        instances = details[4].find('p').text.strip() if len(\n            details) &gt; 4 else \"N\/A\"\n        features = details[5].find('p').text.strip() if len(\n            details) &gt; 5 else \"N\/A\"\n\n\n        return [\n            dataset_name, donated_date, description, dataset_characteristics,\n            subject_area, associated_tasks, feature_type, instances, features\n        ]\n<\/code><\/pre>\n<p>\u0627\u06cc\u0646 <code>scrape_dataset_details<\/code> \u062a\u0627\u0628\u0639 \u0645\u062d\u062a\u0648\u0627\u06cc HTML \u06cc\u06a9 \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647 \u0631\u0627 \u0628\u0627\u0632\u06cc\u0627\u0628\u06cc \u0645\u06cc \u06a9\u0646\u062f page \u0648 \u0622\u0646 \u0631\u0627 \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 BeautifulSoup \u062a\u062c\u0632\u06cc\u0647 \u0645\u06cc \u06a9\u0646\u062f.  \u0627\u06cc\u0646 \u0627\u0637\u0644\u0627\u0639\u0627\u062a \u0631\u0627 \u0628\u0627 \u0647\u062f\u0641 \u0642\u0631\u0627\u0631 \u062f\u0627\u062f\u0646 \u0639\u0646\u0627\u0635\u0631 \u062e\u0627\u0635 HTML \u0628\u0631 \u0627\u0633\u0627\u0633 \u0627\u0633\u062a\u062e\u0631\u0627\u062c \u0645\u06cc \u06a9\u0646\u062f \u0631\u0648\u06cc \u0628\u0631\u0686\u0633\u0628 \u0647\u0627 \u0648 \u06a9\u0644\u0627\u0633 \u0647\u0627\u06cc \u0622\u0646\u0647\u0627\u060c \u0645\u0627\u0646\u0646\u062f \u0646\u0627\u0645 \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647 \u0647\u0627\u060c \u062a\u0627\u0631\u06cc\u062e \u0627\u0647\u062f\u0627\u060c \u0648 \u062a\u0648\u0636\u06cc\u062d\u0627\u062a. <\/p>\n<p>\u062a\u0627\u0628\u0639 \u0627\u0632 \u0631\u0648\u0634 \u0647\u0627\u06cc\u06cc \u0645\u0627\u0646\u0646\u062f <code>find<\/code> \u0648 <code>find_all<\/code> \u0628\u0631\u0627\u06cc \u0645\u06a9\u0627\u0646 \u06cc\u0627\u0628\u06cc \u0627\u06cc\u0646 \u0639\u0646\u0627\u0635\u0631 \u0648 \u0628\u0627\u0632\u06cc\u0627\u0628\u06cc \u0645\u062d\u062a\u0648\u0627\u06cc \u0645\u062a\u0646\u06cc \u0622\u0646\u0647\u0627\u060c \u0631\u0633\u06cc\u062f\u06af\u06cc \u0628\u0647 \u0645\u0648\u0627\u0631\u062f\u06cc \u06a9\u0647 \u0645\u0645\u06a9\u0646 \u0627\u0633\u062a \u0639\u0646\u0627\u0635\u0631 \u0627\u0632 \u062f\u0633\u062a \u0631\u0641\u062a\u0647 \u0628\u0627 \u0627\u0631\u0627\u0626\u0647 \u0645\u0642\u0627\u062f\u06cc\u0631 \u067e\u06cc\u0634 \u0641\u0631\u0636. <\/p>\n<p>\u0627\u06cc\u0646 \u0631\u0648\u06cc\u06a9\u0631\u062f \u0633\u06cc\u0633\u062a\u0645\u0627\u062a\u06cc\u06a9 \u062a\u0636\u0645\u06cc\u0646 \u0645\u06cc \u06a9\u0646\u062f \u06a9\u0647 \u062c\u0632\u0626\u06cc\u0627\u062a \u0645\u0631\u0628\u0648\u0637\u0647 \u0628\u0647 \u0637\u0648\u0631 \u062f\u0642\u06cc\u0642 \u0636\u0628\u0637 \u0634\u062f\u0647 \u0648 \u062f\u0631 \u0642\u0627\u0644\u0628\u06cc \u0633\u0627\u062e\u062a\u0627\u0631\u06cc\u0627\u0641\u062a\u0647 \u0628\u0627\u0632\u06af\u0631\u062f\u0627\u0646\u062f\u0647 \u0645\u06cc \u0634\u0648\u0646\u062f.<\/p>\n<h3 id=\"step-4-create-a-function-to-scrape-dataset-listings\"><span class=\"ez-toc-section\" id=\"%d9%85%d8%b1%d8%ad%d9%84%d9%87_4_%db%8c%da%a9_%d8%aa%d8%a7%d8%a8%d8%b9_%d8%a8%d8%b1%d8%a7%db%8c_%d8%ae%d8%b1%d8%a7%d8%b4_%d8%af%d8%a7%d8%af%d9%86_%d9%84%db%8c%d8%b3%d8%aa_%d9%87%d8%a7%db%8c_%d9%85%d8%ac%d9%85%d9%88%d8%b9%d9%87_%d8%af%d8%a7%d8%af%d9%87_%d8%a7%db%8c%d8%ac%d8%a7%d8%af_%da%a9%d9%86%db%8c%d8%af\"><\/span>\u0645\u0631\u062d\u0644\u0647 4: \u06cc\u06a9 \u062a\u0627\u0628\u0639 \u0628\u0631\u0627\u06cc \u062e\u0631\u0627\u0634 \u062f\u0627\u062f\u0646 \u0644\u06cc\u0633\u062a \u0647\u0627\u06cc \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647 \u0627\u06cc\u062c\u0627\u062f \u06a9\u0646\u06cc\u062f<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p>\u06cc\u06a9 \u062a\u0627\u0628\u0639 \u0631\u0627 \u062a\u0639\u0631\u06cc\u0641 \u06a9\u0646\u06cc\u062f <code>scrape_datasets<\/code> \u06a9\u0647 URL \u06cc\u06a9 \u0631\u0627 \u0645\u06cc \u06af\u06cc\u0631\u062f page \u0641\u0647\u0631\u0633\u062a \u06a9\u0631\u062f\u0646 \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647 \u0647\u0627\u06cc \u0645\u062a\u0639\u062f\u062f\u060c \u0645\u062d\u062a\u0648\u0627\u06cc HTML \u0631\u0627 \u0628\u0627\u0632\u06cc\u0627\u0628\u06cc \u0645\u06cc \u06a9\u0646\u062f \u0648 \u062a\u0645\u0627\u0645 \u067e\u06cc\u0648\u0646\u062f\u0647\u0627\u06cc \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647 \u0631\u0627 \u067e\u06cc\u062f\u0627 \u0645\u06cc \u06a9\u0646\u062f.  \u0628\u0631\u0627\u06cc \u0647\u0631 \u067e\u06cc\u0648\u0646\u062f\u060c \u062a\u0645\u0627\u0633 \u0645\u06cc \u06af\u06cc\u0631\u062f <code>scrape_dataset_details<\/code> \u0628\u0631\u0627\u06cc \u062f\u0631\u06cc\u0627\u0641\u062a \u0627\u0637\u0644\u0627\u0639\u0627\u062a \u062f\u0642\u06cc\u0642<\/p>\n<pre><code class=\"language-python\">    def scrape_datasets(page_url):\n        response = requests.get(page_url)\n        soup = BeautifulSoup(response.text, 'html.parser')\n\n\n        dataset_list = soup.find_all(\n            'a', class_='link-hover link text-xl font-semibold')\n\n\n        if not dataset_list:\n            print(\"No dataset links found\")\n            return\n\n\n        for dataset in dataset_list:\n            dataset_link = \"https:\/\/archive.ics.uci.edu\" + dataset['href']\n            print(f\"Scraping details for {dataset.text.strip()}...\")\n            dataset_details = scrape_dataset_details(dataset_link)\n            data.append(dataset_details)<\/code><\/pre>\n<h3 id=\"step-5-loop-through-pages-using-pagination-parameters\"><span class=\"ez-toc-section\" id=\"%d9%85%d8%b1%d8%ad%d9%84%d9%87_5_%d8%a8%d8%a7_%d8%a7%d8%b3%d8%aa%d9%81%d8%a7%d8%af%d9%87_%d8%a7%d8%b2_%d9%be%d8%a7%d8%b1%d8%a7%d9%85%d8%aa%d8%b1%d9%87%d8%a7%db%8c_%d8%b5%d9%81%d8%ad%d9%87_%d8%a8%d9%86%d8%af%db%8c%d8%8c_%d8%b5%d9%81%d8%ad%d8%a7%d8%aa_%d8%b1%d8%a7_%d8%ad%d9%84%d9%82%d9%87_%d8%a8%d8%b2%d9%86%db%8c%d8%af\"><\/span>\u0645\u0631\u062d\u0644\u0647 5: \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 \u067e\u0627\u0631\u0627\u0645\u062a\u0631\u0647\u0627\u06cc \u0635\u0641\u062d\u0647 \u0628\u0646\u062f\u06cc\u060c \u0635\u0641\u062d\u0627\u062a \u0631\u0627 \u062d\u0644\u0642\u0647 \u0628\u0632\u0646\u06cc\u062f<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p>\u06cc\u06a9 \u062d\u0644\u0642\u0647 \u0628\u0631\u0627\u06cc \u067e\u06cc\u0645\u0627\u06cc\u0634 \u062f\u0631 \u0635\u0641\u062d\u0627\u062a \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 \u067e\u0627\u0631\u0627\u0645\u062a\u0631\u0647\u0627\u06cc \u0635\u0641\u062d\u0647 \u0628\u0646\u062f\u06cc \u067e\u06cc\u0627\u062f\u0647 \u0633\u0627\u0632\u06cc \u06a9\u0646\u06cc\u062f.  \u0627\u06cc\u0646 \u062d\u0644\u0642\u0647 \u062a\u0627 \u0632\u0645\u0627\u0646\u06cc \u0627\u062f\u0627\u0645\u0647 \u0645\u06cc \u06cc\u0627\u0628\u062f \u06a9\u0647 \u0647\u06cc\u0686 \u062f\u0627\u062f\u0647 \u062c\u062f\u06cc\u062f\u06cc \u0627\u0636\u0627\u0641\u0647 \u0646\u0634\u0648\u062f\u060c \u06a9\u0647 \u0646\u0634\u0627\u0646 \u0645\u06cc \u062f\u0647\u062f \u062a\u0645\u0627\u0645 \u0635\u0641\u062d\u0627\u062a \u062e\u0631\u0627\u0634\u06cc\u062f\u0647 \u0634\u062f\u0647 \u0627\u0646\u062f.<\/p>\n<pre><code class=\"language-python\">    skip = 0\n    take = 10\n    while True:\n        page_url = f\"https:\/\/archive.ics.uci.edu\/datasets\u061fskip={skip}&amp;take={take}&amp;sort=desc&amp;orderBy=NumHits&amp;search=\"\n        print(f\"Scraping page: {page_url}\")\n        initial_data_count = len(data)\n        scrape_datasets(page_url)\n        if len(\n                data\n        ) == initial_data_count:  \n            break\n        skip += take<\/code><\/pre>\n<h3 id=\"step-6-save-the-scraped-data-to-a-csv-file\"><span class=\"ez-toc-section\" id=\"%d9%85%d8%b1%d8%ad%d9%84%d9%87_6_%d8%af%d8%a7%d8%af%d9%87_%d9%87%d8%a7%db%8c_%d8%ae%d8%b1%d8%a7%d8%b4%db%8c%d8%af%d9%87_%d8%b4%d8%af%d9%87_%d8%b1%d8%a7_%d8%af%d8%b1_%db%8c%da%a9_%d9%81%d8%a7%db%8c%d9%84_csv_%d8%b0%d8%ae%db%8c%d8%b1%d9%87_%da%a9%d9%86%db%8c%d8%af\"><\/span>\u0645\u0631\u062d\u0644\u0647 6: \u062f\u0627\u062f\u0647 \u0647\u0627\u06cc \u062e\u0631\u0627\u0634\u06cc\u062f\u0647 \u0634\u062f\u0647 \u0631\u0627 \u062f\u0631 \u06cc\u06a9 \u0641\u0627\u06cc\u0644 CSV \u0630\u062e\u06cc\u0631\u0647 \u06a9\u0646\u06cc\u062f<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p>\u067e\u0633 \u0627\u0632 \u062e\u0631\u0627\u0634 \u062f\u0627\u062f\u0646 \u062a\u0645\u0627\u0645 \u062f\u0627\u062f\u0647 \u0647\u0627\u060c \u0622\u0646 \u0631\u0627 \u062f\u0631 \u06cc\u06a9 \u0641\u0627\u06cc\u0644 CSV \u0630\u062e\u06cc\u0631\u0647 \u06a9\u0646\u06cc\u062f.<\/p>\n<pre><code class=\"language-python\">    with open('uci_datasets.csv', 'w', newline=\"\", encoding='utf-8') as file:\n        writer = csv.writer(file)\n        writer.writerow(headers)\n        writer.writerows(data)\n\n\n    print(\"Scraping complete. Data saved to 'uci_datasets.csv'.\")<\/code><\/pre>\n<h3 id=\"step-7-run-the-scraping-function\"><span class=\"ez-toc-section\" id=\"%d9%85%d8%b1%d8%ad%d9%84%d9%87_7_%d8%b9%d9%85%d9%84%da%a9%d8%b1%d8%af_scraping_%d8%b1%d8%a7_%d8%a7%d8%ac%d8%b1%d8%a7_%da%a9%d9%86%db%8c%d8%af\"><\/span>\u0645\u0631\u062d\u0644\u0647 7: \u0639\u0645\u0644\u06a9\u0631\u062f Scraping \u0631\u0627 \u0627\u062c\u0631\u0627 \u06a9\u0646\u06cc\u062f<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p>\u062f\u0631 \u0646\u0647\u0627\u06cc\u062a \u0628\u0627 <code>scrape_uci_datasets<\/code> \u0639\u0645\u0644\u06a9\u0631\u062f \u0628\u0631\u0627\u06cc \u0634\u0631\u0648\u0639 \u062e\u0631\u0627\u0634\u06cc\u062f\u0646 process.<\/p>\n<pre><code class=\"language-python\">scrape_uci_datasets()<\/code><\/pre>\n<h2 id=\"full-code\"><span class=\"ez-toc-section\" id=\"%da%a9%d8%af_%da%a9%d8%a7%d9%85%d9%84\"><\/span><strong>\u06a9\u062f \u06a9\u0627\u0645\u0644<\/strong><span class=\"ez-toc-section-end\"><\/span><\/h2>\n<p>\u062f\u0631 \u0627\u06cc\u0646\u062c\u0627 \u06a9\u062f \u06a9\u0627\u0645\u0644 \u0648\u0628 \u0627\u0633\u06a9\u0631\u0627\u067e\u0631 \u0622\u0645\u062f\u0647 \u0627\u0633\u062a:<\/p>\n<pre><code class=\"language-python\">import requests\nfrom bs4 import BeautifulSoup\nimport csv\n\n\ndef scrape_uci_datasets():\n    base_url = \"https:\/\/archive.ics.uci.edu\/datasets\"\n\n\n    headers = [\n        \"Dataset Name\", \"Donated Date\", \"Description\",\n        \"Dataset Characteristics\", \"Subject Area\", \"Associated Tasks\",\n        \"Feature Type\", \"Instances\", \"Features\"\n    ]\n\n\n    # List to store the scraped data\n    data = []\n\n\n    def scrape_dataset_details(dataset_url):\n        response = requests.get(dataset_url)\n        soup = BeautifulSoup(response.text, 'html.parser')\n\n\n        dataset_name = soup.find(\n            'h1', class_='text-3xl font-semibold text-primary-content')\n        dataset_name = dataset_name.text.strip() if dataset_name else \"N\/A\"\n\n\n        donated_date = soup.find('h2', class_='text-sm text-primary-content')\n        donated_date = donated_date.text.strip().replace(\n            'Donated \u0631\u0648\u06cc ', '') if donated_date else \"N\/A\"\n\n\n        description = soup.find('p', class_='svelte-17wf9gp')\n        description = description.text.strip() if description else \"N\/A\"\n\n\n        details = soup.find_all('div', class_='col-span-4')\n\n\n        dataset_characteristics = details[0].find('p').text.strip() if len(\n            details) &gt; 0 else \"N\/A\"\n        subject_area = details[1].find('p').text.strip() if len(\n            details) &gt; 1 else \"N\/A\"\n        associated_tasks = details[2].find('p').text.strip() if len(\n            details) &gt; 2 else \"N\/A\"\n        feature_type = details[3].find('p').text.strip() if len(\n            details) &gt; 3 else \"N\/A\"\n        instances = details[4].find('p').text.strip() if len(\n            details) &gt; 4 else \"N\/A\"\n        features = details[5].find('p').text.strip() if len(\n            details) &gt; 5 else \"N\/A\"\n\n\n        return [\n            dataset_name, donated_date, description, dataset_characteristics,\n            subject_area, associated_tasks, feature_type, instances, features\n        ]\n\n\n    def scrape_datasets(page_url):\n        response = requests.get(page_url)\n        soup = BeautifulSoup(response.text, 'html.parser')\n\n\n        dataset_list = soup.find_all(\n            'a', class_='link-hover link text-xl font-semibold')\n\n\n        if not dataset_list:\n            print(\"No dataset links found\")\n            return\n\n\n        for dataset in dataset_list:\n            dataset_link = \"https:\/\/archive.ics.uci.edu\" + dataset['href']\n            print(f\"Scraping details for {dataset.text.strip()}...\")\n            dataset_details = scrape_dataset_details(dataset_link)\n            data.append(dataset_details)\n\n\n    # Loop through the pages using the pagination parameters\n    skip = 0\n    take = 10\n    while True:\n        page_url = f\"https:\/\/archive.ics.uci.edu\/datasets\u061fskip={skip}&amp;take={take}&amp;sort=desc&amp;orderBy=NumHits&amp;search=\"\n        print(f\"Scraping page: {page_url}\")\n        initial_data_count = len(data)\n        scrape_datasets(page_url)\n        if len(\n                data\n        ) == initial_data_count: \n            break\n        skip += take\n\n\n    with open('uci_datasets.csv', 'w', newline=\"\", encoding='utf-8') as file:\n        writer = csv.writer(file)\n        writer.writerow(headers)\n        writer.writerows(data)\n\n\n    print(\"Scraping complete. Data saved to 'uci_datasets.csv'.\")\n\n\nscrape_uci_datasets()\n<\/code><\/pre>\n<p>\u0647\u0646\u06af\u0627\u0645\u06cc \u06a9\u0647 \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0631\u0627 \u0627\u062c\u0631\u0627 \u0645\u06cc \u06a9\u0646\u06cc\u062f\u060c \u0628\u0631\u0627\u06cc \u0645\u062f\u062a\u06cc \u0627\u062c\u0631\u0627 \u0645\u06cc \u0634\u0648\u062f \u062a\u0627 \u0632\u0645\u0627\u0646\u06cc \u06a9\u0647 terminal \u0645\u06cc\u200c\u06af\u0648\u06cc\u062f \u00ab\u0647\u06cc\u0686 \u067e\u06cc\u0648\u0646\u062f \u062f\u0627\u062f\u0647\u200c\u0627\u06cc \u06cc\u0627\u0641\u062a \u0646\u0634\u062f\u00bb \u0648 \u0628\u0647 \u062f\u0646\u0628\u0627\u0644 \u0622\u0646 \u00ab\u062e\u0631\u0627\u0634 \u06a9\u0627\u0645\u0644 \u0634\u062f.  \u062f\u0627\u062f\u0647\u200c\u0647\u0627 \u062f\u0631 &#8220;uci_datasets.csv&#8221; \u0630\u062e\u06cc\u0631\u0647 \u0634\u062f\u0646\u062f\u060c \u06a9\u0647 \u0646\u0634\u0627\u0646 \u0645\u06cc\u200c\u062f\u0647\u062f \u062f\u0627\u062f\u0647\u200c\u0647\u0627\u06cc \u062e\u0631\u0627\u0634\u06cc\u062f\u0647 \u0634\u062f\u0647 \u062f\u0631 \u06cc\u06a9 \u0641\u0627\u06cc\u0644 CSV \u0630\u062e\u06cc\u0631\u0647 \u0634\u062f\u0647\u200c\u0627\u0646\u062f.<\/p>\n<figure class=\"kg-card kg-image-card kg-width-wide\"><img decoding=\"async\" src=\"https:\/\/rasanegaar.com\/blog\/wp-content\/uploads\/2024\/07\/AD_4nXdRUvJJsu32oaxdattur__98CEF9GvqQMDTDQzpqS-NW3I2-haF5tfWH_mIBFwEhAqLhUhURVKCNFJE-b1bRzeZtz2oApWe.png\" class=\"kg-image\" alt=\"AD_4nXdRUvJJsu32oaxdattur__98CEF9GvqQMDTDQzpqS-NW3I2-haF5tfWH_mIBFwEhAqLhUhURVKCNFJE-b1bRzeZtz2oApWePqLZqWahNQW0000 2MdqvoLDhToy-gCj9o?key=f_hrU3B_rjNJFpKZiiV3Pw\" width=\"699\" height=\"75\" loading=\"lazy\" title=\"\"><\/figure>\n<p>\u0628\u0631\u0627\u06cc \u0645\u0634\u0627\u0647\u062f\u0647 \u062f\u0627\u062f\u0647 \u0647\u0627\u06cc \u062e\u0631\u0627\u0634\u06cc\u062f\u0647 \u0634\u062f\u0647\u060c &#8220;uci_datasets.csv&#8221; \u0631\u0627 \u0628\u0627\u0632 \u06a9\u0646\u06cc\u062f\u060c \u0628\u0627\u06cc\u062f \u0628\u062a\u0648\u0627\u0646\u06cc\u062f \u062f\u0627\u062f\u0647 \u0647\u0627\u06cc \u0633\u0627\u0632\u0645\u0627\u0646\u062f\u0647\u06cc \u0634\u062f\u0647 \u0628\u0631 \u0627\u0633\u0627\u0633 \u0646\u0627\u0645 \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647\u060c \u062a\u0627\u0631\u06cc\u062e \u0627\u0647\u062f\u0627\u060c \u062a\u0648\u0636\u06cc\u062d\u0627\u062a\u060c \u0648\u06cc\u0698\u06af\u06cc \u0647\u0627\u060c \u0645\u0646\u0637\u0642\u0647 \u0645\u0648\u0636\u0648\u0639\u06cc \u0648 \u063a\u06cc\u0631\u0647 \u0631\u0627 \u0645\u0634\u0627\u0647\u062f\u0647 \u06a9\u0646\u06cc\u062f. \u0631\u0648\u06cc.<\/p>\n<figure class=\"kg-card kg-image-card kg-width-wide kg-card-hascaption\"><img decoding=\"async\" src=\"https:\/\/rasanegaar.com\/blog\/wp-content\/uploads\/2024\/07\/AD_4nXd1ZkPzSyPxZ3KsZklCPPcruSll4xUBxm3KiNdageDzHK-wbTxG7v8HLFpoJ-gMvIpdKPxzoshzRlmNjiPeVcbvse14gdGF.png\" class=\"kg-image\" alt=\"AD_4nXd1ZkPzSyPxZ3KsZklCPPcruSll4xUBxm3KiNdageDzHK-wbTxG7v8HLFpoJ-gMvIpdKPxzoshzRlmNjiPeVcbvse14gdGFHu7Wqm89UGT h1bUO4w0D9sLFC_5Tmy3o?key=f_hrU3B_rjNJFpKZiiV3Pw\" width=\"1600\" height=\"468\" loading=\"lazy\" title=\"\"><figcaption>\u062f\u0627\u062f\u0647 \u0647\u0627\u06cc \u0633\u0627\u0632\u0645\u0627\u0646\u062f\u0647\u06cc \u0634\u062f\u0647 \u0628\u0631 \u0627\u0633\u0627\u0633 \u0646\u0627\u0645 \u0645\u062c\u0645\u0648\u0639\u0647 \u062f\u0627\u062f\u0647\u060c \u062a\u0627\u0631\u06cc\u062e \u0627\u0647\u062f\u0627\u060c \u062a\u0648\u0636\u06cc\u062d\u0627\u062a\u060c \u0648\u06cc\u0698\u06af\u06cc \u0647\u0627\u060c \u062d\u0648\u0632\u0647 \u0645\u0648\u0636\u0648\u0639\u06cc \u0648 \u063a\u06cc\u0631\u0647 \u0631\u0648\u06cc.<\/figcaption><\/figure>\n<p>\u0627\u06af\u0631 \u0641\u0627\u06cc\u0644 \u0631\u0627 \u0627\u0632 \u0637\u0631\u06cc\u0642 \u0627\u06a9\u0633\u0644 \u0628\u0627\u0632 \u06a9\u0646\u06cc\u062f\u060c \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u062f \u062f\u06cc\u062f \u0628\u0647\u062a\u0631\u06cc \u0627\u0632 \u062f\u0627\u062f\u0647 \u0647\u0627 \u062f\u0627\u0634\u062a\u0647 \u0628\u0627\u0634\u06cc\u062f.<\/p>\n<figure class=\"kg-card kg-image-card kg-width-wide kg-card-hascaption\"><img decoding=\"async\" src=\"https:\/\/rasanegaar.com\/blog\/wp-content\/uploads\/2024\/07\/AD_4nXfdmf621HGzQNHCdgxTJ6cvl2YEpuAq5hfvqpE9KrbZ8kDkGo6R3YIYpCFMmNoY8z29YEfcesZap9hpxiLc3fwHEyzLdo6d.png\" class=\"kg-image\" alt=\"AD_4nXfdmf621HGzQNHCdgxTJ6cvl2YEpuAq5hfvqpE9KrbZ8kDkGo6R3YIYpCFMmNoY8z29YEfcesZap9hpxiLc3fwHEyzLdo6dNQGNExRdamHfvqpE9KrbZ8kDkGo6R3YIYpCFMmNoY8z29YEfcesZap9hpxiLc3fwHEyzLdo6dNQGNExRdamFhKodGTU I5miEUp_UCyNPZo?key=f_hrU3B_rjNJFpKZiiV3Pw\" width=\"1553\" height=\"462\" loading=\"lazy\" title=\"\"><figcaption>\u062f\u0627\u062f\u0647 \u0647\u0627 \u062f\u0631 \u0641\u0627\u06cc\u0644 \u0627\u06a9\u0633\u0644 \u0633\u0627\u0632\u0645\u0627\u0646\u062f\u0647\u06cc \u0634\u062f\u0647 \u0627\u0646\u062f<\/figcaption><\/figure>\n<p>\u0628\u0627 \u067e\u06cc\u0631\u0648\u06cc \u0627\u0632 \u0645\u0646\u0637\u0642 \u0630\u06a9\u0631 \u0634\u062f\u0647 \u062f\u0631 \u0627\u06cc\u0646 \u0645\u0642\u0627\u0644\u0647\u060c \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u062f \u0628\u0633\u06cc\u0627\u0631\u06cc \u0627\u0632 \u0633\u0627\u06cc\u062a \u0647\u0627 \u0631\u0627 \u062e\u0631\u0627\u0634 \u062f\u0647\u06cc\u062f.  \u062a\u0646\u0647\u0627 \u06a9\u0627\u0631\u06cc \u06a9\u0647 \u0628\u0627\u06cc\u062f \u0627\u0646\u062c\u0627\u0645 \u062f\u0647\u06cc\u062f \u0627\u06cc\u0646 \u0627\u0633\u062a \u06a9\u0647 \u0627\u0632 URL \u0627\u0635\u0644\u06cc \u0634\u0631\u0648\u0639 \u06a9\u0646\u06cc\u062f\u060c \u0631\u0648\u0634 \u067e\u06cc\u0645\u0627\u06cc\u0634 \u062f\u0631 \u0644\u06cc\u0633\u062a \u0631\u0627 \u0628\u06cc\u0627\u0628\u06cc\u062f \u0648 \u0628\u0647 \u0622\u062f\u0631\u0633 \u0627\u062e\u062a\u0635\u0627\u0635\u06cc \u0628\u0631\u0648\u06cc\u062f page \u0628\u0631\u0627\u06cc \u0647\u0631 \u0622\u06cc\u062a\u0645 \u0644\u06cc\u0633\u062a  \u0633\u067e\u0633\u060c \u0645\u0646\u0627\u0633\u0628 \u0631\u0627 \u0634\u0646\u0627\u0633\u0627\u06cc\u06cc \u06a9\u0646\u06cc\u062f page \u0639\u0646\u0627\u0635\u0631\u06cc \u0645\u0627\u0646\u0646\u062f \u0634\u0646\u0627\u0633\u0647 \u0647\u0627 \u0648 \u06a9\u0644\u0627\u0633 \u0647\u0627\u06cc\u06cc \u06a9\u0647 \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u062f \u062f\u0627\u062f\u0647 \u0647\u0627\u06cc \u0645\u0648\u0631\u062f \u0646\u0638\u0631 \u062e\u0648\u062f \u0631\u0627 \u062c\u062f\u0627\u0633\u0627\u0632\u06cc \u0648 \u0627\u0633\u062a\u062e\u0631\u0627\u062c \u06a9\u0646\u06cc\u062f. <\/p>\n<p>\u0647\u0645\u0686\u0646\u06cc\u0646 \u0628\u0627\u06cc\u062f \u0645\u0646\u0637\u0642 \u067e\u0634\u062a \u0635\u0641\u062d\u0647 \u0628\u0646\u062f\u06cc \u0631\u0627 \u062f\u0631\u06a9 \u06a9\u0646\u06cc\u062f.  \u0627\u063a\u0644\u0628\u060c \u0635\u0641\u062d\u0647\u200c\u0628\u0646\u062f\u06cc \u062a\u063a\u06cc\u06cc\u0631\u0627\u062a \u062c\u0632\u0626\u06cc \u062f\u0631 URL \u0627\u06cc\u062c\u0627\u062f \u0645\u06cc\u200c\u06a9\u0646\u062f\u060c \u06a9\u0647 \u0645\u06cc\u200c\u062a\u0648\u0627\u0646\u06cc\u062f \u0627\u0632 \u0622\u0646 \u0628\u0631\u0627\u06cc \u062d\u0644\u0642\u0647\u200c\u0628\u0646\u062f\u06cc \u0627\u0632 \u06cc\u06a9\u06cc \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0646\u06cc\u062f page \u0628\u0647 \u062f\u06cc\u06af\u0631\u06cc. <\/p>\n<p>\u062f\u0631 \u0646\u0647\u0627\u06cc\u062a\u060c \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u062f \u062f\u0627\u062f\u0647 \u0647\u0627 \u0631\u0627 \u062f\u0631 \u06cc\u06a9 \u0641\u0627\u06cc\u0644 CSV \u0628\u0646\u0648\u06cc\u0633\u06cc\u062f \u06a9\u0647 \u0628\u0631\u0627\u06cc \u0630\u062e\u06cc\u0631\u0647 \u0633\u0627\u0632\u06cc \u0648 \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u0648\u0631\u0648\u062f\u06cc \u0628\u0631\u0627\u06cc \u062a\u062c\u0633\u0645 \u0645\u0646\u0627\u0633\u0628 \u0627\u0633\u062a.<\/p>\n<h2 id=\"conclusion\"><span class=\"ez-toc-section\" id=\"%d9%86%d8%aa%db%8c%d8%ac%d9%87\"><\/span><strong>\u0646\u062a\u06cc\u062c\u0647<\/strong><span class=\"ez-toc-section-end\"><\/span><\/h2>\n<p>\u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 Python SDK \u0647\u0645\u0631\u0627\u0647 \u0628\u0627 Requests \u0648 Beautiful Soup \u0628\u0647 \u0634\u0645\u0627 \u0627\u06cc\u0646 \u0627\u0645\u06a9\u0627\u0646 \u0631\u0627 \u0645\u06cc \u062f\u0647\u062f \u06a9\u0647 \u0648\u0628 \u0627\u0633\u06a9\u0631\u067e\u0631\u0647\u0627\u06cc \u06a9\u0627\u0645\u0644\u0627\u064b \u06a9\u0627\u0631\u0628\u0631\u062f\u06cc \u0628\u0631\u0627\u06cc \u0627\u0633\u062a\u062e\u0631\u0627\u062c \u062f\u0627\u062f\u0647 \u0647\u0627 \u0627\u0632 \u0648\u0628 \u0633\u0627\u06cc\u062a \u0647\u0627 \u0627\u06cc\u062c\u0627\u062f \u06a9\u0646\u06cc\u062f.  \u062f\u0631 \u062d\u0627\u0644\u06cc \u06a9\u0647 \u0627\u06cc\u0646 \u0639\u0645\u0644\u06a9\u0631\u062f \u0645\u06cc \u062a\u0648\u0627\u0646\u062f \u0628\u0631\u0627\u06cc \u062a\u0635\u0645\u06cc\u0645 \u06af\u06cc\u0631\u06cc \u0645\u0628\u062a\u0646\u06cc \u0628\u0631 \u062f\u0627\u062f\u0647 \u0628\u0633\u06cc\u0627\u0631 \u0633\u0648\u062f\u0645\u0646\u062f \u0628\u0627\u0634\u062f\u060c \u0645\u0647\u0645 \u0627\u0633\u062a \u06a9\u0647 \u0645\u0644\u0627\u062d\u0638\u0627\u062a \u0627\u062e\u0644\u0627\u0642\u06cc \u0648 \u0642\u0627\u0646\u0648\u0646\u06cc \u0631\u0627 \u062f\u0631 \u0646\u0638\u0631 \u062f\u0627\u0634\u062a\u0647 \u0628\u0627\u0634\u06cc\u062f.<\/p>\n<p>\u0647\u0646\u06af\u0627\u0645\u06cc \u06a9\u0647 \u0628\u0627 \u0631\u0648\u0634 \u0647\u0627\u06cc \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0634\u062f\u0647 \u062f\u0631 \u0627\u06cc\u0646 \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0622\u0634\u0646\u0627 \u0634\u062f\u06cc\u062f\u060c \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u062f \u062a\u06a9\u0646\u06cc\u06a9 \u0647\u0627\u06cc\u06cc \u0645\u0627\u0646\u0646\u062f \u0645\u062f\u06cc\u0631\u06cc\u062a \u067e\u0631\u0648\u06a9\u0633\u06cc \u0648 \u062a\u062f\u0627\u0648\u0645 \u062f\u0627\u062f\u0647 \u0647\u0627 \u0631\u0627 \u0628\u0631\u0631\u0633\u06cc \u06a9\u0646\u06cc\u062f.  \u0647\u0645\u0686\u0646\u06cc\u0646 \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u062f \u0628\u0627 \u06a9\u062a\u0627\u0628\u062e\u0627\u0646\u0647 \u0647\u0627\u06cc \u062f\u06cc\u06af\u0631 \u0645\u0627\u0646\u0646\u062f Scrapy\u060c Selenium \u0648 Puppeteer \u0622\u0634\u0646\u0627 \u0634\u0648\u06cc\u062f \u062a\u0627 \u0646\u06cc\u0627\u0632\u0647\u0627\u06cc \u062c\u0645\u0639 \u0622\u0648\u0631\u06cc \u062f\u0627\u062f\u0647 \u0647\u0627\u06cc \u062e\u0648\u062f \u0631\u0627 \u0628\u0631\u0622\u0648\u0631\u062f\u0647 \u06a9\u0646\u06cc\u062f. <\/p>\n<p>\u0628\u0627 \u062a\u0634\u06a9\u0631 \u0627\u0632 \u0634\u0645\u0627 \u0628\u0631\u0627\u06cc \u062e\u0648\u0627\u0646\u062f\u0646!  \u0645\u0646 \u062c\u0633 \u0647\u0633\u062a\u0645 \u0648 \u062f\u0631 Hyperskill \u0645\u062a\u062e\u0635\u0635 \u0647\u0633\u062a\u0645.  \u0634\u0645\u0627 \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u062f \u06cc\u06a9 \u0631\u0627 \u0628\u0631\u0631\u0633\u06cc \u06a9\u0646\u06cc\u062f <strong><strong>\u067e\u0627\u06cc\u062a\u0648\u0646 <\/strong>\u062a\u0648\u0633\u0639\u0647 \u062f\u0647\u0646\u062f\u0647<strong><strong><strong> <\/strong><\/strong><\/strong><\/strong>\u062f\u0648\u0631\u0647 \u0631\u0648\u06cc \u067e\u0644\u062a \u0641\u0631\u0645<\/p>\n<\/section>\n<p><br \/>\n<br \/>\u0645\u0646\u062a\u0634\u0631 \u0634\u062f\u0647 \u062f\u0631 1403-07-10 19:40:06<br \/>\n<\/p>\n\n\n<div class=\"kk-star-ratings kksr-auto kksr-align-center kksr-valign-bottom\"\n    data-payload='{&quot;align&quot;:&quot;center&quot;,&quot;id&quot;:&quot;17607&quot;,&quot;slug&quot;:&quot;default&quot;,&quot;valign&quot;:&quot;bottom&quot;,&quot;ignore&quot;:&quot;&quot;,&quot;reference&quot;:&quot;auto&quot;,&quot;class&quot;:&quot;&quot;,&quot;count&quot;:&quot;0&quot;,&quot;legendonly&quot;:&quot;&quot;,&quot;readonly&quot;:&quot;&quot;,&quot;score&quot;:&quot;0&quot;,&quot;starsonly&quot;:&quot;&quot;,&quot;best&quot;:&quot;5&quot;,&quot;gap&quot;:&quot;5&quot;,&quot;greet&quot;:&quot;\u0627\u0645\u062a\u06cc\u0627\u0632 \u0634\u0645\u0627 \u0628\u0647 \u0627\u06cc\u0646 \u0645\u0637\u0644\u0628&quot;,&quot;legend&quot;:&quot;0\\\/5 (0 \u0631\u0627\u06cc)&quot;,&quot;size&quot;:&quot;30&quot;,&quot;title&quot;:&quot;\u0686\u06af\u0648\u0646\u0647 \u0627\u0632 Python SDK \u0628\u0631\u0627\u06cc \u0633\u0627\u062e\u062a\u0646 \u0648\u0628 Scraper \u062e\u0648\u062f \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0646\u06cc\u062f&quot;,&quot;width&quot;:&quot;0&quot;,&quot;_legend&quot;:&quot;{score}\\\/{best} ({count} \u0631\u0627\u06cc)&quot;,&quot;font_factor&quot;:&quot;1.25&quot;}'>\n            \n<div class=\"kksr-stars\">\n    \n<div class=\"kksr-stars-inactive\">\n            <div class=\"kksr-star\" data-star=\"1\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" data-star=\"2\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" data-star=\"3\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" data-star=\"4\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" data-star=\"5\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n    <\/div>\n    \n<div class=\"kksr-stars-active\" style=\"width: 0px;\">\n            <div class=\"kksr-star\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n            <div class=\"kksr-star\" style=\"padding-left: 5px\">\n            \n\n<div class=\"kksr-icon\" style=\"width: 30px; height: 30px;\"><\/div>\n        <\/div>\n    <\/div>\n<\/div>\n                \n\n<div class=\"kksr-legend\" style=\"font-size: 24px;\">\n            <span class=\"kksr-muted\">\u0627\u0645\u062a\u06cc\u0627\u0632 \u0634\u0645\u0627 \u0628\u0647 \u0627\u06cc\u0646 \u0645\u0637\u0644\u0628<\/span>\n    <\/div>\n    <\/div>\n","protected":false},"excerpt":{"rendered":"<p><span class=\"span-reading-time rt-reading-time\" style=\"display: block;\"><span class=\"rt-label rt-prefix\">\u0632\u0645\u0627\u0646 \u0644\u0627\u0632\u0645 \u0628\u0631\u0627\u06cc \u0645\u0637\u0627\u0644\u0639\u0647: <\/span> <span class=\"rt-time\"> 7<\/span> <span class=\"rt-label rt-postfix\">\u062f\u0642\u06cc\u0642\u0647<\/span><\/span>Web scraping \u0686\u06cc\u0633\u062a\u061f Web scraping \u062a\u06a9\u0646\u06cc\u06a9\u06cc \u0627\u0633\u062a \u06a9\u0647 \u0628\u0631\u0627\u06cc \u062c\u0645\u0639 \u0622\u0648\u0631\u06cc \u0645\u0642\u0627\u062f\u06cc\u0631 \u0632\u06cc\u0627\u062f\u06cc \u062f\u0627\u062f\u0647 \u0628\u0647 \u0635\u0648\u0631\u062a \u062e\u0648\u062f\u06a9\u0627\u0631 \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 \u06cc\u06a9 \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u0628\u0631\u0646\u0627\u0645\u0647 \u0646\u0648\u06cc\u0633\u06cc \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0645\u06cc \u0634\u0648\u062f. \u0627\u06cc\u0646 \u0627\u0645\u0631 \u0622\u0646 \u0631\u0627 \u0628\u0631\u0627\u06cc \u0628\u0633\u06cc\u0627\u0631\u06cc \u0627\u0632 \u0645\u062a\u062e\u0635\u0635\u0627\u0646 \u0645\u0627\u0646\u0646\u062f \u062a\u062d\u0644\u06cc\u0644\u06af\u0631\u0627\u0646 \u062f\u0627\u062f\u0647\u060c \u0645\u062d\u0642\u0642\u0627\u0646 \u0628\u0627\u0632\u0627\u0631\u060c \u0645\u062a\u062e\u0635\u0635\u0627\u0646 \u0633\u0626\u0648\u060c \u062a\u062d\u0644\u06cc\u0644\u06af\u0631\u0627\u0646 \u062a\u062c\u0627\u0631\u06cc \u0648 \u0645\u062d\u0642\u0642\u0627\u0646 \u062f\u0627\u0646\u0634\u06af\u0627\u0647\u06cc \u0645\u0641\u06cc\u062f \u0645\u06cc \u06a9\u0646\u062f. \u0622\u0646\u0686\u0647 \u062f\u0631 \u0627\u06cc\u0646\u062c\u0627 \u062e\u0648\u0627\u0647\u06cc\u062f \u0622\u0645\u0648\u062e\u062a [&hellip;]<\/p>\n","protected":false},"author":6,"featured_media":17608,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"footnotes":""},"categories":[1743],"tags":[1749,4752,5273,1917,1844,1926,1776,1919,1786,1814,1744,1822,1802,3656,1755,1806,2829,1927],"class_list":["post-17607","post","type-post","status-publish","format-standard","has-post-thumbnail","hentry","category-python","tag-python","tag-scraper","tag-sdk","tag--python","tag-1844","tag-1926","tag-1776","tag----python","tag-1786","tag-1814","tag-1744","tag-1822","tag-1802","tag-3656","tag-1755","tag-1806","tag-2829","tag-1927"],"acf":[],"_links":{"self":[{"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/posts\/17607","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/users\/6"}],"replies":[{"embeddable":true,"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/comments?post=17607"}],"version-history":[{"count":0,"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/posts\/17607\/revisions"}],"wp:featuredmedia":[{"embeddable":true,"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/media\/17608"}],"wp:attachment":[{"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/media?parent=17607"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/categories?post=17607"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/rasanegaar.com\/blog\/wp-json\/wp\/v2\/tags?post=17607"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}