{"id":95767,"date":"2025-02-03T02:22:31","date_gmt":"2025-02-02T22:52:31","guid":{"rendered":"https:\/\/nabfollower.com\/blog\/playwright-on-cloud-automating-review-data-extraction-9i7\/"},"modified":"2025-02-03T02:22:31","modified_gmt":"2025-02-02T22:52:31","slug":"playwright-on-cloud-automating-review-data-extraction-9i7","status":"publish","type":"post","link":"https:\/\/nabfollower.com\/blog\/playwright-on-cloud-automating-review-data-extraction-9i7\/","title":{"rendered":"\u0646\u0645\u0627\u06cc\u0634\u0646\u0627\u0645\u0647 \u0646\u0648\u06cc\u0633 \u062f\u0631 \u0627\u0628\u0631: \u062e\u0648\u062f\u06a9\u0627\u0631 \u0633\u0627\u0632\u06cc \u0627\u0633\u062a\u062e\u0631\u0627\u062c \u062f\u0627\u062f\u0647 \u0647\u0627\u06cc \u0628\u0631\u0631\u0633\u06cc"},"content":{"rendered":"<div data-article-id=\"2255760\" id=\"article-body\">\n<div id=\"ez-toc-container\" class=\"ez-toc-v2_0_84 counter-hierarchy ez-toc-counter-rtl ez-toc-grey ez-toc-container-direction\">\n<div class=\"ez-toc-title-container\">\n<p class=\"ez-toc-title\" style=\"cursor:inherit\">\u0641\u0647\u0631\u0633\u062a \u0645\u0637\u0627\u0644\u0628<\/p>\n<span class=\"ez-toc-title-toggle\"><a href=\"#\" class=\"ez-toc-pull-right ez-toc-btn ez-toc-btn-xs ez-toc-btn-default ez-toc-toggle\" aria-label=\"Toggle Table of Content\"><span class=\"ez-toc-js-icon-con\"><span class=\"\"><span class=\"eztoc-hide\" style=\"display:none;\">Toggle<\/span><span class=\"ez-toc-icon-toggle-span\"><svg style=\"fill: #999;color:#999\" xmlns=\"http:\/\/www.w3.org\/2000\/svg\" class=\"list-377408\" width=\"20px\" height=\"20px\" viewBox=\"0 0 24 24\" fill=\"none\"><path d=\"M6 6H4v2h2V6zm14 0H8v2h12V6zM4 11h2v2H4v-2zm16 0H8v2h12v-2zM4 16h2v2H4v-2zm16 0H8v2h12v-2z\" fill=\"currentColor\"><\/path><\/svg><svg style=\"fill: #999;color:#999\" class=\"arrow-unsorted-368013\" xmlns=\"http:\/\/www.w3.org\/2000\/svg\" width=\"10px\" height=\"10px\" viewBox=\"0 0 24 24\" version=\"1.2\" baseProfile=\"tiny\"><path d=\"M18.2 9.3l-6.2-6.3-6.2 6.3c-.2.2-.3.4-.3.7s.1.5.3.7c.2.2.4.3.7.3h11c.3 0 .5-.1.7-.3.2-.2.3-.5.3-.7s-.1-.5-.3-.7zM5.8 14.7l6.2 6.3 6.2-6.3c.2-.2.3-.5.3-.7s-.1-.5-.3-.7c-.2-.2-.4-.3-.7-.3h-11c-.3 0-.5.1-.7.3-.2.2-.3.5-.3.7s.1.5.3.7z\"\/><\/svg><\/span><\/span><\/span><\/a><\/span><\/div>\n<nav><ul class='ez-toc-list ez-toc-list-level-1 ' ><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class=\"ez-toc-link ez-toc-heading-1\" href=\"https:\/\/nabfollower.com\/blog\/playwright-on-cloud-automating-review-data-extraction-9i7\/#%D8%A8%DB%8C%D8%A7%D9%86%DB%8C%D9%87_%D9%85%D8%B4%DA%A9%D9%84\" >\u0628\u06cc\u0627\u0646\u06cc\u0647 \u0645\u0634\u06a9\u0644<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class=\"ez-toc-link ez-toc-heading-2\" href=\"https:\/\/nabfollower.com\/blog\/playwright-on-cloud-automating-review-data-extraction-9i7\/#%D8%A7%D8%AC%D8%B1%D8%A7%DB%8C\" >\u0627\u062c\u0631\u0627\u06cc<\/a><ul class='ez-toc-list-level-3' ><li class='ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-3\" href=\"https:\/\/nabfollower.com\/blog\/playwright-on-cloud-automating-review-data-extraction-9i7\/#%D8%AF%D8%B1%D9%88%D8%A7%D8%B2%D9%87_API\" >\u062f\u0631\u0648\u0627\u0632\u0647 API<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-4\" href=\"https:\/\/nabfollower.com\/blog\/playwright-on-cloud-automating-review-data-extraction-9i7\/#%D8%B9%D9%85%D9%84%DA%A9%D8%B1%D8%AF_%D9%84%D8%A7%D9%85%D8%A8%D8%AF%D8%A7\" >\u0639\u0645\u0644\u06a9\u0631\u062f \u0644\u0627\u0645\u0628\u062f\u0627<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-5\" href=\"https:\/\/nabfollower.com\/blog\/playwright-on-cloud-automating-review-data-extraction-9i7\/#%D9%86%D9%85%D9%88%D9%86%D9%87_EC2\" >\u0646\u0645\u0648\u0646\u0647 EC2<\/a><\/li><\/ul><\/li><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class=\"ez-toc-link ez-toc-heading-6\" href=\"https:\/\/nabfollower.com\/blog\/playwright-on-cloud-automating-review-data-extraction-9i7\/#%DA%86%D8%A7%D9%84%D8%B4_%D9%87%D8%A7%DB%8C_%D8%B1%D9%88%D8%A8%D8%B1%D9%88\" >\u0686\u0627\u0644\u0634 \u0647\u0627\u06cc \u0631\u0648\u0628\u0631\u0648<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class=\"ez-toc-link ez-toc-heading-7\" href=\"https:\/\/nabfollower.com\/blog\/playwright-on-cloud-automating-review-data-extraction-9i7\/#%D9%86%D8%B3%D8%AE%D9%87_%D8%A2%D8%B2%D9%85%D8%A7%DB%8C%D8%B4%DB%8C\" >\u0646\u0633\u062e\u0647 \u0622\u0632\u0645\u0627\u06cc\u0634\u06cc<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class=\"ez-toc-link ez-toc-heading-8\" href=\"https:\/\/nabfollower.com\/blog\/playwright-on-cloud-automating-review-data-extraction-9i7\/#%D9%86%D9%82%D8%A7%D8%B7_%D9%BE%D8%A7%DB%8C%D8%A7%D9%86%DB%8C_API\" >\u0646\u0642\u0627\u0637 \u067e\u0627\u06cc\u0627\u0646\u06cc API<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class=\"ez-toc-link ez-toc-heading-9\" href=\"https:\/\/nabfollower.com\/blog\/playwright-on-cloud-automating-review-data-extraction-9i7\/#%DA%AF%D8%B1%D8%AF%D8%B4_%DA%A9%D8%A7%D8%B1\" >\u06af\u0631\u062f\u0634 \u06a9\u0627\u0631<\/a><ul class='ez-toc-list-level-4' ><li class='ez-toc-heading-level-4'><ul class='ez-toc-list-level-4' ><li class='ez-toc-heading-level-4'><a class=\"ez-toc-link ez-toc-heading-10\" href=\"https:\/\/nabfollower.com\/blog\/playwright-on-cloud-automating-review-data-extraction-9i7\/#%D9%81%D9%86_%D8%A2%D9%88%D8%B1%DB%8C_%D9%87%D8%A7%DB%8C_%D9%85%D9%88%D8%B1%D8%AF_%D8%A7%D8%B3%D8%AA%D9%81%D8%A7%D8%AF%D9%87\" >\u0641\u0646 \u0622\u0648\u0631\u06cc \u0647\u0627\u06cc \u0645\u0648\u0631\u062f \u0627\u0633\u062a\u0641\u0627\u062f\u0647:<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-4'><a class=\"ez-toc-link ez-toc-heading-11\" href=\"https:\/\/nabfollower.com\/blog\/playwright-on-cloud-automating-review-data-extraction-9i7\/#%D9%85%D8%A4%D9%84%D9%81%D9%87_%D9%87%D8%A7\" >\u0645\u0624\u0644\u0641\u0647 \u0647\u0627:<\/a><\/li><\/ul><\/li><\/ul><\/li><\/ul><\/nav><\/div>\n<h2><span class=\"ez-toc-section\" id=\"%D8%A8%DB%8C%D8%A7%D9%86%DB%8C%D9%87_%D9%85%D8%B4%DA%A9%D9%84\"><\/span>\n<p>  \u0628\u06cc\u0627\u0646\u06cc\u0647 \u0645\u0634\u06a9\u0644<br \/>\n<span class=\"ez-toc-section-end\"><\/span><\/h2>\n<p>\u0627\u0644\u0632\u0627\u0645 \u0627\u06cc\u0646 \u0628\u0631\u0646\u0627\u0645\u0647 \u0627\u0633\u062a\u062e\u0631\u0627\u062c \u062f\u0627\u062f\u0647 \u0647\u0627\u06cc \u0645\u0631\u0648\u0631 \u0627\u0632 \u0648\u0628 \u0633\u0627\u06cc\u062a \u0647\u0627\u06cc \u0645\u062d\u0635\u0648\u0644 \u0627\u0633\u062a \u06a9\u0647 \u062f\u0631 \u0628\u062e\u0634 \u0628\u0631\u0631\u0633\u06cc \u0635\u0641\u062d\u0647 \u0628\u0646\u062f\u06cc \u062f\u0627\u0631\u0646\u062f \u0648 \u0646\u06cc\u0627\u0632 \u0628\u0647 \u067e\u0634\u062a\u06cc\u0628\u0627\u0646\u06cc \u062c\u0647\u0627\u0646\u06cc \u0628\u0631\u0627\u06cc \u0647\u0645\u0647 \u0646\u0648\u0639 \u0635\u0641\u062d\u0647 \u0628\u0646\u062f\u06cc \u062f\u0627\u0631\u0646\u062f. \u0647\u0645\u0686\u0646\u06cc\u0646 \u0628\u0631\u0627\u06cc \u0628\u0627\u0632\u06af\u0634\u062a \u0628\u0647 \u0628\u0631\u0631\u0633\u06cc \u0627\u0633\u062a\u062e\u0631\u0627\u062c \u0634\u062f\u0647 \u060c API GET \u0646\u06cc\u0632 \u0644\u0627\u0632\u0645 \u0627\u0633\u062a.<\/p>\n<h2><span class=\"ez-toc-section\" id=\"%D8%A7%D8%AC%D8%B1%D8%A7%DB%8C\"><\/span>\n<p>  \u0627\u062c\u0631\u0627\u06cc<br \/>\n<span class=\"ez-toc-section-end\"><\/span><\/h2>\n<p>\u0627\u06cc\u0646 \u0634\u0627\u0645\u0644 \u0633\u0647 \u0645\u0624\u0644\u0641\u0647 \u0627\u0635\u0644\u06cc \u060c API Gateway \u060c \u0639\u0645\u0644\u06a9\u0631\u062f \u0644\u0627\u0645\u0628\u062f\u0627 \u0648 \u0646\u0645\u0648\u0646\u0647 EC2 \u0627\u0633\u062a. \u0628\u06cc\u0627\u06cc\u06cc\u062f \u0628\u0647 \u0635\u0648\u0631\u062a \u062c\u062f\u0627\u06af\u0627\u0646\u0647 \u0628\u0647 \u0647\u0631 \u0645\u0624\u0644\u0641\u0647 \u0634\u06cc\u0631\u062c\u0647 \u0628\u0632\u0646\u06cc\u0645:<\/p>\n<p><\/p>\n<h3><span class=\"ez-toc-section\" id=\"%D8%AF%D8%B1%D9%88%D8%A7%D8%B2%D9%87_API\"><\/span>\n<p>  \u062f\u0631\u0648\u0627\u0632\u0647 API<br \/>\n<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p>\u0647\u0645\u0627\u0646\u0637\u0648\u0631 \u06a9\u0647 \u0627\u0632 \u0646\u0627\u0645 \u0622\u0646 \u067e\u06cc\u062f\u0627\u0633\u062a \u060c \u0631\u0648\u0646\u062f \u0627\u062a\u0648\u0645\u0627\u0633\u06cc\u0648\u0646 \u0645\u0627 \u0631\u0627 \u062f\u0631 \u0645\u0639\u0631\u0636 \u0634\u0628\u06a9\u0647 \u0642\u0631\u0627\u0631 \u0645\u06cc \u062f\u0647\u062f. \u0628\u0631\u0627\u06cc \u0627\u06cc\u0646 \u0645\u0648\u0631\u062f \u060c \u0627\u06cc\u0646 \u06cc\u06a9 API REST \u0628\u0627 \u067e\u0627\u0633\u062e \u0628\u0647 \u0627\u06cc\u0646 \u0635\u0648\u0631\u062a \u0627\u0633\u062a:<\/p>\n<div class=\"highlight js-code-highlight\">\n<pre class=\"highlight json\"><code><span class=\"p\">{<\/span><span class=\"w\">\n  <\/span><span class=\"nl\">\"reviews_count\"<\/span><span class=\"p\">:<\/span><span class=\"w\"> <\/span><span class=\"mi\">100<\/span><span class=\"p\">,<\/span><span class=\"w\">\n  <\/span><span class=\"nl\">\"reviews\"<\/span><span class=\"p\">:<\/span><span class=\"w\"> <\/span><span class=\"p\">[<\/span><span class=\"w\">\n    <\/span><span class=\"p\">{<\/span><span class=\"w\">\n      <\/span><span class=\"nl\">\"title\"<\/span><span class=\"p\">:<\/span><span class=\"w\"> <\/span><span class=\"s2\">\"Review Title\"<\/span><span class=\"p\">,<\/span><span class=\"w\">\n      <\/span><span class=\"nl\">\"body\"<\/span><span class=\"p\">:<\/span><span class=\"w\"> <\/span><span class=\"s2\">\"Review body text\"<\/span><span class=\"p\">,<\/span><span class=\"w\">\n      <\/span><span class=\"nl\">\"rating\"<\/span><span class=\"p\">:<\/span><span class=\"w\"> <\/span><span class=\"mi\">5<\/span><span class=\"p\">,<\/span><span class=\"w\">\n      <\/span><span class=\"nl\">\"reviewer\"<\/span><span class=\"p\">:<\/span><span class=\"w\"> <\/span><span class=\"s2\">\"Reviewer Name\"<\/span><span class=\"w\">\n    <\/span><span class=\"p\">},<\/span><span class=\"w\">\n    <\/span><span class=\"err\">...<\/span><span class=\"w\">\n  <\/span><span class=\"p\">]<\/span><span class=\"w\">\n<\/span><span class=\"p\">}<\/span><span class=\"w\">\n<\/span><\/code><\/pre>\n<div class=\"highlight__panel js-actions-panel\">\n<div class=\"highlight__panel-action js-fullscreen-code-action\">\n    <svg xmlns=\"http:\/\/www.w3.org\/2000\/svg\" width=\"20px\" height=\"20px\" viewbox=\"0 0 24 24\" class=\"highlight-action crayons-icon highlight-action--fullscreen-on\"><title>\u062d\u0627\u0644\u062a \u062a\u0645\u0627\u0645 \u0635\u0641\u062d\u0647 \u0631\u0627 \u0648\u0627\u0631\u062f \u06a9\u0646\u06cc\u062f<\/title>\n    <path d=\"M16 3h6v6h-2V5h-4V3zM2 3h6v2H4v4H2V3zm18 16v-4h2v6h-6v-2h4zM4 19h4v2H2v-6h2v4z\"\/>\n<\/svg><\/p>\n<p>    <svg xmlns=\"http:\/\/www.w3.org\/2000\/svg\" width=\"20px\" height=\"20px\" viewbox=\"0 0 24 24\" class=\"highlight-action crayons-icon highlight-action--fullscreen-off\"><title>\u0627\u0632 \u062d\u0627\u0644\u062a \u062a\u0645\u0627\u0645 \u0635\u0641\u062d\u0647 \u062e\u0627\u0631\u062c \u0634\u0648\u06cc\u062f<\/title>\n    <path d=\"M18 7h4v2h-6V3h2v4zM8 9H2V7h4V3h2v6zm10 8v4h-2v-6h6v2h-4zM8 15v6H6v-4H2v-2h6z\"\/>\n<\/svg><\/p>\n<\/div>\n<\/div>\n<\/div>\n<p>API \u06a9\u0647 \u0645\u0627 \u0628\u0647 \u062a\u0627\u0632\u06af\u06cc \u0627\u06cc\u062c\u0627\u062f \u06a9\u0631\u062f\u06cc\u0645 \u060c \u0639\u0645\u0644\u06a9\u0631\u062f Lambda \u0631\u0627 \u0627\u06cc\u062c\u0627\u062f \u0645\u06cc \u06a9\u0646\u062f \u06a9\u0647 \u0631\u0648\u0646\u062f \u06a9\u0627\u0631 \u0631\u0627 \u062f\u0631 \u0646\u0645\u0648\u0646\u0647 EC2 \u0645\u0627 \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 SSM \u0645\u062f\u06cc\u0631\u06cc\u062a \u0645\u06cc \u06a9\u0646\u062f (\u0628\u0644\u0648\u06a9 \u06a9\u062f \u0628\u0631\u0627\u06cc SSM \u062f\u0631 \u0628\u062e\u0634 \u0628\u0639\u062f\u06cc \u0648\u0635\u0644 \u0634\u062f\u0647 \u0627\u0633\u062a). <br \/>\u0646\u0642\u0637\u0647 \u067e\u0627\u06cc\u0627\u0646\u06cc API \u0628\u0627\u06cc\u062f \u06cc\u06a9 \u067e\u0627\u0631\u0627\u0645\u062a\u0631 \u062c\u0633\u062a\u062c\u0648\u06cc \u067e\u0631\u0633 \u0648 \u062c\u0648 \u0628\u0647 \u0646\u0627\u0645 &#8220;\u0635\u0641\u062d\u0647&#8221; \u062f\u0627\u0634\u062a\u0647 \u0628\u0627\u0634\u062f. \u0646\u0642\u0637\u0647 \u067e\u0627\u06cc\u0627\u0646\u06cc \u0646\u0647\u0627\u06cc\u06cc \u0628\u0627\u06cc\u062f \u0645\u0627\u0646\u0646\u062f \u0627\u06cc\u0646 \u0628\u0627\u0634\u062f: <code>\/api\/reviews?page={url}<\/code>\u0628\u0634\u0631 \u067e\u0627\u0631\u0627\u0645\u062a\u0631 \u062c\u0633\u062a\u062c\u0648\u06cc \u067e\u0631\u0633 \u0648 \u062c\u0648 \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 \u067e\u0627\u0631\u0627\u0645\u062a\u0631 \u0631\u0648\u06cc\u062f\u0627\u062f \u0645\u0648\u062c\u0648\u062f \u062f\u0631 \u0639\u0645\u0644\u06a9\u0631\u062f Lambda \u0628\u0647 \u0639\u0645\u0644\u06a9\u0631\u062f Lambda \u0645\u0646\u062a\u0642\u0644 \u0645\u06cc \u0634\u0648\u062f.<br \/>\u0645\u0627 \u0628\u0627\u06cc\u062f \u0627\u0637\u0645\u06cc\u0646\u0627\u0646 \u062d\u0627\u0635\u0644 \u06a9\u0646\u06cc\u0645 \u06a9\u0647 \u0627\u062f\u063a\u0627\u0645 \u067e\u0631\u0648\u06a9\u0633\u06cc Lambda \u0628\u0647 \u062f\u0631\u0633\u062a\u06cc \u062a\u0646\u0638\u06cc\u0645 \u0634\u062f\u0647 \u0627\u0633\u062a \u062a\u0627 \u0628\u062a\u0648\u0627\u0646\u06cc\u062f \u0639\u0645\u0644\u06a9\u0631\u062f Lambda \u0631\u0627 \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u067e\u0627\u0633\u062e API \u0645\u0627 \u062f\u0631\u06cc\u0627\u0641\u062a \u06a9\u0646\u06cc\u062f. <\/p>\n<h3><span class=\"ez-toc-section\" id=\"%D8%B9%D9%85%D9%84%DA%A9%D8%B1%D8%AF_%D9%84%D8%A7%D9%85%D8%A8%D8%AF%D8%A7\"><\/span>\n<p>  \u0639\u0645\u0644\u06a9\u0631\u062f \u0644\u0627\u0645\u0628\u062f\u0627<br \/>\n<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p>\u0639\u0645\u0644\u06a9\u0631\u062f \u0644\u0627\u0645\u0628\u062f\u0627 \u0645\u0627 \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u0648\u0627\u0633\u0637\u0647 \u0627\u06cc \u06a9\u0627\u0631 \u062e\u0648\u0627\u0647\u062f \u06a9\u0631\u062f \u06a9\u0647 \u0627\u0632 \u062a\u0645\u0627\u0633 API \u0634\u0631\u0648\u0639 \u0645\u06cc \u0634\u0648\u062f \u0648 \u062e\u0637 \u0644\u0648\u0644\u0647 \u0627\u062a\u0648\u0645\u0627\u0633\u06cc\u0648\u0646 \u0631\u0627 \u062f\u0631 EC2 \u0627\u062c\u0631\u0627 \u0645\u06cc \u06a9\u0646\u062f \u0648 \u062a\u0648\u0644\u06cc\u062f \u062e\u0631\u0648\u062c\u06cc \u0631\u0627 \u062a\u0648\u0633\u0637 \u062e\u0637 \u0644\u0648\u0644\u0647 \u0628\u0647 \u067e\u0627\u0633\u062e API \u0645\u0646\u062a\u0642\u0644 \u0645\u06cc \u06a9\u0646\u062f.<br \/>\u0639\u0645\u0644\u06a9\u0631\u062f Lambda \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 \u067e\u0627\u0631\u0627\u0645\u062a\u0631 \u0631\u0648\u06cc\u062f\u0627\u062f \u0645\u0646\u062a\u0642\u0644 \u0634\u062f\u0647 \u062f\u0631 \u0639\u0645\u0644\u06a9\u0631\u062f Lambda \u0645\u0627\u0646\u0646\u062f \u0627\u06cc\u0646 \u060c \u067e\u0627\u0631\u0627\u0645\u062a\u0631 \u062c\u0633\u062a\u062c\u0648\u06cc \u067e\u0631\u0633 \u0648 \u062c\u0648 \u0631\u0627 \u062f\u0631\u06cc\u0627\u0641\u062a \u0645\u06cc \u06a9\u0646\u062f:<\/p>\n<div class=\"highlight js-code-highlight\">\n<pre class=\"highlight python\"><code><span class=\"n\">url<\/span> <span class=\"o\">=<\/span> <span class=\"n\">event<\/span><span class=\"p\">[<\/span><span class=\"sh\">'<\/span><span class=\"s\">queryStringParameters<\/span><span class=\"sh\">'<\/span><span class=\"p\">][<\/span><span class=\"sh\">'<\/span><span class=\"s\">page<\/span><span class=\"sh\">'<\/span><span class=\"p\">]<\/span>\n<\/code><\/pre>\n<div class=\"highlight__panel js-actions-panel\">\n<div class=\"highlight__panel-action js-fullscreen-code-action\">\n    <svg xmlns=\"http:\/\/www.w3.org\/2000\/svg\" width=\"20px\" height=\"20px\" viewbox=\"0 0 24 24\" class=\"highlight-action crayons-icon highlight-action--fullscreen-on\"><title>\u062d\u0627\u0644\u062a \u062a\u0645\u0627\u0645 \u0635\u0641\u062d\u0647 \u0631\u0627 \u0648\u0627\u0631\u062f \u06a9\u0646\u06cc\u062f<\/title>\n    <path d=\"M16 3h6v6h-2V5h-4V3zM2 3h6v2H4v4H2V3zm18 16v-4h2v6h-6v-2h4zM4 19h4v2H2v-6h2v4z\"\/>\n<\/svg><\/p>\n<p>    <svg xmlns=\"http:\/\/www.w3.org\/2000\/svg\" width=\"20px\" height=\"20px\" viewbox=\"0 0 24 24\" class=\"highlight-action crayons-icon highlight-action--fullscreen-off\"><title>\u0627\u0632 \u062d\u0627\u0644\u062a \u062a\u0645\u0627\u0645 \u0635\u0641\u062d\u0647 \u062e\u0627\u0631\u062c \u0634\u0648\u06cc\u062f<\/title>\n    <path d=\"M18 7h4v2h-6V3h2v4zM8 9H2V7h4V3h2v6zm10 8v4h-2v-6h6v2h-4zM8 15v6H6v-4H2v-2h6z\"\/>\n<\/svg><\/p>\n<\/div>\n<\/div>\n<\/div>\n<p>\u0647\u0645\u0627\u0646\u0637\u0648\u0631 \u06a9\u0647 \u0642\u0628\u0644\u0627\u064b \u0630\u06a9\u0631 \u0634\u062f \u060c \u0627\u0632 SSM \u0628\u0631\u0627\u06cc \u0645\u062f\u06cc\u0631\u06cc\u062a \u0641\u0631\u0622\u06cc\u0646\u062f \u0627\u062c\u0631\u0627 \u0634\u062f\u0647 \u062a\u0648\u0633\u0637 \u0646\u0645\u0648\u0646\u0647 EC2 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0645\u06cc \u06a9\u0646\u062f \u060c \u062f\u0631 \u0627\u06cc\u0646\u062c\u0627 \u0628\u0644\u0648\u06a9 \u06a9\u062f \u0627\u0633\u062a \u06a9\u0647 \u0645\u0633\u0626\u0648\u0644 \u0622\u0646 \u0627\u0633\u062a<\/p>\n<div class=\"highlight js-code-highlight\">\n<pre class=\"highlight python\"><code><span class=\"n\">ssm<\/span> <span class=\"o\">=<\/span> <span class=\"n\">boto3<\/span><span class=\"p\">.<\/span><span class=\"nf\">client<\/span><span class=\"p\">(<\/span><span class=\"sh\">'<\/span><span class=\"s\">ssm<\/span><span class=\"sh\">'<\/span><span class=\"p\">,<\/span> <span class=\"n\">region_name<\/span><span class=\"o\">=<\/span><span class=\"sh\">'<\/span><span class=\"s\">ap-south-1<\/span><span class=\"sh\">'<\/span><span class=\"p\">)<\/span>\n<span class=\"n\">unique_id<\/span> <span class=\"o\">=<\/span> <span class=\"nf\">str<\/span><span class=\"p\">(<\/span><span class=\"n\">uuid<\/span><span class=\"p\">.<\/span><span class=\"nf\">uuid4<\/span><span class=\"p\">())<\/span>\n\n<span class=\"c1\"># Send command to EC2 instance\n<\/span><span class=\"n\">response<\/span> <span class=\"o\">=<\/span> <span class=\"n\">ssm<\/span><span class=\"p\">.<\/span><span class=\"nf\">send_command<\/span><span class=\"p\">(<\/span>\n    <span class=\"n\">InstanceIds<\/span><span class=\"o\">=<\/span><span class=\"p\">[<\/span><span class=\"sh\">'<\/span><span class=\"s\">i-instanceIdOfTheEc2VM<\/span><span class=\"sh\">'<\/span><span class=\"p\">],<\/span>\n    <span class=\"n\">DocumentName<\/span><span class=\"o\">=<\/span><span class=\"sh\">'<\/span><span class=\"s\">AWS-RunPowerShellScript<\/span><span class=\"sh\">'<\/span><span class=\"p\">,<\/span>\n    <span class=\"n\">Parameters<\/span><span class=\"o\">=<\/span><span class=\"p\">{<\/span>\n        <span class=\"sh\">'<\/span><span class=\"s\">commands<\/span><span class=\"sh\">'<\/span><span class=\"p\">:<\/span> <span class=\"p\">[<\/span><span class=\"sa\">f<\/span><span class=\"sh\">'<\/span><span class=\"s\">C:<\/span><span class=\"se\">\\\\<\/span><span class=\"s\">Users<\/span><span class=\"se\">\\\\<\/span><span class=\"s\">Administrator<\/span><span class=\"se\">\\\\<\/span><span class=\"s\">AppData<\/span><span class=\"se\">\\\\<\/span><span class=\"s\">Local<\/span><span class=\"se\">\\\\<\/span><span class=\"s\">Programs<\/span><span class=\"se\">\\\\<\/span><span class=\"s\">Python<\/span><span class=\"se\">\\\\<\/span><span class=\"s\">Python311<\/span><span class=\"se\">\\\\<\/span><span class=\"s\">python.exe C:<\/span><span class=\"se\">\\\\<\/span><span class=\"s\">final-automation-w-rating.py <\/span><span class=\"sh\">\"<\/span><span class=\"si\">{<\/span><span class=\"n\">url<\/span><span class=\"si\">}<\/span><span class=\"sh\">\"<\/span><span class=\"s\"> <\/span><span class=\"sh\">\"<\/span><span class=\"si\">{<\/span><span class=\"n\">unique_id<\/span><span class=\"si\">}<\/span><span class=\"sh\">\"'<\/span><span class=\"p\">]<\/span>\n    <span class=\"p\">}<\/span>\n<span class=\"p\">)<\/span>\n\n<span class=\"n\">command_id<\/span> <span class=\"o\">=<\/span> <span class=\"n\">response<\/span><span class=\"p\">[<\/span><span class=\"sh\">'<\/span><span class=\"s\">Command<\/span><span class=\"sh\">'<\/span><span class=\"p\">][<\/span><span class=\"sh\">'<\/span><span class=\"s\">CommandId<\/span><span class=\"sh\">'<\/span><span class=\"p\">]<\/span>\n<\/code><\/pre>\n<div class=\"highlight__panel js-actions-panel\">\n<div class=\"highlight__panel-action js-fullscreen-code-action\">\n    <svg xmlns=\"http:\/\/www.w3.org\/2000\/svg\" width=\"20px\" height=\"20px\" viewbox=\"0 0 24 24\" class=\"highlight-action crayons-icon highlight-action--fullscreen-on\"><title>\u062d\u0627\u0644\u062a \u062a\u0645\u0627\u0645 \u0635\u0641\u062d\u0647 \u0631\u0627 \u0648\u0627\u0631\u062f \u06a9\u0646\u06cc\u062f<\/title>\n    <path d=\"M16 3h6v6h-2V5h-4V3zM2 3h6v2H4v4H2V3zm18 16v-4h2v6h-6v-2h4zM4 19h4v2H2v-6h2v4z\"\/>\n<\/svg><\/p>\n<p>    <svg xmlns=\"http:\/\/www.w3.org\/2000\/svg\" width=\"20px\" height=\"20px\" viewbox=\"0 0 24 24\" class=\"highlight-action crayons-icon highlight-action--fullscreen-off\"><title>\u0627\u0632 \u062d\u0627\u0644\u062a \u062a\u0645\u0627\u0645 \u0635\u0641\u062d\u0647 \u062e\u0627\u0631\u062c \u0634\u0648\u06cc\u062f<\/title>\n    <path d=\"M18 7h4v2h-6V3h2v4zM8 9H2V7h4V3h2v6zm10 8v4h-2v-6h6v2h-4zM8 15v6H6v-4H2v-2h6z\"\/>\n<\/svg><\/p>\n<\/div>\n<\/div>\n<\/div>\n<p>\u0627\u06cc\u0646 \u0628\u0644\u0648\u06a9 \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a Python \u0645\u0648\u062c\u0648\u062f \u062f\u0631 \u0646\u0645\u0648\u0646\u0647 EC2 \u0631\u0627 \u0627\u062c\u0631\u0627 \u0645\u06cc \u06a9\u0646\u062f. \u0645\u0627 \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u0622\u0631\u06af\u0648\u0645\u0627\u0646 \u062e\u0637 \u0641\u0631\u0645\u0627\u0646 \u0628\u0631\u0627\u06cc \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u067e\u0627\u06cc\u062a\u0648\u0646 \u062f\u0631 \u062d\u0627\u0644 \u0639\u0628\u0648\u0631 \u0627\u0632 &#8220;\u0645\u0646\u062d\u0635\u0631 \u0628\u0647 \u0641\u0631\u062f&#8221; \u0648 &#8220;url&#8221; \u0647\u0633\u062a\u06cc\u0645. <br \/>\u0633\u067e\u0633 \u06cc\u06a9 \u0628\u0644\u0648\u06a9 \u0647\u0645\u0632\u0645\u0627\u0646 \u0631\u0627 \u0627\u062c\u0631\u0627 \u0645\u06cc \u06a9\u0646\u062f \u06a9\u0647 \u0648\u0636\u0639\u06cc\u062a \u0627\u06cc\u0646 \u0631\u0648\u0646\u062f \u0631\u0627 \u0628\u0647 \u067e\u0627\u06cc\u0627\u0646 \u0631\u0633\u0627\u0646\u062f \u06cc\u0627 \u0647\u0631 8 \u062b\u0627\u0646\u06cc\u0647 \u0628\u0647 \u067e\u0627\u06cc\u0627\u0646 \u0628\u0631\u0633\u062f.<\/p>\n<div class=\"highlight js-code-highlight\">\n<pre class=\"highlight python\"><code><span class=\"k\">while<\/span> <span class=\"bp\">True<\/span><span class=\"p\">:<\/span>\n    <span class=\"k\">try<\/span><span class=\"p\">:<\/span>\n        <span class=\"n\">invocation_response<\/span> <span class=\"o\">=<\/span> <span class=\"n\">ssm<\/span><span class=\"p\">.<\/span><span class=\"nf\">get_command_invocation<\/span><span class=\"p\">(<\/span>\n            <span class=\"n\">CommandId<\/span><span class=\"o\">=<\/span><span class=\"n\">command_id<\/span><span class=\"p\">,<\/span>\n            <span class=\"n\">InstanceId<\/span><span class=\"o\">=<\/span><span class=\"sh\">'<\/span><span class=\"s\">i-07b0999d978efd1fb<\/span><span class=\"sh\">'<\/span>\n        <span class=\"p\">)<\/span>\n\n        <span class=\"n\">status<\/span> <span class=\"o\">=<\/span> <span class=\"n\">invocation_response<\/span><span class=\"p\">[<\/span><span class=\"sh\">'<\/span><span class=\"s\">Status<\/span><span class=\"sh\">'<\/span><span class=\"p\">]<\/span>\n\n        <span class=\"k\">if<\/span> <span class=\"n\">status<\/span> <span class=\"ow\">in<\/span> <span class=\"p\">[<\/span><span class=\"sh\">'<\/span><span class=\"s\">Success<\/span><span class=\"sh\">'<\/span><span class=\"p\">,<\/span> <span class=\"sh\">'<\/span><span class=\"s\">Failed<\/span><span class=\"sh\">'<\/span><span class=\"p\">,<\/span> <span class=\"sh\">'<\/span><span class=\"s\">Cancelled<\/span><span class=\"sh\">'<\/span><span class=\"p\">,<\/span> <span class=\"sh\">'<\/span><span class=\"s\">TimedOut<\/span><span class=\"sh\">'<\/span><span class=\"p\">]:<\/span>\n            <span class=\"nf\">print<\/span><span class=\"p\">(<\/span><span class=\"sa\">f<\/span><span class=\"sh\">\"<\/span><span class=\"s\">Command finished with status: <\/span><span class=\"si\">{<\/span><span class=\"n\">status<\/span><span class=\"si\">}<\/span><span class=\"sh\">\"<\/span><span class=\"p\">)<\/span>\n            <span class=\"k\">break<\/span>\n\n        <span class=\"nf\">print<\/span><span class=\"p\">(<\/span><span class=\"sa\">f<\/span><span class=\"sh\">\"<\/span><span class=\"s\">Current status: <\/span><span class=\"si\">{<\/span><span class=\"n\">status<\/span><span class=\"si\">}<\/span><span class=\"s\">. Waiting for completion...<\/span><span class=\"sh\">\"<\/span><span class=\"p\">)<\/span>\n        <span class=\"n\">time<\/span><span class=\"p\">.<\/span><span class=\"nf\">sleep<\/span><span class=\"p\">(<\/span><span class=\"mi\">8<\/span><span class=\"p\">)<\/span>\n\n    <span class=\"k\">except<\/span> <span class=\"n\">ssm<\/span><span class=\"p\">.<\/span><span class=\"n\">exceptions<\/span><span class=\"p\">.<\/span><span class=\"n\">InvocationDoesNotExist<\/span><span class=\"p\">:<\/span>\n        <span class=\"nf\">print<\/span><span class=\"p\">(<\/span><span class=\"sh\">\"<\/span><span class=\"s\">Invocation does not exist yet. Retrying...<\/span><span class=\"sh\">\"<\/span><span class=\"p\">)<\/span>\n        <span class=\"n\">time<\/span><span class=\"p\">.<\/span><span class=\"nf\">sleep<\/span><span class=\"p\">(<\/span><span class=\"mi\">2<\/span><span class=\"p\">)<\/span>\n<\/code><\/pre>\n<div class=\"highlight__panel js-actions-panel\">\n<div class=\"highlight__panel-action js-fullscreen-code-action\">\n    <svg xmlns=\"http:\/\/www.w3.org\/2000\/svg\" width=\"20px\" height=\"20px\" viewbox=\"0 0 24 24\" class=\"highlight-action crayons-icon highlight-action--fullscreen-on\"><title>\u062d\u0627\u0644\u062a \u062a\u0645\u0627\u0645 \u0635\u0641\u062d\u0647 \u0631\u0627 \u0648\u0627\u0631\u062f \u06a9\u0646\u06cc\u062f<\/title>\n    <path d=\"M16 3h6v6h-2V5h-4V3zM2 3h6v2H4v4H2V3zm18 16v-4h2v6h-6v-2h4zM4 19h4v2H2v-6h2v4z\"\/>\n<\/svg><\/p>\n<p>    <svg xmlns=\"http:\/\/www.w3.org\/2000\/svg\" width=\"20px\" height=\"20px\" viewbox=\"0 0 24 24\" class=\"highlight-action crayons-icon highlight-action--fullscreen-off\"><title>\u0627\u0632 \u062d\u0627\u0644\u062a \u062a\u0645\u0627\u0645 \u0635\u0641\u062d\u0647 \u062e\u0627\u0631\u062c \u0634\u0648\u06cc\u062f<\/title>\n    <path d=\"M18 7h4v2h-6V3h2v4zM8 9H2V7h4V3h2v6zm10 8v4h-2v-6h6v2h-4zM8 15v6H6v-4H2v-2h6z\"\/>\n<\/svg><\/p>\n<\/div>\n<\/div>\n<\/div>\n<p>\u0641\u0631\u0622\u06cc\u0646\u062f \u0646\u0647\u0627\u06cc\u06cc \u060c \u062f\u0627\u062f\u0647 \u0647\u0627\u06cc \u0627\u0633\u062a\u062e\u0631\u0627\u062c \u0634\u062f\u0647 \u0631\u0627 \u0627\u0632 \u0646\u0645\u0648\u0646\u0647 EC2 \u0628\u062f\u0633\u062a \u0622\u0648\u0631\u06cc\u062f. \u0628\u0631\u0627\u06cc \u0627\u0646\u062c\u0627\u0645 \u0627\u06cc\u0646 \u06a9\u0627\u0631 \u060c \u0645\u0627 \u0627\u0632 \u0633\u0637\u0644 S3 \u0628\u0631\u0627\u06cc \u0627\u0646\u062a\u0642\u0627\u0644 \u062f\u0627\u062f\u0647 \u0647\u0627\u06cc \u0628\u06cc\u0646 \u0639\u0645\u0644\u06a9\u0631\u062f EC2 \u0648 Lambda \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u062e\u0648\u0627\u0647\u06cc\u0645 \u06a9\u0631\u062f. \u067e\u06cc\u0634 \u0627\u0632 \u0627\u06cc\u0646 \u0645\u0627 &#8220;\u0645\u0646\u062d\u0635\u0631 \u0628\u0647 \u0641\u0631\u062f&#8221; \u0631\u0627 \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u0622\u0631\u06af\u0648\u0645\u0627\u0646 \u062e\u0637 \u0641\u0631\u0645\u0627\u0646 \u0628\u0647 \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u067e\u0627\u06cc\u062a\u0648\u0646 \u0645\u0646\u062a\u0642\u0644 \u06a9\u0631\u062f\u06cc\u0645 \u060c \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u0646\u0627\u0645 \u067e\u0631\u0648\u0646\u062f\u0647 \u0628\u0631\u0627\u06cc \u067e\u0631\u0648\u0646\u062f\u0647 JSON \u06a9\u0647 \u0633\u067e\u0633 \u062f\u0631 \u0633\u0637\u0644 S3 \u0628\u0627\u0631\u06af\u0630\u0627\u0631\u06cc \u0645\u06cc \u0634\u0648\u062f \u060c \u062e\u062f\u0645\u062a \u0645\u06cc \u06a9\u0646\u062f. \u0627\u0632 \u0622\u0646\u062c\u0627 \u06a9\u0647 \u0645\u0627 \u0627\u0632 \u0639\u0645\u0644\u06a9\u0631\u062f Lambda \u0645\u0646\u062d\u0635\u0631 \u0628\u0647 \u0641\u0631\u062f \u0639\u0628\u0648\u0631 \u0645\u06cc \u06a9\u0646\u06cc\u0645 \u062a\u0627 \u067e\u0633 \u0627\u0632 \u0627\u062a\u0645\u0627\u0645 \u0641\u0631\u0622\u06cc\u0646\u062f EC2 \u060c \u0628\u062a\u0648\u0627\u0646\u06cc\u0645 \u062f\u0627\u062f\u0647 \u0647\u0627 \u0631\u0627 \u0627\u0632 \u0633\u0637\u0644 S3 \u0628\u062f\u0633\u062a \u0622\u0648\u0631\u06cc\u0645 \u0648 \u062f\u0627\u062f\u0647 \u0647\u0627 \u0631\u0627 \u062f\u0631 \u0628\u06cc\u0627\u0646\u06cc\u0647 \u0628\u0631\u06af\u0634\u062a\u06cc \u06a9\u0647 \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u067e\u0627\u0633\u062e API \u0639\u0645\u0644 \u0645\u06cc \u06a9\u0646\u062f \u060c \u0631\u06cc\u062e\u062a\u0647 \u06a9\u0646\u06cc\u0645.<\/p>\n<div class=\"highlight js-code-highlight\">\n<pre class=\"highlight python\"><code><span class=\"n\">s3_client<\/span> <span class=\"o\">=<\/span> <span class=\"n\">boto3<\/span><span class=\"p\">.<\/span><span class=\"nf\">client<\/span><span class=\"p\">(<\/span><span class=\"sh\">'<\/span><span class=\"s\">s3<\/span><span class=\"sh\">'<\/span><span class=\"p\">)<\/span>\n<span class=\"n\">bucket_name<\/span> <span class=\"o\">=<\/span> <span class=\"sh\">'<\/span><span class=\"s\">extracted-reviews<\/span><span class=\"sh\">'<\/span>\n<span class=\"n\">file_name<\/span> <span class=\"o\">=<\/span> <span class=\"sa\">f<\/span><span class=\"sh\">'<\/span><span class=\"si\">{<\/span><span class=\"n\">unique_id<\/span><span class=\"si\">}<\/span><span class=\"s\">.json<\/span><span class=\"sh\">'<\/span>\n\n<span class=\"k\">try<\/span><span class=\"p\">:<\/span>\n    <span class=\"n\">s3_response<\/span> <span class=\"o\">=<\/span> <span class=\"n\">s3_client<\/span><span class=\"p\">.<\/span><span class=\"nf\">get_object<\/span><span class=\"p\">(<\/span><span class=\"n\">Bucket<\/span><span class=\"o\">=<\/span><span class=\"n\">bucket_name<\/span><span class=\"p\">,<\/span> <span class=\"n\">Key<\/span><span class=\"o\">=<\/span><span class=\"n\">file_name<\/span><span class=\"p\">)<\/span>\n    <span class=\"n\">file_data<\/span> <span class=\"o\">=<\/span> <span class=\"n\">s3_response<\/span><span class=\"p\">[<\/span><span class=\"sh\">'<\/span><span class=\"s\">Body<\/span><span class=\"sh\">'<\/span><span class=\"p\">].<\/span><span class=\"nf\">read<\/span><span class=\"p\">().<\/span><span class=\"nf\">decode<\/span><span class=\"p\">(<\/span><span class=\"sh\">'<\/span><span class=\"s\">utf-8<\/span><span class=\"sh\">'<\/span><span class=\"p\">)<\/span>\n    <span class=\"n\">json_data<\/span> <span class=\"o\">=<\/span> <span class=\"n\">json<\/span><span class=\"p\">.<\/span><span class=\"nf\">loads<\/span><span class=\"p\">(<\/span><span class=\"n\">file_data<\/span><span class=\"p\">)<\/span>\n\n    <span class=\"k\">return<\/span> <span class=\"p\">{<\/span>\n        <span class=\"sh\">'<\/span><span class=\"s\">statusCode<\/span><span class=\"sh\">'<\/span><span class=\"p\">:<\/span> <span class=\"mi\">200<\/span><span class=\"p\">,<\/span>\n        <span class=\"sh\">\"<\/span><span class=\"s\">headers<\/span><span class=\"sh\">\"<\/span><span class=\"p\">:<\/span> <span class=\"p\">{<\/span>\n            <span class=\"sh\">'<\/span><span class=\"s\">Content-Type<\/span><span class=\"sh\">'<\/span><span class=\"p\">:<\/span> <span class=\"sh\">'<\/span><span class=\"s\">application\/json<\/span><span class=\"sh\">'<\/span><span class=\"p\">,<\/span>\n            <span class=\"sh\">\"<\/span><span class=\"s\">Access-Control-Allow-Origin<\/span><span class=\"sh\">\"<\/span><span class=\"p\">:<\/span> <span class=\"sh\">\"<\/span><span class=\"s\">*<\/span><span class=\"sh\">\"<\/span><span class=\"p\">,<\/span>\n            <span class=\"sh\">\"<\/span><span class=\"s\">Access-Control-Allow-Methods<\/span><span class=\"sh\">\"<\/span><span class=\"p\">:<\/span> <span class=\"sh\">\"<\/span><span class=\"s\">GET, POST, OPTIONS<\/span><span class=\"sh\">\"<\/span><span class=\"p\">,<\/span>\n            <span class=\"sh\">\"<\/span><span class=\"s\">Access-Control-Allow-Headers<\/span><span class=\"sh\">\"<\/span><span class=\"p\">:<\/span> <span class=\"sh\">\"<\/span><span class=\"s\">Content-Type<\/span><span class=\"sh\">\"<\/span><span class=\"p\">,<\/span>\n        <span class=\"p\">},<\/span>\n        <span class=\"sh\">'<\/span><span class=\"s\">body<\/span><span class=\"sh\">'<\/span><span class=\"p\">:<\/span> <span class=\"n\">json<\/span><span class=\"p\">.<\/span><span class=\"nf\">dumps<\/span><span class=\"p\">(<\/span><span class=\"n\">json_data<\/span><span class=\"p\">)<\/span>\n    <span class=\"p\">}<\/span>\n\n<span class=\"k\">except<\/span> <span class=\"nb\">Exception<\/span> <span class=\"k\">as<\/span> <span class=\"n\">e<\/span><span class=\"p\">:<\/span>\n    <span class=\"k\">return<\/span> <span class=\"p\">{<\/span>\n        <span class=\"sh\">'<\/span><span class=\"s\">statusCode<\/span><span class=\"sh\">'<\/span><span class=\"p\">:<\/span> <span class=\"mi\">500<\/span><span class=\"p\">,<\/span>\n        <span class=\"sh\">\"<\/span><span class=\"s\">headers<\/span><span class=\"sh\">\"<\/span><span class=\"p\">:<\/span> <span class=\"p\">{<\/span>\n            <span class=\"sh\">'<\/span><span class=\"s\">Content-Type<\/span><span class=\"sh\">'<\/span><span class=\"p\">:<\/span> <span class=\"sh\">'<\/span><span class=\"s\">application\/json<\/span><span class=\"sh\">'<\/span><span class=\"p\">,<\/span>\n            <span class=\"sh\">\"<\/span><span class=\"s\">Access-Control-Allow-Origin<\/span><span class=\"sh\">\"<\/span><span class=\"p\">:<\/span> <span class=\"sh\">\"<\/span><span class=\"s\">*<\/span><span class=\"sh\">\"<\/span><span class=\"p\">,<\/span>\n            <span class=\"sh\">\"<\/span><span class=\"s\">Access-Control-Allow-Methods<\/span><span class=\"sh\">\"<\/span><span class=\"p\">:<\/span> <span class=\"sh\">\"<\/span><span class=\"s\">GET, POST, OPTIONS<\/span><span class=\"sh\">\"<\/span><span class=\"p\">,<\/span>\n            <span class=\"sh\">\"<\/span><span class=\"s\">Access-Control-Allow-Headers<\/span><span class=\"sh\">\"<\/span><span class=\"p\">:<\/span> <span class=\"sh\">\"<\/span><span class=\"s\">Content-Type<\/span><span class=\"sh\">\"<\/span><span class=\"p\">,<\/span>\n        <span class=\"p\">},<\/span>\n        <span class=\"sh\">'<\/span><span class=\"s\">body<\/span><span class=\"sh\">'<\/span><span class=\"p\">:<\/span> <span class=\"n\">json<\/span><span class=\"p\">.<\/span><span class=\"nf\">dumps<\/span><span class=\"p\">({<\/span><span class=\"sh\">'<\/span><span class=\"s\">error<\/span><span class=\"sh\">'<\/span><span class=\"p\">:<\/span> <span class=\"nf\">str<\/span><span class=\"p\">(<\/span><span class=\"n\">e<\/span><span class=\"p\">)})<\/span>\n    <span class=\"p\">}<\/span>\n<\/code><\/pre>\n<div class=\"highlight__panel js-actions-panel\">\n<div class=\"highlight__panel-action js-fullscreen-code-action\">\n    <svg xmlns=\"http:\/\/www.w3.org\/2000\/svg\" width=\"20px\" height=\"20px\" viewbox=\"0 0 24 24\" class=\"highlight-action crayons-icon highlight-action--fullscreen-on\"><title>\u062d\u0627\u0644\u062a \u062a\u0645\u0627\u0645 \u0635\u0641\u062d\u0647 \u0631\u0627 \u0648\u0627\u0631\u062f \u06a9\u0646\u06cc\u062f<\/title>\n    <path d=\"M16 3h6v6h-2V5h-4V3zM2 3h6v2H4v4H2V3zm18 16v-4h2v6h-6v-2h4zM4 19h4v2H2v-6h2v4z\"\/>\n<\/svg><\/p>\n<p>    <svg xmlns=\"http:\/\/www.w3.org\/2000\/svg\" width=\"20px\" height=\"20px\" viewbox=\"0 0 24 24\" class=\"highlight-action crayons-icon highlight-action--fullscreen-off\"><title>\u0627\u0632 \u062d\u0627\u0644\u062a \u062a\u0645\u0627\u0645 \u0635\u0641\u062d\u0647 \u062e\u0627\u0631\u062c \u0634\u0648\u06cc\u062f<\/title>\n    <path d=\"M18 7h4v2h-6V3h2v4zM8 9H2V7h4V3h2v6zm10 8v4h-2v-6h6v2h-4zM8 15v6H6v-4H2v-2h6z\"\/>\n<\/svg><\/p>\n<\/div>\n<\/div>\n<\/div>\n<h3><span class=\"ez-toc-section\" id=\"%D9%86%D9%85%D9%88%D9%86%D9%87_EC2\"><\/span>\n<p>  \u0646\u0645\u0648\u0646\u0647 EC2<br \/>\n<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p>\u0627\u0648\u0644 \u060c \u0645\u0627 \u0628\u0627\u06cc\u062f \u062a\u0627 \u062d\u062f \u0627\u0645\u06a9\u0627\u0646 \u06a9\u062f \u0631\u0627 \u0627\u0632 \u06a9\u062f \u0645\u0646\u0628\u0639 \u067e\u0627\u06cc\u06cc\u0646 \u0628\u06cc\u0627\u0648\u0631\u06cc\u0645 \u062a\u0627 \u0627\u0646\u062f\u0627\u0632\u0647 \u062a\u0648\u06a9\u0646 \u0628\u0631\u0627\u06cc LLM \u06a9\u0627\u0647\u0634 \u06cc\u0627\u0628\u062f \u060c \u06a9\u0647 \u0628\u0627\u0639\u062b \u06a9\u0627\u0647\u0634 \u0647\u0632\u06cc\u0646\u0647 \u0647\u0627\u06cc API \u060c \u0628\u0647\u0628\u0648\u062f \u0639\u0645\u0644\u06a9\u0631\u062f \u0648 \u0627\u0641\u0632\u0627\u06cc\u0634 \u062f\u0642\u062a \u0645\u06cc \u0634\u0648\u062f. \u0628\u0631\u0627\u06cc \u0627\u06cc\u0646 \u0645\u0646\u0638\u0648\u0631 \u060c \u0627\u0632 \u0632\u06cc\u0628\u0627 \u0628\u0631\u0627\u06cc \u062d\u0630\u0641 \u0647\u0645\u0647 \u0686\u06cc\u0632 \u062f\u0631 \u0628\u0631\u0686\u0633\u0628 \u0647\u0627\u06cc \u0632\u06cc\u0631 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0645\u06cc \u0634\u0648\u062f: \u0627\u0633\u06a9\u0631\u06cc\u067e\u062a \u060c \u0633\u0628\u06a9 \u060c IMG \u060c NAV \u060c \u0647\u062f\u0631 \u060c \u067e\u0627\u0648\u0631\u0642\u06cc \u060c \u062a\u0635\u0648\u06cc\u0631 \u060c SVG \u060c \u0645\u0633\u06cc\u0631 \u0648 \u0641\u0631\u0645.<\/p>\n<div class=\"highlight js-code-highlight\">\n<pre class=\"highlight python\"><code><span class=\"k\">def<\/span> <span class=\"nf\">filter_source<\/span><span class=\"p\">(<\/span><span class=\"n\">source<\/span><span class=\"p\">):<\/span>\n  <span class=\"n\">soup<\/span> <span class=\"o\">=<\/span> <span class=\"nc\">BeautifulSoup<\/span><span class=\"p\">(<\/span><span class=\"n\">source<\/span><span class=\"p\">,<\/span> <span class=\"sh\">'<\/span><span class=\"s\">html.parser<\/span><span class=\"sh\">'<\/span><span class=\"p\">)<\/span>\n\n  <span class=\"k\">for<\/span> <span class=\"n\">script<\/span> <span class=\"ow\">in<\/span> <span class=\"nf\">soup<\/span><span class=\"p\">([<\/span><span class=\"sh\">\"<\/span><span class=\"s\">script<\/span><span class=\"sh\">\"<\/span><span class=\"p\">,<\/span> <span class=\"sh\">\"<\/span><span class=\"s\">style<\/span><span class=\"sh\">\"<\/span><span class=\"p\">,<\/span> <span class=\"sh\">\"<\/span><span class=\"s\">img<\/span><span class=\"sh\">\"<\/span><span class=\"p\">,<\/span> <span class=\"sh\">\"<\/span><span class=\"s\">nav<\/span><span class=\"sh\">\"<\/span><span class=\"p\">,<\/span> <span class=\"sh\">\"<\/span><span class=\"s\">header<\/span><span class=\"sh\">\"<\/span><span class=\"p\">,<\/span> <span class=\"sh\">\"<\/span><span class=\"s\">footer<\/span><span class=\"sh\">\"<\/span><span class=\"p\">,<\/span> <span class=\"sh\">\"<\/span><span class=\"s\">picture<\/span><span class=\"sh\">\"<\/span><span class=\"p\">,<\/span> <span class=\"sh\">\"<\/span><span class=\"s\">svg<\/span><span class=\"sh\">\"<\/span><span class=\"p\">,<\/span> <span class=\"sh\">\"<\/span><span class=\"s\">path<\/span><span class=\"sh\">\"<\/span><span class=\"p\">,<\/span> <span class=\"sh\">\"<\/span><span class=\"s\">form<\/span><span class=\"sh\">\"<\/span><span class=\"p\">]):<\/span>\n      <span class=\"n\">script<\/span><span class=\"p\">.<\/span><span class=\"nf\">decompose<\/span><span class=\"p\">()<\/span>\n\n  <span class=\"n\">cleaned_body_content<\/span> <span class=\"o\">=<\/span> <span class=\"nf\">str<\/span><span class=\"p\">(<\/span><span class=\"n\">soup<\/span><span class=\"p\">.<\/span><span class=\"n\">body<\/span><span class=\"p\">)<\/span>\n  <span class=\"k\">return<\/span> <span class=\"n\">cleaned_body_content<\/span>\n<\/code><\/pre>\n<div class=\"highlight__panel js-actions-panel\">\n<div class=\"highlight__panel-action js-fullscreen-code-action\">\n    <svg xmlns=\"http:\/\/www.w3.org\/2000\/svg\" width=\"20px\" height=\"20px\" viewbox=\"0 0 24 24\" class=\"highlight-action crayons-icon highlight-action--fullscreen-on\"><title>\u062d\u0627\u0644\u062a \u062a\u0645\u0627\u0645 \u0635\u0641\u062d\u0647 \u0631\u0627 \u0648\u0627\u0631\u062f \u06a9\u0646\u06cc\u062f<\/title>\n    <path d=\"M16 3h6v6h-2V5h-4V3zM2 3h6v2H4v4H2V3zm18 16v-4h2v6h-6v-2h4zM4 19h4v2H2v-6h2v4z\"\/>\n<\/svg><\/p>\n<p>    <svg xmlns=\"http:\/\/www.w3.org\/2000\/svg\" width=\"20px\" height=\"20px\" viewbox=\"0 0 24 24\" class=\"highlight-action crayons-icon highlight-action--fullscreen-off\"><title>\u0627\u0632 \u062d\u0627\u0644\u062a \u062a\u0645\u0627\u0645 \u0635\u0641\u062d\u0647 \u062e\u0627\u0631\u062c \u0634\u0648\u06cc\u062f<\/title>\n    <path d=\"M18 7h4v2h-6V3h2v4zM8 9H2V7h4V3h2v6zm10 8v4h-2v-6h6v2h-4zM8 15v6H6v-4H2v-2h6z\"\/>\n<\/svg><\/p>\n<\/div>\n<\/div>\n<\/div>\n<p>\u0627\u06a9\u0646\u0648\u0646 \u060c \u0628\u0631\u0627\u06cc \u0631\u0641\u062a\u0646 \u0628\u0647 \u0635\u0641\u062d\u0647 \u0628\u0631\u0631\u0633\u06cc \u0628\u0639\u062f\u06cc \u060c \u0628\u0631\u0646\u0627\u0645\u0647 \u0628\u0627\u06cc\u062f \u0631\u0648\u06cc \u062f\u06a9\u0645\u0647 &#8220;Next&#8221; \u06a9\u0644\u06cc\u06a9 \u06a9\u0646\u062f. \u0628\u0631\u0627\u06cc \u0627\u0646\u062c\u0627\u0645 \u0627\u06cc\u0646 \u06a9\u0627\u0631 \u060c \u0628\u0647 \u0646\u0627\u0645 \u06a9\u0644\u0627\u0633 \u062f\u06a9\u0645\u0647 \u0646\u06cc\u0627\u0632 \u062f\u0627\u0631\u062f. \u0627\u0632 \u0622\u0646\u062c\u0627 \u06a9\u0647 \u0647\u0631 \u0648\u0628 \u0633\u0627\u06cc\u062a \u062f\u0627\u0631\u0627\u06cc \u06cc\u06a9 \u0646\u0627\u0645 \u06a9\u0644\u0627\u0633 \u0645\u0646\u062d\u0635\u0631 \u0628\u0647 \u0641\u0631\u062f \u0628\u0631\u0627\u06cc \u062f\u06a9\u0645\u0647 \u0627\u0633\u062a \u060c \u0645\u0627 \u0646\u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u0645 \u0646\u0627\u0645 \u06a9\u0644\u0627\u0633 \u0631\u0627 \u0628\u0647 \u0633\u062e\u062a\u06cc \u06a9\u062f\u06af\u0630\u0627\u0631\u06cc \u06a9\u0646\u06cc\u0645. \u0628\u0631\u0627\u06cc \u067e\u0631\u062f\u0627\u062e\u062a\u0646 \u0628\u0647 \u0627\u06cc\u0646 \u0645\u0648\u0636\u0648\u0639 \u060c \u0645\u0646 \u0627\u0632 LLM \u0628\u0631\u0627\u06cc \u062a\u0639\u06cc\u06cc\u0646 \u0646\u0627\u0645 \u06a9\u0644\u0627\u0633 \u0627\u0632 \u06a9\u062f \u0645\u0646\u0628\u0639 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0645\u06cc \u06a9\u0646\u0645. \u0627\u06cc\u0646 \u0628\u0631\u0646\u0627\u0645\u0647 \u0647\u0645\u0686\u0646\u06cc\u0646 \u0646\u06cc\u0627\u0632 \u0628\u0647 \u0628\u0627\u0632\u06cc\u0627\u0628\u06cc \u062c\u0632\u0626\u06cc\u0627\u062a \u0628\u0631\u0631\u0633\u06cc \u062f\u0627\u0631\u062f \u060c \u0628\u0646\u0627\u0628\u0631\u0627\u06cc\u0646 \u0645\u0646 \u06a9\u062f \u0631\u0627 \u0628\u0631\u0627\u06cc \u0634\u0646\u0627\u0633\u0627\u06cc\u06cc \u0646\u0627\u0645 \u06a9\u0644\u0627\u0633 \u0639\u0646\u0627\u0635\u0631 \u0628\u0631\u0631\u0633\u06cc \u0646\u06cc\u0632 \u0627\u0636\u0627\u0641\u0647 \u06a9\u0631\u062f\u0647 \u0627\u0645. \u0645\u0646 \u0627\u0632 Google AI Studio API (Gemini 1.5 Flash) \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0645\u06cc \u06a9\u0646\u0645 \u0632\u06cc\u0631\u0627 \u0627\u06cc\u0646 \u0628\u0631\u0646\u0627\u0645\u0647 \u0631\u0627\u06cc\u06af\u0627\u0646 \u0627\u0633\u062a \u0648 \u0627\u0632 \u0627\u0646\u062f\u0627\u0632\u0647 \u0648\u0631\u0648\u062f\u06cc 1 \u0645\u06cc\u0644\u06cc\u0648\u0646 \u0646\u0634\u0627\u0646\u0647 \u067e\u0634\u062a\u06cc\u0628\u0627\u0646\u06cc \u0645\u06cc \u06a9\u0646\u062f \u060c \u06a9\u0647 \u062a\u0642\u0631\u06cc\u0628\u0627\u064b \u062a\u0636\u0645\u06cc\u0646 \u0645\u06cc \u06a9\u0646\u062f \u06a9\u0647 \u06a9\u062f \u0645\u0646\u0628\u0639 \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u0648\u0631\u0648\u062f\u06cc \u0645\u062a\u0646\u0627\u0633\u0628 \u0628\u0627\u0634\u062f.<\/p>\n<div class=\"highlight js-code-highlight\">\n<pre class=\"highlight python\"><code><span class=\"c1\">#global variable\n<\/span><span class=\"n\">review_paginate_next<\/span> <span class=\"o\">=<\/span> <span class=\"sh\">\"\"<\/span>\n<span class=\"n\">review_author<\/span> <span class=\"o\">=<\/span> <span class=\"sh\">\"\"<\/span>\n<span class=\"n\">review_title<\/span> <span class=\"o\">=<\/span> <span class=\"sh\">\"\"<\/span>\n<span class=\"n\">review_text<\/span> <span class=\"o\">=<\/span> <span class=\"sh\">\"\"<\/span>\n<span class=\"n\">review_rating<\/span> <span class=\"o\">=<\/span> <span class=\"sh\">\"\"<\/span>\n\n<span class=\"n\">prompt<\/span> <span class=\"o\">=<\/span> <span class=\"sh\">\"\"\"<\/span><span class=\"s\">extract the following class name for each of the following elements:\n- pagination <\/span><span class=\"sh\">\"<\/span><span class=\"s\">next page<\/span><span class=\"sh\">\"<\/span><span class=\"s\"> button of review section\n- name of reviewer\n- title of review\n- text of review\n- rating classname\nfrom the provided codebase.\nJust return a comma seperated value of classnames, if multiple class name is found for the same section, use the most relevant one which is unique.\nDon<\/span><span class=\"sh\">'<\/span><span class=\"s\">t trim the values, return the value as it is in source code.\nDon<\/span><span class=\"sh\">'<\/span><span class=\"s\">t return any other text than mentioned. Here is the code: <\/span><span class=\"sh\">\"\"\"<\/span>\n\n<span class=\"n\">google_api_key<\/span> <span class=\"o\">=<\/span> <span class=\"n\">os<\/span><span class=\"p\">.<\/span><span class=\"nf\">getenv<\/span><span class=\"p\">(<\/span><span class=\"sh\">'<\/span><span class=\"s\">GOOGLE_API_KEY<\/span><span class=\"sh\">'<\/span><span class=\"p\">)<\/span>\n\n<span class=\"k\">def<\/span> <span class=\"nf\">filter_css_selector<\/span><span class=\"p\">(<\/span><span class=\"n\">source_text<\/span><span class=\"p\">,<\/span> <span class=\"n\">max_retries<\/span> <span class=\"o\">=<\/span> <span class=\"mi\">3<\/span><span class=\"p\">):<\/span>\n    <span class=\"n\">response<\/span> <span class=\"o\">=<\/span> <span class=\"n\">requests<\/span><span class=\"p\">.<\/span><span class=\"nf\">post<\/span><span class=\"p\">(<\/span>\n        <span class=\"n\">url<\/span><span class=\"o\">=<\/span><span class=\"sa\">f<\/span><span class=\"sh\">\"<\/span><span class=\"s\">https:\/\/generativelanguage.googleapis.com\/v1beta\/models\/gemini-1.5-flash:generateContent?key=<\/span><span class=\"si\">{<\/span><span class=\"n\">google_api_key<\/span><span class=\"si\">}<\/span><span class=\"sh\">\"<\/span><span class=\"p\">,<\/span>\n        <span class=\"n\">headers<\/span><span class=\"o\">=<\/span><span class=\"p\">{<\/span>\n            <span class=\"sh\">\"<\/span><span class=\"s\">Content-Type<\/span><span class=\"sh\">\"<\/span><span class=\"p\">:<\/span> <span class=\"sh\">\"<\/span><span class=\"s\">application\/json<\/span><span class=\"sh\">\"<\/span>\n        <span class=\"p\">},<\/span>\n        <span class=\"n\">json<\/span><span class=\"o\">=<\/span><span class=\"p\">{<\/span>\n            <span class=\"sh\">\"<\/span><span class=\"s\">contents<\/span><span class=\"sh\">\"<\/span><span class=\"p\">:<\/span> <span class=\"p\">[<\/span>\n                <span class=\"p\">{<\/span>\n                    <span class=\"sh\">\"<\/span><span class=\"s\">parts<\/span><span class=\"sh\">\"<\/span><span class=\"p\">:<\/span> <span class=\"p\">[<\/span>\n                        <span class=\"p\">{<\/span>\n                            <span class=\"sh\">\"<\/span><span class=\"s\">text<\/span><span class=\"sh\">\"<\/span><span class=\"p\">:<\/span> <span class=\"n\">prompt<\/span> <span class=\"o\">+<\/span> <span class=\"n\">source_text<\/span>\n                        <span class=\"p\">}<\/span>\n                    <span class=\"p\">]<\/span>\n                <span class=\"p\">}<\/span>\n            <span class=\"p\">]<\/span>\n        <span class=\"p\">}<\/span>\n    <span class=\"p\">)<\/span>\n\n    <span class=\"k\">if<\/span> <span class=\"n\">response<\/span><span class=\"p\">.<\/span><span class=\"n\">status_code<\/span> <span class=\"o\">==<\/span> <span class=\"mi\">200<\/span><span class=\"p\">:<\/span>\n        <span class=\"n\">data<\/span> <span class=\"o\">=<\/span> <span class=\"n\">response<\/span><span class=\"p\">.<\/span><span class=\"nf\">json<\/span><span class=\"p\">()<\/span>\n        <span class=\"n\">message_content<\/span> <span class=\"o\">=<\/span> <span class=\"n\">data<\/span><span class=\"p\">[<\/span><span class=\"sh\">'<\/span><span class=\"s\">candidates<\/span><span class=\"sh\">'<\/span><span class=\"p\">][<\/span><span class=\"mi\">0<\/span><span class=\"p\">][<\/span><span class=\"sh\">'<\/span><span class=\"s\">content<\/span><span class=\"sh\">'<\/span><span class=\"p\">][<\/span><span class=\"sh\">'<\/span><span class=\"s\">parts<\/span><span class=\"sh\">'<\/span><span class=\"p\">][<\/span><span class=\"mi\">0<\/span><span class=\"p\">][<\/span><span class=\"sh\">'<\/span><span class=\"s\">text<\/span><span class=\"sh\">'<\/span><span class=\"p\">]<\/span>\n        <span class=\"n\">message_content<\/span> <span class=\"o\">=<\/span> <span class=\"n\">message_content<\/span><span class=\"p\">.<\/span><span class=\"nf\">strip<\/span><span class=\"p\">(<\/span><span class=\"sh\">\"<\/span><span class=\"se\">\\n<\/span><span class=\"sh\">\"<\/span><span class=\"p\">)<\/span>\n        <span class=\"k\">try<\/span><span class=\"p\">:<\/span>\n          <span class=\"k\">global<\/span> <span class=\"n\">review_paginate_next<\/span><span class=\"p\">,<\/span> <span class=\"n\">review_author<\/span><span class=\"p\">,<\/span> <span class=\"n\">review_title<\/span><span class=\"p\">,<\/span> <span class=\"n\">review_text<\/span><span class=\"p\">,<\/span> <span class=\"n\">review_rating<\/span>\n          <span class=\"n\">review_paginate_next<\/span><span class=\"p\">,<\/span> <span class=\"n\">review_author<\/span><span class=\"p\">,<\/span> <span class=\"n\">review_title<\/span><span class=\"p\">,<\/span> <span class=\"n\">review_text<\/span><span class=\"p\">,<\/span> <span class=\"n\">review_rating<\/span> <span class=\"o\">=<\/span> <span class=\"n\">message_content<\/span><span class=\"p\">.<\/span><span class=\"nf\">split<\/span><span class=\"p\">(<\/span><span class=\"sh\">\"<\/span><span class=\"s\">,<\/span><span class=\"sh\">\"<\/span><span class=\"p\">)<\/span>\n          <span class=\"n\">next_buttons<\/span><span class=\"p\">.<\/span><span class=\"nf\">append<\/span><span class=\"p\">(<\/span><span class=\"sa\">f<\/span><span class=\"sh\">'<\/span><span class=\"s\">.<\/span><span class=\"si\">{<\/span><span class=\"n\">review_paginate_next<\/span><span class=\"si\">}<\/span><span class=\"sh\">'<\/span><span class=\"p\">)<\/span>\n          <span class=\"nf\">print<\/span><span class=\"p\">(<\/span><span class=\"n\">review_paginate_next<\/span><span class=\"p\">)<\/span>\n          <span class=\"nf\">print<\/span><span class=\"p\">(<\/span><span class=\"n\">review_author<\/span><span class=\"p\">)<\/span>\n          <span class=\"nf\">print<\/span><span class=\"p\">(<\/span><span class=\"n\">review_title<\/span><span class=\"p\">)<\/span>\n          <span class=\"nf\">print<\/span><span class=\"p\">(<\/span><span class=\"n\">review_text<\/span><span class=\"p\">)<\/span>\n          <span class=\"nf\">print<\/span><span class=\"p\">(<\/span><span class=\"n\">review_rating<\/span><span class=\"p\">)<\/span>\n\n        <span class=\"k\">except<\/span><span class=\"p\">:<\/span>\n          <span class=\"c1\"># also try with some other model\n<\/span>          <span class=\"nf\">if <\/span><span class=\"p\">(<\/span><span class=\"n\">max_retries<\/span> <span class=\"o\">&gt;<\/span> <span class=\"mi\">0<\/span><span class=\"p\">):<\/span>\n            <span class=\"n\">time<\/span><span class=\"p\">.<\/span><span class=\"nf\">sleep<\/span><span class=\"p\">(<\/span><span class=\"mi\">2<\/span><span class=\"p\">)<\/span>\n            <span class=\"nf\">filter_css_selector<\/span><span class=\"p\">(<\/span><span class=\"n\">source_text<\/span><span class=\"p\">,<\/span> <span class=\"n\">max_retries<\/span> <span class=\"o\">-<\/span> <span class=\"mi\">1<\/span><span class=\"p\">)<\/span>\n    <span class=\"k\">else<\/span><span class=\"p\">:<\/span>\n        <span class=\"c1\"># handles model overload error or any other error encountered by LLM API\n<\/span>        <span class=\"nf\">print<\/span><span class=\"p\">(<\/span><span class=\"n\">response<\/span><span class=\"p\">.<\/span><span class=\"nf\">json<\/span><span class=\"p\">())<\/span>\n        <span class=\"nf\">if <\/span><span class=\"p\">(<\/span><span class=\"n\">max_retries<\/span> <span class=\"o\">&gt;<\/span> <span class=\"mi\">0<\/span><span class=\"p\">):<\/span>\n          <span class=\"n\">time<\/span><span class=\"p\">.<\/span><span class=\"nf\">sleep<\/span><span class=\"p\">(<\/span><span class=\"mi\">2<\/span><span class=\"p\">)<\/span>\n          <span class=\"nf\">filter_css_selector<\/span><span class=\"p\">(<\/span><span class=\"n\">source_text<\/span><span class=\"p\">,<\/span> <span class=\"n\">max_retries<\/span> <span class=\"o\">-<\/span> <span class=\"mi\">1<\/span><span class=\"p\">)<\/span>\n<\/code><\/pre>\n<div class=\"highlight__panel js-actions-panel\">\n<div class=\"highlight__panel-action js-fullscreen-code-action\">\n    <svg xmlns=\"http:\/\/www.w3.org\/2000\/svg\" width=\"20px\" height=\"20px\" viewbox=\"0 0 24 24\" class=\"highlight-action crayons-icon highlight-action--fullscreen-on\"><title>\u062d\u0627\u0644\u062a \u062a\u0645\u0627\u0645 \u0635\u0641\u062d\u0647 \u0631\u0627 \u0648\u0627\u0631\u062f \u06a9\u0646\u06cc\u062f<\/title>\n    <path d=\"M16 3h6v6h-2V5h-4V3zM2 3h6v2H4v4H2V3zm18 16v-4h2v6h-6v-2h4zM4 19h4v2H2v-6h2v4z\"\/>\n<\/svg><\/p>\n<p>    <svg xmlns=\"http:\/\/www.w3.org\/2000\/svg\" width=\"20px\" height=\"20px\" viewbox=\"0 0 24 24\" class=\"highlight-action crayons-icon highlight-action--fullscreen-off\"><title>\u0627\u0632 \u062d\u0627\u0644\u062a \u062a\u0645\u0627\u0645 \u0635\u0641\u062d\u0647 \u062e\u0627\u0631\u062c \u0634\u0648\u06cc\u062f<\/title>\n    <path d=\"M18 7h4v2h-6V3h2v4zM8 9H2V7h4V3h2v6zm10 8v4h-2v-6h6v2h-4zM8 15v6H6v-4H2v-2h6z\"\/>\n<\/svg><\/p>\n<\/div>\n<\/div>\n<\/div>\n<p>\u0647\u0646\u06af\u0627\u0645\u06cc \u06a9\u0647 \u0645\u0627 \u0646\u0627\u0645 \u06a9\u0644\u0627\u0633 \u0631\u0627 \u0645\u06cc \u062f\u0627\u0646\u06cc\u0645 \u060c \u0628\u0631\u0646\u0627\u0645\u0647 \u0645\u06cc \u062a\u0648\u0627\u0646\u062f \u0635\u0641\u062d\u0647 \u0628\u0631\u0631\u0633\u06cc \u0631\u0627 \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 BeautifulSoup \u0628\u0647 \u0635\u0641\u062d\u0647 \u0628\u0631\u0631\u0633\u06cc \u06a9\u0646\u062f. \u0686\u0631\u0627 \u0628\u0647 \u062c\u0627\u06cc LLM \u0627\u0632 \u06af\u0631\u0648\u0647 \u0632\u06cc\u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0645\u06cc \u06a9\u0646\u06cc\u0645\u061f \u0627\u0632 \u0622\u0646\u062c\u0627 \u06a9\u0647 \u0627\u06cc\u0646 \u0631\u0639\u062f \u0648 \u0628\u0631\u0642 \u0633\u0631\u06cc\u0639 \u0627\u0633\u062a \u060c \u0645\u0642\u0627\u062f\u06cc\u0631 \u0645\u062b\u0628\u062a \u06a9\u0627\u0630\u0628 \u0645\u0627\u0646\u0646\u062f LLM \u0631\u0627 \u062a\u0648\u0644\u06cc\u062f \u0646\u0645\u06cc \u06a9\u0646\u062f (\u0627\u06af\u0631\u0686\u0647 \u0627\u06af\u0631 \u0646\u0627\u0645 \u06a9\u0644\u0627\u0633 \u0646\u0627\u062f\u0631\u0633\u062a \u0628\u0627\u0634\u062f \u060c \u0645\u06cc \u062a\u0648\u0627\u0646\u062f \u0645\u0642\u0627\u062f\u06cc\u0631 \u0631\u0627 \u06a9\u0627\u0645\u0644\u0627\u064b \u0627\u0632 \u062f\u0633\u062a \u0628\u062f\u0647\u062f) \u060c \u0648 \u0645\u062d\u062f\u0648\u062f\u06cc\u062a \u0647\u0627\u06cc \u0646\u0631\u062e \u0622\u0646 \u0631\u0627 \u0646\u062f\u0627\u0631\u062f \u060c \u0628\u0646\u0627\u0628\u0631\u0627\u06cc\u0646 \u0645\u06cc \u062a\u0648\u0627\u0646\u06cc\u0645 \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u0628\u0633\u06cc\u0627\u0631\u06cc \u0627\u0632 \u0635\u0641\u062d\u0627\u062a \u0645\u0648\u0631\u062f \u0646\u06cc\u0627\u0632 \u0631\u0627 \u0628\u0628\u0646\u062f\u06cc\u0645 \u0628\u0634\u0631<\/p>\n<div class=\"highlight js-code-highlight\">\n<pre class=\"highlight python\"><code><span class=\"k\">def<\/span> <span class=\"nf\">extract_reviews<\/span><span class=\"p\">(<\/span><span class=\"n\">source<\/span><span class=\"p\">):<\/span>\n\n  <span class=\"n\">body_strainer<\/span> <span class=\"o\">=<\/span> <span class=\"nc\">SoupStrainer<\/span><span class=\"p\">(<\/span><span class=\"sh\">'<\/span><span class=\"s\">body<\/span><span class=\"sh\">'<\/span><span class=\"p\">)<\/span>\n  <span class=\"n\">soup<\/span> <span class=\"o\">=<\/span> <span class=\"nc\">BeautifulSoup<\/span><span class=\"p\">(<\/span><span class=\"n\">source<\/span><span class=\"p\">,<\/span> <span class=\"sh\">'<\/span><span class=\"s\">html.parser<\/span><span class=\"sh\">'<\/span><span class=\"p\">,<\/span> <span class=\"n\">parse_only<\/span><span class=\"o\">=<\/span><span class=\"n\">body_strainer<\/span><span class=\"p\">)<\/span>\n\n  <span class=\"n\">titles<\/span> <span class=\"o\">=<\/span> <span class=\"n\">soup<\/span><span class=\"p\">.<\/span><span class=\"nf\">find_all<\/span><span class=\"p\">(<\/span><span class=\"n\">class_<\/span><span class=\"o\">=<\/span><span class=\"n\">review_title<\/span><span class=\"p\">)<\/span>\n  <span class=\"n\">bodies<\/span> <span class=\"o\">=<\/span> <span class=\"n\">soup<\/span><span class=\"p\">.<\/span><span class=\"nf\">find_all<\/span><span class=\"p\">(<\/span><span class=\"n\">class_<\/span><span class=\"o\">=<\/span><span class=\"n\">review_text<\/span><span class=\"p\">)<\/span>\n  <span class=\"n\">authors<\/span> <span class=\"o\">=<\/span> <span class=\"n\">soup<\/span><span class=\"p\">.<\/span><span class=\"nf\">find_all<\/span><span class=\"p\">(<\/span><span class=\"n\">class_<\/span><span class=\"o\">=<\/span><span class=\"n\">review_author<\/span><span class=\"p\">)<\/span>\n  <span class=\"n\">ratings<\/span> <span class=\"o\">=<\/span> <span class=\"n\">soup<\/span><span class=\"p\">.<\/span><span class=\"nf\">find_all<\/span><span class=\"p\">(<\/span><span class=\"n\">class_<\/span><span class=\"o\">=<\/span><span class=\"n\">review_rating<\/span><span class=\"p\">)<\/span>\n\n  <span class=\"k\">for<\/span> <span class=\"n\">i<\/span> <span class=\"ow\">in<\/span> <span class=\"nf\">range<\/span><span class=\"p\">(<\/span><span class=\"nf\">max<\/span><span class=\"p\">(<\/span><span class=\"nf\">len<\/span><span class=\"p\">(<\/span><span class=\"n\">titles<\/span><span class=\"p\">),<\/span> <span class=\"nf\">len<\/span><span class=\"p\">(<\/span><span class=\"n\">bodies<\/span><span class=\"p\">),<\/span> <span class=\"nf\">len<\/span><span class=\"p\">(<\/span><span class=\"n\">authors<\/span><span class=\"p\">),<\/span> <span class=\"nf\">len<\/span><span class=\"p\">(<\/span><span class=\"n\">ratings<\/span><span class=\"p\">))):<\/span>\n      <span class=\"n\">review<\/span> <span class=\"o\">=<\/span> <span class=\"p\">{<\/span>\n          <span class=\"sh\">\"<\/span><span class=\"s\">title<\/span><span class=\"sh\">\"<\/span><span class=\"p\">:<\/span> <span class=\"n\">titles<\/span><span class=\"p\">[<\/span><span class=\"n\">i<\/span><span class=\"p\">].<\/span><span class=\"nf\">get_text<\/span><span class=\"p\">(<\/span><span class=\"n\">strip<\/span><span class=\"o\">=<\/span><span class=\"bp\">True<\/span><span class=\"p\">)<\/span> <span class=\"k\">if<\/span> <span class=\"n\">i<\/span> <span class=\"o\">&lt;<\/span> <span class=\"nf\">len<\/span><span class=\"p\">(<\/span><span class=\"n\">titles<\/span><span class=\"p\">)<\/span> <span class=\"k\">else<\/span> <span class=\"sh\">\"\"<\/span><span class=\"p\">,<\/span>\n          <span class=\"sh\">\"<\/span><span class=\"s\">body<\/span><span class=\"sh\">\"<\/span><span class=\"p\">:<\/span> <span class=\"n\">bodies<\/span><span class=\"p\">[<\/span><span class=\"n\">i<\/span><span class=\"p\">].<\/span><span class=\"nf\">get_text<\/span><span class=\"p\">(<\/span><span class=\"n\">strip<\/span><span class=\"o\">=<\/span><span class=\"bp\">True<\/span><span class=\"p\">)<\/span> <span class=\"k\">if<\/span> <span class=\"n\">i<\/span> <span class=\"o\">&lt;<\/span> <span class=\"nf\">len<\/span><span class=\"p\">(<\/span><span class=\"n\">bodies<\/span><span class=\"p\">)<\/span> <span class=\"k\">else<\/span> <span class=\"sh\">\"\"<\/span><span class=\"p\">,<\/span>\n          <span class=\"sh\">\"<\/span><span class=\"s\">author<\/span><span class=\"sh\">\"<\/span><span class=\"p\">:<\/span> <span class=\"n\">authors<\/span><span class=\"p\">[<\/span><span class=\"n\">i<\/span><span class=\"p\">].<\/span><span class=\"nf\">get_text<\/span><span class=\"p\">(<\/span><span class=\"n\">strip<\/span><span class=\"o\">=<\/span><span class=\"bp\">True<\/span><span class=\"p\">)<\/span> <span class=\"k\">if<\/span> <span class=\"n\">i<\/span> <span class=\"o\">&lt;<\/span> <span class=\"nf\">len<\/span><span class=\"p\">(<\/span><span class=\"n\">authors<\/span><span class=\"p\">)<\/span> <span class=\"k\">else<\/span> <span class=\"sh\">\"\"<\/span><span class=\"p\">,<\/span>\n          <span class=\"sh\">\"<\/span><span class=\"s\">rating<\/span><span class=\"sh\">\"<\/span><span class=\"p\">:<\/span> <span class=\"n\">ratings<\/span><span class=\"p\">[<\/span><span class=\"n\">i<\/span><span class=\"p\">].<\/span><span class=\"nf\">get_text<\/span><span class=\"p\">(<\/span><span class=\"n\">strip<\/span><span class=\"o\">=<\/span><span class=\"bp\">True<\/span><span class=\"p\">)<\/span> <span class=\"k\">if<\/span> <span class=\"n\">i<\/span> <span class=\"o\">&lt;<\/span> <span class=\"nf\">len<\/span><span class=\"p\">(<\/span><span class=\"n\">ratings<\/span><span class=\"p\">)<\/span> <span class=\"k\">else<\/span> <span class=\"sh\">\"\"<\/span>\n      <span class=\"p\">}<\/span>\n      <span class=\"n\">reviews<\/span><span class=\"p\">.<\/span><span class=\"nf\">append<\/span><span class=\"p\">(<\/span><span class=\"n\">review<\/span><span class=\"p\">)<\/span>\n<\/code><\/pre>\n<div class=\"highlight__panel js-actions-panel\">\n<div class=\"highlight__panel-action js-fullscreen-code-action\">\n    <svg xmlns=\"http:\/\/www.w3.org\/2000\/svg\" width=\"20px\" height=\"20px\" viewbox=\"0 0 24 24\" class=\"highlight-action crayons-icon highlight-action--fullscreen-on\"><title>\u062d\u0627\u0644\u062a \u062a\u0645\u0627\u0645 \u0635\u0641\u062d\u0647 \u0631\u0627 \u0648\u0627\u0631\u062f \u06a9\u0646\u06cc\u062f<\/title>\n    <path d=\"M16 3h6v6h-2V5h-4V3zM2 3h6v2H4v4H2V3zm18 16v-4h2v6h-6v-2h4zM4 19h4v2H2v-6h2v4z\"\/>\n<\/svg><\/p>\n<p>    <svg xmlns=\"http:\/\/www.w3.org\/2000\/svg\" width=\"20px\" height=\"20px\" viewbox=\"0 0 24 24\" class=\"highlight-action crayons-icon highlight-action--fullscreen-off\"><title>\u0627\u0632 \u062d\u0627\u0644\u062a \u062a\u0645\u0627\u0645 \u0635\u0641\u062d\u0647 \u062e\u0627\u0631\u062c \u0634\u0648\u06cc\u062f<\/title>\n    <path d=\"M18 7h4v2h-6V3h2v4zM8 9H2V7h4V3h2v6zm10 8v4h-2v-6h6v2h-4zM8 15v6H6v-4H2v-2h6z\"\/>\n<\/svg><\/p>\n<\/div>\n<\/div>\n<\/div>\n<p>\u0627\u06a9\u0646\u0648\u0646 \u060c \u062f\u0627\u062f\u0647 \u0647\u0627 \u0628\u0627\u06cc\u062f \u0627\u0632 \u0646\u0645\u0648\u0646\u0647 EC2 \u0628\u0647 \u0639\u0645\u0644\u06a9\u0631\u062f Lambda \u0645\u0646\u062a\u0642\u0644 \u0634\u0648\u0646\u062f \u062a\u0627 \u0628\u062a\u0648\u0627\u0646 \u0627\u0632 \u0637\u0631\u06cc\u0642 \u062f\u0631\u0648\u0627\u0632\u0647 API \u0628\u0627\u0632\u06af\u0631\u062f\u06cc\u062f. \u0628\u0631\u0627\u06cc \u0627\u0646\u062c\u0627\u0645 \u0627\u06cc\u0646 \u06a9\u0627\u0631 \u060c \u0645\u0646 \u0627\u0632 \u06cc\u06a9 \u0633\u0637\u0644 S3 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0645\u06cc \u06a9\u0646\u0645. \u0627\u06cc\u0646 \u0631\u0648\u06cc\u06a9\u0631\u062f \u0647\u0645\u0686\u0646\u06cc\u0646 \u0628\u0647 \u0622\u0646 \u0627\u062c\u0627\u0632\u0647 \u0645\u06cc \u062f\u0647\u062f \u062a\u0627 \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u06cc\u06a9 \u0641\u0631\u0648\u0634\u06af\u0627\u0647 \u062d\u0627\u0641\u0638\u0647 \u0646\u0647\u0627\u0646 \u0628\u0631\u0627\u06cc \u0628\u0631\u0631\u0633\u06cc \u0647\u0627\u06cc \u0642\u0628\u0644\u0627\u064b \u0627\u0633\u062a\u062e\u0631\u0627\u062c \u0634\u062f\u0647 \u0639\u0645\u0644 \u06a9\u0646\u062f.<br \/>def upload_to_s3 (\u062f\u0627\u062f\u0647 \u060c \u0645\u0646\u062d\u0635\u0631 \u0628\u0647 \u0641\u0631\u062f_File_Name):<br \/>s3_client = boto3.client (&#39;s3&#39;) # \u0627\u06cc\u062c\u0627\u062f \u0645\u0634\u062a\u0631\u06cc S3<\/p>\n<div class=\"highlight js-code-highlight\">\n<pre class=\"highlight plaintext\"><code>bucket_name=\"extracted-reviews\"  # Replace with your bucket name\n\ns3_client.put_object(\n    Bucket=bucket_name,\n    Key=unique_file_name,\n    Body=json.dumps(data),  # Convert list to JSON string\n    ContentType=\"application\/json\"\n)\n\nprint(f\"Responses uploaded to s3:\/\/{bucket_name}\/{unique_file_name}\")\n<\/code><\/pre>\n<div class=\"highlight__panel js-actions-panel\">\n<div class=\"highlight__panel-action js-fullscreen-code-action\">\n    <svg xmlns=\"http:\/\/www.w3.org\/2000\/svg\" width=\"20px\" height=\"20px\" viewbox=\"0 0 24 24\" class=\"highlight-action crayons-icon highlight-action--fullscreen-on\"><title>\u062d\u0627\u0644\u062a \u062a\u0645\u0627\u0645 \u0635\u0641\u062d\u0647 \u0631\u0627 \u0648\u0627\u0631\u062f \u06a9\u0646\u06cc\u062f<\/title>\n    <path d=\"M16 3h6v6h-2V5h-4V3zM2 3h6v2H4v4H2V3zm18 16v-4h2v6h-6v-2h4zM4 19h4v2H2v-6h2v4z\"\/>\n<\/svg><\/p>\n<p>    <svg xmlns=\"http:\/\/www.w3.org\/2000\/svg\" width=\"20px\" height=\"20px\" viewbox=\"0 0 24 24\" class=\"highlight-action crayons-icon highlight-action--fullscreen-off\"><title>\u0627\u0632 \u062d\u0627\u0644\u062a \u062a\u0645\u0627\u0645 \u0635\u0641\u062d\u0647 \u062e\u0627\u0631\u062c \u0634\u0648\u06cc\u062f<\/title>\n    <path d=\"M18 7h4v2h-6V3h2v4zM8 9H2V7h4V3h2v6zm10 8v4h-2v-6h6v2h-4zM8 15v6H6v-4H2v-2h6z\"\/>\n<\/svg><\/p>\n<\/div>\n<\/div>\n<\/div>\n<p>\u0627\u06a9\u0646\u0648\u0646 \u060c \u0628\u0631\u0627\u06cc \u062a\u0631\u06a9\u06cc\u0628 \u0647\u0645\u0647 \u0686\u06cc\u0632 \u0648 \u062e\u0648\u062f\u06a9\u0627\u0631 \u06a9\u0631\u062f\u0646 \u0631\u0648\u0646\u062f \u060c \u0645\u0646 \u0627\u0632 \u0646\u0645\u0627\u06cc\u0634\u0646\u0627\u0645\u0647 \u0646\u0648\u06cc\u0633 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0645\u06cc \u06a9\u0646\u0645. \u0631\u0648\u06cc \u062f\u06a9\u0645\u0647 \u06a9\u0644\u06cc\u06a9 \u0645\u06cc \u06a9\u0646\u062f \u060c \u0645\u0646\u0628\u0639 \u0635\u0641\u062d\u0647 \u0631\u0627 \u062f\u0631\u06cc\u0627\u0641\u062a \u0645\u06cc \u06a9\u0646\u062f \u060c \u0628\u0631\u0631\u0633\u06cc \u0647\u0627 \u0631\u0627 \u0627\u0633\u062a\u062e\u0631\u0627\u062c \u0645\u06cc \u06a9\u0646\u062f \u0648 \u0631\u0648\u0646\u062f \u06a9\u0627\u0631 \u0631\u0627 \u062a\u06a9\u0631\u0627\u0631 \u0645\u06cc \u06a9\u0646\u062f \u062a\u0627 \u062a\u0645\u0627\u0645 \u0628\u0631\u0631\u0633\u06cc \u0647\u0627 \u0627\u0633\u062a\u062e\u0631\u0627\u062c \u0634\u0648\u062f (\u0628\u0627 \u0645\u062d\u062f\u0648\u062f\u06cc\u062a \u0633\u062e\u062a 20 \u0635\u0641\u062d\u0647 \u0628\u0631\u0627\u06cc \u0627\u0637\u0645\u06cc\u0646\u0627\u0646 \u0627\u0632 \u0627\u06cc\u0646\u06a9\u0647 \u06a9\u0627\u0631\u0628\u0631 \u0645\u062c\u0628\u0648\u0631 \u0646\u06cc\u0633\u062a \u0628\u0647 \u0637\u0648\u0631 \u0646\u0627\u0645\u062d\u062f\u0648\u062f \u0645\u0646\u062a\u0638\u0631 \u0628\u0645\u0627\u0646\u062f \u060c \u0632\u06cc\u0631\u0627 \u0645\u0627 \u0627\u0632 \u062c\u0631\u06cc\u0627\u0646 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0646\u0645\u06cc \u06a9\u0646\u06cc\u0645 \u0628\u0631\u0627\u06cc \u062e\u0631\u0648\u062c\u06cc \u062f\u0627\u062f\u0647 \u0647\u0627 \u062f\u0631 \u067e\u0631\u0648\u0627\u0632). \u0639\u0644\u0627\u0648\u0647 \u0628\u0631 \u0627\u06cc\u0646 \u060c \u0627\u06af\u0631 \u0627\u0633\u062a\u062e\u0631\u0627\u062c \u0628\u0631\u0631\u0633\u06cc \u0628\u0647 \u0647\u0631 \u062f\u0644\u06cc\u0644\u06cc \u0646\u062a\u0648\u0627\u0646\u062f \u060c \u0645\u0646 \u06cc\u06a9 \u0639\u0645\u0644\u06a9\u0631\u062f \u0628\u0631\u06af\u0634\u062a\u06cc \u0631\u0627 \u067e\u06cc\u0627\u062f\u0647 \u0633\u0627\u0632\u06cc \u06a9\u0631\u062f\u0647 \u0627\u0645 \u062a\u0627 \u0627\u0637\u0645\u06cc\u0646\u0627\u0646 \u062d\u0627\u0635\u0644 \u0634\u0648\u062f \u06a9\u0647 \u062d\u062f\u0627\u0642\u0644 \u0628\u0631\u062e\u06cc \u0627\u0632 \u062f\u0627\u062f\u0647 \u0647\u0627\u06cc \u0628\u0631\u0631\u0633\u06cc \u0631\u0627 \u062f\u0631 \u067e\u0627\u0633\u062e \u0628\u0627\u0632 \u0645\u06cc \u06af\u0631\u062f\u0627\u0646\u062f.<\/p>\n<div class=\"highlight js-code-highlight\">\n<pre class=\"highlight python\"><code><span class=\"k\">async<\/span> <span class=\"k\">def<\/span> <span class=\"nf\">scrape<\/span><span class=\"p\">(<\/span><span class=\"n\">url<\/span><span class=\"p\">,<\/span> <span class=\"n\">file_name<\/span><span class=\"p\">):<\/span>\n    <span class=\"k\">async<\/span> <span class=\"k\">with<\/span> <span class=\"nf\">async_playwright<\/span><span class=\"p\">()<\/span> <span class=\"k\">as<\/span> <span class=\"n\">p<\/span><span class=\"p\">:<\/span>\n        <span class=\"n\">browser<\/span> <span class=\"o\">=<\/span> <span class=\"k\">await<\/span> <span class=\"n\">p<\/span><span class=\"p\">.<\/span><span class=\"n\">chromium<\/span><span class=\"p\">.<\/span><span class=\"nf\">launch<\/span><span class=\"p\">(<\/span><span class=\"n\">headless<\/span><span class=\"o\">=<\/span><span class=\"bp\">True<\/span><span class=\"p\">)<\/span>\n        <span class=\"n\">page<\/span> <span class=\"o\">=<\/span> <span class=\"k\">await<\/span> <span class=\"n\">browser<\/span><span class=\"p\">.<\/span><span class=\"nf\">new_page<\/span><span class=\"p\">()<\/span>\n        <span class=\"k\">await<\/span> <span class=\"n\">page<\/span><span class=\"p\">.<\/span><span class=\"nf\">goto<\/span><span class=\"p\">(<\/span><span class=\"n\">url<\/span><span class=\"p\">)<\/span>\n\n        <span class=\"k\">await<\/span> <span class=\"n\">page<\/span><span class=\"p\">.<\/span><span class=\"nf\">wait_for_selector<\/span><span class=\"p\">(<\/span><span class=\"sh\">'<\/span><span class=\"s\">body<\/span><span class=\"sh\">'<\/span><span class=\"p\">)<\/span>\n        <span class=\"n\">page_source<\/span> <span class=\"o\">=<\/span> <span class=\"k\">await<\/span> <span class=\"n\">page<\/span><span class=\"p\">.<\/span><span class=\"nf\">content<\/span><span class=\"p\">()<\/span>\n\n        <span class=\"n\">cleaned_body_content<\/span> <span class=\"o\">=<\/span> <span class=\"nf\">filter_source<\/span><span class=\"p\">(<\/span><span class=\"n\">page_source<\/span><span class=\"p\">)<\/span>\n        <span class=\"nf\">filter_css_selector<\/span><span class=\"p\">(<\/span><span class=\"n\">cleaned_body_content<\/span><span class=\"p\">)<\/span>\n\n        <span class=\"n\">dialog_close_attempt<\/span> <span class=\"o\">=<\/span> <span class=\"mi\">1<\/span>\n        <span class=\"k\">for<\/span> <span class=\"n\">elm<\/span> <span class=\"ow\">in<\/span> <span class=\"n\">next_buttons<\/span><span class=\"p\">:<\/span>\n          <span class=\"n\">count<\/span> <span class=\"o\">=<\/span> <span class=\"mi\">0<\/span>\n          <span class=\"k\">while<\/span> <span class=\"bp\">True<\/span><span class=\"p\">:<\/span>\n              <span class=\"k\">await<\/span> <span class=\"n\">page<\/span><span class=\"p\">.<\/span><span class=\"nf\">wait_for_selector<\/span><span class=\"p\">(<\/span><span class=\"sh\">'<\/span><span class=\"s\">body<\/span><span class=\"sh\">'<\/span><span class=\"p\">)<\/span>\n              <span class=\"n\">page_source<\/span> <span class=\"o\">=<\/span> <span class=\"k\">await<\/span> <span class=\"n\">page<\/span><span class=\"p\">.<\/span><span class=\"nf\">content<\/span><span class=\"p\">()<\/span>\n\n              <span class=\"nf\">extract_reviews<\/span><span class=\"p\">(<\/span><span class=\"n\">page_source<\/span><span class=\"p\">)<\/span>\n\n              <span class=\"nf\">print<\/span><span class=\"p\">(<\/span><span class=\"n\">count<\/span><span class=\"p\">)<\/span>\n              <span class=\"n\">count<\/span> <span class=\"o\">+=<\/span> <span class=\"mi\">1<\/span>\n              <span class=\"nf\">if <\/span><span class=\"p\">(<\/span><span class=\"n\">count<\/span> <span class=\"o\">&gt;<\/span> <span class=\"mi\">20<\/span><span class=\"p\">):<\/span> <span class=\"k\">break<\/span>\n\n              <span class=\"k\">try<\/span><span class=\"p\">:<\/span>\n                  <span class=\"n\">next_button<\/span> <span class=\"o\">=<\/span> <span class=\"n\">page<\/span><span class=\"p\">.<\/span><span class=\"nf\">locator<\/span><span class=\"p\">(<\/span><span class=\"n\">elm<\/span><span class=\"p\">)<\/span>\n\n                  <span class=\"k\">await<\/span> <span class=\"n\">page<\/span><span class=\"p\">.<\/span><span class=\"n\">mouse<\/span><span class=\"p\">.<\/span><span class=\"nf\">click<\/span><span class=\"p\">(<\/span><span class=\"n\">x<\/span><span class=\"o\">=<\/span><span class=\"mi\">0<\/span><span class=\"p\">,<\/span> <span class=\"n\">y<\/span><span class=\"o\">=<\/span><span class=\"n\">page<\/span><span class=\"p\">.<\/span><span class=\"n\">viewport_size<\/span><span class=\"p\">[<\/span><span class=\"sh\">'<\/span><span class=\"s\">height<\/span><span class=\"sh\">'<\/span><span class=\"p\">]<\/span> <span class=\"o\">\/\/<\/span> <span class=\"mi\">2<\/span><span class=\"p\">)<\/span>\n\n                  <span class=\"k\">await<\/span> <span class=\"n\">asyncio<\/span><span class=\"p\">.<\/span><span class=\"nf\">wait_for<\/span><span class=\"p\">(<\/span><span class=\"n\">next_button<\/span><span class=\"p\">.<\/span><span class=\"nf\">click<\/span><span class=\"p\">(),<\/span> <span class=\"n\">timeout<\/span><span class=\"o\">=<\/span><span class=\"mi\">5<\/span><span class=\"p\">)<\/span>\n\n                  <span class=\"k\">await<\/span> <span class=\"n\">page<\/span><span class=\"p\">.<\/span><span class=\"nf\">wait_for_load_state<\/span><span class=\"p\">(<\/span><span class=\"sh\">'<\/span><span class=\"s\">networkidle<\/span><span class=\"sh\">'<\/span><span class=\"p\">)<\/span>  \n                  <span class=\"k\">await<\/span> <span class=\"n\">page<\/span><span class=\"p\">.<\/span><span class=\"nf\">wait_for_selector<\/span><span class=\"p\">(<\/span><span class=\"sh\">'<\/span><span class=\"s\">body<\/span><span class=\"sh\">'<\/span><span class=\"p\">)<\/span>  \n\n              <span class=\"k\">except<\/span> <span class=\"n\">asyncio<\/span><span class=\"p\">.<\/span><span class=\"nb\">TimeoutError<\/span><span class=\"p\">:<\/span>\n                  <span class=\"k\">break<\/span>\n              <span class=\"k\">except<\/span> <span class=\"nb\">Exception<\/span> <span class=\"k\">as<\/span> <span class=\"n\">e<\/span><span class=\"p\">:<\/span>\n                <span class=\"nf\">print<\/span><span class=\"p\">(<\/span><span class=\"sh\">\"<\/span><span class=\"s\">Bro, error with pagination? <\/span><span class=\"sh\">\"<\/span><span class=\"p\">,<\/span> <span class=\"n\">e<\/span><span class=\"p\">)<\/span>\n                <span class=\"k\">break<\/span>\n\n        <span class=\"c1\">#Handle infinite scroll\n<\/span>        <span class=\"n\">prev_height<\/span> <span class=\"o\">=<\/span> <span class=\"o\">-<\/span><span class=\"mi\">1<\/span>\n        <span class=\"n\">max_scrolls<\/span> <span class=\"o\">=<\/span> <span class=\"mi\">20<\/span>  <span class=\"c1\"># Set a maximum number of scrolls to prevent infinite loops\n<\/span>        <span class=\"n\">scroll_count<\/span> <span class=\"o\">=<\/span> <span class=\"mi\">0<\/span>\n\n        <span class=\"k\">while<\/span> <span class=\"n\">scroll_count<\/span> <span class=\"o\">&lt;<\/span> <span class=\"n\">max_scrolls<\/span><span class=\"p\">:<\/span>\n            <span class=\"k\">await<\/span> <span class=\"n\">page<\/span><span class=\"p\">.<\/span><span class=\"nf\">evaluate<\/span><span class=\"p\">(<\/span><span class=\"sh\">\"<\/span><span class=\"s\">window.scrollTo(0, document.body.scrollHeight)<\/span><span class=\"sh\">\"<\/span><span class=\"p\">)<\/span>\n            <span class=\"k\">await<\/span> <span class=\"n\">page<\/span><span class=\"p\">.<\/span><span class=\"nf\">wait_for_timeout<\/span><span class=\"p\">(<\/span><span class=\"mi\">200<\/span><span class=\"p\">)<\/span>\n            <span class=\"n\">new_height<\/span> <span class=\"o\">=<\/span> <span class=\"k\">await<\/span> <span class=\"n\">page<\/span><span class=\"p\">.<\/span><span class=\"nf\">evaluate<\/span><span class=\"p\">(<\/span><span class=\"sh\">\"<\/span><span class=\"s\">document.body.scrollHeight<\/span><span class=\"sh\">\"<\/span><span class=\"p\">)<\/span>\n\n            <span class=\"k\">if<\/span> <span class=\"n\">new_height<\/span> <span class=\"o\">==<\/span> <span class=\"n\">prev_height<\/span><span class=\"p\">:<\/span>\n                <span class=\"k\">break<\/span> \n\n            <span class=\"n\">prev_height<\/span> <span class=\"o\">=<\/span> <span class=\"n\">new_height<\/span>  \n            <span class=\"n\">scroll_count<\/span> <span class=\"o\">+=<\/span> <span class=\"mi\">1<\/span>  \n\n        <span class=\"n\">page_source<\/span> <span class=\"o\">=<\/span> <span class=\"k\">await<\/span> <span class=\"n\">page<\/span><span class=\"p\">.<\/span><span class=\"nf\">content<\/span><span class=\"p\">()<\/span>\n        <span class=\"nf\">extract_reviews<\/span><span class=\"p\">(<\/span><span class=\"n\">page_source<\/span><span class=\"p\">)<\/span>\n\n        <span class=\"nf\">if <\/span><span class=\"p\">(<\/span><span class=\"nf\">len<\/span><span class=\"p\">(<\/span><span class=\"n\">reviews<\/span><span class=\"p\">)<\/span> <span class=\"o\">==<\/span> <span class=\"mi\">0<\/span><span class=\"p\">):<\/span>\n          <span class=\"nf\">fallback_review_extraction<\/span><span class=\"p\">(<\/span><span class=\"n\">cleaned_body_content<\/span><span class=\"p\">)<\/span>\n          <span class=\"n\">fallback_reviews<\/span><span class=\"p\">[<\/span><span class=\"sh\">\"<\/span><span class=\"s\">reviews_count<\/span><span class=\"sh\">\"<\/span><span class=\"p\">]<\/span> <span class=\"o\">=<\/span> <span class=\"nf\">len<\/span><span class=\"p\">(<\/span><span class=\"n\">fallback_reviews<\/span><span class=\"p\">[<\/span><span class=\"sh\">\"<\/span><span class=\"s\">reviews<\/span><span class=\"sh\">\"<\/span><span class=\"p\">])<\/span>\n          <span class=\"nf\">upload_to_s3<\/span><span class=\"p\">(<\/span><span class=\"n\">fallback_reviews<\/span><span class=\"p\">,<\/span> <span class=\"n\">file_name<\/span><span class=\"p\">)<\/span>\n          <span class=\"c1\"># print(fallback_reviews)\n<\/span>        <span class=\"k\">else<\/span><span class=\"p\">:<\/span>\n          <span class=\"n\">reviews_dict<\/span> <span class=\"o\">=<\/span> <span class=\"p\">{<\/span><span class=\"sh\">\"<\/span><span class=\"s\">reviews_count<\/span><span class=\"sh\">\"<\/span> <span class=\"p\">:<\/span> <span class=\"nf\">len<\/span><span class=\"p\">(<\/span><span class=\"n\">reviews<\/span><span class=\"p\">),<\/span> <span class=\"sh\">\"<\/span><span class=\"s\">reviews<\/span><span class=\"sh\">\"<\/span><span class=\"p\">:<\/span> <span class=\"n\">reviews<\/span><span class=\"p\">}<\/span>\n          <span class=\"c1\"># print(reviews_dict)\n<\/span>          <span class=\"nf\">upload_to_s3<\/span><span class=\"p\">(<\/span><span class=\"n\">reviews_dict<\/span><span class=\"p\">,<\/span> <span class=\"n\">file_name<\/span><span class=\"p\">)<\/span>\n<\/code><\/pre>\n<div class=\"highlight__panel js-actions-panel\">\n<div class=\"highlight__panel-action js-fullscreen-code-action\">\n    <svg xmlns=\"http:\/\/www.w3.org\/2000\/svg\" width=\"20px\" height=\"20px\" viewbox=\"0 0 24 24\" class=\"highlight-action crayons-icon highlight-action--fullscreen-on\"><title>\u062d\u0627\u0644\u062a \u062a\u0645\u0627\u0645 \u0635\u0641\u062d\u0647 \u0631\u0627 \u0648\u0627\u0631\u062f \u06a9\u0646\u06cc\u062f<\/title>\n    <path d=\"M16 3h6v6h-2V5h-4V3zM2 3h6v2H4v4H2V3zm18 16v-4h2v6h-6v-2h4zM4 19h4v2H2v-6h2v4z\"\/>\n<\/svg><\/p>\n<p>    <svg xmlns=\"http:\/\/www.w3.org\/2000\/svg\" width=\"20px\" height=\"20px\" viewbox=\"0 0 24 24\" class=\"highlight-action crayons-icon highlight-action--fullscreen-off\"><title>\u0627\u0632 \u062d\u0627\u0644\u062a \u062a\u0645\u0627\u0645 \u0635\u0641\u062d\u0647 \u062e\u0627\u0631\u062c \u0634\u0648\u06cc\u062f<\/title>\n    <path d=\"M18 7h4v2h-6V3h2v4zM8 9H2V7h4V3h2v6zm10 8v4h-2v-6h6v2h-4zM8 15v6H6v-4H2v-2h6z\"\/>\n<\/svg><\/p>\n<\/div>\n<\/div>\n<\/div>\n<h2><span class=\"ez-toc-section\" id=\"%DA%86%D8%A7%D9%84%D8%B4_%D9%87%D8%A7%DB%8C_%D8%B1%D9%88%D8%A8%D8%B1%D9%88\"><\/span>\n<p>  \u0686\u0627\u0644\u0634 \u0647\u0627\u06cc \u0631\u0648\u0628\u0631\u0648<br \/>\n<span class=\"ez-toc-section-end\"><\/span><\/h2>\n<ul>\n<li>\u0633\u0647 \u0686\u0627\u0644\u0634 \u0645\u0646 \u0647\u0646\u06af\u0627\u0645 \u0627\u0646\u062a\u062e\u0627\u0628 LLM \u0628\u0627 \u0622\u0646 \u0631\u0648\u0628\u0631\u0648 \u0634\u062f\u0645: \u0627\u0648\u0644 \u060c \u0627\u06cc\u0646 \u0645\u0642\u0627\u062f\u06cc\u0631 \u0645\u062b\u0628\u062a \u06a9\u0627\u0630\u0628 \u0631\u0627 \u0628\u0631\u0645\u06cc \u06af\u0631\u062f\u0627\u0646\u062f \u060c \u0648 \u062f\u0648\u0645 \u060c \u06a9\u062f \u0645\u0646\u0628\u0639 \u062f\u0631 \u0645\u062a\u0646 \u0648\u0631\u0648\u062f\u06cc \u0648 \u0633\u0648\u0645 \u060c \u0639\u0645\u0644\u06a9\u0631\u062f \u0642\u0631\u0627\u0631 \u0646\u0645\u06cc \u06af\u0631\u0641\u062a. \u0645\u0646 \u0686\u0646\u062f\u06cc\u0646 \u0645\u062f\u0644 \u0631\u0627\u06cc\u06af\u0627\u0646 \u06cc\u0639\u0646\u06cc Llama \u060c Mistral \u0648 Qwen \u0631\u0627 \u0627\u0645\u062a\u062d\u0627\u0646 \u06a9\u0631\u062f\u0645 \u060c \u0627\u0645\u0627 \u0647\u0631\u06a9\u062f\u0627\u0645 \u06a9\u0627\u0633\u062a\u06cc \u0647\u0627\u06cc \u062e\u0648\u062f \u0631\u0627 \u062f\u0627\u0634\u062a\u0646\u062f. \u0628\u0631\u062e\u06cc \u0627\u0632 \u0622\u0646\u0647\u0627 \u0627\u0646\u062f\u0627\u0632\u0647 \u062a\u0648\u06a9\u0646 \u0648\u0631\u0648\u062f\u06cc \u0628\u0633\u06cc\u0627\u0631 \u06a9\u0645\u06cc \u062f\u0627\u0634\u062a\u0646\u062f \u060c \u0628\u0631\u062e\u06cc \u0627\u0632 \u0622\u0646\u0647\u0627 \u062a\u0648\u0644\u06cc\u062f \u062a\u0635\u0627\u062f\u0641\u06cc (\u0645\u062b\u0628\u062a \u06a9\u0627\u0630\u0628) \u062a\u0648\u0644\u06cc\u062f \u0645\u06cc \u06a9\u0631\u062f\u0646\u062f \u0648 \u0628\u0631\u062e\u06cc \u062f\u06cc\u06af\u0631 \u0647\u0646\u06af\u0627\u0645 \u067e\u062e\u062a \u0648 \u067e\u0632 \u0645\u0648\u0627\u062f \u063a\u0630\u0627\u06cc\u06cc \u0628\u0647 \u0627\u0646\u062f\u0627\u0632\u0647 \u0645\u0646 \u06a9\u0646\u062f \u0628\u0648\u062f\u0646\u062f. &#8220;Gemini 1.5 Flash&#8221; \u0628\u0647\u062a\u0631\u06cc\u0646 \u0628\u0647 \u0646\u0638\u0631 \u0645\u06cc \u0631\u0633\u062f \u060c \u0628\u0627 \u0632\u0645\u0627\u0646 \u067e\u0627\u0633\u062e \u0627\u0632 1.5 \u062b\u0627\u0646\u06cc\u0647 \u062a\u0627 10 \u062b\u0627\u0646\u06cc\u0647 (\u0628\u0631\u0627\u06cc \u0628\u06cc\u0634\u062a\u0631 \u0645\u0648\u0627\u0631\u062f) \u060c \u062a\u0648\u0644\u06cc\u062f \u0645\u0642\u0627\u062f\u06cc\u0631 \u062f\u0642\u06cc\u0642 (\u0646\u0647 \u0647\u0645\u06cc\u0634\u0647 \u0628\u0644\u06a9\u0647 \u0628\u0647\u062a\u0631 \u0627\u0632 \u0633\u0627\u06cc\u0631\u06cc\u0646) \u060c \u06cc\u06a9 \u0627\u0646\u062f\u0627\u0632\u0647 \u0648\u0631\u0648\u062f\u06cc \u0639\u0638\u06cc\u0645 \u062a\u0627 1 \u0645\u06cc\u0644\u06cc\u0648\u0646 (PS: \u0645\u0646 \u062f\u0631 \u0622\u0646 \u0632\u0645\u0627\u0646 \u062f\u0631 \u0647\u0646\u06af\u0627\u0645 \u0633\u0627\u062e\u062a \u067e\u0631\u0648\u0698\u0647 \u0647\u06cc\u0686 \u0627\u06cc\u062f\u0647 \u0627\u06cc \u062f\u0631 \u0645\u0648\u0631\u062f Deepseek \u0646\u062f\u0627\u0634\u062a\u0645.)<\/li>\n<li>\u06cc\u06a9 \u06a9\u0627\u062f\u0631 \u06af\u0641\u062a\u06af\u0648 \u0628\u0647 \u0637\u0648\u0631 \u062a\u0635\u0627\u062f\u0641\u06cc \u0638\u0627\u0647\u0631 \u0645\u06cc \u0634\u0648\u062f \u0648 \u062f\u06a9\u0645\u0647 &#8220;\u0628\u0639\u062f\u06cc&#8221; \u0631\u0627 \u0645\u0633\u062f\u0648\u062f \u0645\u06cc \u06a9\u0646\u062f. \u0628\u0631\u0627\u06cc \u062c\u0644\u0648\u06af\u06cc\u0631\u06cc \u0627\u0632 \u0627\u06cc\u0646 \u06a9\u0627\u0631 \u060c \u0642\u0628\u0644 \u0627\u0632 \u06a9\u0644\u06cc\u06a9 \u0628\u0631 \u0631\u0648\u06cc \u0647\u0631 \u062f\u06a9\u0645\u0647 \u060c \u0645\u0646 \u0627\u0637\u0645\u06cc\u0646\u0627\u0646 \u062d\u0627\u0635\u0644 \u0645\u06cc \u06a9\u0646\u0645 \u06a9\u0647 \u0628\u0631 \u0631\u0648\u06cc \u0645\u062e\u062a\u0635\u0627\u062a x = 0 \u060c y = 50 \u06a9\u0644\u06cc\u06a9 \u06a9\u0646\u06cc\u062f \u062a\u0627 \u0645\u0637\u0645\u0626\u0646 \u0634\u0648\u06cc\u062f \u06a9\u0647 \u06a9\u0627\u062f\u0631 \u06af\u0641\u062a\u06af\u0648 \u0642\u0628\u0644 \u0627\u0632 \u06a9\u0644\u06cc\u06a9 \u0628\u0631 \u0631\u0648\u06cc \u062f\u06a9\u0645\u0647 &#8220;\u0628\u0639\u062f\u06cc&#8221; \u0646\u0627\u067e\u062f\u06cc\u062f \u0645\u06cc \u0634\u0648\u062f.<\/li>\n<li>\u0627\u0632 \u0622\u0646\u062c\u0627 \u06a9\u0647 \u0646\u0645\u0627\u06cc\u0634\u0646\u0627\u0645\u0647 \u0646\u0648\u06cc\u0633 \u0631\u0648\u06cc \u06a9\u0631\u0648\u0645 \u06a9\u0627\u0631 \u0645\u06cc \u06a9\u0646\u062f \u060c \u0628\u0647 \u0637\u0648\u0631 \u0628\u0648\u0645\u06cc \u062a\u0648\u0633\u0637 \u062a\u0648\u0627\u0628\u0639 \u0644\u0627\u0645\u0628\u062f\u0627 \u067e\u0634\u062a\u06cc\u0628\u0627\u0646\u06cc \u0646\u0645\u06cc \u0634\u0648\u062f. \u0628\u0646\u0627\u0628\u0631\u0627\u06cc\u0646 \u060c EC2 \u0628\u0647 \u0639\u0646\u0648\u0627\u0646 \u06cc\u06a9 \u0631\u0627\u0647 \u062d\u0644 \u062f\u0633\u062a\u06cc \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0634\u062f. \u062e\u062f\u0645\u0627\u062a \u0634\u062e\u0635 \u062b\u0627\u0644\u062b \u062f\u06cc\u06af\u0631\u06cc \u0628\u0631\u0627\u06cc \u0627\u062c\u0631\u0627\u06cc \u0645\u0634\u0627\u063a\u0644 \u0627\u062a\u0648\u0645\u0627\u0633\u06cc\u0648\u0646 \u062f\u0631 \u062f\u0633\u062a\u0631\u0633 \u0627\u0633\u062a \u060c \u0627\u0645\u0627 \u0622\u0646\u0647\u0627 \u0628\u0647 \u0647\u0632\u06cc\u0646\u0647 \u0647\u0627\u06cc \u0627\u0636\u0627\u0641\u06cc \u0646\u06cc\u0627\u0632 \u062f\u0627\u0631\u0646\u062f.<\/li>\n<li>\u0627\u0646\u062a\u0642\u0627\u0644 \u062f\u0627\u062f\u0647 \u0647\u0627 \u0627\u0632 EC2 \u0628\u0647 Lambda \u0628\u0647 \u0637\u0648\u0631 \u0645\u0633\u062a\u0642\u06cc\u0645 \u067e\u0634\u062a\u06cc\u0628\u0627\u0646\u06cc \u0646\u0645\u06cc \u0634\u0648\u062f \u060c \u0628\u0646\u0627\u0628\u0631\u0627\u06cc\u0646 \u0645\u062c\u0628\u0648\u0631 \u0634\u062f\u0645 \u0627\u0632 S3 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0646\u0645 (\u0627\u06af\u0631\u0686\u0647 \u0628\u0647 \u062f\u0644\u06cc\u0644 \u062e\u0648\u0627\u0646\u062f\u0646 \u0648 \u0646\u0648\u0634\u062a\u0646 \u0639\u0645\u0644\u06cc\u0627\u062a \u0631\u0648\u06cc \u0633\u0637\u0644 S3 \u0628\u0647 \u0647\u0632\u06cc\u0646\u0647 \u0627\u0636\u0627\u0641\u0647 \u0645\u06cc \u06a9\u0646\u062f).<\/li>\n<li>AWS API Gateway 29 \u062b\u0627\u0646\u06cc\u0647 \u067e\u06cc\u0634 \u0641\u0631\u0636 \u062f\u0627\u0631\u062f \u0648 \u0632\u0645\u0627\u0646 \u0627\u062c\u0631\u0627 \u062e\u0637 \u0644\u0648\u0644\u0647 \u0645\u06cc \u062a\u0648\u0627\u0646\u062f \u0627\u0632 29 \u062b\u0627\u0646\u06cc\u0647 \u0641\u0631\u0627\u062a\u0631 \u0631\u0648\u062f. \u0628\u0646\u0627\u0628\u0631\u0627\u06cc\u0646 \u060c \u0645\u0646 \u0628\u0627\u06cc\u062f \u0627\u0632 \u0637\u0631\u06cc\u0642 &#8220;\u0633\u0647\u0645\u06cc\u0647 \u062e\u062f\u0645\u0627\u062a&#8221; \u062f\u0631 AWS \u060c \u0632\u0645\u0627\u0646 \u0631\u0627 \u0628\u0647 2 \u062f\u0642\u06cc\u0642\u0647 \u0627\u0641\u0632\u0627\u06cc\u0634 \u062f\u0647\u0645.<\/li>\n<\/ul>\n<div class=\"ltag-github-readme-tag\">\n<div class=\"ltag-github-body\">\n<div id=\"readme\" class=\"md\" data-path=\"README.md\">\n<article class=\"markdown-body entry-content container-lg\" itemprop=\"text\">\n<p><h2 class=\"heading-element\" dir=\"auto\"><span class=\"ez-toc-section\" id=\"%D9%86%D8%B3%D8%AE%D9%87_%D8%A2%D8%B2%D9%85%D8%A7%DB%8C%D8%B4%DB%8C\"><\/span>\u0646\u0633\u062e\u0647 \u0622\u0632\u0645\u0627\u06cc\u0634\u06cc<span class=\"ez-toc-section-end\"><\/span><\/h2>\n<\/p>\n<p dir=\"auto\">\u0648\u0628 \u0633\u0627\u06cc\u062a \u0632\u0646\u062f\u0647: https:\/\/serene-kitten-5a66fb.netlify.app\/<\/p>\n<details open=\"\" class=\"details-reset border rounded-2\">\n<summary class=\"px-3 py-2\">\n    <svg aria-hidden=\"true\" height=\"16\" viewbox=\"0 0 16 16\" version=\"1.1\" width=\"16\" data-view-component=\"true\" class=\"octicon octicon-device-camera-video\">\n<\/svg><br \/>\n    <span aria-label=\"Video description demo.mp4\" class=\"m-1\">demo.mp4<\/span><br \/>\n  <\/summary>\n<p>  <video src=\"https:\/\/private-user-images.githubusercontent.com\/27368177\/404730752-94e735fe-738e-42c1-89b4-a41e1063a14c.mp4?jwt=eyJhbGciOiJIUzI1NiIsInR5cCI6IkpXVCJ9.eyJpc3MiOiJnaXRodWIuY29tIiwiYXVkIjoicmF3LmdpdGh1YnVzZXJjb250ZW50LmNvbSIsImtleSI6ImtleTUiLCJleHAiOjE3Mzg1MzQ0NjUsIm5iZiI6MTczODUzNDE2NSwicGF0aCI6Ii8yNzM2ODE3Ny80MDQ3MzA3NTItOTRlNzM1ZmUtNzM4ZS00MmMxLTg5YjQtYTQxZTEwNjNhMTRjLm1wND9YLUFtei1BbGdvcml0aG09QVdTNC1ITUFDLVNIQTI1NiZYLUFtei1DcmVkZW50aWFsPUFLSUFWQ09EWUxTQTUzUFFLNFpBJTJGMjAyNTAyMDIlMkZ1cy1lYXN0LTElMkZzMyUyRmF3czRfcmVxdWVzdCZYLUFtei1EYXRlPTIwMjUwMjAyVDIyMDkyNVomWC1BbXotRXhwaXJlcz0zMDAmWC1BbXotU2lnbmF0dXJlPWVhYTZkYmRlODgzYjA0MmRkOGRmNTg3MWIzNmRmYzNmODg3ZDk0MjM2YjJmMzQ3NDM1MTlhODRiNzdjZTExZDEmWC1BbXotU2lnbmVkSGVhZGVycz1ob3N0In0.PRCX19ivNRXUp9QRUZ_wYzajGPLI4OBJ-Hetta9LBrw\" data-canonical-src=\"https:\/\/private-user-images.githubusercontent.com\/27368177\/404730752-94e735fe-738e-42c1-89b4-a41e1063a14c.mp4?jwt=eyJhbGciOiJIUzI1NiIsInR5cCI6IkpXVCJ9.eyJpc3MiOiJnaXRodWIuY29tIiwiYXVkIjoicmF3LmdpdGh1YnVzZXJjb250ZW50LmNvbSIsImtleSI6ImtleTUiLCJleHAiOjE3Mzg1MzQ0NjUsIm5iZiI6MTczODUzNDE2NSwicGF0aCI6Ii8yNzM2ODE3Ny80MDQ3MzA3NTItOTRlNzM1ZmUtNzM4ZS00MmMxLTg5YjQtYTQxZTEwNjNhMTRjLm1wND9YLUFtei1BbGdvcml0aG09QVdTNC1ITUFDLVNIQTI1NiZYLUFtei1DcmVkZW50aWFsPUFLSUFWQ09EWUxTQTUzUFFLNFpBJTJGMjAyNTAyMDIlMkZ1cy1lYXN0LTElMkZzMyUyRmF3czRfcmVxdWVzdCZYLUFtei1EYXRlPTIwMjUwMjAyVDIyMDkyNVomWC1BbXotRXhwaXJlcz0zMDAmWC1BbXotU2lnbmF0dXJlPWVhYTZkYmRlODgzYjA0MmRkOGRmNTg3MWIzNmRmYzNmODg3ZDk0MjM2YjJmMzQ3NDM1MTlhODRiNzdjZTExZDEmWC1BbXotU2lnbmVkSGVhZGVycz1ob3N0In0.PRCX19ivNRXUp9QRUZ_wYzajGPLI4OBJ-Hetta9LBrw\" controls=\"controls\" muted=\"muted\" class=\"d-block rounded-bottom-2 border-top width-fit\" style=\"max-height:640px; min-height: 200px\"><\/p>\n<p>  <\/video><br \/>\n<\/details>\n<hr\/>\n<p><h2 class=\"heading-element\" dir=\"auto\"><span class=\"ez-toc-section\" id=\"%D9%86%D9%82%D8%A7%D8%B7_%D9%BE%D8%A7%DB%8C%D8%A7%D9%86%DB%8C_API\"><\/span>\u0646\u0642\u0627\u0637 \u067e\u0627\u06cc\u0627\u0646\u06cc API<span class=\"ez-toc-section-end\"><\/span><\/h2>\n<\/p>\n<p dir=\"auto\">https:\/\/wb6nvu1fl1.execute-api.ap-south-1.amazonaws.com\/dev\/api\/reviews\u061fpage= {product_url}<\/p>\n<div class=\"markdown-alert markdown-alert-note\" dir=\"auto\">\n<p class=\"markdown-alert-title\" dir=\"auto\">\u06cc\u0627\u062f\u062f\u0627\u0634\u062a<\/p>\n<p dir=\"auto\">\u062d\u062a\u0645\u0627\u064b URL \u06a9\u0627\u0645\u0644 \u0631\u0627 \u062f\u0631 \u067e\u0627\u0631\u0627\u0645\u062a\u0631 \u067e\u0631\u0633 \u0648 \u062c\u0648 \u0645\u0627\u0646\u0646\u062f \u0627\u06cc\u0646 \u0648\u0627\u0631\u062f \u06a9\u0646\u06cc\u062f: <code>?page=https:\/\/www.example.com<\/code><\/p>\n<\/div>\n<p dir=\"auto\">\u067e\u0627\u0633\u062e:<\/p>\n<div class=\"highlight highlight-source-json notranslate position-relative overflow-auto js-code-highlight\" dir=\"auto\" data-snippet-clipboard-copy-content=\"{&#10;    \" statuscode=\"\">\n<pre>{\n    <span class=\"pl-ent\">\"statusCode\"<\/span>: \n    <span class=\"pl-ent\">\"reviews_count\"<\/span>: ,\n    <span class=\"pl-ent\">\"reviews\"<\/span>: [\n        {\n            <span class=\"pl-ent\">\"title\"<\/span>: <span class=\"pl-s\"><span class=\"pl-pds\">\"<\/span><span class=\"pl-pds\">\"<\/span><\/span>,\n            <span class=\"pl-ent\">\"body\"<\/span>: <span class=\"pl-s\"><span class=\"pl-pds\">\"<\/span><span class=\"pl-pds\">\"<\/span><\/span>,\n            <span class=\"pl-ent\">\"author\"<\/span>: <span class=\"pl-s\"><span class=\"pl-pds\">\"<\/span><span class=\"pl-pds\">\"<\/span><\/span>,\n            <span class=\"pl-ent\">\"rating\"<\/span>: <span class=\"pl-s\"><span class=\"pl-pds\">\"<\/span><span class=\"pl-pds\">\"<\/span><\/span>\n        },\n    ]\n}<\/pre>\n<div class=\"highlight__panel js-actions-panel\">\n<div class=\"highlight__panel-action js-fullscreen-code-action\">\n    <svg xmlns=\"http:\/\/www.w3.org\/2000\/svg\" width=\"20px\" height=\"20px\" viewbox=\"0 0 24 24\" class=\"highlight-action crayons-icon highlight-action--fullscreen-on\"><title>\u062d\u0627\u0644\u062a \u062a\u0645\u0627\u0645 \u0635\u0641\u062d\u0647 \u0631\u0627 \u0648\u0627\u0631\u062f \u06a9\u0646\u06cc\u062f<\/title>\n    <path d=\"M16 3h6v6h-2V5h-4V3zM2 3h6v2H4v4H2V3zm18 16v-4h2v6h-6v-2h4zM4 19h4v2H2v-6h2v4z\"\/>\n<\/svg><\/p>\n<p>    <svg xmlns=\"http:\/\/www.w3.org\/2000\/svg\" width=\"20px\" height=\"20px\" viewbox=\"0 0 24 24\" class=\"highlight-action crayons-icon highlight-action--fullscreen-off\"><title>\u0627\u0632 \u062d\u0627\u0644\u062a \u062a\u0645\u0627\u0645 \u0635\u0641\u062d\u0647 \u062e\u0627\u0631\u062c \u0634\u0648\u06cc\u062f<\/title>\n    <path d=\"M18 7h4v2h-6V3h2v4zM8 9H2V7h4V3h2v6zm10 8v4h-2v-6h6v2h-4zM8 15v6H6v-4H2v-2h6z\"\/>\n<\/svg><\/p>\n<\/div>\n<\/div>\n<\/div>\n<hr\/>\n<p><h2 class=\"heading-element\" dir=\"auto\"><span class=\"ez-toc-section\" id=\"%DA%AF%D8%B1%D8%AF%D8%B4_%DA%A9%D8%A7%D8%B1\"><\/span>\u06af\u0631\u062f\u0634 \u06a9\u0627\u0631<span class=\"ez-toc-section-end\"><\/span><\/h2>\n<\/p>\n<p><markdown-accessiblity-table><\/p>\n<div class=\"table-wrapper-paragraph\">\n<table>\n<\/p>\n<thead>\n<\/p>\n<tr>\n<\/p>\n<th align=\"center\"><img decoding=\"async\" alt=\"\u062c\u0631\u06cc\u0627\u0646 -2\" src=\"max-width: 100%;\" loading=\"lazy\" title=\"\"><\/th>\n<p><\/tr>\n<p><\/thead>\n<p><\/p>\n<tbody>\n<\/p>\n<tr>\n<\/p>\n<td align=\"center\"><em>\u062e\u0637 \u0644\u0648\u0644\u0647 V2 (\u062c\u0631\u06cc\u0627\u0646)<\/em><\/td>\n<p><\/tr>\n<p><\/tbody>\n<p><\/table>\n<\/div>\n<p><\/markdown-accessiblity-table><br \/><markdown-accessiblity-table><\/p>\n<div class=\"table-wrapper-paragraph\">\n<table>\n<\/p>\n<thead>\n<\/p>\n<tr>\n<\/p>\n<th align=\"center\"><img decoding=\"async\" alt=\"\u062c\u0631\u06cc\u0627\u0646\" src=\"max-width: 100%;\" loading=\"lazy\" title=\"\"><\/th>\n<p><\/tr>\n<p><\/thead>\n<p><\/p>\n<tbody>\n<\/p>\n<tr>\n<\/p>\n<td align=\"center\"><em>\u062e\u0637 \u0644\u0648\u0644\u0647 \u062a\u0627\u062e\u06cc\u0631<\/em><\/td>\n<p><\/tr>\n<p><\/tbody>\n<p><\/table>\n<\/div>\n<p><\/markdown-accessiblity-table><\/p>\n<p><h4 class=\"heading-element\" dir=\"auto\"><span class=\"ez-toc-section\" id=\"%D9%81%D9%86_%D8%A2%D9%88%D8%B1%DB%8C_%D9%87%D8%A7%DB%8C_%D9%85%D9%88%D8%B1%D8%AF_%D8%A7%D8%B3%D8%AA%D9%81%D8%A7%D8%AF%D9%87\"><\/span>\u0641\u0646 \u0622\u0648\u0631\u06cc \u0647\u0627\u06cc \u0645\u0648\u0631\u062f \u0627\u0633\u062a\u0641\u0627\u062f\u0647:<span class=\"ez-toc-section-end\"><\/span><\/h4>\n<\/p>\n<ul dir=\"auto\">\n<li>Backend: AWS Lambda \u060c EC2 \u060c API Gateway \u060c S3<\/li>\n<li>\u0641\u06cc\u0644\u0645\u0646\u0627\u0645\u0647: \u067e\u0627\u06cc\u062a\u0648\u0646 (\u0633\u0648\u067e \u0632\u06cc\u0628\u0627 \u060c \u0646\u0645\u0627\u06cc\u0634\u0646\u0627\u0645\u0647 \u0646\u0648\u06cc\u0633)<\/li>\n<li>LLM: GEMINI-1.5-FLASH<\/li>\n<li>Frontend: Next.js<\/li>\n<\/ul>\n<p><h4 class=\"heading-element\" dir=\"auto\"><span class=\"ez-toc-section\" id=\"%D9%85%D8%A4%D9%84%D9%81%D9%87_%D9%87%D8%A7\"><\/span>\u0645\u0624\u0644\u0641\u0647 \u0647\u0627:<span class=\"ez-toc-section-end\"><\/span><\/h4>\n<\/p>\n<ul dir=\"auto\">\n<li>\n<p><em>\u0641\u06cc\u0644\u062a\u0631 \u0645\u062d\u062a\u0648\u0627\u06cc HTML:<\/em> \u0627\u06cc\u0646 \u0641\u0631\u0627\u06cc\u0646\u062f \u0628\u0627 \u067e\u0630\u06cc\u0631\u0634 URL \u0635\u0641\u062d\u0647 \u0648\u0628 \u060c \u0641\u06cc\u0644\u062a\u0631 \u06a9\u0631\u062f\u0646 \u06a9\u062f \u0645\u0646\u0628\u0639 \u0622\u0646 \u0628\u0627 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0627\u0632 \u0622\u0646 \u0622\u063a\u0627\u0632 \u0645\u06cc \u0634\u0648\u062f <code>Beautiful Soup<\/code> \u0628\u0631\u0627\u06cc \u0627\u0633\u062a\u062e\u0631\u0627\u062c \u0645\u062d\u062a\u0648\u0627\u06cc \u0645\u0639\u0646\u06cc \u062f\u0627\u0631 \u062f\u0631 \u062d\u0627\u0644\u06cc \u06a9\u0647 \u0639\u0646\u0627\u0635\u0631 \u0628\u06cc \u0631\u0628\u0637 \u0631\u0627 \u062f\u0648\u0631 \u0645\u06cc \u0632\u0646\u06cc\u062f \u062a\u0627 \u0642\u0628\u0644 \u0627\u0632 \u0627\u0646\u062a\u0642\u0627\u0644 \u0622\u0646 \u0628\u0647 LLM \u060c \u0627\u0646\u062f\u0627\u0632\u0647 \u0646\u0634\u0627\u0646\u0647 \u0631\u0627 \u06a9\u0627\u0647\u0634 \u062f\u0647\u06cc\u062f.<\/li>\n<li>\n<p><em>\u0627\u0633\u062a\u062e\u0631\u0627\u062c \u06a9\u0644\u0627\u0633 \u0631\u0627 \u0627\u0633\u062a\u062e\u0631\u0627\u062c \u06a9\u0646\u06cc\u062f:<\/em> \u0628\u0631\u0627\u06cc \u062e\u0648\u062f\u06a9\u0627\u0631 \u0633\u0627\u0632\u06cc \u0627\u0642\u062f\u0627\u0645\u0627\u062a\u06cc \u0645\u0627\u0646\u0646\u062f \u0635\u0641\u062d\u0647 \u0628\u0646\u062f\u06cc \u060c \u0628\u0631\u0631\u0633\u06cc \u0647\u0627\u06cc \u062e\u0627\u0631\u062c \u0627\u0632 \u06a9\u0634\u0648\u0631 \u060c \u0645\u0627 \u0628\u0647 \u0627\u0646\u062a\u062e\u0627\u0628 \u06a9\u0644\u0627\u0633 \u0646\u06cc\u0627\u0632 \u062f\u0627\u0631\u06cc\u0645 \u062a\u0627 \u0628\u0627 \u0628\u0631\u0646\u0627\u0645\u0647 \u0647\u0627\u06cc \u0635\u0641\u062d\u0647 \u0628\u0647 \u0635\u0648\u0631\u062a \u0628\u0631\u0646\u0627\u0645\u0647 \u0627\u06cc \u062f\u0631 \u062a\u0639\u0627\u0645\u0644 \u0628\u0627\u0634\u062f \u0648 \u0627\u0632 \u0622\u0646 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u06a9\u0646\u062f \u060c \u0627\u0632 \u0622\u0646 \u0627\u0633\u062a\u0641\u0627\u062f\u0647 \u0645\u06cc \u06a9\u0646\u062f <code>Gemini-1.5-flash<\/code> \u0645\u062f\u0644.<\/li>\n<li>\n<p><em>\u0627\u062a\u0648\u0645\u0627\u0633\u06cc\u0648\u0646 \u0645\u0631\u0648\u0631\u06af\u0631:<\/em> \u2026<\/li>\n<\/ul>\n<\/article>\n<\/div>\n<p>\n  <\/div>\n<\/div>\n<p>\u0628\u0627 \u062a\u0634\u06a9\u0631 \u0627\u0632 \u062e\u0648\u0627\u0646\u062f\u0646<\/p>\n<\/p><\/div>\n","protected":false},"excerpt":{"rendered":"<p>\u0628\u06cc\u0627\u0646\u06cc\u0647 \u0645\u0634\u06a9\u0644 \u0627\u0644\u0632\u0627\u0645 \u0627\u06cc\u0646 \u0628\u0631\u0646\u0627\u0645\u0647 \u0627\u0633\u062a\u062e\u0631\u0627\u062c \u062f\u0627\u062f\u0647 \u0647\u0627\u06cc \u0645\u0631\u0648\u0631 \u0627\u0632 \u0648\u0628 \u0633\u0627\u06cc\u062a \u0647\u0627\u06cc \u0645\u062d\u0635\u0648\u0644 \u0627\u0633\u062a \u06a9\u0647 \u062f\u0631 \u0628\u062e\u0634 \u0628\u0631\u0631\u0633\u06cc \u0635\u0641\u062d\u0647 \u0628\u0646\u062f\u06cc \u062f\u0627\u0631\u0646\u062f \u0648 \u0646\u06cc\u0627\u0632 \u0628\u0647 \u067e\u0634\u062a\u06cc\u0628\u0627\u0646\u06cc \u062c\u0647\u0627\u0646\u06cc \u0628\u0631\u0627\u06cc \u0647\u0645\u0647 \u0646\u0648\u0639 \u0635\u0641\u062d\u0647 \u0628\u0646\u062f\u06cc \u062f\u0627\u0631\u0646\u062f. \u0647\u0645\u0686\u0646\u06cc\u0646 \u0628\u0631\u0627\u06cc \u0628\u0627\u0632\u06af\u0634\u062a \u0628\u0647 \u0628\u0631\u0631\u0633\u06cc \u0627\u0633\u062a\u062e\u0631\u0627\u062c \u0634\u062f\u0647 \u060c API GET \u0646\u06cc\u0632 \u0644\u0627\u0632\u0645 \u0627\u0633\u062a. \u0627\u062c\u0631\u0627\u06cc \u0627\u06cc\u0646 \u0634\u0627\u0645\u0644 \u0633\u0647 \u0645\u0624\u0644\u0641\u0647 \u0627\u0635\u0644\u06cc \u060c API Gateway &hellip;<\/p>\n","protected":false},"author":2,"featured_media":95768,"comment_status":"open","ping_status":"closed","sticky":false,"template":"","format":"standard","meta":{"fifu_image_url":"","fifu_image_alt":"","footnotes":""},"categories":[339],"tags":[],"class_list":["post-95767","post","type-post","status-publish","format-standard","has-post-thumbnail","hentry","category-dev"],"_links":{"self":[{"href":"https:\/\/nabfollower.com\/blog\/wp-json\/wp\/v2\/posts\/95767","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/nabfollower.com\/blog\/wp-json\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/nabfollower.com\/blog\/wp-json\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/nabfollower.com\/blog\/wp-json\/wp\/v2\/users\/2"}],"replies":[{"embeddable":true,"href":"https:\/\/nabfollower.com\/blog\/wp-json\/wp\/v2\/comments?post=95767"}],"version-history":[{"count":0,"href":"https:\/\/nabfollower.com\/blog\/wp-json\/wp\/v2\/posts\/95767\/revisions"}],"wp:featuredmedia":[{"embeddable":true,"href":"https:\/\/nabfollower.com\/blog\/wp-json\/wp\/v2\/media\/95768"}],"wp:attachment":[{"href":"https:\/\/nabfollower.com\/blog\/wp-json\/wp\/v2\/media?parent=95767"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/nabfollower.com\/blog\/wp-json\/wp\/v2\/categories?post=95767"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/nabfollower.com\/blog\/wp-json\/wp\/v2\/tags?post=95767"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}