{"id":467,"date":"2022-08-15T09:00:57","date_gmt":"2022-08-15T00:00:57","guid":{"rendered":"https:\/\/is-ai.jp\/?p=467"},"modified":"2022-08-02T17:29:49","modified_gmt":"2022-08-02T08:29:49","slug":"pythonfilmarks%e3%81%ae%e3%83%ac%e3%83%93%e3%83%a5%e3%83%bc%e3%82%92%e3%82%b9%e3%82%af%e3%83%ac%e3%82%a4%e3%83%94%e3%83%b3%e3%82%b0%e3%81%99%e3%82%8b","status":"publish","type":"post","link":"https:\/\/is-ai.jp\/?p=467","title":{"rendered":"[python]Filmarks\u306e\u30ec\u30d3\u30e5\u30fc\u3092\u30b9\u30af\u30ec\u30a4\u30d4\u30f3\u30b0\u3059\u308b"},"content":{"rendered":"\n<h2 class=\"wp-block-heading\">\u306f\u3058\u3081\u306b<\/h2>\n\n\n\n<p>\u30bf\u30a4\u30c8\u30eb\u306e\u901a\u308a\u3001\u4eca\u56de\u306fFilmarks\u306e\u30ec\u30d3\u30e5\u30fc\u7d50\u679c\u3092\u30b9\u30af\u30ec\u30a4\u30d4\u30f3\u30b0\u3057\u3066\u3044\u304f\u3068\u3044\u3046\u5185\u5bb9\u3067\u3059\u3002<\/p>\n\n\n\n<p>\u30b9\u30af\u30ec\u30a4\u30d4\u30f3\u30b0\u3059\u308b\u3068\u3044\u3046\u30bf\u30a4\u30c8\u30eb\u3067\u306f\u3042\u308a\u307e\u3059\u304c\u3001\u81ea\u5206\u306e\u5834\u5408\u306f\u3069\u3046\u3057\u3066\u3082\u60f3\u5b9a\u901a\u308a\u306e\u6319\u52d5\u3092\u8d77\u3053\u305b\u306a\u304b\u3063\u305f\u306e\u3067\u3001\u4e00\u65e6\u8ae6\u3081\u307e\u3057\u305f\u3002\u305f\u3060\u73fe\u6642\u70b9\u3067\u3082\u5341\u5206\u5229\u7528\u4fa1\u5024\u306e\u3042\u308b\u30b3\u30fc\u30c9\u3060\u3068\u601d\u3046\u306e\u3067\u8a18\u4e8b\u306b\u307e\u3068\u3081\u307e\u3059\u3002<\/p>\n\n\n\n<p>\u305d\u3046\u3044\u3063\u305f\u72b6\u6cc1\u3092\u52a0\u5473\u3057\u305f\u4e0a\u3067\u8aac\u660e\u3057\u3066\u3044\u304d\u307e\u3059\u3002<\/p>\n\n\n\n<p><\/p>\n\n\n\n<p><strong>[\u6ce8\u610f]<\/strong>\u30b9\u30af\u30ec\u30a4\u30d4\u30f3\u30b0\u3057\u305f\u30c7\u30fc\u30bf\u306e\u4f7f\u7528\u306b\u95a2\u3057\u3066\u306f\u81ea\u5df1\u8cac\u4efb\u3067\u304a\u9858\u3044\u3057\u307e\u3059\u3002<\/p>\n\n\n\n<p>\u30b9\u30af\u30ec\u30a4\u30d4\u30f3\u30b0\u306e\u9055\u6cd5\u6027\u306b\u3064\u3044\u3066\u306f\u3053\u3061\u3089\u306e\u8a18\u4e8b\u3067\u307e\u3068\u3081\u3066\u3044\u308b\u306e\u3067\u3001\u8208\u5473\u304c\u3042\u308b\u65b9\u306f\u662f\u975e\u3054\u89a7\u306b\u306a\u3063\u3066\u304f\u3060\u3055\u3044\u3002\u7d50\u69cb\u6c17\u5408\u3092\u5165\u308c\u3066\u8abf\u67fb\u3057\u307e\u3057\u305f!!<\/p>\n\n\n\n<figure class=\"wp-block-embed\"><div class=\"wp-block-embed__wrapper\">\n<div class=\"sc_getpost\"><a class=\"clearfix\" href=\"https:\/\/is-ai.jp\/?p=483\"><div><div class=\"sc_getpost_thumb post-box-thumbnail__wrap\"><img src=\"https:\/\/is-ai.jp\/wp-content\/uploads\/2022\/08\/email-4284157.png\" width=\"1920\" height=\"1298\" alt=\"[python]Filmarks\u306e\u30ec\u30d3\u30e5\u30fc\u3092\u30b9\u30af\u30ec\u30a4\u30d4\u30f3\u30b0\u3059\u308b\"><\/div><div class=\"title\">\u30b9\u30af\u30ec\u30a4\u30d4\u30f3\u30b0\u306f\u9055\u6cd5\uff1f\uff1f\u9055\u6cd5\u6027\u306b\u3064\u3044\u3066\u8abf\u3079\u3066\u307f\u305f<\/div><div class=\"date\">2022.8.8<\/div><div class=\"substr\">\u306f\u3058\u3081\u306b \u81ea\u5206\u306e\u30b5\u30a4\u30c8\u3067\u306f\u30b9\u30af\u30ec\u30a4\u30d4\u30f3\u30b0\u306b\u95a2\u3059\u308b\u5185\u5bb9\u306e\u8a18\u4e8b\u3092\u3044\u304f\u3064\u304b\u53d6\u308a\u4e0a\u3052\u3066\u304a\u308a\u3001\u307e\u305f\u4eca\u5f8c\u3082\u5b9a\u671f\u7684\u306b\u30a2\u30c3\u30d7\u30ed\u30fc\u30c9\u3059\u308b\u4e88\u5b9a\u306a\u306e\u3067\u3001\u4e00\u5ea6\u3057\u3063\u304b\u308a\u8abf\u3079\u3066\u307f\u305f\u3044\u3068\u601d\u3044\u7e8f\u3081\u308b\u3053\u3068\u306b\u3057\u307e\u3057\u305f...<\/div><\/div><\/a><\/div>\n<\/div><\/figure>\n\n\n\n<p><\/p>\n\n\n\n<p><\/p>\n\n\n\n<h2 class=\"wp-block-heading\">\u554f\u984c\u70b9<\/h2>\n\n\n\n<p>\u3067\u306f\u3001\u672c\u984c\u3067\u3059\u3002\u4eca\u56de\u81ea\u5206\u304c\u3076\u3064\u304b\u3063\u305f\u58c1\u304c\u5927\u304d\u304f<strong>\u4e8c\u3064<\/strong>\u3042\u308a\u307e\u3059\u3002<\/p>\n\n\n\n<p><strong>\u30fb\u30b5\u30fc\u30d0\u304b\u3089\u306e\u30ec\u30b9\u30dd\u30f3\u30b9\u304c\u9045\u304f\u3001\u8981\u7d20\u304c\u53d6\u308c\u305a\u306b\u30a8\u30e9\u30fc\u3067\u505c\u6b62<\/strong><\/p>\n\n\n\n<p><strong>\u30fb\u30bf\u30a4\u30c8\u30eb\u691c\u7d22\u3067\u98db\u3073\u305f\u3044\u30bf\u30a4\u30c8\u30eb\u30da\u30fc\u30b8\u306b\u98db\u3079\u306a\u3044<\/strong><\/p>\n\n\n\n<p>\u4e00\u3064\u76ee\u306b\u95a2\u3057\u3066\u306f\u4f8b\u5916\u51e6\u7406\u306a\u3069\u3092\u4f7f\u3063\u3066\u5bfe\u51e6\u3067\u304d\u3066\u3044\u305f\u306e\u3067\u3059\u304c\u3001\u554f\u984c\u306f\u4e8c\u3064\u76ee\u3067\u3059\u3002<\/p>\n\n\n\n<p>\u4eca\u56de\u81ea\u5206\u306e\u4f7f\u3044\u65b9\u3067\u306f\u3001<\/p>\n\n\n\n<ol><li>\u691c\u7d22\u30bf\u30a4\u30c8\u30eb\u306b\u30bf\u30a4\u30c8\u30eb\u3092\u5165\u529b  <\/li><li>\u4e00\u756a\u4e0a\u306e\u5019\u88dc\u3092\u9078\u629e<\/li><li>\u98db\u3093\u3060\u5148\u306e\u30da\u30fc\u30b8\u3067\u30ec\u30d3\u30e5\u30fc\u3092\u62fe\u3046<\/li><\/ol>\n\n\n\n<p>\u3068\u3044\u3046\u3001\u4e0a\u8a18\u306e\u30d1\u30bf\u30fc\u30f3\u3092\u7e70\u308a\u8fd4\u3059\u3053\u3068\u3067\u30ec\u30d3\u30e5\u30fc\u3092\u53d6\u5f97\u3057\u3066\u3044\u307e\u3057\u305f\u3002\u3053\u306e\u53d6\u5f97\u65b9\u6cd5\u3060\u3068\u4e00\u756a\u4e0a\u306e\u5019\u88dc\u3068\u30bf\u30a4\u30c8\u30eb\u304c\u565b\u307f\u5408\u308f\u306a\u3044\u3053\u3068\u304c\u305f\u307e\u306b\u767a\u751f\u3057\u305f\u305f\u3081\u30c7\u30fc\u30bf\u306e\u4fe1\u983c\u6027\u304c\u4e0b\u304c\u3063\u3066\u3057\u307e\u3044\u307e\u3057\u305f\u3002<\/p>\n\n\n\n<p>\u4f8b\u3048\u3070\u3001\"\u30bd\u30a6\"\u3068\u3044\u3046\u6620\u753b\u304c\u3042\u308a\u307e\u3059\u304c\u3001\u691c\u7d22\u7d50\u679c\u306e\u4e00\u756a\u4e0a\u306b\u304f\u308b\u30bf\u30a4\u30c8\u30eb\u306f\"\u30bd\u30a6\u30eb\u30d5\u30eb\u30fb\u30ef\u30fc\u30eb\u30c9\"\u3068\u3044\u3046\u5225\u306e\u30bf\u30a4\u30c8\u30eb\u304c\u6700\u4e0a\u4f4d\u306b\u304d\u3066\u3057\u307e\u3044\u307e\u3059\u3002<\/p>\n\n\n\n<p>\u3053\u3046\u3044\u3063\u305f\u73fe\u8c61\u304c\u7a00\u306b\u767a\u751f\u3059\u308b\u3053\u3068\u304c\u4e00\u756a\u306e\u554f\u984c\u70b9\u3067\u3057\u305f\u3002<\/p>\n\n\n\n<figure class=\"wp-block-image size-large is-resized\"><img decoding=\"async\" loading=\"lazy\" data-src=\"https:\/\/is-ai.jp\/wp-content\/uploads\/2022\/07\/8746697579d034a3a5c7c1a595ce73aa-1024x438.png\" alt=\"\" class=\"wp-image-468 lazyload\" width=\"634\" height=\"271\" data-srcset=\"https:\/\/is-ai.jp\/wp-content\/uploads\/2022\/07\/8746697579d034a3a5c7c1a595ce73aa-1024x438.png 1024w, https:\/\/is-ai.jp\/wp-content\/uploads\/2022\/07\/8746697579d034a3a5c7c1a595ce73aa-300x128.png 300w, https:\/\/is-ai.jp\/wp-content\/uploads\/2022\/07\/8746697579d034a3a5c7c1a595ce73aa-768x328.png 768w, https:\/\/is-ai.jp\/wp-content\/uploads\/2022\/07\/8746697579d034a3a5c7c1a595ce73aa-1536x657.png 1536w, https:\/\/is-ai.jp\/wp-content\/uploads\/2022\/07\/8746697579d034a3a5c7c1a595ce73aa-2048x876.png 2048w\" data-sizes=\"(max-width: 634px) 100vw, 634px\" \/><\/figure>\n\n\n\n<p><\/p>\n\n\n\n<p class=\"has-red-color has-text-color has-small-font-size\">*\u8ffd\u8a18 <\/p>\n\n\n\n<p class=\"has-red-color has-text-color has-small-font-size\">\u691c\u7d22\u5019\u88dc\u3068\u5165\u529b\u6587\u5b57\u306e\u30bf\u30a4\u30c8\u30eb\u304c\u5b8c\u5168\u4e00\u81f4\u3057\u3066\u3044\u308b\u304b\u3092\u30c1\u30a7\u30c3\u30af\u3059\u308c\u3070\u5b9f\u88c5\u3067\u304d\u305d\u3046\u3067\u3059\u306d\u3002\u3002<\/p>\n\n\n\n<p><\/p>\n\n\n\n<h2 class=\"wp-block-heading\">\u30b3\u30fc\u30c9<\/h2>\n\n\n\n<p>\u4eca\u56de\u306f\u4f5c\u6210\u3057\u305f\u95a2\u6570\u306e\u7d39\u4ecb\u3092\u3057\u307e\u3059\u3002<\/p>\n\n\n\n<p>get_page_review\u95a2\u6570\u306b\u30bf\u30a4\u30c8\u30eb\u3092\u6e21\u3057\u3066\u3042\u3052\u308c\u3070\u30ec\u30d3\u30e5\u30fc\u304c\u53d6\u5f97\u3067\u304d\u308b\u3088\u3046\u306b\u306a\u3063\u3066\u3044\u307e\u3059\u3002<\/p>\n\n\n\n<div class=\"hcb_wrap\"><pre class=\"prism line-numbers lang-python\" data-lang=\"Python\"><code># import & \u30d1\u30e9\u30e1\u30fc\u30bf\u5b9a\u7fa9\nfrom time import sleep, time\nfrom selenium import webdriver\nfrom selenium.webdriver.chrome.service import Service\nfrom selenium.webdriver.common.by import By\nfrom selenium.webdriver.chrome.options import Options \n\nCONNECTION_RETRY = 10\n\noptions = Options()\noptions.binary_location = &#39;\/Applications\/Google Chrome Beta.app\/Contents\/MacOS\/Google Chrome Beta&#39;\ndriver = webdriver.Chrome(service=Service(&#39;.\/chromedriver-bata&#39;), options=options)\n\n# \u30bf\u30a4\u30c8\u30eb\u3092\u5165\u308c\u3066\u305d\u306e\u30bf\u30a4\u30c8\u30eb\u30da\u30fc\u30b8\u306e\u6620\u753b\u30ec\u30d3\u30e5\u30fc\u3092\u53d6\u5f97\ndef get_page_review(film_title, i=1):\n  if not select_movie_item_with_retry(film_title):\n    exit()\n  else:\n    basepath = driver.current_url \n    \n  while True:\n    access_url = basepath + f&#39;?page={i}&#39;\n    print(access_url)\n    try:\n      driver.get(access_url)\n    except:\n      break\n\n    sleep(0.2)\n    try:\n      reviews = driver.find_elements(by=By.CLASS_NAME, value=&#39;p-mark__review&#39;)\n      goods = driver.find_elements(by=By.CLASS_NAME, value=&#39;c-reactions__count&#39;)\n      scores = driver.find_elements(by=By.CLASS_NAME, value=&#39;c-rating__score&#39;)\n    except:\n      print(&#39;continue&#39;)\n      i += 1\n      continue\n    \n    # no review\n    if len(reviews)==0 and len(goods)==0 and len(scores)==0:\n      break\n\n    for review, good, score in zip(reviews, goods, scores):\n      print(review.text, good.text, score.text)\n    i += 1\n    \n    # 100\u30da\u30fc\u30b8\u5206\u53d6\u5f97\u3057\u305f\u3089\u7d42\u4e86\n    if i &gt;= 100:\n      break\n    \ndef select_movie_item_with_retry(film_title):\n  print(f&#39;https:\/\/filmarks.com\/search\/movies?q=&quot;{film_title}&quot;&#39;)\n  driver.get(f&#39;https:\/\/filmarks.com\/search\/movies?q=&quot;{film_title}&quot;&#39;)\n  \n  for i in range(1, CONNECTION_RETRY + 1):\n    try:\n      driver.find_elements(by=By.CLASS_NAME, value=&quot;p-content-cassette__jacket&quot;)[0].click()\n    except Exception as e:\n      print(&quot;error:{e} retry:{i}\/{max}&quot;.format(e=e, i=i, max=CONNECTION_RETRY))\n      sleep(1)\n    else:\n      return True\n  return False\n\nget_page_review(&#39;Joker&#39;)<\/code><\/pre><\/div>\n\n\n\n<p><\/p>\n\n\n\n<p>\u307e\u305f\u3001\u4eca\u56de\u7d39\u4ecb\u3057\u305f\u8a18\u4e8b\u3067\u306fchrome\u306ebeta\u30d0\u30fc\u30b8\u30e7\u30f3\u3092\u5229\u7528\u3057\u3066\u3044\u307e\u3059\u3002<\/p>\n\n\n\n<p>\u4f7f\u3044\u65b9\u306f\u3053\u3061\u3089\u306e\u8a18\u4e8b\u3067\u307e\u3068\u3081\u3066\u3044\u308b\u306e\u3067\u3001beta\u7248\u3092\u5229\u7528\u3059\u308b\u5834\u5408\u306f\u53c2\u8003\u306b\u3057\u3066\u307f\u3066\u304f\u3060\u3055\u3044\u3002<\/p>\n\n\n\n<figure class=\"wp-block-embed is-type-wp-embed is-provider-is-blog wp-block-embed-is-blog\"><div class=\"wp-block-embed__wrapper\">\n<div class=\"sc_getpost\"><a class=\"clearfix\" href=\"https:\/\/is-ai.jp\/?p=457\"><div><div class=\"sc_getpost_thumb post-box-thumbnail__wrap\"><img data-src=\"https:\/\/is-ai.jp\/wp-content\/uploads\/2022\/07\/44c23b6b15d70994d766716b66bcaf1c.jpeg\" width=\"322\" height=\"157\" alt=\"[python]Filmarks\u306e\u30ec\u30d3\u30e5\u30fc\u3092\u30b9\u30af\u30ec\u30a4\u30d4\u30f3\u30b0\u3059\u308b\" class=\"lazyload\" \/><\/div><div class=\"title\">Chrome<var.103>Selenium\u306e\u30a8\u30e9\u30fc\u5bfe\u51e6\ufffc<\/div><div class=\"date\">2022.7.13<\/div><div class=\"substr\">\u306f\u3058\u3081\u306b \u6700\u8fd1\u30b9\u30af\u30ec\u30a4\u30d4\u30f3\u30b0\u3092\u56de\u3057\u3066\u3044\u308b\u3053\u3068\u304c\u591a\u3044\u306e\u3067\u3059\u304c\u3001\u8b0e\u306e\u30a8\u30e9\u30fc\u306b\u3088\u304f\u963b\u307e\u308c\u3066\u3044\u305f\u306e\u3067\u3059\u304c\u3001\u3053\u308c\u304cchrome\u5074\u306e\u554f\u984c\u3067\u3042\u308b\u3053\u3068\u3092\u77e5\u3063\u305f\u306e\u3067\u5171\u6709\uff06\u307e\u3068\u3081\u3092\u3057\u307e\u3059\u3002 \u81ea\u5206\u306e\u74b0\u5883...<\/div><\/div><\/a><\/div>\n<\/div><\/figure>\n\n\n\n<p><\/p>\n\n\n\n<h2 class=\"wp-block-heading\">\u304a\u308f\u308a\u306b<\/h2>\n\n\n\n<p>\u4eca\u56de\u3001\u6620\u753b\u30bf\u30a4\u30c8\u30eb\u3068\u5bfe\u5fdc\u3059\u308b\u30ec\u30d3\u30e5\u30fc\u30c7\u30fc\u30bf\u304c\u6b32\u3057\u304b\u3063\u305f\u306e\u3067\u3059\u304c\u3001\u65ad\u5ff5\u3057\u307e\u3057\u305f\u3002\u3002<\/p>\n\n\n\n<p>\u4ed6\u306b\u3082\u65b9\u6cd5\u306a\u3069\u306f\u8003\u3048\u3089\u308c\u308b\u3068\u601d\u3046\u306e\u3067\u3001\u307e\u305f\u5225\u306e\u65b9\u6cd5\u3092\u8a66\u3057\u3066\u3044\u3053\u3046\u3068\u601d\u3044\u307e\u3059\u3002<\/p>\n\n\n\n<p>\u4ee5\u4e0a!!<\/p>\n","protected":false},"excerpt":{"rendered":"<p>\u306f\u3058\u3081\u306b \u30bf\u30a4\u30c8\u30eb\u306e\u901a\u308a\u3001\u4eca\u56de\u306fFilmarks\u306e\u30ec\u30d3\u30e5\u30fc\u7d50\u679c\u3092\u30b9\u30af\u30ec\u30a4\u30d4\u30f3\u30b0\u3057\u3066\u3044\u304f\u3068\u3044\u3046\u5185\u5bb9\u3067\u3059\u3002 \u30b9\u30af\u30ec\u30a4\u30d4\u30f3\u30b0\u3059\u308b\u3068\u3044\u3046\u30bf\u30a4\u30c8\u30eb\u3067\u306f\u3042\u308a\u307e\u3059\u304c\u3001\u81ea\u5206\u306e\u5834\u5408\u306f\u3069\u3046\u3057\u3066\u3082\u60f3\u5b9a\u901a\u308a\u306e\u6319\u52d5\u3092\u8d77\u3053\u305b\u306a\u304b\u3063\u305f\u306e\u3067\u3001\u4e00\u65e6\u8ae6\u3081\u307e\u2026<\/p>\n","protected":false},"author":1,"featured_media":471,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":[],"categories":[10,1],"tags":[7,38],"_links":{"self":[{"href":"https:\/\/is-ai.jp\/index.php?rest_route=\/wp\/v2\/posts\/467"}],"collection":[{"href":"https:\/\/is-ai.jp\/index.php?rest_route=\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/is-ai.jp\/index.php?rest_route=\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/is-ai.jp\/index.php?rest_route=\/wp\/v2\/users\/1"}],"replies":[{"embeddable":true,"href":"https:\/\/is-ai.jp\/index.php?rest_route=%2Fwp%2Fv2%2Fcomments&post=467"}],"version-history":[{"count":5,"href":"https:\/\/is-ai.jp\/index.php?rest_route=\/wp\/v2\/posts\/467\/revisions"}],"predecessor-version":[{"id":491,"href":"https:\/\/is-ai.jp\/index.php?rest_route=\/wp\/v2\/posts\/467\/revisions\/491"}],"wp:featuredmedia":[{"embeddable":true,"href":"https:\/\/is-ai.jp\/index.php?rest_route=\/wp\/v2\/media\/471"}],"wp:attachment":[{"href":"https:\/\/is-ai.jp\/index.php?rest_route=%2Fwp%2Fv2%2Fmedia&parent=467"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/is-ai.jp\/index.php?rest_route=%2Fwp%2Fv2%2Fcategories&post=467"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/is-ai.jp\/index.php?rest_route=%2Fwp%2Fv2%2Ftags&post=467"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}