Explorar o código

修改time sleep

zooeytsai %!s(int64=3) %!d(string=hai) anos
pai
achega
34686b387a
Modificáronse 1 ficheiros con 11 adicións e 8 borrados
  1. 11 8
      ig_tags/ig_selenium.py

+ 11 - 8
ig_tags/ig_selenium.py

@@ -20,13 +20,13 @@ account = ['liftwotsai','chenlinrain','enjoylisteningswift']
 pd = ['obl787iviate634','weareyoung12']
 
 path = '/Users/zooeytsai/Downloads/chromedriver'
-sbaccount = account[2]
+sbaccount = account[1]
 sbpd = pd[1]
 options = Options()
 options.add_argument("--headless")
 
 def download_post():
-    hashtag = '寵物'
+    hashtag = '寵物零食'
     url = f"https://www.instagram.com/explore/tags/{hashtag}/"
     s = Service(path)
     driver = webdriver.Chrome(service=s)
@@ -46,13 +46,14 @@ def download_post():
         jar.set(i['name'], i['value'])
     driver.get(url)
     time.sleep(3)
-    limit_of_posts = 100
+    limit_of_posts = 10
     c = 0
     wait = WebDriverWait(driver, 10)
     last_height = driver.execute_script(
         "window.scrollTo(0, document.body.scrollHeight);var scrolldown=document.body.scrollHeight;return scrolldown;")
     link = []
     while True:
+        print(c)
         href_element = wait.until(ec.visibility_of_all_elements_located((By.XPATH, "//a[@href]")))
         for i in href_element:
             link.append(i.get_attribute('href'))
@@ -63,9 +64,10 @@ def download_post():
         driver.implicitly_wait(3)
         c+=1
         if c > limit_of_posts:
-            time.sleep(randint(180,300))
             print('中場休息')
-        if len(link)>10000:
+            time.sleep(randint(180,300))
+            c=0
+        if len(link)>5000:
             break
 
     driver.close()
@@ -77,7 +79,8 @@ def download_post():
 def hashtag():
     hashtag = []
     c=0
-    for url in download_post():
+    result = download_post()
+    for url in result:
         s = Service(path)
         driver = webdriver.Chrome(service=s)
         driver.implicitly_wait(3)
@@ -92,7 +95,7 @@ def hashtag():
             time.sleep(3)
             c=0
     driver.close()
-
+    print(hashtag)
     db = pymysql.connect(host='localhost',
                          user='root',
                          password='jondae350',
@@ -106,5 +109,5 @@ def hashtag():
     return hashtag
 
 
-download_post()
+
 hashtag()