save_search_result.py 1.3 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152
  1. import gsearch_general
  2. import sys
  3. import dataset
  4. import datetime
  5. import codecs
  6. import time
  7. db = dataset.connect('mysql://choozmo:pAssw0rd@db.ptt.cx:3306/seo?charset=utf8mb4')
  8. table=db['save_result']
  9. driver=gsearch_general.restart_browser()
  10. fr=codecs.open('c:/tmp/food.csv','r','utf-8')
  11. lines=fr.readlines()
  12. fr.close()
  13. namedict={}
  14. cursor=db.query('select distinct(keyword) as kw from save_result')
  15. for c in cursor:
  16. kw=c['kw'].replace('\n','')
  17. kw=c['kw'].replace('\r','')
  18. namedict[kw]=1
  19. print(namedict)
  20. print(lines)
  21. #time.sleep(9999)
  22. #keyword='檸檬原汁'
  23. #lines=['芋頭 外帶']
  24. #lines=['布丁 牛奶 冰']
  25. #lines=['芋圓 加盟']
  26. for l in lines:
  27. l=l.replace('\r','')
  28. l=l.replace('\n','')
  29. if namedict.get(l) is not None:
  30. continue
  31. keyword=l
  32. print(keyword)
  33. idx=gsearch_general.process_query(driver,keyword,number_results=100,language_code='zh-TW',enable_next=False)
  34. print(idx)
  35. cnt=1
  36. for x in idx:
  37. x['keyword']=keyword
  38. x['dt']=datetime.datetime.now()
  39. x['num']=str(cnt)
  40. cnt+=1
  41. table.insert(x)
  42. # if idx==None:
  43. # print(driver.page_source)
  44. if '我們的系統偵測到您的電腦網路送出的流量有異常情況' in driver.page_source:
  45. print('baned.....')
  46. sys.exit()