googlenews.py 1.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748
  1. from newspaper import Article
  2. from GoogleNews import GoogleNews
  3. def news(title_and_link):
  4. for i in title_and_link:
  5. try:
  6. article = Article(i['link'])
  7. article.download()
  8. article.parse()
  9. text = article.text
  10. title = i['title']
  11. try:
  12. print(title)
  13. with open(f'/Users/zooeytsai/ig_tags/googlenews/{title}.txt','x') as f:
  14. f.write(text)
  15. except FileExistsError:
  16. print('已有同樣新聞文章','title')
  17. pass
  18. except:
  19. print('403')
  20. pass
  21. return text
  22. def google_news(keyword,page):
  23. g = GoogleNews()
  24. g.setlang('cn')
  25. g.setencode('utf-8')
  26. g.search(keyword)
  27. g.clear()
  28. news_link = []
  29. for i in range(page):
  30. g.get_page(page)
  31. result = g.result()
  32. for j in result:
  33. d ={'title':j['title'],'link':j['link']}
  34. news_link.append(d)
  35. g.clear()
  36. print(len(news_link))
  37. print(news_link)
  38. return news_link
  39. k = ['寵物蛋糕','寵物住宿','寵物餐廳','寵物用品','寵物美容','寵物友善']
  40. for i in k:
  41. result = google_news(i,5)
  42. news(result)