12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849 |
- #!/usr/bin/python3
- import sys
- import codecs
- import traceback
- import requests
- import re
- import pandas as pd
- import random
- import urllib
- import dataset
- import json
- import gspread
- import datetime
- from gspread_pandas import Spread, Client
- from oauth2client.service_account import ServiceAccountCredentials
- import os
- import threading
- def save_sheet(df,filename,tabname,startpos='A1'):
- scope = ['https://spreadsheets.google.com/feeds',
- 'https://www.googleapis.com/auth/drive']
- credentials = ServiceAccountCredentials.from_json_keyfile_name('c:\\keys\\spread2.json', scope)
- # credentials = ServiceAccountCredentials.from_json_keyfile_name('/var/keys/spread2.json', scope)
- gc = gspread.authorize(credentials)
- spread = Spread(filename,creds=credentials)
- spread.df_to_sheet(df, index=False, sheet=tabname, start=startpos, replace=False)
- def do_jobs():
- db = dataset.connect('mysql://choozmo:pAssw0rd@db.ptt.cx:3306/hhh?charset=utf8mb4')
- cursor=db.query('SELECT id,title,href,kw FROM hhh.gap20v7;')
- df = pd.DataFrame(columns=('id','title','href','kw'))
- idx=0
- for c in cursor:
- df.loc[idx]=[c['id'],c['title'],c['href'],c['kw']]
- # df.loc[idx]=['okok',333]
- idx+=1
- save_sheet(df,'Content_Gap_URLs','2021_DEC_P1')
- t = threading.Thread(target = do_jobs)
- t.start()
- t.join()
|