123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127 |
- #!/usr/bin/python3
- import sys
- import codecs
- import traceback
- import requests
- import re
- import pandas as pd
- import random
- import urllib
- import dataset
- import json
- import gspread
- import datetime
- from gspread_pandas import Spread, Client
- from oauth2client.service_account import ServiceAccountCredentials
- import os
- import threading
- from apiclient.discovery import build
- from oauth2client.service_account import ServiceAccountCredentials
- import dataset
- db = dataset.connect('mysql://choozmo:pAssw0rd@db.ptt.cx:3306/hhh?charset=utf8mb4')
- db.query('delete from ga_pagepath')
- db.begin()
- table=db['ga_pagepath_yearly']
- SCOPES = ['https://www.googleapis.com/auth/analytics.readonly']
- KEY_FILE_LOCATION = 'c:\\keys\\choozmo-ga-beee24b7a4c1.json'
- VIEW_ID = '188916214'
- def initialize_analyticsreporting():
- """Initializes an Analytics Reporting API V4 service object.
- Returns:
- An authorized Analytics Reporting API V4 service object.
- """
- credentials = ServiceAccountCredentials.from_json_keyfile_name(
- KEY_FILE_LOCATION, SCOPES)
- # Build the service object.
- analytics = build('analyticsreporting', 'v4', credentials=credentials)
- return analytics
- def get_report(analytics,body):
- """Queries the Analytics Reporting API V4.
- Args:
- analytics: An authorized Analytics Reporting API V4 service object.
- Returns:
- The Analytics Reporting API V4 response.
- """
- return analytics.reports().batchGet(
- body={
- 'reportRequests':body
- }
- ).execute()
- def print_response(response):
- """Parses and prints the Analytics Reporting API V4 response.
- Args:
- response: An Analytics Reporting API V4 response.
- """
- result=[]
- for report in response.get('reports', []):
- columnHeader = report.get('columnHeader', {})
- dimensionHeaders = columnHeader.get('dimensions', [])
- metricHeaders = columnHeader.get('metricHeader', {}).get('metricHeaderEntries', [])
- for row in report.get('data', {}).get('rows', []):
- dimensions = row.get('dimensions', [])
- dateRangeValues = row.get('metrics', [])
- ga_dict={}
- for header, dimension in zip(dimensionHeaders, dimensions):
- # print(header + ': ', dimension)
- ga_dict[header]=dimension
-
- for i, values in enumerate(dateRangeValues):
- # print('Date range:', str(i))
- for metricHeader, value in zip(metricHeaders, values.get('values')):
- ga_dict[metricHeader.get('name')]=value
- # print(metricHeader.get('name') + ':', value)
- result.append(ga_dict)
- return result
- # print(ga_dict)
- def main():
- analytics = initialize_analyticsreporting()
- #(FB_|facebook|IG_|LINE_|LINEMP_|qsear.ch)
- body=[{ 'viewId': VIEW_ID,
- 'dateRanges': [{'startDate': '2020-06-30', 'endDate': '2021-06-29'}],
- # 'dateRanges': [{'startDate': '2021-06-01', 'endDate': '2021-06-24'}],
- 'metrics': [{'expression': 'ga:users'},{'expression': 'ga:newusers'},{'expression': 'ga:sessions'},{'expression': 'ga:pageviews'},{'expression': 'ga:bounceRate'},{'expression': 'ga:pageviewsPerSession'}],
- 'dimensions': [{'name': 'ga:pagePath'}],
- 'orderBys':[{"fieldName": "ga:pageviews", "sortOrder": "DESCENDING"}],
- 'pageSize': '20000'
- }]
- response = get_report(analytics,body)
- ga_dict=print_response(response)
- result=[]
- for elmt in ga_dict:
- elmt['ga:pagePath']='https://hhh.com.tw'+elmt['ga:pagePath']
- # print(elmt)
- result.append(elmt)
- print('inserting.....')
- for r in result:
- try:
- table.insert(r)
- except:
- print('exception')
- db.commit()
- # elmt['category']='social'
- if __name__ == '__main__':
- main()
|