GA_Path.py 4.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135
  1. """Hello Analytics Reporting API V4."""
  2. #!/usr/bin/python3
  3. import sys
  4. import codecs
  5. import traceback
  6. import requests
  7. import re
  8. import pandas as pd
  9. import random
  10. import urllib
  11. import dataset
  12. import json
  13. import gspread
  14. import datetime
  15. from gspread_pandas import Spread, Client
  16. from oauth2client.service_account import ServiceAccountCredentials
  17. import os
  18. import threading
  19. from apiclient.discovery import build
  20. from oauth2client.service_account import ServiceAccountCredentials
  21. import dataset
  22. db = dataset.connect('mysql://choozmo:pAssw0rd@db.ptt.cx:3306/hhh?charset=utf8mb4')
  23. #db.query('delete from hhh_weekly_affinity')
  24. table=db['hhh_weekly_pagetitle']
  25. SCOPES = ['https://www.googleapis.com/auth/analytics.readonly']
  26. KEY_FILE_LOCATION = 'c:\\keys\\choozmo-ga-beee24b7a4c1.json'
  27. VIEW_ID = '188916214'
  28. def initialize_analyticsreporting():
  29. """Initializes an Analytics Reporting API V4 service object.
  30. Returns:
  31. An authorized Analytics Reporting API V4 service object.
  32. """
  33. credentials = ServiceAccountCredentials.from_json_keyfile_name(
  34. KEY_FILE_LOCATION, SCOPES)
  35. # Build the service object.
  36. analytics = build('analyticsreporting', 'v4', credentials=credentials)
  37. return analytics
  38. def get_report(analytics,body):
  39. """Queries the Analytics Reporting API V4.
  40. Args:
  41. analytics: An authorized Analytics Reporting API V4 service object.
  42. Returns:
  43. The Analytics Reporting API V4 response.
  44. """
  45. return analytics.reports().batchGet(
  46. body={
  47. 'reportRequests':body
  48. # [
  49. #{
  50. # 'viewId': VIEW_ID,
  51. # 'dateRanges': [{'startDate': '14daysAgo', 'endDate': 'today'}],
  52. # 'dateRanges': [{'startDate': '2021-05-30', 'endDate': '2021-06-05'}],
  53. # 'metrics': [{'expression': 'ga:users'}],
  54. # 'dimensions': [{'name': 'ga:sourceMedium'}]
  55. # 'dimensions': [{'name': 'ga:date'},{'name': 'ga:sourceMedium'}]
  56. # }]
  57. }
  58. ).execute()
  59. def print_response(response):
  60. """Parses and prints the Analytics Reporting API V4 response.
  61. Args:
  62. response: An Analytics Reporting API V4 response.
  63. """
  64. result=[]
  65. for report in response.get('reports', []):
  66. columnHeader = report.get('columnHeader', {})
  67. dimensionHeaders = columnHeader.get('dimensions', [])
  68. metricHeaders = columnHeader.get('metricHeader', {}).get('metricHeaderEntries', [])
  69. for row in report.get('data', {}).get('rows', []):
  70. dimensions = row.get('dimensions', [])
  71. dateRangeValues = row.get('metrics', [])
  72. ga_dict={}
  73. for header, dimension in zip(dimensionHeaders, dimensions):
  74. print(header + ': ', dimension)
  75. ga_dict[header]=dimension
  76. for i, values in enumerate(dateRangeValues):
  77. print('Date range:', str(i))
  78. for metricHeader, value in zip(metricHeaders, values.get('values')):
  79. ga_dict[metricHeader.get('name')]=value
  80. # print(metricHeader.get('name') + ':', value)
  81. result.append(ga_dict)
  82. return result
  83. # print(ga_dict)
  84. def main():
  85. analytics = initialize_analyticsreporting()
  86. body=[{ 'viewId': VIEW_ID,
  87. # 'dateRanges': [{'startDate': '2021-05-30', 'endDate': '2021-06-05'}],
  88. 'dateRanges': [{'startDate': '2021-05-28', 'endDate': '2021-06-11'}],
  89. 'metrics': [{'expression': 'ga:users'}],
  90. # 'metrics': [{'expression': 'ga:users'},{'expression': 'ga:newusers'},{'expression': 'ga:sessions'},{'expression': 'ga:pageviews'},{'expression': 'ga:bounceRate'},{'expression': 'ga:pageviewsPerSession'}],
  91. # 'metrics': [{'expression': 'ga:users'},{'expression': 'ga:newusers'},{'expression': 'ga:sessions'},{'expression': 'ga:pageviews'},{'expression': 'ga:bounceRate'},{'expression': 'ga:pageviewsPerSession'}],
  92. # 'dimensions': [{'name': 'ga:date'},{'name': 'ga:sourceMedium'}]
  93. # 'dimensions': [{'name': 'ga:date'}]
  94. 'dimensions': [{'name': 'ga:pageTitle'},{'name': 'ga:isoWeek'},]
  95. }]
  96. response = get_report(analytics,body)
  97. ga_dict=print_response(response)
  98. # print(ga_dict)
  99. # print(ga_dict)
  100. for elmt in ga_dict:
  101. # elmt['ga:users']=int(elmt['ga:users'])
  102. if int(elmt['ga:users']) > 2:
  103. # print(elmt['ga:interestAffinityCategory'])
  104. table.insert(elmt)
  105. # print(elmt['ga:sourceMedium'])
  106. if __name__ == '__main__':
  107. main()