get_order_dairly_wending.py 7.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240
  1. import hashlib
  2. import time
  3. import datetime
  4. from concurrent.futures import ProcessPoolExecutor
  5. import requests
  6. from util import date_util
  7. from util import platform_config_util
  8. from util import robust_util
  9. from util.MySQLConnection import MySQLConnection
  10. def md5(s):
  11. md5 = hashlib.md5()
  12. md5.update(s.encode("utf-8"))
  13. return md5.hexdigest()
  14. def getSelfDateStr(times=time.time(),date_format='%Y%m%d'):
  15. """
  16. ## 20201028添加,阳光接口,文鼎接口,日期参数请求格式20201028,一日一拉api数据
  17. description: 获取指定时间戳
  18. time: 秒 默认当前时间
  19. return: 返回指定时间戳的前一日日期 。 比如 :接收20190512号的时间戳,返回 20190513 -> str
  20. tips: 一天86400秒
  21. """
  22. timestamps = str(time.strftime(date_format,time.localtime(times)))
  23. return timestamps
  24. def get_wending_account_list():
  25. sql="select text from order_account_text where platform='文鼎'"
  26. con=MySQLConnection()
  27. data= con.query(sql)
  28. li=[]
  29. for i in data:
  30. a= i['text'].replace('\n','').split(',')
  31. li.append(a)
  32. return li
  33. def get_wending_order(st,et,account_list):
  34. total_order_list = ()
  35. start_exec_seconds = date_util.getCurrentSecondTime()
  36. futures = []
  37. for account in account_list:
  38. futures.append(get_wending_order_task(st, et, account))
  39. for future in futures:
  40. if len(future)>0:
  41. total_order_list = future + total_order_list
  42. print('文鼎订单数量:', len(total_order_list), '执行时长(秒):', date_util.getCurrentSecondTime() - start_exec_seconds)
  43. return total_order_list
  44. def get_wd_account_siteid_list(account):
  45. url = 'https://bi.reading.163.com/dist-api/siteList'
  46. consumerkey = account[0]
  47. secretkey = account[1]
  48. stage = account[3]
  49. timestamp = int(time.time()*1000)
  50. siteid_params = {
  51. "consumerkey":consumerkey,
  52. 'secretkey':secretkey,
  53. 'timestamp':timestamp,
  54. }
  55. sorted_data = sorted(siteid_params.items(),reverse = False)
  56. s=""
  57. for k,v in sorted_data:
  58. s = s+str(k)+"="+str(v)
  59. sign = md5(s).lower()
  60. siteid_params['sign'] = sign
  61. consumerkey = siteid_params['consumerkey']
  62. timestamp = siteid_params['timestamp']
  63. parameter = 'consumerkey='+str(consumerkey)+'&timestamp='+str(timestamp)+'&sign='+str(sign)
  64. get_url = url+"?"+parameter
  65. while True:
  66. r = requests.get(url=get_url)
  67. if r.status_code==200:
  68. break
  69. try:
  70. id_key_list = r.json()['data']
  71. except:
  72. return []
  73. mpid_list = []
  74. try:
  75. for id_key_val in id_key_list:
  76. mpid = dict(id_key_val)["mpId"]
  77. mpid_list.append(mpid)
  78. except Exception as e:
  79. print(stage,'站点查询返回结果:',r.json())
  80. return mpid_list
  81. def get_wending_json_object(url,params):
  82. params['timestamp'] = int(time.time()*1000)
  83. sorted_data = sorted(params.items(),reverse = False)
  84. s=""
  85. for k,v in sorted_data:
  86. s = s+str(k)+"="+str(v)
  87. sign = md5(s).lower()
  88. params['sign'] = sign
  89. consumerkey = params['consumerkey']
  90. secretkey = params['secretkey']
  91. timestamp = params['timestamp']
  92. siteid = params['siteid']
  93. pageSize = params['pageSize']
  94. starttime = params['starttime']
  95. endtime = params['endtime']
  96. page = params['page']
  97. paystatus = params['paystatus']
  98. ## +'&secretkey='+str(secretkey)
  99. parameter = 'consumerkey='+str(consumerkey)+'&timestamp='+str(timestamp)+'&siteid='+str(siteid)+'&pageSize='+str(pageSize)\
  100. +'&starttime='+str(starttime)+'&endtime='+str(endtime)+'&page='+str(page)+'&paystatus='+str(paystatus)+'&sign='+str(sign)
  101. global get_url
  102. get_url = url+"?"+parameter
  103. while True:
  104. r= requests.get(url=get_url)
  105. if r.status_code==200:
  106. break
  107. else:
  108. time.sleep(1)
  109. print("请求连接出错,等待1s...")
  110. response_result_json=r.json()
  111. del params['sign']
  112. return response_result_json
  113. def get_wending_order_task(st,et,account):
  114. order_list = ()
  115. url = 'https://bi.reading.163.com/dist-api/rechargeList'
  116. consumerkey = account[0]
  117. secretkey = account[1]
  118. siteid=account[2]
  119. stage = account[3]
  120. siteid_list = get_wd_account_siteid_list(account)
  121. print(siteid_list)
  122. if len(siteid_list) == 0:
  123. siteid_list.append(siteid)
  124. starttime = getSelfDateStr(st,'%Y%m%d%H%M')
  125. endtime = getSelfDateStr(et,'%Y%m%d%H%M')
  126. for siteid in siteid_list:
  127. page = 1
  128. while True:
  129. params = {
  130. 'consumerkey': consumerkey,
  131. 'secretkey':secretkey,
  132. 'timestamp':int(1601481600),
  133. 'siteid':siteid,
  134. 'pageSize':1000,
  135. 'starttime':starttime,
  136. 'endtime':endtime,
  137. 'page':page,
  138. 'paystatus':1}
  139. response_result_json = get_wending_json_object(url,params)
  140. order_item_list = response_result_json['data']['rechargeList']
  141. for x in order_item_list:
  142. y={}
  143. y['date'] = (int(x['payTime']//1000)+ 8 * 3600) // 86400 * 86400 - 8 * 3600 ## 网易的是13位时间戳
  144. y['platform'] = '文鼎'
  145. y['channel'] = x['wx_mpName'] ## 公众号名称
  146. y['channel_id'] = x['wx_originalId'] ## 公众号id
  147. y['from_novel'] = x['bookTitle'] ## 小说名称
  148. y['user_id'] = x['userId'] ## 付费用户uid
  149. y['stage'] = stage ## 期数
  150. createTime = time.strftime("%Y-%m-%d %H:%M:%S",time.localtime(x['createTime']//1000)) ## 时间戳 》struct_time 》标准时间
  151. y['order_time']= createTime ## 订单生成时间
  152. y['amount']=x['money']/100 ## 原数据单位:分
  153. uid_reg_time = time.strftime("%Y-%m-%d %H:%M:%S",time.localtime(x['userRegisterTime']//1000)) ## 13位时间戳 》标准时间
  154. y['reg_time']= uid_reg_time ## 用户注册时间
  155. y['order_id']= x['ewTradeId'] ## 订单id
  156. y = sorted(y.items(), key=lambda item:item[0])
  157. y = dict(y)
  158. y = tuple(y.values())
  159. order_list = order_list+((y),)
  160. if len(order_item_list)<1000:
  161. break
  162. else:
  163. page+=1
  164. print(f"文鼎数据日期-{starttime}到{endtime}-期数-{stage}-获取数据-{len(order_list)}条")
  165. return order_list
  166. def batch_save_order(data):
  167. if data is None or len(data) == 0:
  168. print('数据为空,不执行数据库操作!')
  169. else:
  170. sql = 'INSERT IGNORE INTO quchen_text.order(amount,channel,channel_id,date,from_novel,order_id,order_time,platform,reg_time,stage,user_id) VALUES (%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s);'
  171. connect = MySQLConnection()
  172. try:
  173. num = connect.batch(sql, data)
  174. # 提交
  175. connect.commit()
  176. print('订单数据最终入库【{num}】条'.format(num=num))
  177. except Exception as e:
  178. print('订单数据入库失败:', e)
  179. finally:
  180. connect.close()
  181. def start_order_job_wending(st,et):
  182. account_list = get_wending_account_list()
  183. da=get_wending_order(st, et,account_list)
  184. batch_save_order(da)
  185. if __name__ == '__main__':
  186. st = date_util.get_n_day(n=-1, is_timestamp=1)
  187. et = date_util.get_n_day(n=0, is_timestamp=1)
  188. start_order_job_wending(st,et)