get_wechat_info.py 9.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196
  1. from selenium import webdriver
  2. from selenium.webdriver import ActionChains
  3. from selenium.webdriver.common.by import By
  4. from selenium.webdriver.support import expected_conditions as EC
  5. from selenium.webdriver.support.wait import WebDriverWait
  6. from wechat_action.create_ad_plan_idea import IdeaAction
  7. from wechat_action.human_ad import HumanAd
  8. from selenium.webdriver import ChromeOptions
  9. from selenium.webdriver.common.keys import Keys
  10. from functools import wraps
  11. from wechat_action import login_ad
  12. import logging
  13. import json
  14. import time
  15. import re
  16. import requests
  17. import random
  18. class WechatApi():
  19. def __init__(self, log_ad):
  20. self.log_ad = log_ad
  21. self.driver = self.log_ad.driver
  22. self.human_info_list = []
  23. def api_get_name(self):
  24. # 微信公众号相关内容获取,现在基本不使用,用get_human_info为主
  25. def _api_get_name(self, service_name):
  26. WebDriverWait(self.driver, 100).until(
  27. lambda driver: True if service_name in self.driver.page_source and len(
  28. re.findall('g_tk=(\d+)', self.driver.page_source)) else False)
  29. cookie_dict = self.log_ad.get_cookie(self.driver)
  30. url_token = re.findall('g_tk=(\d+)', self.driver.page_source)
  31. url_token = url_token[0]
  32. # 得到公众号
  33. wechat_names_url = 'https://a.weixin.qq.com/cgi-bin/agency/get_delivery_metrics?page=1&page_size=10&search_key=&order_by=&ascending=1&only_collect=0&g_tk={token}&_={time_}'.format(
  34. token=url_token, time_=int(time.time()))
  35. rsp = requests.get(url=wechat_names_url, cookies=cookie_dict)
  36. print(service_name, rsp.text)
  37. WebDriverWait(self.driver, 100).until(
  38. lambda driver: True if len(
  39. re.findall('g_tk=(\d+)', self.driver.page_source)) else False)
  40. url_token = re.findall('g_tk=(\d+)', self.driver.page_source)
  41. url_token = url_token[0]
  42. wechat_names_url = 'https://a.weixin.qq.com/cgi-bin/agency/get_delivery_metrics?page=1&page_size=10&search_key=&order_by=&ascending=1&only_collect=0&g_tk={token}&_={time_}'.format(
  43. token=url_token, time_=int(time.time()))
  44. cookie_dict = self.log_ad.get_cookie(self.driver)
  45. rsp = requests.get(url=wechat_names_url, cookies=cookie_dict)
  46. service_name = self.driver.find_element_by_xpath('//*[@id="root"]/div/header/div/div[3]/div/div[1]').text
  47. print(service_name, rsp.text)
  48. service_name = ''
  49. self.service_loop(_api_get_name, {'self': self, 'service_name': service_name})
  50. def get_human_info(self, err_num=0):
  51. try:
  52. def _get_human_info(self, service_name):
  53. # 耗时一秒以内
  54. # self.driver.get('https://a.weixin.qq.com/client')
  55. WebDriverWait(self.driver, 100).until(
  56. lambda driver: True if service_name in self.driver.page_source and len(
  57. re.findall('g_tk=(\d+)', self.driver.page_source)) else False)
  58. cookie_dict = self.log_ad.get_cookie(self.driver)
  59. url_token = re.findall('g_tk=(\d+)', self.driver.page_source)[0]
  60. # 得到各个appid
  61. wechat_names_url = 'https://a.weixin.qq.com/cgi-bin/agency/get_delivery_metrics?page=1&page_size=10&search_key=&order_by=&ascending=1&only_collect=0&g_tk={token}&_={time_}'.format(
  62. token=url_token, time_=int(time.time()))
  63. rsp = requests.get(url=wechat_names_url, cookies=cookie_dict)
  64. print(wechat_names_url)
  65. print(rsp.text)
  66. # 普通用户的需要在1s内获取到
  67. # 得到wechat_token
  68. for i in rsp.json()['list']:
  69. wechat_wxname = i['wxname']
  70. wechat_name = i['nickname']
  71. wechat_id = i['appid']
  72. wechat_tran_url = 'http://a.weixin.qq.com/cgi-bin/agency/redirect_mp?appid={wechat_id}&g_tk={token}&mgr_type=1'.format(
  73. token=url_token, wechat_id=wechat_id)
  74. session = requests.session()
  75. rsp = session.get(wechat_tran_url, cookies=cookie_dict)
  76. print(rsp.url)
  77. token_id = re.findall('token=(\d+)', rsp.url)[0]
  78. print(token_id)
  79. # 得到人群包
  80. human_url = 'https://mp.weixin.qq.com/promotion/dmpmgr?action=readlist&page=1&page_size=100&token={wechat_token}&appid=&spid=&_={time_}'.format(
  81. wechat_token=token_id, time_=int(time.time()))
  82. print(human_url)
  83. rsp = session.get(url=human_url)
  84. print(rsp.text)
  85. res_json = rsp.json()
  86. res_json['service_name'] = service_name
  87. res_json['wechat_name'] = wechat_name
  88. res_json['wxname'] = wechat_wxname
  89. res_json['appid'] = wechat_id
  90. self.human_info_list.append(res_json)
  91. print(self.human_info_list)
  92. print(json.dumps(self.human_info_list))
  93. time.sleep(random.uniform(3, 5))
  94. service_name = self.driver.find_element_by_xpath('//*[@id="root"]/div/header/div/div[3]/div/div[1]').text
  95. _get_human_info(self, service_name=service_name)
  96. self.service_loop(_get_human_info, {'self': self, 'service_name': service_name})
  97. self.log_ad.cookies_save(self.log_ad)
  98. return {'sucess': True, 'result_info': '', "result_list": self.human_info_list}
  99. except Exception as e:
  100. logging.error(str(e))
  101. if err_num < 3:
  102. self.human_info_list = []
  103. return self.get_human_info(err_num=err_num + 1)
  104. return {'sucess': False, 'result_info': str(e)}
  105. def service_loop(self, function, kwargs):
  106. def click_service_change():
  107. # self.driver.switch_to.window(self.driver.window_handles[-1])
  108. WebDriverWait(self.driver, 10).until(
  109. lambda x: self.driver.find_element_by_css_selector(
  110. '#root > div > header > div > div.CoreLayout__account-2lIr0 > div'))
  111. service_name_button = self.driver.find_element_by_css_selector(
  112. '#root > div > header > div > div.CoreLayout__account-2lIr0 > div')
  113. WebDriverWait(self.driver, 10).until(
  114. lambda x: (service_name_button.is_displayed() and service_name_button.is_enabled()))
  115. server_button = self.driver.find_element_by_css_selector(
  116. '#root > div > header > div > div.CoreLayout__account-2lIr0 > div')
  117. ActionChains(self.driver).move_to_element(server_button).click().perform()
  118. # server_button.click()
  119. time.sleep(random.uniform(0.1, 0.2))
  120. self.driver.find_element_by_css_selector(
  121. '#root > div > div.CoreLayout__headerDropdown-3xWkD > div > div:nth-child(1) > button').click()
  122. time.sleep(random.uniform(0.1, 0.2))
  123. # 得到所有service name
  124. service_name_all = set()
  125. service_name_used = set()
  126. self.driver.execute_script('''
  127. window.scroll(0,1000000);
  128. ''')
  129. # time.sleep(random.uniform(3, 5))
  130. click_service_change()
  131. # WebDriverWait(self.driver, 10).until(
  132. # lambda x: self.driver.find_element_by_xpath('//*[@id="root"]/div/span/div/main/div/div[1]/div/h3'))
  133. # self.driver.find_element_by_xpath('//*[@id="root"]/div/span/div/main/div/div[1]/div/h3').click()
  134. # time.sleep(random.uniform(0.1,0.2))
  135. service_names = self.driver.find_elements_by_class_name('CoreLayout__headerDropdownItem-X4S98')
  136. for _ in service_names:
  137. service_name_all.add(_.text)
  138. # 第一个service_name
  139. service_name = self.driver.find_element_by_xpath('//*[@id="root"]/div/header/div/div[3]/div/div[1]').text
  140. service_name_used.add(service_name)
  141. # 循环使用完service_name为止
  142. for i in range(len(service_name_all) - 1):
  143. service_names = self.driver.find_elements_by_xpath('//*[@class="CoreLayout__headerDropdownItem-X4S98"]/p')
  144. for _ in service_names:
  145. print(_.text)
  146. for service_num in range(len(service_names)):
  147. _ = service_names[service_num]
  148. if _.text not in service_name_used:
  149. choice_service = _
  150. choice_service_name = _.text
  151. service_name_used.add(_.text)
  152. # self.driver.execute_script('''
  153. # var e_one=document.getElementsByClassName('CoreLayout__headerDropdown-3xWkD')[0]; e_one.scroll(10000,100000);
  154. # e_one.scroll(0,{y_localtion});
  155. # '''.format(y_localtion=service_num * 45))
  156. ActionChains(self.driver).move_to_element(choice_service).click().perform()
  157. # choice_service.click()
  158. if 'service_name' in kwargs.keys():
  159. kwargs['service_name'] = choice_service_name
  160. function(**kwargs)
  161. break
  162. # time.sleep(random.uniform(3, 5))
  163. click_service_change()
  164. if __name__ == "__main__":
  165. pass