dw_channel_daily.py 17 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258
  1. """
  2. @desc 公众号维度的数据处理
  3. @auth ck
  4. """
  5. from model.DateUtils import DateUtils
  6. from model.DataBaseUtils import MysqlUtils, CkUtils
  7. import logging
  8. du = DateUtils()
  9. db = MysqlUtils()
  10. ck = CkUtils()
  11. def dw_channel():
  12. sql = """
  13. select
  14. dt1,channel1,pitcher,stage,platform,book,
  15. if(stage ='趣程15期' or stage ='趣程26期' or stage ='趣程30期','GDT','MP'),
  16. order_count,create_user_num,reg_num,order_user,order_amount,
  17. first_order_count,first_order_user,first_order_amount,
  18. view_count,click_count,follow_user,
  19. cost,reg_order_count,reg_order_user,reg_order_amount,
  20. web_view_count,platform_view_count,web_order_count,
  21. reg_order_user_again,
  22. reg_order_user_again3,
  23. reg_order_user_again4,
  24. reg_order_user_again5,
  25. reg_order_user_again6
  26. from (
  27. select
  28. if(dt4='1970-01-01',dt,dt4) dt1,if(channel4='',channel,channel4) channel1,
  29. create_user_num,reg_num,pitcher,stage,platform,book,cost,view_count,click_count, ---基础属性和消耗数据
  30. follow_user,web_view_count,platform_view_count,web_order_count,type,
  31. require_roi,require_mult,order_count,order_user,order_amount from
  32. (select * from game_data.dw_daily_platform_cost) aa
  33. full outer join
  34. (select date as dt4,channel as channel4,count(1) as order_count, ---账面充值
  35. count(distinct user_id) as order_user,sum(amount) as order_amount
  36. from game_data.order
  37. where status=2
  38. and channel in (select DISTINCT (channel) from game_data.dw_daily_channel_cost ddcc)
  39. group by date,channel) dd
  40. on dt=dt4 and channel=channel4) a
  41. left outer join (
  42. select sum(if(user_order_count>=2,1,0)) reg_order_user_again,channel channel6,toDate(reg_date) dt6, ---复冲人数
  43. sum(if(user_order_count>=3,1,0)) reg_order_user_again3,
  44. sum(if(user_order_count>=4,1,0)) reg_order_user_again4,
  45. sum(if(user_order_count>=5,1,0)) reg_order_user_again5,
  46. sum(if(user_order_count>=6,1,0)) reg_order_user_again6
  47. from (select formatDateTime(reg_time,'%Y-%m-%d') reg_date,channel,count(1) user_order_count
  48. from game_data.order where status=2 group by formatDateTime(reg_time,'%Y-%m-%d') ,user_id,channel) x
  49. group by reg_date,channel
  50. ) f on dt1=dt6 and channel1=channel6
  51. left outer join
  52. (
  53. select toDate(formatDateTime(reg_time,'%Y-%m-%d')) as dt2, ---新用户累计充值数据
  54. channel as channel2,
  55. sum(amount) as reg_order_amount,
  56. count(distinct user_id) as reg_order_user,
  57. count(1) as reg_order_count
  58. from game_data.order where status=2 and reg_time>'2019-03-18 00:00:00'
  59. group by toDate(formatDateTime(reg_time,'%Y-%m-%d')),channel) b
  60. on dt1=dt2 and channel1=channel2
  61. left outer join
  62. (select date as dt3,channel as channel3,count(1) as first_order_count, ---新用户首日充值
  63. count(distinct user_id) as first_order_user,sum(amount) as first_order_amount
  64. from game_data.order where status=2 and toDate(reg_time)=date group by date,channel) c
  65. on dt1=dt3 and channel1=channel3
  66. having order_amount+cost+reg_order_amount>0"""
  67. data = ck.execute(sql)
  68. isql = "replace into dw_channel values (%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s)"
  69. # db.dm.execute("truncate table dw_channel")
  70. db.dm.executeMany(isql, data)
  71. def dw_channel_user_daily():
  72. sql = """
  73. select toDate(formatDateTime(reg_time,'%Y-%m-%d')) as dt,
  74. channel,
  75. count(distinct if(subtractDays(date, 1)>=toDate(reg_time),null,user_id)) dc1,
  76. count(distinct if(subtractDays(date, 2)>=toDate(reg_time),null,user_id)) dc2,
  77. count(distinct if(subtractDays(date, 3)>=toDate(reg_time),null,user_id)) dc3,
  78. count(distinct if(subtractDays(date, 4)>=toDate(reg_time),null,user_id)) dc4,
  79. count(distinct if(subtractDays(date, 5)>=toDate(reg_time),null,user_id)) dc5,
  80. count(distinct if(subtractDays(date, 6)>=toDate(reg_time),null,user_id)) dc6,
  81. count(distinct if(subtractDays(date, 7)>=toDate(reg_time),null,user_id)) dc7,
  82. count(distinct if(subtractDays(date, 8)>=toDate(reg_time),null,user_id)) dc8,
  83. count(distinct if(subtractDays(date, 9)>=toDate(reg_time),null,user_id)) dc9,
  84. count(distinct if(subtractDays(date, 10)>=toDate(reg_time),null,user_id)) dc10,
  85. count(distinct if(subtractDays(date, 11)>=toDate(reg_time),null,user_id)) dc11,
  86. count(distinct if(subtractDays(date, 12)>=toDate(reg_time),null,user_id)) dc12,
  87. count(distinct if(subtractDays(date, 13)>=toDate(reg_time),null,user_id)) dc13,
  88. count(distinct if(subtractDays(date, 14)>=toDate(reg_time),null,user_id)) dc14,
  89. count(distinct if(subtractDays(date, 15)>=toDate(reg_time),null,user_id)) dc15,
  90. count(distinct if(subtractDays(date, 16)>=toDate(reg_time),null,user_id)) dc16,
  91. count(distinct if(subtractDays(date, 17)>=toDate(reg_time),null,user_id)) dc17,
  92. count(distinct if(subtractDays(date, 18)>=toDate(reg_time),null,user_id)) dc18,
  93. count(distinct if(subtractDays(date, 19)>=toDate(reg_time),null,user_id)) dc19,
  94. count(distinct if(subtractDays(date, 20)>=toDate(reg_time),null,user_id)) dc20,
  95. count(distinct if(subtractDays(date, 21)>=toDate(reg_time),null,user_id)) dc21,
  96. count(distinct if(subtractDays(date, 22)>=toDate(reg_time),null,user_id)) dc22,
  97. count(distinct if(subtractDays(date, 23)>=toDate(reg_time),null,user_id)) dc23,
  98. count(distinct if(subtractDays(date, 24)>=toDate(reg_time),null,user_id)) dc24,
  99. count(distinct if(subtractDays(date, 25)>=toDate(reg_time),null,user_id)) dc25,
  100. count(distinct if(subtractDays(date, 26)>=toDate(reg_time),null,user_id)) dc26,
  101. count(distinct if(subtractDays(date, 27)>=toDate(reg_time),null,user_id)) dc27,
  102. count(distinct if(subtractDays(date, 28)>=toDate(reg_time),null,user_id)) dc28,
  103. count(distinct if(subtractDays(date, 29)>=toDate(reg_time),null,user_id)) dc29,
  104. count(distinct if(subtractDays(date, 30)>=toDate(reg_time),null,user_id)) dc30
  105. from game_data.order where status=2 and reg_time>'2019-03-18 00:00:00' group by toDate(formatDateTime(reg_time,'%Y-%m-%d')),channel"""
  106. data = ck.execute(sql)
  107. isql = "insert into dw_channel_user_daily values " \
  108. "(%s,%s,%s,%s,%s,%s,%s,%s,%s,%s," \
  109. "%s,%s,%s,%s,%s,%s,%s,%s,%s,%s," \
  110. "%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s)"
  111. db.dm.execute("truncate table dw_channel_user_daily")
  112. db.dm.executeMany(isql, data)
  113. def dw_channel_amount_daily():
  114. sql = """
  115. select toDate(formatDateTime(reg_time,'%Y-%m-%d')) as dt,
  116. channel as channel,
  117. sum(if(subtractDays(date, 1)>=toDate(reg_time),0,amount)) as da1,
  118. if (dt<today(),sum(if(subtractDays(date, 2)>=toDate(reg_time),0,amount)),null) as da2,
  119. if(dt<subtractDays(today(), 1), sum(if(subtractDays(date, 3)>=toDate(reg_time),0,amount)),null) as da3,
  120. if(dt<subtractDays(today(), 2),sum(if(subtractDays(date, 4)>=toDate(reg_time),0,amount)),null) as da4,
  121. if(dt<subtractDays(today(), 3),sum(if(subtractDays(date, 5)>=toDate(reg_time),0,amount)),null) as da5,
  122. if(dt<subtractDays(today(), 4),sum(if(subtractDays(date, 6)>=toDate(reg_time),0,amount)),null) as da6,
  123. if(dt<subtractDays(today(), 5),sum(if(subtractDays(date, 7)>=toDate(reg_time),0,amount)),null) as da7,
  124. if(dt<subtractDays(today(), 6),sum(if(subtractDays(date, 8)>=toDate(reg_time),0,amount)),null) as da8,
  125. if(dt<subtractDays(today(), 7),sum(if(subtractDays(date, 9)>=toDate(reg_time),0,amount)),null) as da9,
  126. if(dt<subtractDays(today(), 8),sum(if(subtractDays(date, 10)>=toDate(reg_time),0,amount)),null) as da10,
  127. if(dt<subtractDays(today(), 9),sum(if(subtractDays(date, 11)>=toDate(reg_time),0,amount)),null) as da11,
  128. if(dt<subtractDays(today(), 10),sum(if(subtractDays(date, 12)>=toDate(reg_time),0,amount)),null) as da12,
  129. if(dt<subtractDays(today(), 11),sum(if(subtractDays(date, 13)>=toDate(reg_time),0,amount)),null) as da13,
  130. if(dt<subtractDays(today(), 12),sum(if(subtractDays(date, 14)>=toDate(reg_time),0,amount)),null) as da14,
  131. if(dt<subtractDays(today(), 13),sum(if(subtractDays(date, 15)>=toDate(reg_time),0,amount)),null) as da15,
  132. if(dt<subtractDays(today(), 14),sum(if(subtractDays(date, 16)>=toDate(reg_time),0,amount)),null) as da16,
  133. if(dt<subtractDays(today(), 15),sum(if(subtractDays(date, 17)>=toDate(reg_time),0,amount)),null) as da17,
  134. if(dt<subtractDays(today(), 16),sum(if(subtractDays(date, 18)>=toDate(reg_time),0,amount)),null) as da18,
  135. if(dt<subtractDays(today(), 17),sum(if(subtractDays(date, 19)>=toDate(reg_time),0,amount)),null) as da19,
  136. if(dt<subtractDays(today(), 18),sum(if(subtractDays(date, 20)>=toDate(reg_time),0,amount)),null) as da20,
  137. if(dt<subtractDays(today(), 19),sum(if(subtractDays(date, 21)>=toDate(reg_time),0,amount)),null) as da21,
  138. if(dt<subtractDays(today(), 20),sum(if(subtractDays(date, 22)>=toDate(reg_time),0,amount)),null) as da22,
  139. if(dt<subtractDays(today(), 21),sum(if(subtractDays(date, 23)>=toDate(reg_time),0,amount)),null) as da23,
  140. if(dt<subtractDays(today(), 22),sum(if(subtractDays(date, 24)>=toDate(reg_time),0,amount)),null) as da24,
  141. if(dt<subtractDays(today(), 23),sum(if(subtractDays(date, 25)>=toDate(reg_time),0,amount)),null) as da25,
  142. if(dt<subtractDays(today(), 24),sum(if(subtractDays(date, 26)>=toDate(reg_time),0,amount)),null) as da26,
  143. if(dt<subtractDays(today(), 25),sum(if(subtractDays(date, 27)>=toDate(reg_time),0,amount)),null) as da27,
  144. if(dt<subtractDays(today(), 26),sum(if(subtractDays(date, 28)>=toDate(reg_time),0,amount)),null) as da28,
  145. if(dt<subtractDays(today(), 27),sum(if(subtractDays(date, 29)>=toDate(reg_time),0,amount)),null) as da29,
  146. if(dt<subtractDays(today(), 28),sum(if(subtractDays(date, 30)>=toDate(reg_time),0,amount)),null) as da30,
  147. if(dt<subtractDays(today(), 29),sum(if(subtractDays(date, 31)>=toDate(reg_time),0,amount)),null) as da31,
  148. if(dt<subtractDays(today(), 30),sum(if(subtractDays(date, 32)>=toDate(reg_time),0,amount)),null) as da32,
  149. if(dt<subtractDays(today(), 31),sum(if(subtractDays(date, 33)>=toDate(reg_time),0,amount)),null) as da33,
  150. if(dt<subtractDays(today(), 32),sum(if(subtractDays(date, 34)>=toDate(reg_time),0,amount)),null) as da34,
  151. if(dt<subtractDays(today(), 33),sum(if(subtractDays(date, 35)>=toDate(reg_time),0,amount)),null) as da35,
  152. if(dt<subtractDays(today(), 34),sum(if(subtractDays(date, 36)>=toDate(reg_time),0,amount)),null) as da36,
  153. if(dt<subtractDays(today(), 35),sum(if(subtractDays(date, 37)>=toDate(reg_time),0,amount)),null) as da37,
  154. if(dt<subtractDays(today(), 36),sum(if(subtractDays(date, 38)>=toDate(reg_time),0,amount)),null) as da38,
  155. if(dt<subtractDays(today(), 37),sum(if(subtractDays(date, 39)>=toDate(reg_time),0,amount)),null) as da39,
  156. if(dt<subtractDays(today(), 38),sum(if(subtractDays(date, 40)>=toDate(reg_time),0,amount)),null) as da40,
  157. if(dt<subtractDays(today(), 39),sum(if(subtractDays(date, 41)>=toDate(reg_time),0,amount)),null) as da41,
  158. if(dt<subtractDays(today(), 40),sum(if(subtractDays(date, 42)>=toDate(reg_time),0,amount)),null) as da42,
  159. if(dt<subtractDays(today(), 41),sum(if(subtractDays(date, 43)>=toDate(reg_time),0,amount)),null) as da43,
  160. if(dt<subtractDays(today(), 42),sum(if(subtractDays(date, 44)>=toDate(reg_time),0,amount)),null) as da44,
  161. if(dt<subtractDays(today(), 43),sum(if(subtractDays(date, 45)>=toDate(reg_time),0,amount)),null) as da45,
  162. if(dt<subtractDays(today(), 44),sum(if(subtractDays(date, 46)>=toDate(reg_time),0,amount)),null) as da46,
  163. if(dt<subtractDays(today(), 45),sum(if(subtractDays(date, 47)>=toDate(reg_time),0,amount)),null) as da47,
  164. if(dt<subtractDays(today(), 46),sum(if(subtractDays(date, 48)>=toDate(reg_time),0,amount)),null) as da48,
  165. if(dt<subtractDays(today(), 47),sum(if(subtractDays(date, 49)>=toDate(reg_time),0,amount)),null) as da49,
  166. if(dt<subtractDays(today(), 48),sum(if(subtractDays(date, 50)>=toDate(reg_time),0,amount)),null) as da50,
  167. if(dt<subtractDays(today(), 49),sum(if(subtractDays(date, 51)>=toDate(reg_time),0,amount)),null) as da51,
  168. if(dt<subtractDays(today(), 50),sum(if(subtractDays(date, 52)>=toDate(reg_time),0,amount)),null) as da52,
  169. if(dt<subtractDays(today(), 51),sum(if(subtractDays(date, 53)>=toDate(reg_time),0,amount)),null) as da53,
  170. if(dt<subtractDays(today(), 52),sum(if(subtractDays(date, 54)>=toDate(reg_time),0,amount)),null) as da54,
  171. if(dt<subtractDays(today(), 53),sum(if(subtractDays(date, 55)>=toDate(reg_time),0,amount)),null) as da55,
  172. if(dt<subtractDays(today(), 54),sum(if(subtractDays(date, 56)>=toDate(reg_time),0,amount)),null) as da56,
  173. if(dt<subtractDays(today(), 55),sum(if(subtractDays(date, 57)>=toDate(reg_time),0,amount)),null) as da57,
  174. if(dt<subtractDays(today(), 56),sum(if(subtractDays(date, 58)>=toDate(reg_time),0,amount)),null) as da58,
  175. if(dt<subtractDays(today(), 57), sum(if(subtractDays(date, 59)>=toDate(reg_time),0,amount)),null) as da59,
  176. if(dt<subtractDays(today(),58),sum(if(subtractDays(date, 60)>=toDate(reg_time),0,amount)),null) as da60,
  177. if(dt<subtractDays(today(), 88),sum(if(subtractDays(date, 90)>=toDate(reg_time),0,amount)),null) as dm3,
  178. if(dt<subtractDays(today(), 118),sum(if(subtractDays(date, 120)>=toDate(reg_time),0,amount)),null) as dm4,
  179. if(dt<subtractDays(today(), 148),sum(if(subtractDays(date, 150)>=toDate(reg_time),0,amount)),null) as dm5
  180. from game_data.order where status=2 and reg_time>'2019-03-18 00:00:00' group by toDate(formatDateTime(reg_time,'%Y-%m-%d')),channel """
  181. data = ck.execute(sql)
  182. isql = "insert into dw_channel_amount_daily values (%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s," \
  183. "%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s,%s)"
  184. db.dm.execute("truncate table dw_channel_amount_daily")
  185. db.dm.executeMany(isql, data)
  186. def dw_channel_amount_daily_reverse():
  187. sql = """
  188. select toDate(formatDateTime(reg_time,'%Y-%m-%d')) as dt,
  189. channel as channel,
  190. sum(if(date=today(),amount,0)) ba1,
  191. sum(if(addDays(date,1)=today(),amount,0)) ba2,
  192. sum(if(addDays(date,2)=today(),amount,0)) ba3,
  193. sum(if(addDays(date,3)=today(),amount,0)) ba4,
  194. sum(if(addDays(date,4)=today(),amount,0)) ba5,
  195. sum(if(addDays(date,6)=today(),amount,0)) ba6,
  196. sum(if(addDays(date,7)=today(),amount,0)) ba7
  197. from game_data.order where status=2 and reg_time>'2019-03-18 00:00:00' and date>=subtractDays(today(),7) group by toDate(formatDateTime(reg_time,'%Y-%m-%d')),channel"""
  198. data = ck.execute(sql)
  199. isql = "replace into dw_channel_amount_daily_reverse values (%s,%s,%s,%s,%s,%s,%s,%s,%s)"
  200. db.dm.execute("truncate table dw_channel_amount_daily_reverse")
  201. db.dm.executeMany(isql, data)
  202. def del_channel():
  203. sql = 'delete from dw_channel where channel in ("腾云文渊", "青渊文学", "玉竹文渊", "赤瞳伴读","扶摇阅文")'
  204. db.dm.execute(sql)
  205. def dw_channel_daily():
  206. logging.info('公众号数据处理,开始')
  207. logging.info('run> dw_channel')
  208. logging.info('公众号基本数据处理,开始')
  209. dw_channel() # 公众号基本数据
  210. logging.info('公众号基本数据处理,结束')
  211. logging.info('用户激活数据处理,开始')
  212. dw_channel_user_daily() # 用户激活
  213. logging.info('用户激活数据处理,结束')
  214. logging.info('用户充值数据处理,开始')
  215. dw_channel_amount_daily() # 用户充值
  216. logging.info('用户充值数据处理,结束')
  217. logging.info('用户充值数据倒序处理,开始')
  218. dw_channel_amount_daily_reverse() # 用户充值倒序
  219. logging.info('用户充值数据倒序处理,结束')
  220. logging.info('删除代投,开始')
  221. del_channel() # 删除代投的号
  222. logging.info('删除代投,结束')
  223. logging.info('公众号数据处理,开始')
  224. if __name__ == '__main__':
  225. # dw_channel_daily()
  226. # dw_daily_channel()
  227. dw_channel()
  228. # dw_channel_amount_daily()
  229. # dw_channel_user_daily()
  230. # dw_channel_amount_daily_reverse()
  231. # dw_channel()
  232. # del_channel()