饿了么(同行门店榜单).py 8.4 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170
  1. # -*- codeing = utf-8 -*-
  2. # @Time : 2023/3/7 11:03
  3. # @Author : Clown
  4. # @File : 饿了么(同行门店榜单).py
  5. # @Software : PyCharm
  6. from time import sleep
  7. import requests
  8. import random
  9. import os
  10. import sys
  11. from datetime import datetime,timedelta
  12. import json
  13. import pymysql
  14. import pandas as pd
  15. def linkTomySql(host, passwd, db_name, port):
  16. '''连接至数据库返回【db】,v2新增local_infile=1 打开文件导入权限'''
  17. try:
  18. # 本地连接为:localhost 服务器连接为:124.222.188.59
  19. db = pymysql.connect (
  20. host=host, user="root",
  21. passwd=passwd,
  22. db=db_name,
  23. charset='utf8mb4',
  24. local_infile=1,
  25. port=port)
  26. # print ('\nconnect to mysql server 成功')
  27. # print ('---------------------------------------')
  28. except:
  29. print ("\ncould not connect to mysql server")
  30. db = "连接失败"
  31. return db
  32. def read_key_value_pair(db, brand_name, wm_plate, owner):
  33. '''按条件读取,数据库中all_key_table表里的key_value_pair字段中的值,以键值对的形式输出
  34. db:数据库,
  35. brand_name:品牌名,
  36. wm_plate:外卖平台MEITUAN或ELEME,
  37. owner:账号权限all或one
  38. '''
  39. cursor = db.cursor ()
  40. sql = f'SELECT key_value_pair FROM all_key_table WHERE brand_name = "{brand_name}" AND wm_plate = "{wm_plate}" AND owner = "{owner}";'
  41. cursor.execute (sql)
  42. pair = json.loads (cursor.fetchall ()[0][0])
  43. return pair
  44. def get_shops_info_to_list(db, brand_name, wm_plate, key_name):
  45. '''获取门店信息表【shops_info_to_list】中的信息,
  46. 并返回表单shops_info_df【shop_id,shop_name,update_datetime,info_for_script】
  47. db:数据库信息
  48. brand_name:品牌
  49. wm_plate:外卖平台
  50. key_name:关键信息字段名,如无填‘’,如有填对应键值对的key
  51. '''
  52. cursor = db.cursor ()
  53. if key_name == '':
  54. sql = f'SELECT shop_id,shop_name,update_datetime FROM shops_info_for_script WHERE brand_name = "{brand_name}" AND wm_plate = "{wm_plate}";'
  55. cursor.execute (sql)
  56. shops_info = cursor.fetchall ()
  57. shops_info_df = []
  58. for shop_info in shops_info:
  59. shop_info_dict = {'shop_id': shop_info[0],
  60. 'shop_name': shop_info[1]}
  61. shops_info_df.append (shop_info_dict)
  62. return shops_info_df
  63. else:
  64. sql = f'SELECT shop_id,shop_name,update_datetime,info_for_script -> "$.{key_name}" FROM shops_info_for_script WHERE brand_name = "{brand_name}" AND wm_plate = "{wm_plate}";'
  65. cursor.execute (sql)
  66. shops_info = cursor.fetchall ()
  67. shops_info_df = []
  68. for shop_info in shops_info:
  69. shop_info_dict = {'shop_id': shop_info[0],
  70. 'shop_name': shop_info[1],
  71. 'update_datetime': shop_info[2],
  72. f'{key_name}': shop_info[3]}
  73. shops_info_df.append (shop_info_dict)
  74. return shops_info_df
  75. def rankDecs(dict_in):
  76. return dict_in['同行门店月售top10']
  77. if __name__ == '__main__':
  78. host = '124.222.188.59'
  79. passwd = '111...Clown'
  80. db_name = 'zuzu_data'
  81. port = 63306
  82. db = linkTomySql(host, passwd, db_name, port)
  83. brand_name = '浆小白'
  84. owner = 'all'
  85. keys_dict = {'elm':'',
  86. 'elm_shops':'',
  87. 'mt':'',
  88. 'mt_shops':''}
  89. keys_dict['elm'] = read_key_value_pair(db, brand_name, 'ELEME', owner)
  90. keys_dict['elm_shops'] = get_shops_info_to_list(db,brand_name,'ELEME','')
  91. keys_dict['mt'] = read_key_value_pair (db, brand_name, 'MEITUAN', owner)
  92. keys_dict['mt_shops'] = get_shops_info_to_list (db, brand_name, 'MEITUAN', '')
  93. try:
  94. ksid = keys_dict['elm'] ['data']['session']['ksid']
  95. elm_shops = keys_dict['elm_shops']
  96. # elm_shops = [{'shop_id':173858169,'shop_name':''},{'shop_id':507932892,'shop_name':''}]
  97. script_name = os.path.basename(sys.argv[0])
  98. beginTime = (datetime.today () + timedelta (days=-1)).strftime ('%Y-%m-%d') # 2022-06-23
  99. endTime = (datetime.today () + timedelta (days=-1)).strftime ('%Y-%m-%d') # 2022-06-23
  100. beginTime_int = int ((datetime.today () + timedelta (days=-1)).strftime ('%Y%m%d')) # 20220623
  101. endTime_int = int ((datetime.today () + timedelta (days=-1)).strftime ('%Y%m%d')) # 20220623
  102. downloadPath = f'F:/cppc/cppc_数据表/3每日爬虫数据/饿了么同行门店榜单/{beginTime_int}饿了么同行门店榜单.xlsx'
  103. df_out = []
  104. for shop in elm_shops:
  105. shop_id = shop['shop_id']
  106. shop_name = shop['shop_name']
  107. # print(ksid,shop_id)
  108. # # print(shop_name)
  109. sleep (random.uniform (0.5, 1.5))
  110. try:
  111. url = 'https://app-api.shop.ele.me/stats/invoke/?method=OrderStatsService.getIndustryShop'
  112. cookie = 'cna=sk9kGMYYSlkCAd9o1MY603L4; ubt_ssid=z4djmg7vis0sclouzk4dag3r05s2jj30_2021-03-04; perf_ssid=or3iygctea950e0ujr03rhb1lxtke9ms_2021-03-07; nrksid=MZZMNDMTA1MjU4MzA1NTA3NDAxT1Y1aXdxVzhQ; xlly_s=1; shopId='+str(shop_id)+'; ksid='+ksid+'; AEM_TAG_ID_CATCH_DATA_ES00000044={%22tagId%22:%22ES00000044%22%2C%22data%22:%22%E5%BF%AB%E9%A4%90%E4%BE%BF%E5%BD%93%22%2C%22userId%22:173858169%2C%22time%22:1678159125600}; AEM_TAG_ID_CATCH_DATA_ES00000069={%22tagId%22:%22ES00000069%22%2C%22data%22:%22%E8%80%81%E5%BA%97%22%2C%22userId%22:173858169%2C%22time%22:1678159125601}; AEM_TAG_ID_CATCH_DATA_ES00000035={%22tagId%22:%22ES00000035%22%2C%22data%22:%22%E8%80%81%E5%BA%97-%E4%B8%80%E8%88%AC%E5%93%81%E8%B4%A8%22%2C%22userId%22:173858169%2C%22time%22:1678159125601}; AEM_TAG_ID_CATCH_DATA_ES00000021={%22tagId%22:%22ES00000021%22%2C%22data%22:%22%E5%85%A8%E5%9B%BD%E8%BF%9E%E9%94%81%22%2C%22userId%22:173858169%2C%22time%22:1678159125601}; AEM_TAG_ID_CATCH_DATA_ES00000019={%22tagId%22:%22ES00000019%22%2C%22data%22:%22%E4%B8%8A%E6%B5%B7%22%2C%22userId%22:173858169%2C%22time%22:1678159125601}; tfstk=cptRBeO4vjcoG8ch0g308V_N3JOdaSGdG813vhyNM1b04jEbDsxkjhdxD46C__HA.; l=fBOyel_7jbqeT6mSBO5Ihurza779eIOb8oVzaNbMiIEGa6gCNFDj5OCsaGqeldtjgTCxnetrl5ZFzd3HkeUdaxDDBec6LmhInxv9xESPN; isg=BOHh1uRzIbZCUYn7wQVzgEex8K37jlWAM3q0MUO37-hVqgB8i9ilUBWoDN4sZu24'
  113. headers = {
  114. 'user-agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/110.0.0.0 Safari/537.36',
  115. 'content-type': 'application/json',
  116. 'Cookie':cookie}
  117. params = {"id":"89F28423BA7B4882900E677683EA56E7|1678159334618",
  118. "metas":{"appName":"melody",
  119. "appVersion":"4.4.0",
  120. "ksid":ksid,
  121. "shopId":shop_id},
  122. "service":"OrderStatsService",
  123. "method":"getIndustryShop",
  124. "params":{"shopId":shop_id},"ncp":"2.0.0"}
  125. resp = requests.post(url,headers=headers,json=params).json()
  126. recentOrderNum_list = []
  127. for shop_rank_info in resp['result']:
  128. shop_dict = {'门店id':shop_id,
  129. '门店名称':shop_name,
  130. '商圈同行门店id':shop_rank_info['mShopId'],
  131. '商圈同行门店名称':shop_rank_info['mShopName'],
  132. '同行门店月售top10':shop_rank_info['recentOrderNum'],
  133. '同行门店评分':shop_rank_info['score']}
  134. recentOrderNum_list.append(shop_dict)
  135. recentOrderNum_list.sort(key=rankDecs,reverse=True)
  136. df_out.extend(recentOrderNum_list[:10])
  137. code = '成功'
  138. except Exception as e:
  139. shop_dict = {'门店id': shop_id,
  140. '门店名称': shop_name,
  141. '商圈同行门店id': '无数据',
  142. '商圈同行门店名称': '无数据',
  143. '同行门店月售top10': '无数据',
  144. '同行门店评分': '无数据'}
  145. df_out.append(shop_dict)
  146. code = e
  147. print(script_name,shop_id,shop_name,code)
  148. df_out = pd.DataFrame(df_out)
  149. df_out.to_excel(downloadPath)
  150. except Exception as e:
  151. print(e)