roll_bangqiu.py 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238
  1. #!/usr/bin/env python
  2. # -*- coding: utf-8 -*-
  3. import datetime
  4. import jsonpath
  5. __author__ = 'ethereal'
  6. __mtime__ = '2019/4/16'
  7. # -*- coding: utf-8 -*-
  8. import json
  9. import scrapy
  10. from scrapy.http import Request
  11. from ..items import Roll_Bangqiu
  12. class BqrangqiuSpider(scrapy.Spider):
  13. name = 'roll_bangqiu'
  14. to_day = datetime.datetime.now()
  15. allowed_domains = ['hg3535z.com']
  16. custom_settings = {
  17. "ITEM_PIPELINES": {
  18. "hg3535.pipeline.Roll_Banqiupipeline": 300,
  19. },
  20. # 'LOG_LEVEL': 'DEBUG',
  21. # 'LOG_FILE': "../hg3535/log/roll_bangqiu_{}_{}_{}.log".format(to_day.year, to_day.month, to_day.day)
  22. }
  23. start_urls = ['https://hg3535z.com/odds2/d/getodds?sid=4&pt=4&ubt=am&pn=0&sb=2&dc=null&pid=0'] # 滚球菜单 棒球滚球列url
  24. # start_urls = ['http://hg3535z.com/odds2/d/getodds?sid=3&pt=4&ubt=am&pn=0&sb=2&dc=null&pid=0'] # 滚球菜单 网球测试滚球列url
  25. # start_urls = ['https://www.baidu.com']
  26. def parse(self, response):
  27. datas = json.loads(response.text)
  28. # urls = "https://www.baidu.com"
  29. # yield Request(url=urls,callback=self.parse_each)
  30. # datas ={"i": ["true", 4, 3110520, 2, 1, "sh", 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, "14 / 04", "", "", "false", "true", "\u68d2\u7403", 0], "eg": {"c": {"k": 29400, "n": "\u7f8e\u56fd\u804c\u4e1a\u68d2\u7403"}, "es": [{"dbg": "false", "egid": 0, "g": "", "i": ["\u4e9a\u7279\u5170\u5927\u52c7\u58eb\u961f", "\u7ebd\u7ea6\u5927\u90fd\u4f1a\u961f", "9", "True", "14 / 04", "", "9", "False", "0", "0", "2", "1", "", "", "", "", 0, "", "", 16, "True"], "ibs": "true", "ibsc": "false", "k": 3110520, "o": {"ah": {"s": 1, "v": ["h3164784133", "-1.5", "h3164784134", "+1.5", "o3164784133", "1.33", "o3164784134", "0.55"], "n": "\u6eda\u7403 \u8ba9\u7403"}, "ou": {"s": 2, "v": ["h3164784135", "6.5", "h3164784136", "6.5", "o3164784135", "0.70", "o3164784136", "1.04"], "n": "\u603b\u5f97\u5206:\u6eda\u7403 \u5927 / \u5c0f"}, "oe": {"s": 6, "v": ["o3164784137", "0.51", "o3164784138", "1.58"], "n": "\u603b\u5f97\u5206:\u6eda\u7403 \u5355 / \u53cc"}, "ml": {"s": 5, "v": ["o3164784139", "0.00", "o3164784140", "0.00"], "n": "\u6eda\u7403 \u72ec\u8d62\u76d8"}}, "p-o": [{"n": "\u51c0\u80dc\u7403\u6570", "st": "ha", "mgk": 9, "s": 7, "k": 301, "o": [["\u4e9a\u7279\u5170\u5927\u52c7\u58eb\u961f-\u8d62\u5f971\u5206", "o3164784186", "3.15", "0"], ["\u4e9a\u7279\u5170\u5927\u52c7\u58eb\u961f-\u8d62\u5f972\u5206", "o3164784187", "5.5", "3"], ["\u4e9a\u7279\u5170\u5927\u52c7\u58eb\u961f-\u8d62\u5f973\u5206", "o3164784188", "9.5", "6"], ["\u4e9a\u7279\u5170\u5927\u52c7\u58eb\u961f-\u8d62\u5f974\u5206\u6216\u66f4\u591a", "o3164784189", "7.5", "9"], ["\u7ebd\u7ea6\u5927\u90fd\u4f1a\u961f-\u8d62\u5f971\u5206", "o3164784190", "5.0", "2"], ["\u7ebd\u7ea6\u5927\u90fd\u4f1a\u961f-\u8d62\u5f972\u5206", "o3164784191", "7.5", "5"], ["\u7ebd\u7ea6\u5927\u90fd\u4f1a\u961f-\u8d62\u5f973\u5206", "o3164784192", "11.5", "8"], ["\u7ebd\u7ea6\u5927\u90fd\u4f1a\u961f-\u8d62\u5f974\u5206\u6216\u66f4\u591a", "o3164784193", "10.0", "11"]]}, {"n": "\u7b2c6\u5c40\u83b7\u80dc\u8005", "st": "ha", "mgk": 0, "s": 3000, "k": 4000, "o": [["\u548c\u5c40", "o3164784213", "1.50"], ["\u4e9a\u7279\u5170\u5927\u52c7\u58eb\u961f", "o3164784214", "5.5"], ["\u7ebd\u7ea6\u5927\u90fd\u4f1a\u961f", "o3164784215", "3.80"]]}, {"n": "\u52a0\u65f6", "st": "ha", "mgk": 312, "s": 8, "k": 13520, "o": [["\u662f", "o3164784228", "6.0"], ["\u4e0d\u662f", "o3164784229", "1.09"]]}], "pci": {"ctid": 0}, "sb": {"fb": "false", "sb": "false", "tb": "false", "ot": 0, "ps": [{"adv": -1, "a": 1.0, "e": 3110520, "h": 2.0, "p": "ft"}, {"adv": -1, "a": 0.0, "e": 3110520, "h": 0.0, "p": "ot"}, {"adv": -1, "a": 0.0, "e": 3110520, "h": 0.0, "p": "i1"}, {"adv": -1, "a": 1.0, "e": 3110520, "h": 1.0, "p": "i2"}, {"adv": -1, "a": 0.0, "e": 3110520, "h": 1.0, "p": "i3"}, {"adv": -1, "a": 0.0, "e": 3110520, "h": 0.0, "p": "i4"}, {"adv": -1, "a": 0.0, "e": 3110520, "h": 0.0, "p": "i5"}, {"adv": -1, "a": 0.0, "e": 3110520, "h": 0.0, "p": "i6"}, {"adv": -1, "a": 0.0, "e": 3110520, "h": 0.0, "p": "i7"}, {"adv": -1, "a": 0.0, "e": 3110520, "h": 0.0, "p": "i8"}, {"adv": -1, "a": 0.0, "e": 3110520, "h": 0.0, "p": "i9"}], "a": 1, "h": 2, "k": 3110520, "iwd": "false", "ls": -1, "s": 1, "ts": 0, "tt": 0, "ct": "00:00", "cp": "i5"}, "egn": ""}, {"dbg": "false", "egid": 0, "g": "", "i": ["ATL Braves - Team Runs - Over", "ATL Braves - Team Runs - Under", "9", "True", "14 / 04", "", "9", "False", "0", "0", "2", "0", "", "", "", "", 0, "", "", 16, "True"], "ibs": "true", "ibsc": "false", "k": 3110522, "o": {"ou": {"s": 3, "v": ["h3164784242", "3.5", "h3164784243", "3.5", "o3164784242", "1.12", "o3164784243", "0.63"], "n": "\u7403\u961f\u5f97\u5206:\u4e9a\u7279\u5170\u5927\u52c7\u58eb\u961f-\u6eda\u7403 \u5927 / \u5c0f"}}, "pci": {"ctid": 208, "ctn": "\u7403\u961f\u5f97\u5206"}, "egn": ""}, {"dbg": "false", "egid": 0, "g": "", "i": ["NY Mets - Team Runs - Over", "NY Mets - Team Runs - Under", "9", "True", "14 / 04", "", "9", "False", "0", "0", "1", "0", "", "", "", "", 0, "", "", 16, "True"], "ibs": "true", "ibsc": "false", "k": 3110524, "o": {"ou": {"s": 4, "v": ["h3164784261", "2.5", "h3164784263", "2.5", "o3164784261", "0.55", "o3164784263", "1.23"], "n": "\u7403\u961f\u5f97\u5206:\u7ebd\u7ea6\u5927\u90fd\u4f1a\u961f-\u6eda\u7403 \u5927 / \u5c0f"}}, "pci": {"ctid": 209, "ctn": "\u7403\u961f\u5f97\u5206"}, "egn": ""}]}, "ot": 2, "sc": {"3110520": {"a": 1, "h": 2}, "3110522": {"a": 0, "h": 2}, "3110524": {"a": 0, "h": 1}}, "v": 40576}
  31. # item = Today_all()
  32. ids = jsonpath.jsonpath(datas, '$..i-ot[0]..egs..es..i[16]') # ids新列表
  33. print(ids)
  34. if ids:
  35. ids = set(ids)
  36. for i in ids:
  37. urls = 'https://hg3535z.com/odds2/d/getamodds?eid={}&iip=true&ubt=am&isp=false'.format(i)
  38. print(urls)
  39. yield Request(url=urls, callback=self.parse_each, dont_filter=True)
  40. def parse_each(self, response):
  41. datas = json.loads(response.text)
  42. # 倒三角形 sa向下,sh向上
  43. triangle = datas['i'][5]
  44. try:
  45. # new_datas = json.loads(response.text)['eg']
  46. new_datas = datas['eg']
  47. except:
  48. new_datas = ""
  49. try:
  50. pt = response.meta['pt']
  51. except:
  52. pt = 0
  53. if new_datas:
  54. # 联赛id
  55. league_id = new_datas["c"]["k"]
  56. # 联赛名
  57. league_name = new_datas["c"]["n"]
  58. new_data = new_datas["es"]
  59. for result in new_data:
  60. if result['pci']["ctid"] == 0:
  61. item = Roll_Bangqiu()
  62. # 比赛id
  63. game_id = str(result['k'])
  64. # 球队1
  65. team_home = result['i'][0]
  66. # 球队2
  67. team_guest = result['i'][1]
  68. # 数量(97>)
  69. number = result['i'][2]
  70. # 比赛状态
  71. zhuangtai = result['i'][3]
  72. # 日期
  73. data_game = result['i'][4]
  74. # 开赛时间
  75. time_game = result['i'][5]
  76. # 队1分数
  77. score_home1 = result['i'][10]
  78. # 队2分数
  79. score_guest1 = result['i'][11]
  80. # 第几盘
  81. # jijie = result['i'][12]
  82. # 球队得分
  83. qiudui = result['pci'].get('ctn', "")
  84. # 是否出局 不一定存在
  85. ot = result['sb'].get("ot", "")
  86. ps_list = result['sb']['ps']
  87. # 右菱形bool值
  88. fb = result['sb']['fb']
  89. # 左菱形bool值
  90. tb = result['sb']['tb']
  91. # 上菱形bool值
  92. sb = result['sb']['tb']
  93. # 局数或者节或者分
  94. cp = result['sb']['cp']
  95. # 第一个队伍
  96. a = result['sb']['a']
  97. # 第二个队伍
  98. h = result['sb']['h']
  99. d = {}
  100. d['ps'] = ps_list
  101. d['cp'] = cp
  102. d['ot'] = ot
  103. d['triangle'] = triangle
  104. d['fb'] = fb
  105. d['tb'] = tb
  106. d['sb'] = sb
  107. # --------------------------------------------------让球分割线-----------------------------------------------------------
  108. concedes_dict = {}
  109. concedes_dict_rule = {}
  110. try:
  111. concedes = result['o']["ah"]["v"]
  112. concedes_dict_rule['concede_home'] = concedes[1]
  113. concedes_dict['concede_home'] = concedes[5]
  114. concedes_dict_rule['concede_guest'] = concedes[3]
  115. concedes_dict['concede_guest'] = concedes[7]
  116. except:
  117. concedes_dict_rule['concede_home'] = ""
  118. concedes_dict['concede_home'] = ""
  119. concedes_dict_rule['concede_guest'] = ""
  120. concedes_dict['concede_guest'] = ""
  121. # 让球 前5局-------------------------------------------------------------------------------------------------------------
  122. try:
  123. concedes = result['o']["ahf5in"]["v"]
  124. concedes_dict_rule['five_concede_home'] = concedes[1]
  125. concedes_dict['five_concede_home'] = concedes[5]
  126. concedes_dict_rule['five_concede_guest'] = concedes[3]
  127. concedes_dict['five_concede_guest'] = concedes[7]
  128. except:
  129. concedes_dict_rule['five_concede_home'] = ""
  130. concedes_dict['five_concede_home'] = ""
  131. concedes_dict_rule['five_concede_guest'] = ""
  132. concedes_dict['five_concede_guest'] = ""
  133. # ---------------------------------------------------独赢----------------------------------------------------------------
  134. capots_dict = {}
  135. try:
  136. capots = result['o']["ml"]["v"]
  137. capots_dict['capot_home'] = capots[1]
  138. capots_dict['capot_guest'] = capots[3]
  139. except:
  140. capots_dict['capot_home'] = ""
  141. capots_dict['capot_guest'] = ""
  142. # ---------------------------------------------------总得分:大/小--------------------------------------------------------
  143. total_size_dict = {}
  144. total_size_dict_rule = {}
  145. try:
  146. total_sizes = result['o']["ou"]["v"]
  147. total_size_dict_rule['total_size_big'] = total_sizes[1]
  148. total_size_dict['total_size_big'] = total_sizes[5]
  149. total_size_dict_rule['total_size_small'] = total_sizes[3]
  150. total_size_dict['total_size_small'] = total_sizes[7]
  151. except:
  152. total_size_dict_rule['total_size_big'] = ""
  153. total_size_dict['total_size_big'] = ""
  154. total_size_dict_rule['total_size_small'] = ""
  155. total_size_dict['total_size_small'] = ""
  156. # 总得分: 大/小 前5局-----------------------------------------------------------------------------------------------------
  157. try:
  158. total_sizes = result['o']["ouf5in"]["v"]
  159. total_size_dict_rule['five_total_size_big'] = total_sizes[1]
  160. total_size_dict['five_total_size_big'] = total_sizes[5]
  161. total_size_dict_rule['five_total_size_small'] = total_sizes[3]
  162. total_size_dict['five_total_size_small'] = total_sizes[7]
  163. except:
  164. total_size_dict_rule['five_total_size_big'] = ""
  165. total_size_dict['five_total_size_big'] = ""
  166. total_size_dict_rule['five_total_size_small'] = ""
  167. total_size_dict['five_total_size_small'] = ""
  168. # ------------------------------------------------------总得分:单/双-----------------------------------------------------
  169. odd_evens_dict = {}
  170. odd_evens_dict_rule = {}
  171. try:
  172. odd_evens = result['o']["oe"]["v"]
  173. # 上半场 主队让球条件
  174. odd_evens_dict['two_sides_single'] = odd_evens[1]
  175. odd_evens_dict_rule['two_sides_single'] = "单"
  176. odd_evens_dict['two_sides_double'] = odd_evens[3]
  177. odd_evens_dict_rule['two_sides_double'] = "双"
  178. except:
  179. odd_evens_dict['two_sides_single'] = ""
  180. odd_evens_dict['two_sides_double'] = ""
  181. odd_evens_dict_rule['two_sides_single'] = ""
  182. odd_evens_dict_rule['two_sides_double'] = ""
  183. # 联赛id
  184. item['league_id'] = league_id
  185. # 联赛名
  186. item['league_name'] = league_name
  187. # 比赛id
  188. item['game_id'] = game_id
  189. # 球队1
  190. item['team_home'] = team_home
  191. # 球队2
  192. item['team_guest'] = team_guest
  193. # 数量(97>)
  194. item['number'] = number
  195. # 比赛状态
  196. item['zhuangtai'] = zhuangtai
  197. # 日期
  198. item['data_game'] = data_game
  199. # 开赛时间
  200. item['time_game'] = time_game
  201. # 队1分数
  202. item['score_home'] = score_home1
  203. # 队2分数
  204. item['score_guest'] = score_guest1
  205. # 第几节
  206. item['jijie'] = cp
  207. item['pt'] = pt
  208. # 球队得分
  209. item['qiudui'] = "{}:{}".format(a, h)
  210. # 让球
  211. item['concedes_dict'] = concedes_dict
  212. item['concedes_dict_rule'] = concedes_dict_rule
  213. # 独赢
  214. item['capots_dict'] = capots_dict
  215. # 总得分:大/小
  216. item['total_size_dict'] = total_size_dict
  217. item['total_size_dict_rule'] = total_size_dict_rule
  218. # 总得分:单/双
  219. item['odd_evens_dict'] = odd_evens_dict
  220. item['odd_evens_dict_rule'] = odd_evens_dict_rule
  221. item['match_score_dict'] = d
  222. yield item