sports.py 1.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142
  1. # -*- coding: utf-8 -*-
  2. import scrapy
  3. import lxml.etree
  4. import pycomm
  5. class SportsSpider(scrapy.Spider):
  6. name = 'sports'
  7. allowed_domains = ['hg0088.com']
  8. # start_urls = ['http://hg0088.com/']
  9. custom_settings = {
  10. "Accept":"text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,*/*;q=0.8",
  11. "Accept-Encoding":"gzip, deflate",
  12. "Accept-Language":"zh-CN,zh;q=0.8",
  13. "Cache-Control":"max-age=0",
  14. "Connection":"keep-alive",
  15. "Cookie":"OddType@21627573=H; protocolstr=http; gamePoint_21627573=2019-05-10%2A0%2A0; _ga=GA1.4.601418716.1557495256; _gid=GA1.4.1118061739.1557495256",
  16. "Host":"199.26.100.178",
  17. "USER_AGENT": "Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/55.0.2883.87 UBrowser/6.2.4098.3 Safari/537.36",
  18. }
  19. start_url= 'http://199.26.100.178/app/member/get_game_allbets.php'
  20. def start_requests(self):
  21. url=self.start_url
  22. form_data={
  23. "uid":"x5cx6y9fm21627573l266800",
  24. "langx":"zh-cn",
  25. "gtype":"FT",
  26. "showtype":"FT",
  27. "gid":"3701122",
  28. "ltype":"4",
  29. "date":pycomm.gmdate()
  30. }
  31. request = scrapy.FormRequest(url, formdata=form_data, callback=self.parse)
  32. yield request
  33. def parse(self, response):
  34. doc = lxml.etree.fromstring(response.body)
  35. print(doc.xpath('/serverresponse/game/gid//text()'))
  36. print(pycomm.getCache('conf'))
  37. pass