向scray中的ASMX Webservice发送Ajax请求

import scrapy from scrapy.http import * from scrapy.selector import Selector import json from scrapy.utils.response import open_in_browser class TestSpider(scrapy.Spider): name = "test" allowed_domains = ['customer2.videcom.com'] start_urls = ['http://customer2.videcom.com/med- view/VARS/Public/CustomerPanels/requirements.aspx?country=ng&lang=en'] def parse(self, response): form_data = { 'VarsSessionID': '', '__VIEWSTATE': '/wEPDwULLTE4MTk4NDM5NjEPZBYCAgMPZBYCAgMPFgIeB1Zpc2libGVoZGSNuC4VK36MoPTmce49gcH1j2nxAPDYsLXii0G/syddwQ=='} yield FormRequest.from_response(response, formid='frmChangePage', formdata=form_data, method='POST', callback=self.after_parse, url='http://customer2.videcom.com/med-view/VARS/Public/CustomerPanels/requirements.aspx?country=ng&lang=en', ) def after_parse(self, response): print "====RESPONSE===" print response.headers print "==========" print response.request.headers print "==========" VarsSessionID = Selector(response=response).xpath("//*[@id='VarsSessionID']/@value").extract()[0] viewstate = Selector(response=response).xpath("//*[@id='__VIEWSTATE']/@value").extract()[0] print "VarsSessionID: " + VarsSessionID print "__VIEWSTATE: " + viewstate url = "http://customer2.videcom.com/med-view/VARS/Public/WebServices/AvailabilityWS.asmx/GetFlightAvailability?VarsSessionID="+VarsSessionID payload = { "FormData": { 'Origin': ['LOS'], 'VarsSessionID': VarsSessionID, 'Destination': ['ABV'], 'DepartureDate': ['05-May-2017'], 'ReturnDate': '', 'Adults': '1', 'Children': '0', 'SmallChildren': '0', "Seniors": '0', "Students": '0', "Infants": '0', "Youths": '0', "Teachers": '0', "SeatedInfants": '0', "EVoucher": '', "recaptcha": 'SHOW', "SearchUser": 'PUBLIC', "SearchSource": "requirements" }, "IsMMBChangeFlightMode": 'false' } headers = { 'Accept': 'application/json, text/javascript, */*', 'Accept-Encoding': 'gzip, deflate, br', 'accept-language': 'en_US', 'Connection': 'keep-alive', 'content-type': 'application/json', 'Cookie': {'VarsSessionID':''}, 'User-Agent': "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_12_3) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/57.0.2987.133 Safari/537.36" } yield Request(url, callback=self.after_search, method='POST', body=json.dumps(payload), headers=headers) def after_search(self, response): print "========SEARCH HEADERS========" print response.headers print response.request.headers open_in_browser(response)

1条回答

网友

1楼 · 发布于 2024-10-01 11:19:51

将请求中硬编码的__VIEWSTATE参数替换为“fresh”参数。在

获取某个时间后的复杂状态是无效的。在

有时在ASP网站上，FormRequest.from_response无法正确捕获此参数，因此您可能需要检查响应.正文以了解如何提取__VIEWSTATE。在

下面是一个很好的例子：https://blog.scrapinghub.com/2016/04/20/scrapy-tips-from-the-pros-april-2016-edition/

相关问题更多 >

编程相关推荐

热门问题

热门文章