Note that there are some explanatory texts on larger screens.

plurals
  1. PO
    text
    copied!<p>Check out this here is an exact solution..</p> <p>in parse method selecting 50 products per page</p> <p>in page_rs_50 handled pagination </p> <pre><code>start_urls = ['http://www.e3050.com/Items.aspx?cat=SON'] pro_urls = [] # all product Urls def parse(self, response): # select 50 products on each page yield FormRequest.from_response(response, formdata={'ctl00$ctl00$ContentPlaceHolder1$ItemListPlaceHolder$pagesddl': '50', 'ctl00$ctl00$ContentPlaceHolder1$ItemListPlaceHolder$sortddl': 'Price(ASC)'}, meta={'curr': 1, 'total': 0, 'flag': True}, dont_click=True, callback=self.page_rs_50) def page_rs_50(self, response): # paginate the pages hxs = HtmlXPathSelector(response) curr = int(response.request.meta['curr']) total = int(response.request.meta['total']) flag = response.request.meta['flag'] self.pro_urls.extend(hxs.select( "//td[@class='name']//a[contains(@id,'ctl00_ctl00_ContentPlaceHolder1_ItemListPlaceHolder_itemslv_ctrl')]/@href" ).extract()) if flag: total = hxs.select( "//span[@id='ctl00_ctl00_ContentPlaceHolder1_ItemListPlaceHolder_lbl_pagesizeBtm']/text()").re('\d+')[0] if curr &lt; total: curr += 1 yield FormRequest.from_response(response, formdata={'ctl00$ctl00$ContentPlaceHolder1$ItemListPlaceHolder$pagesddl': '50', 'ctl00$ctl00$ContentPlaceHolder1$ItemListPlaceHolder$sortddl': 'Price(ASC)', 'ctl00$ctl00$ScriptManager1': 'ctl00$ctl00$ScriptManager1|ctl00$ctl00$ContentPlaceHolder1$ItemListPlaceHolder$pager1$ctl00$ctl01' , '__EVENTTARGET': 'ctl00$ctl00$ContentPlaceHolder1$ItemListPlaceHolder$pager1$ctl00$ctl01', 'ctl00$ctl00$ContentPlaceHolder1$ItemListPlaceHolder$hfVSFileName': hxs.select( ".//input[@id='ctl00_ctl00_ContentPlaceHolder1_ItemListPlaceHolder_hfVSFileName']/@value").extract()[ 0]}, meta={'curr': curr, 'total': total, 'flag': False}, dont_click=True, callback=self.page_rs_50 ) else: for pro in self.pro_urls: yield Request("http://www.e3050.com/%s" % pro, callback=self.parse_product) def parse_product(self, response): pass #TODO Implementation Required For Parsing </code></pre>
 

Querying!

 
Guidance

SQuiL has stopped working due to an internal error.

If you are curious you may find further information in the browser console, which is accessible through the devtools (F12).

Reload