# -*- coding: utf-8 -*-
import requests
from lxml import etree#抽取数据,只写了爬前页,章节页没写
'''oop例子
class Pig:#大写
def eat(self):
print('Hello World')
t=Pig()
t.eat()
'''
class Spider(object):
def start_request(self):
response=requests.get('https://www.qidian.com/all')
html=response.content.decode()
dom=etree.HTML(html)
#标题xpath
Bigtit_list=dom.xpath('//div[@class="book-mid-info"]/h4/a/text()')
#print(Bigtit_list)
Bighref_list=dom.xpath('//div[@class="book-mid-info"]/h4/a/@href')
#print(Bighref_list)
#代码管理 一一对应zip
for Bigtit_list,Bighref_list in zip (Bigtit_list,Bighref_list):
print(Bigtit_list,Bighref_list)
def start_chapter(self,url):
response=requests.get(url)
html=response.content.decode()
dom=etree.HTML(html)
print(dom)
spider=Spider()
spider.start_request()
#spider.start_chapter('https://book.qidian.com/info/1009480992')