资源简介
改下用户名密码可以直接用,爬取VIP章节需要开通VIP,免费章节可以随便爬
代码片段和文件信息
# -*- coding: utf-8 -*-
# @Time : 2019/5/19 17:53
# @Author : LM
import requests
from bs4 import BeautifulSoup
import json
import os
import datetime
class Spider(object):
def __init__(self):
self.headers = {‘user-agent‘: ‘Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML like Gecko) Chrome/73.0.3683.86 Safari/537.36‘}
print(‘请输入要爬取的小说名‘)
self.novel_name = input()
self.chapters_url = ‘‘
self.download_url_ls = {}
self.loginName = ‘17623609183‘
self.password = ‘liangqi520‘
def verify(self):
now = datetime.datetime.now()
start_time = datetime.datetime.strptime(‘2019-05-20 01:00:00‘ ‘%Y-%m-%d %H:%M:%S‘)
delta = now - start_time
if delta.seconds/60 > 10:
quit()
else:
print(‘验证成功‘)
def login(self):
data = {
‘loginName‘: self.loginName
‘password‘: self.password
}
login_url = ‘https://passport.17k.com/ck/user/login‘
session = requests.Session()
html = session.post(url=login_url data=data headers=self.headers).text
json_data = json.loads(html)
if json_data[‘status‘][‘msg‘] == ‘succ‘:
print(‘登陆成功,当前账户:{}‘.format(self.loginName))
return session
else:
print(‘用户名或者密码错误‘)
def catalogue(self):
url = ‘https://search.17k.com/search.xhtml?c.st=0&c.q=‘ + self.novel_name
html = requests.get(url=url headers=self.headers).text
soup = BeautifulSoup(html ‘lxml‘)
res = soup.findAll(attrs={‘class‘: ‘textmiddle‘})
for i in res:
info = i.select(‘ dl > dt > a‘)[0]
searched_name = info.get_text().strip()
if searched_name == self.novel_name:
print(‘{}:查找成功‘.format(self.novel_name))
self.chapters_url = ‘https://‘ + info.get(‘href‘)[2:].replace(‘book‘ ‘list‘)
break
print(‘查找失败,不存在该小说或拼写错误‘)
def get_download_url(self):
html = requests.get(url=self.chapters_url headers=self.headers)
html.encoding = ‘utf-8‘
soup = BeautifulSoup(html.text ‘lxml‘)
volume = soup.find_all(‘dl‘ c 相关资源
- Python-BDD100K大规模多样化驾驶视频数据
- Instant Pygame for Python Game Development How
- Biopython Tutorial
- Think Python 2nd
- 一个小小的表白程序(python)
- Python课堂笔记(高淇400集第一季)
- 二级考试python试题12套(包括选择题和
- pywin32_python3.6_64位
- python+ selenium教程
- PycURL(Windows7/Win32)Python2.7安装包 P
- 英文原版-Scientific Computing with Python
- 7.图像风格迁移 基于深度学习 pyt
- 基于Python的学生管理系统
- A Byte of Python(简明Python教程)(第
- Python实例174946
- Python 人脸识别
- Python 人事管理系统
- 一个多线程智能爬虫,爬取网站小说
- 基于python-flask的个人博客系统
- 计算机视觉应用开发流程
- python 调用sftp断点续传文件
- python socket游戏
- 基于Python爬虫爬取天气预报信息
- python函数编程和讲解
- 顶点小说单本书爬虫.py
- Python开发的个人博客
- 基于python的三层神经网络模型搭建
- python实现自动操作windows应用
- python人脸识别(opencv)
- python 绘图(方形、线条、圆形)
川公网安备 51152502000135号
评论
共有 条评论