import requests import os import time from bs4 import BeautifulSoup import lxml import re import io import sys #import json #sys.getdefaultencoding('utf8') #url = 'http://www.jmrgs.com/showinfo-121-65372-0.html#001' #url1 = 'http://www.jmrgs.com/showinfo-116-616650-0.html' fout = open('tongchuangjiaoqi.txt', 'w') url_li = [] ''' content = requests.get(url).text soup = BeautifulSoup(content,'lxml') print(content) ''' def get_chapter_url(): with open('xiaoshuo.txt') as f: for line in f: url_li.append(line.strip().split('" title=')[0].split('