1 import urllib.request 2 import chardet 3 4 def main(): 5 count = 1 6 with open('D:\\urls.txt') as f: 7 while True: 8 url = f.readline() 9 if url == '': 10 break 11 12 url_content = urllib.request.urlopen(url).read() 13 14 #获取网页编码 15 encode = chardet.detect(url_content)['encoding'] 16 if encode == 'GB2312': 17 encode = 'GBK' 18 #解码 19 url_content = url_content.decode(encode) 20 21 #文件名称 22 file_name = 'D:\\url_%d.txt' % count 23 24 #写入内容 25 with open(file_name,'a',encoding = encode) as g: 26 g.write(url_content) 27 28 count += 1 29 30 if __name__ == '__main__': 31 main()