有一个包含链接的 9980 行文本文件。字典从这些页面中解析出来并写入表中。该程序运行良好,但只处理一半的链接。我不明白原因。告诉我有什么问题吗?
from openpyxl import Workbook
from openpyxl.worksheet.table import Table, TableStyleInfo
import requests
from bs4 import BeautifulSoup as bs
import json
num = int(1)
wb = Workbook()
ws = wb.active
ws.append(["Наименование организацтт", "ИНН", "Юридический адресс", "Дата регистрации", "Руководитель", "e-mail", "Номер телефона", "Номер факса", "Web-site"])
keys = 'fullName','inn','address','regDate','director','email','phoneNumber','faxNumber','webSiteUrl'
with open("data_links.txt", 'r') as links_file:
for link in links_file:
r = requests.get(links_file.readline())
soup = str(bs(r.text, "html.parser"))
data = json.loads(soup)
data = {k: data[k] for k in keys}
finish_data = []
for value in data.values():
finish_data.append(value)
ws.append(finish_data)
print(num)
num += 1
wb.save("Organizations.xlsx")