我有以下代码:
import os import re from bs4 import BeautifulSoup import urllib.request #from urllib.request import request, urlopen #from urllib import request import pandas as pd import numpy as np import datetime import time import openpyxl for a in range(0,len(symbols),1): #ua = UserAgent() url = "https://iborrowdesk.com/report/" + symbols[a] """ test urls: https://iborrowdesk.com/report/wmt """ print("Extracting Values for " + symbols[a] + ".") try: page = urllib.request.urlopen(url) soup = BeautifulSoup(page, "html.parser", from_encoding="iso-8859-1") value_label_value = soup.find_all('table', {'class': 'table table-condensed table-hover'})
print(value_label_value)
数据来自“网络”选项卡中的API调用。您可以按如下方式重新创建表:
import requests import pandas as pd data = requests.get('https://iborrowdesk.com/api/ticker/wmt').json() df = pd.DataFrame(data['real_time']) df