Spaces:

mdj1412
/

stock_news_summaries_AI

Runtime error

mdj1412

commit first

c109682 over 1 year ago

1.3 kB

	from bs4 import BeautifulSoup
	import urllib.request
	import pandas as pd

	url = "https://en.wikipedia.org/wiki/List_of_S%26P_500_companies"

	def get_SP500():
	# Set List
	SP500_list = []

	# html 정보 가져오기
	html = urllib.request.urlopen(url).read()
	soup = BeautifulSoup(html, 'html.parser')

	# html에서 table 정보 가져오기
	table = soup.find("table", {"class": "wikitable sortable"})

	for row in table.findAll("tr")[1:]:

	ticker = get_ticker(row)
	name = get_name(row)
	sector = get_sector(row)
	industry = get_industry(row)

	SP500_list.append(return_comment_form(ticker, name, sector, industry))

	return SP500_list





	def return_comment_form(ticker, name, sector, industry):
	comment = {'ticker': ticker,
	'name': name,
	'sector' : sector,
	'industry' : industry
	}
	return comment






	def get_ticker(row):
	return row.select('td')[0].text.strip()

	def get_name(row):
	return row.select('td')[1].text.strip()

	def get_sector(row):
	return row.select('td')[3].text.strip()

	def get_industry(row):
	return row.select('td')[4].text.strip()




	if __name__ == '__main__':
	a = get_SP500()

	print(pd.DataFrame(a))
	print("Finish")