unstoppable_app / get_gun_endorsements.py
veeps
merging all endorsements into one file
cf66726
raw
history blame contribute delete
752 Bytes
from bs4 import BeautifulSoup
import pandas as pd
# Open and read the HTML file
with open("giffords.html", 'r', encoding='utf-8') as file:
html_content = file.read()
# Parse the HTML content
soup = BeautifulSoup(html_content, 'html.parser')
# Find all div elements
h3 = soup.find_all('h3', class_='gif-card__title')
# Initialize a list to store the data
data = []
for link in h3:
name = link.find('a').text.strip()
data.append(name)
len(data)
# Make dataframe
df = pd.DataFrame(data)
df["Endorsed by"] = "Education Votes"
# Clean candidate name
df["Candidate"] = df["Candidate"].str.replace('\xa0(D)', '')
df["Candidate"] = df["Candidate"].str.replace('Rep. ', '')
# write to csv
df.to_csv("edu_endorsements.csv", index = False)