Joshua Wallace's Blog: Project #7

For my 7th project, I made a program that scrapes information from a webpage and shows it in the terminal.

import requests
from bs4 import BeautifulSoup

r = requests.get("http://www.pyclass.com/real-estate/rock-springs-wy/LCWYROCKSPRINGS/",

headers={'User-agent': 'Mozilla/5.0 (X11; Ubuntu; Linux x86_64; rv:61.0) Gecko/20100101 Firefox/61.0'})
c = r.content

soup = BeautifulSoup(c, "html.parser")

all = soup.find_all("div", {"class": "propertyRow"})

all[0].find("h4", {"class": "propPrice"}).text.replace("\n", "").replace(" ", "")


# Pulling data from each listing and printing it in the terminal.

for item in all:
    try:
        print(item.find_all("span", {"class", "propAddressCollapse"})[0].text)
    except:
        print("No Info")

    try:
        print(item.find_all("span", {"class", "propAddressCollapse"})[1].text)
    except:
        print("No Info")

    try:
        print(item.find("h4", {"class", "propPrice"}).text.replace("\n", "").replace(" ", ""))
    except:
        print("No Info")

    try:
        print(item.find("span", {"class", "infoBed"}).find("b").text)
    except:
        print("No Info")

    try:
        print(item.find("span", {"class", "infoValueFullBath"}).find("b").text)
    except:
        print("No Info")

    try:
        print(item.find("span", {"class", "infoValueHalfBath"}).find("b").text)
    except:
        print("No half bath")

    try:
        print(item.find("span", {"class", "infoSqFt"}).find("b").text)
    except:
        print("No Info")

    for column_group in item.find_all("div", {"class": "columnGroup"}):
        for feature_group, feature_name in zip(column_group.find_all("spans", {"class": "featureGroup"}),

column_group.find_all("span", {"class": "featureName"})):

            print(feature_group.text, feature_name.text)

    print(" ")

Joshua Wallace's Blog

Wednesday, February 12, 2020

Project #7 - Web Scraper

No comments:

Post a Comment

Project #8 - Stock Tracking Graph

Search This Blog