DataAnalysis/웹크롤링

쿠우쿠우 웹크롤링 전국매장 정보 가져오기 (beautifulsoup)

_DAMI 2022. 4. 22. 23:29
import requests
from bs4 import BeautifulSoup
import pandas as pd
import matplotlib.pyplot as plt
import matplotlib

result = []
#쿠우쿠우
for pageNum in range(1,8):
    url = f'http://www.qooqoo.co.kr/bbs/board.php?bo_table=storeship&&page={pageNum}'
    response = requests.get(url)

    print('-------------------------- " ', pageNum)

    if response.status_code == 200:
        html = response.content
        soup = BeautifulSoup(html, 'html.parser',from_encoding='cp949')

        tbody = soup.find('tbody')
        tr_list=tbody.find_all('tr')
        for i in range(0,len(tr_list),2):
            tr=tr_list[i]
            loc = tr.find('span', class_="color-grey").text  # 지역
            name = tr.find('div', class_="td-subject ellipsis").find_all('a')[1].text  # 지점명
            tel = tr.find('td', class_="hidden-xs").find('a').text  # 주소
            addr = tr.find('td', class_="hidden-xs td-width").find('a').text  # 번호
            result.append([loc, name, addr, tel])
            print(loc, name, addr, tel)

    else :
        print(response.status_code)

pdResult = pd.DataFrame(result, columns=['loc', 'name', 'addr', 'tel'])
pdResult.to_csv('caffenbay_stores.csv', encoding='cp949')

acount=pdResult.groupby(['loc']).describe()
print(acount.iloc[:,0:1])