import requests
from bs4 import BeautifulSoup
import pandas as pd
import warnings
warnings.filterwarnings('ignore')
url = 'https://movie.naver.com/movie/running/current.naver'
resp = requests.get(url)
resp.text
soup = BeautifulSoup(resp.text)
lst_dsc = soup.find_all('dl', class_='lst_dsc')[0]
dt_tit = lst_dsc.find('dt', class_='tit')
dt_tit.find('a').get_text()
dl_info_star = lst_dsc.find('dl', class_='info_star')
dl_info_star.find_all('span', class_='num')
net = dl_info_star.find_all('span', class_='num')[0].get_text()
gija = dl_info_star.find_all('span', class_='num')[1].get_text()
print(net)
print(gija)
lst_dsc = soup.find_all('dl', class_='lst_dsc')
df = pd.DataFrame()
for dsc in lst_dsc:
dt_tit = dsc.find('dt', class_='tit')
title = dt_tit.find('a').get_text()
dl_info_star = dsc.find('dl', class_='info_star')
net = dl_info_star.find_all('span', class_='num')[0].get_text()
if(len(dl_info_star.find_all('span', class_='num')) == 2):
gija = dl_info_star.find_all('span', class_='num')[1].get_text()
movie = dict()
movie['title'] = title
movie['net'] = float(net)
movie['gija'] = float(gija)
df = df.append(movie, ignore_index=True)
df.head()
df.tail()
df[['gija', 'net']].describe()
df.info()