웹 크롤링/Web Crawling
[Web Crawling] 3. 정적페이지,html
by Jasonify97
2023. 2. 27.
import pandas as pd
import requests
from bs4 import BeautifulSoup
1.웹페이지 분석: URL
query = '삼성전자'
url = f'https://search.naver.com/search.naver?query={query}'
2. request > reponse(html)
response = requests.get(url)
3. str > bs object
dom = BeautifulSoup(response.text, 'html.parser')
4. bs object > css-selector > str
elements = dom.select('#nx_right_related_keywords > div > div.related_srch > ul > li')
element = elements[0]
element.select_one('.tit').text
5. str > dataframe
keywords = [element.select_one('.tit').text for element in elements]
df = pd.DataFrame({'keyword': keywords})
df['query'] = query
df