HTML/HTML

[Python_HTML] 파이썬 웹 크롤링

꾸압 2021. 3. 4. 10:15

 

from selenium import webdriver
from selenium.webdriver.common.keys import Keys
from webdriver_manager.chrome import ChromeDriverManager
driver = webdriver.Chrome(ChromeDriverManager().install())

try:
    for i in range(1,11):
        url = 'https://naver.com/BlogHome.nhn?directoryNo=0&currentPage='+str(i)+'&groupId=0'
        driver.get(url)

        elem = driver.find_element_by_class_name('list_post_article')    
        print(elem.text)
        
    input()    
except Exception as e:
    print(e)
finally:
    driver.quit()

네이버 블로그 크롤링

 

네이버 기사 메인 화면 호출

 

from selenium import webdriver
from selenium.webdriver.common.keys import Keys
from webdriver_manager.chrome import ChromeDriverManager
driver = webdriver.Chrome(ChromeDriverManager().install())

try:
    driver.get('http://pann.nate.com')
    elem = driver.find_element_by_id('container')
    lis = elem.find_elements_by_xpath('./div/ul')
    for li in lis:
        print(li.text)

    input()    
except Exception as e:
    print(e)
finally:
    driver.quit()

네이트 판 메인 화면 호출