개발

Insta 해쉬태그 크롤링 코딩 소스

Byunpa24 2021. 1. 20. 16:07
반응형

from urllib.request import urlopen

from urllib.parse import quote_plus

from bs4 import BeautifulSoup

from selenium import webdriver 

import time

 

https://www.instagram.com/dlwlrma.16/

 

baseUrl = 'https://www.instagram.com/explore/tags/'

plusUrl = input('검색할 태그를 입력하세요 : ')

url = baseUrl + quote_plus(plusUrl)

 

driver = webdriver.Chrome()

driver.get(url)

 

time.sleep(3)

 

html = driver.page_source 

soup = BeautifulSoup(html)

 

insta = soup.select('.v1Nh3.kIKUG._bz0w')

 

n = 1 

for i in insta:

    print('https://instagram.com' + i.a['href'])

    imgUrl = i.select_one('.KL4Bh').img['src']

    with urlopen(imgUrl) as f:

        with open('./img/' +plusUrl + str(n) + '.jpg''wb'as h:

            img = f.read()

            h.write(img)

    n += 1

    print(imgUrl)

    print()

driver. close()

 

반응형