-
이곳저곳 이미지 썸네일 크롤러ESG부트캠프/파이썬 2022. 10. 21. 17:38
구글
12345678910111213141516171819202122232425262728293031323334353637383940from selenium import webdriverfrom selenium.webdriver.common.keys import Keysimport timeimport urllib.requestfrom selenium.webdriver.common.by import Bychromedriver = "크롬 드라이버 경로"driver = webdriver.Chrome(chromedriver)driver.implicitly_wait(1)img_name = "저장할 이미지 이름" # 저장할 이미지 이름driver.get("구글 이미지 검색 url")# 구글 검색 이미지 링크save_path = "이미지 저장 경로" # 이미지 저장 위치element = driver.find_element(By.TAG_NAME, "body")temp = 0while True:for _ in range(100): # 뭔가 중간에 끝나는 것 같으면 100씩 올려봅시다element.send_keys(Keys.PAGE_DOWN)time.sleep(0.1)try:driver.find_element(By.XPATH, "/html/body/div[2]/c-wiz/div[3]/div[1]/div/div/div/div[1]/div[2]/div[2]/input").click()except:breaklinks = []images = driver.find_elements(By.CSS_SELECTOR, "img.rg_i.Q4LuWd")for image in images:if image.get_attribute("src") != None:links.append(image.get_attribute("src"))time.sleep(2)for idx, link in enumerate(links):urllib.request.urlretrieve(link, str(save_path) + str(img_name) + str(idx) + ".jpg")driver.close()cs 네이버
12345678910111213141516171819202122232425262728293031323334353637383940from selenium import webdriverfrom selenium.webdriver.common.keys import Keysimport urllib.requestfrom selenium.webdriver.common.by import Byfrom keras.utils.image_utils import load_imgimport timechromedriver = "크롬 드라이버 경로" # 크롬 드라이버 위치img_name = "검색 키워드" # 검색 키워드save_path = "이미지 저장 위치" # 이미지 저장 위치img_width = 256 # output사이즈(픽셀)img_height = 256scroll_num = 30 # 스크롤 횟수driver = webdriver.Chrome(chromedriver)driver.implicitly_wait(1)driver.get("https://search.naver.com/search.naver?where=image&sm=tab_jum&query=" + img_name)element = driver.find_element(By.TAG_NAME, "body")for _ in range(scroll_num):for _ in range(10):element.send_keys(Keys.PAGE_DOWN)time.sleep(2)links = []images = driver.find_elements(By.CSS_SELECTOR, "img._image._listImage")for image in images:if image.get_attribute("src") != None:links.append(image.get_attribute("src"))driver.close()for idx, link in enumerate(links):urllib.request.urlretrieve(link, str(save_path) + str(img_name) + str(idx) + ".jpg")img = load_img(str(save_path) + str(img_name) + str(idx) + ".jpg")img = img.convert("RGB")img = img.resize((img_width, img_height))img.save(str(save_path) + str(img_name) + str(idx) + ".jpg")cs 핀터레스트
1234567891011121314151617181920212223242526272829303132333435363738from selenium import webdriverfrom selenium.webdriver.common.keys import Keysimport urllib.requestfrom selenium.webdriver.common.by import Byfrom keras.utils.image_utils import load_imgchromedriver = "크롬 드라이버 경로" # 크롬 드라이버 위치img_name = "검색 키워드" # 검색 키워드save_path = "이미지 저장 경로" # 이미지 저장 위치img_width = 256 # output사이즈(픽셀)img_height = 256scroll_num = 5 # 스크롤 횟수driver = webdriver.Chrome(chromedriver)driver.implicitly_wait(1)driver.get("https://www.pinterest.co.kr/search/pins/?q=" + img_name + "&rs=rs&eq=&etslf=1719")element = driver.find_element(By.TAG_NAME, "body")for _ in range(scroll_num):images = driver.find_elements(By.CSS_SELECTOR, "img.hCL.kVc.L4E.MIw")links = []for image in images:links.append(image.get_attribute("src"))for _ in range(5):element.send_keys(Keys.PAGE_DOWN)driver.close()for idx, link in enumerate(links):urllib.request.urlretrieve(link, str(save_path) + str(img_name) + str(idx) + ".jpg")img = load_img(str(save_path) + str(img_name) + str(idx) + ".jpg")img = img.convert("RGB")img = img.resize((img_width, img_height))img.save(str(save_path) + str(img_name) + str(idx) + ".jpg")cs 혹시 몰라서..
'ESG부트캠프 > 파이썬' 카테고리의 다른 글
AI Hub 데이터 bounding box 변환(Json to txt) (0) 2022.11.11