언어/python

크롤러 - 임시

파아랑새 2018. 1. 2. 12:48
import requests
import pprint
from urllib.request import urlopen
from bs4 import BeautifulSoup
def main():
payload = {'q':'test','oq':'test'}
url = "https://www.google.co.kr/search?hl=ko&tbm=isch&source=hp&biw=1041&bih=781&ei=quxKWuidKca20QT9uJIo"
html = requests.get(url, params=payload)
s = html.text
t = BeautifulSoup(s, 'html.parser')
#print (t.prettify())
s = t.find_all('img')
num = 0
for i in s:
save_name = "test"
print (i['src'])
try:
mem = urlopen(i['src']).read()
save_name += str(num)
save_name +='.jpg'
print (save_name)
except:
print ("fail ... !!!")
else:
with open(save_name, mode='wb') as f:
f.write(mem)
num+=1

if __name__ == "__main__":
main()