I want to search company information automatically in google. Please see my code as below. HTTP Error 403: Forbidden or HTTP Error 404: Forbidden is happen.
from urllib.request import urlopen
from bs4 import BeautifulSoup
from urllib import parse
import openpyxl
wd = openpyxl.load_workbook('C:/Users/Lee Jung
Un/Documents/hopeyouwork.xlsx')#locate of excel file.
ws = wd.active
def bs(Eng_name):
url = "https://www.google.co.kr/search?ei=hWEaW-bKEMnb8QWa1IrQDw&q="
q = parse.quote(Eng_name)
html = urlopen(url + q)
bsObj = BeautifulSoup(html, "html.parser")
twg = bsObj.select("div.ifM9O > div:nth-child(2) > div.kp-header > div >
div.DI6Ufb > div > div > div.d1rFIf > div.kno-ecr-pt.kno-fb-ctx > span")
if bool(twg):
return twg.text
else:
info = "none"
return info
def companyname():
for r in ws.rows:
row_index = r[0].row
Eng_name = r[1].value
Kor_name = bs(Eng_name)
ws.cell(row=row_index, column=1).value = row_index
ws.cell(row=row_index, column=2).value = Eng_name
ws.cell(row=row_index, column=3).value = Kor_name
wd.save("Done.xlsx")
wd.close()
companyname()