我要登录,然后爬网该网站。
我通过python登录后,必须获得每个班级(员工级别)的薪水。
登录网址= https://www.jobplanet.co.kr/users/sign_in 每个班级的工资网址= https://www.jobplanet.co.kr/companies/20575/salaries/
from bs4 import BeautifulSoup
import urllib,http.cookiejar
cj = http.cookiejar.LWPCookieJar()
opener = urllib.request.build_opener(urllib.request.HTTPCookieProcessor(cj))
urllib.request.install_opener(opener)
headers = {'User-Agent': 'Mozilla/5.0'}
params = urllib.parse.urlencode({"mode":"login","user_email":"*******","user_password":"******"})
params = params.encode('utf-8')
req = urllib.request.Request("https://www.jobplanet.co.kr/users/sign_in",headers=headers)
rej = urllib.request.Request("https://www.jobplanet.co.kr/companies/20575/salaries/",headers=headers)
res = opener.open(rej)
html = res.read()