这篇博文为大家分享如何使用R包爬取智联招聘的信息,以上海市目前数据分析师岗位为例,愿为即将找工作的你提供帮助。1、爬取主界面信息library(rvest)library(stringr)url1='http://sou.zhaopin.com/jobs/searchresult.ashx?jl=%e4%b8%8a%e6%b5%b7&kw=%e6%95%b0%e6%8d%ae%e5%88%86%e6%9e%90&isadv=0&sg=d916c075b66b48249d6dba31c11b39e0&p='zhiwei=company=salary=adress=time=zwhref=NULLfor( i in 1:10){ url=paste(url1,i,sep = '') web = read_html(url) zhiwei1=web %>% html_nodes('td.zwmc')%>% html_nodes('a')%>%html_text() zhiwei = c(zhiwei,zhiwei1[str_length(zhiwei1) !=0]) company1= web %>% html_nodes('td.gsmc')%>% html_nodes('a')%>%html_text() company = c(company,company1[str_length(company1) !=0]) salary=c(salary,web %>% html_nodes('td.zwyx')%>% html_text()) adress=c(adress,web %>% html_nodes('td.gzdd')%>
………………………………