福特抓取网页

uat-temp-castle-2502241152-fordFetchWeb
臧学普 2 months ago
parent 0ed0d4e43f
commit 37843777b5

@ -12,9 +12,9 @@ import cn.estsh.impp.framework.boot.exception.ImppExceptionBuilder;
import cn.hutool.http.HttpRequest; import cn.hutool.http.HttpRequest;
import cn.hutool.http.HttpResponse; import cn.hutool.http.HttpResponse;
import lombok.extern.slf4j.Slf4j; import lombok.extern.slf4j.Slf4j;
import org.apache.commons.lang3.StringUtils;
import org.jsoup.Jsoup; import org.jsoup.Jsoup;
import org.jsoup.nodes.Document; import org.jsoup.nodes.Document;
import org.jsoup.nodes.Element;
import org.jsoup.select.Elements; import org.jsoup.select.Elements;
import org.springframework.beans.factory.annotation.Autowired; import org.springframework.beans.factory.annotation.Autowired;
import org.springframework.stereotype.Service; import org.springframework.stereotype.Service;
@ -99,38 +99,41 @@ public class MesFordFetchWebServiceImpl implements IFordFetchWebService {
log.info("doFetchData-查询出来的内容为:{}",response.body()); log.info("doFetchData-查询出来的内容为:{}",response.body());
Document doc = Jsoup.parse(response.body()); Document doc = Jsoup.parse(response.body());
Elements trList = doc.select("tr"); Elements trList = doc.select("tr");
for (Element tr : trList) { for (int i = 1; i < trList.size(); i++) {
Elements tdList = tr.select("td"); Elements tdList = trList.get(i).select("td");
MesFordJsaSortInfoWithFetchWeb webInfo = new MesFordJsaSortInfoWithFetchWeb(); MesFordJsaSortInfoWithFetchWeb webInfo = new MesFordJsaSortInfoWithFetchWeb();
webInfo.setSeq(Long.parseLong(tdList.get(0).text())); if (tdList.get(0).text().equals("无数据") || StringUtils.isBlank(tdList.get(0).text())){
webInfo.setFetchDate(tdList.get(1).text()); break;
webInfo.setFetchTime(tdList.get(2).text()); }
webInfo.setVinCode(tdList.get(3).text()); webInfo.setSeq(Long.parseLong(tdList.get(0).text()));
webInfo.setPartNo(tdList.get(4).text()); webInfo.setFetchDate(tdList.get(1).text());
webInfo.setPartName(tdList.get(5).text()); webInfo.setFetchTime(tdList.get(2).text());
webInfo.setColorCode(tdList.get(6).text()); webInfo.setVinCode(tdList.get(3).text());
webInfo.setInfo0008(tdList.get(7).text()); webInfo.setPartNo(tdList.get(4).text());
webInfo.setSeqContext(tdList.get(8).text()); webInfo.setPartName(tdList.get(5).text());
webInfo.setRemark(tdList.get(9).text()); webInfo.setColorCode(tdList.get(6).text());
webInfo.setInfoPointDesc(tdList.get(10).text()); webInfo.setInfo0008(tdList.get(7).text());
webInfo.setFetchType(1); //抓取类型 webInfo.setSeqContext(tdList.get(8).text());
webInfo.setDataStatus(200); webInfo.setRemark(tdList.get(9).text());
webInfo.setOrganizeCode(organizeCode); webInfo.setInfoPointDesc(tdList.get(10).text());
webInfo.setInfoPointCode(parameter.getInfoPointCode()); webInfo.setFetchType(1); //抓取类型
webInfo.setCustOrganizeCode(parameter.getCustOrganizeCode()); webInfo.setDataStatus(200);
ConvertBean.saveOrUpdate(webInfo,"doFetchData"); webInfo.setOrganizeCode(organizeCode);
//校验是否已经查询过 webInfo.setInfoPointCode(parameter.getInfoPointCode());
DdlPackBean webInfoPackBean = DdlPackBean.getDdlPackBean(organizeCode); webInfo.setCustOrganizeCode(parameter.getCustOrganizeCode());
DdlPreparedPack.getNumEqualPack(webInfo.getSeq(),"seq",webInfoPackBean); ConvertBean.saveOrUpdate(webInfo,"doFetchData");
DdlPreparedPack.getNumEqualPack(webInfo.getFetchDate(),"fetchDate",webInfoPackBean); //校验是否已经查询过
DdlPreparedPack.getNumEqualPack(webInfo.getFetchTime(),"fetchTime",webInfoPackBean); DdlPackBean webInfoPackBean = DdlPackBean.getDdlPackBean(organizeCode);
int count = fetchWebRao.findByHqlWhereCount(webInfoPackBean); DdlPreparedPack.getNumEqualPack(webInfo.getSeq(),"seq",webInfoPackBean);
if (count > 0){ DdlPreparedPack.getStringEqualPack(webInfo.getFetchDate(),"fetchDate",webInfoPackBean);
continue; DdlPreparedPack.getStringEqualPack(webInfo.getFetchTime(),"fetchTime",webInfoPackBean);
int count = fetchWebRao.findByHqlWhereCount(webInfoPackBean);
if (count > 0){
continue;
}
fetchWebRao.insert(webInfo);
infoList.add(webInfo);
} }
fetchWebRao.insert(webInfo);
infoList.add(webInfo);
}
return infoList; return infoList;
} }

Loading…
Cancel
Save