|
|
@@ -130,19 +130,22 @@ public class Crawler4LoveFootServiceImpl implements Crawler4LoveFootService {
|
|
|
String sourceUrl = sourceSelect.select("a").attr("abs:href");
|
|
|
|
|
|
Integer statusInt = 2;
|
|
|
+ LocalDate clockDate = null;
|
|
|
+ LocalDate updateDate = null;
|
|
|
+ String keywords = null;
|
|
|
try {
|
|
|
loveFootDetailDocument = JsoupUtil.requestDocument(sourceUrl, JsoupUtil.HTTP_GET, proxy, null, header2Map, null);
|
|
|
String clockDateStr = loveFootDetailDocument.select("div.viral").select("li.icon-clock").text();
|
|
|
String updateDateStr = loveFootDetailDocument.select("div.viral").select("li.icon-update").text();
|
|
|
- LocalDate clockDate = LocalDate.parse(clockDateStr, DateUtils.dateFormatter3);
|
|
|
- LocalDate updateDate = LocalDate.parse(updateDateStr, DateUtils.dateFormatter3);
|
|
|
+ clockDate = LocalDate.parse(clockDateStr, DateUtils.dateFormatter3);
|
|
|
+ updateDate = LocalDate.parse(updateDateStr, DateUtils.dateFormatter3);
|
|
|
|
|
|
if (updateDate.isBefore(latestDate) || updateDate.isEqual(latestDate)) {
|
|
|
break outer;
|
|
|
}
|
|
|
|
|
|
// 获取关键词
|
|
|
- String keywords = loveFootDetailDocument.select("div.postContents").select("td:contains(タイトル)").next("td").text();
|
|
|
+ keywords = loveFootDetailDocument.select("div.postContents").select("td:contains(タイトル)").next("td").text();
|
|
|
if (StringUtils.isNotEmpty(keywords)) {
|
|
|
statusInt = 1;
|
|
|
log.warn("jsoupLoveFoot4avnoashiSub parseDetailToKeywords success,sourceUrl={},keywords={}", sourceUrl, keywords);
|
|
|
@@ -169,6 +172,9 @@ public class Crawler4LoveFootServiceImpl implements Crawler4LoveFootService {
|
|
|
CrawlerLoveFoot crawlerLoveFoot = new CrawlerLoveFoot();
|
|
|
crawlerLoveFoot.setIdentificationCode(UUID.randomUUID().toString());
|
|
|
crawlerLoveFoot.setOrginUrl(sourceUrl);
|
|
|
+ crawlerLoveFoot.setClockDate(clockDate);
|
|
|
+ crawlerLoveFoot.setUpdateDate(updateDate);
|
|
|
+ crawlerLoveFoot.setName(keywords);
|
|
|
crawlerLoveFoot.setType(1);
|
|
|
crawlerLoveFoot.setStatus(statusInt);
|
|
|
crawlerLoveFoot.setCreateTime(LocalDateTime.now());
|