From 7c6f116beb7b62e8defaf292cfacd9d003231e0d Mon Sep 17 00:00:00 2001 From: cff <302959274@qq.com> Date: Tue, 17 Jul 2018 22:21:31 +0800 Subject: [PATCH] =?UTF-8?q?=E6=8D=A2=E7=BD=91=E7=AB=99http://www.ruiwen.co?= =?UTF-8?q?m/jiaocai/?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- tamguo-crawler/src/main/java/com/tamguo/model/vo/BookVo.java | 2 +- .../src/main/java/com/tamguo/service/impl/BookService.java | 4 ++-- 2 files changed, 3 insertions(+), 3 deletions(-) diff --git a/tamguo-crawler/src/main/java/com/tamguo/model/vo/BookVo.java b/tamguo-crawler/src/main/java/com/tamguo/model/vo/BookVo.java index 9a80c74..19f9dcd 100644 --- a/tamguo-crawler/src/main/java/com/tamguo/model/vo/BookVo.java +++ b/tamguo-crawler/src/main/java/com/tamguo/model/vo/BookVo.java @@ -9,7 +9,7 @@ import java.util.List; @PageSelect(cssQuery = "body") public class BookVo { - @PageFieldSelect(cssQuery = ".ih3") + @PageFieldSelect(cssQuery = ".text") private List name; public List getName() { diff --git a/tamguo-crawler/src/main/java/com/tamguo/service/impl/BookService.java b/tamguo-crawler/src/main/java/com/tamguo/service/impl/BookService.java index 5459b7f..4c467a1 100644 --- a/tamguo-crawler/src/main/java/com/tamguo/service/impl/BookService.java +++ b/tamguo-crawler/src/main/java/com/tamguo/service/impl/BookService.java @@ -28,7 +28,7 @@ public class BookService implements IBookService { @Override public void crawlerBook() { XxlCrawler crawler = new XxlCrawler.Builder() - .setUrls("http://www.dzkbw.com") + .setUrls("http://www.ruiwen.com/jiaocai/") .setAllowSpread(false) .setFailRetryCount(5) .setThreadCount(20) @@ -37,7 +37,7 @@ public class BookService implements IBookService { public void parse(Document html, Element pageVoElement, BookVo bookVo) { // 解析封装 PageVo 对象 String pageUrl = html.baseUri(); - if (pageUrl.equals("http://www.dzkbw.com")) { + if (pageUrl.equals("http://www.ruiwen.com/jiaocai/")) { logger.info("开始解析书本信息:{}", pageUrl); List books = bookVo.getName(); books.forEach(item -> {