From 4111b07263579e4e7f714547f1b5bc2e0fa46b4f Mon Sep 17 00:00:00 2001 From: "yihua.huang" Date: Sat, 17 Jun 2017 10:36:41 +0800 Subject: [PATCH] more error log on page code error #601 --- webmagic-core/src/main/java/us/codecraft/webmagic/Spider.java | 2 ++ .../us/codecraft/webmagic/downloader/HttpClientDownloader.java | 3 +-- 2 files changed, 3 insertions(+), 2 deletions(-) diff --git a/webmagic-core/src/main/java/us/codecraft/webmagic/Spider.java b/webmagic-core/src/main/java/us/codecraft/webmagic/Spider.java index 69096188..62c989f1 100644 --- a/webmagic-core/src/main/java/us/codecraft/webmagic/Spider.java +++ b/webmagic-core/src/main/java/us/codecraft/webmagic/Spider.java @@ -418,6 +418,8 @@ public class Spider implements Runnable, Task { pipeline.process(page.getResultItems(), this); } } + } else { + logger.info("page status code error, page {} , code: {}", request.getUrl(), page.getStatusCode()); } sleep(site.getSleepTime()); return; diff --git a/webmagic-core/src/main/java/us/codecraft/webmagic/downloader/HttpClientDownloader.java b/webmagic-core/src/main/java/us/codecraft/webmagic/downloader/HttpClientDownloader.java index 7119d107..6d4442a6 100644 --- a/webmagic-core/src/main/java/us/codecraft/webmagic/downloader/HttpClientDownloader.java +++ b/webmagic-core/src/main/java/us/codecraft/webmagic/downloader/HttpClientDownloader.java @@ -76,7 +76,6 @@ public class HttpClientDownloader extends AbstractDownloader { if (task == null || task.getSite() == null) { throw new NullPointerException("task or site can not be null"); } - logger.debug("downloading page {}", request.getUrl()); CloseableHttpResponse httpResponse = null; CloseableHttpClient httpClient = getHttpClient(task.getSite()); Proxy proxy = proxyProvider != null ? proxyProvider.getProxy(task) : null; @@ -86,7 +85,7 @@ public class HttpClientDownloader extends AbstractDownloader { httpResponse = httpClient.execute(requestContext.getHttpUriRequest(), requestContext.getHttpClientContext()); page = handleResponse(request, task.getSite().getCharset(), httpResponse, task); onSuccess(request); - logger.debug("downloading page success {}", page); + logger.info("downloading page success {}", request.getUrl()); return page; } catch (IOException e) { logger.warn("download page {} error", request.getUrl(), e);