Commit 4111b072 authored by yihua.huang's avatar yihua.huang

more error log on page code error #601

parent 6bd1eed2
...@@ -418,6 +418,8 @@ public class Spider implements Runnable, Task { ...@@ -418,6 +418,8 @@ public class Spider implements Runnable, Task {
pipeline.process(page.getResultItems(), this); pipeline.process(page.getResultItems(), this);
} }
} }
} else {
logger.info("page status code error, page {} , code: {}", request.getUrl(), page.getStatusCode());
} }
sleep(site.getSleepTime()); sleep(site.getSleepTime());
return; return;
......
...@@ -76,7 +76,6 @@ public class HttpClientDownloader extends AbstractDownloader { ...@@ -76,7 +76,6 @@ public class HttpClientDownloader extends AbstractDownloader {
if (task == null || task.getSite() == null) { if (task == null || task.getSite() == null) {
throw new NullPointerException("task or site can not be null"); throw new NullPointerException("task or site can not be null");
} }
logger.debug("downloading page {}", request.getUrl());
CloseableHttpResponse httpResponse = null; CloseableHttpResponse httpResponse = null;
CloseableHttpClient httpClient = getHttpClient(task.getSite()); CloseableHttpClient httpClient = getHttpClient(task.getSite());
Proxy proxy = proxyProvider != null ? proxyProvider.getProxy(task) : null; Proxy proxy = proxyProvider != null ? proxyProvider.getProxy(task) : null;
...@@ -86,7 +85,7 @@ public class HttpClientDownloader extends AbstractDownloader { ...@@ -86,7 +85,7 @@ public class HttpClientDownloader extends AbstractDownloader {
httpResponse = httpClient.execute(requestContext.getHttpUriRequest(), requestContext.getHttpClientContext()); httpResponse = httpClient.execute(requestContext.getHttpUriRequest(), requestContext.getHttpClientContext());
page = handleResponse(request, task.getSite().getCharset(), httpResponse, task); page = handleResponse(request, task.getSite().getCharset(), httpResponse, task);
onSuccess(request); onSuccess(request);
logger.debug("downloading page success {}", page); logger.info("downloading page success {}", request.getUrl());
return page; return page;
} catch (IOException e) { } catch (IOException e) {
logger.warn("download page {} error", request.getUrl(), e); logger.warn("download page {} error", request.getUrl(), e);
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment