Commit 160a149b authored by yihua.huang's avatar yihua.huang

todo bugfix

parent 583a0eba
...@@ -482,7 +482,7 @@ public class Spider implements Runnable, Task { ...@@ -482,7 +482,7 @@ public class Spider implements Runnable, Task {
/** /**
* Exit when complete. <br/> * Exit when complete. <br/>
* True: exit when all url of the site is downloaded. <br/> * True: exit when all url of the site is downloaded. <br/>
* False: not exit until call stop manually.<br/> * False: not exit until call stop() manually.<br/>
* *
* @param exitWhenComplete * @param exitWhenComplete
* @return * @return
......
...@@ -90,11 +90,15 @@ public class HttpClientDownloader implements Downloader { ...@@ -90,11 +90,15 @@ public class HttpClientDownloader implements Downloader {
HttpClient httpClient = getHttpClientPool().getClient(site); HttpClient httpClient = getHttpClientPool().getClient(site);
try { try {
HttpGet httpGet = new HttpGet(request.getUrl()); HttpGet httpGet = new HttpGet(request.getUrl());
if (headers!=null){ if (headers!=null){
for (Map.Entry<String, String> headerEntry : headers.entrySet()) { for (Map.Entry<String, String> headerEntry : headers.entrySet()) {
httpGet.addHeader(headerEntry.getKey(),headerEntry.getValue()); httpGet.addHeader(headerEntry.getKey(),headerEntry.getValue());
} }
} }
if (!httpGet.containsHeader("Accept-Encoding")) {
httpGet.addHeader("Accept-Encoding", "gzip");
}
HttpResponse httpResponse = null; HttpResponse httpResponse = null;
int tried = 0; int tried = 0;
boolean retry; boolean retry;
...@@ -168,6 +172,7 @@ public class HttpClientDownloader implements Downloader { ...@@ -168,6 +172,7 @@ public class HttpClientDownloader implements Downloader {
HeaderElement[] codecs = ceheader.getElements(); HeaderElement[] codecs = ceheader.getElements();
for (HeaderElement codec : codecs) { for (HeaderElement codec : codecs) {
if (codec.getName().equalsIgnoreCase("gzip")) { if (codec.getName().equalsIgnoreCase("gzip")) {
//todo bugfix
httpResponse.setEntity( httpResponse.setEntity(
new GzipDecompressingEntity(httpResponse.getEntity())); new GzipDecompressingEntity(httpResponse.getEntity()));
} }
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment