Commit 689e89a9 authored by Yihua Huang's avatar Yihua Huang

Merge pull request #157 from zhugw/patch-1

Update FileCacheQueueScheduler.java
parents 147401ce 1db940a0
...@@ -145,6 +145,8 @@ public class FileCacheQueueScheduler extends DuplicateRemovedScheduler implement ...@@ -145,6 +145,8 @@ public class FileCacheQueueScheduler extends DuplicateRemovedScheduler implement
if (!inited.get()) { if (!inited.get()) {
init(task); init(task);
} }
if(urls.contains(request.getUrl())) //已存在此URL 表示已抓取过 跳过
return;
queue.add(request); queue.add(request);
fileUrlWriter.println(request.getUrl()); fileUrlWriter.println(request.getUrl());
} }
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment