mirror of
https://github.com/yacy/yacy_search_server.git
synced 2024-09-19 00:01:41 +02:00
check the document protocol & host values before proceeding to form final url.
This commit is contained in:
parent
962aaec0c0
commit
5268ae2ce9
|
@ -617,6 +617,10 @@ public class CrawlQueues {
|
|||
deep = true;
|
||||
}
|
||||
DigestURL url;
|
||||
if (doc.getFieldValue("url_protocol_s") == null || doc.getFieldValue("host_s") == null) {
|
||||
//Skip this document if either of these values is null.
|
||||
continue;
|
||||
}
|
||||
final String u = doc.getFieldValue("url_protocol_s").toString() + "://" + doc.getFieldValue("host_s").toString();
|
||||
try {
|
||||
url = new DigestURL(u);
|
||||
|
|
Loading…
Reference in New Issue
Block a user