From bd54b85d46d448b61dfedc7f4f3f1ef3c337519c Mon Sep 17 00:00:00 2001 From: Michael Peter Christen Date: Fri, 28 Mar 2014 14:44:52 +0100 Subject: [PATCH] fix for relative sitemap urls --- htroot/Crawler_p.java | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/htroot/Crawler_p.java b/htroot/Crawler_p.java index 4bb106d23..a96752bbd 100644 --- a/htroot/Crawler_p.java +++ b/htroot/Crawler_p.java @@ -473,7 +473,7 @@ public class Crawler_p { } } else if ("sitemap".equals(crawlingMode)) { try { - final DigestURL sitemapURL = new DigestURL(sitemapURLStr); + final DigestURL sitemapURL = sitemapURLStr.indexOf("//") > 0 ? new DigestURL(sitemapURLStr) : new DigestURL(rootURLs.iterator().next(), sitemapURLStr); // fix for relative paths which should not exist but are used anyway sb.crawler.putActive(handle, profile); final SitemapImporter importer = new SitemapImporter(sb, sitemapURL, profile); importer.start();