StringpartitioningQuery=partitioningKey+":\""+partitioningValue+"\" AND ("+collection1query+")";
postprocessingActivity="collecting "+partitioning.get(partitioningValue)+" documents from partition \""+partitioningValue+"\" (averall "+count+") from the collection for harvestkey "+harvestkey+", partitioned by "+partitioningKey;
CollectionSchema.host_subdomain_s.getSolrFieldName()+" asc,"+// sort on subdomain to get hosts without subdomain first; that gives an opportunity to set www_unique_b flag to false
CollectionSchema.host_subdomain_s.getSolrFieldName()+" asc,"+// sort on subdomain to get hosts without subdomain first; that gives an opportunity to set www_unique_b flag to false
CollectionSchema.url_protocol_s.getSolrFieldName()+" asc"// sort on protocol to get http before https; that gives an opportunity to set http_unique_b flag to false
CollectionSchema.url_protocol_s.getSolrFieldName()+" asc"// sort on protocol to get http before https; that gives an opportunity to set http_unique_b flag to false
@ -1297,11 +1312,6 @@ public class CollectionConfiguration extends SchemaConfiguration implements Seri
ConcurrentLog.info("CollectionConfiguration","cleanup_processing: deleting "+failids.size()+" documents which have permanent execution fails");
ConcurrentLog.info("CollectionConfiguration","cleanup_processing: deleting "+failids.size()+" documents which have permanent execution fails");
collectionConnector.deleteByIds(failids);
collectionConnector.deleteByIds(failids);
}
}
if(count!=countcheck.get())ConcurrentLog.warn("CollectionConfiguration","ambiguous collection document count for harvestkey "+harvestkey+": expected="+count+", counted="+countcheck);// big gap for harvestkey = null
if(count!=countcheck.get())ConcurrentLog.warn("CollectionConfiguration","ambiguous collection document count for harvestkey "+harvestkey+": expected="+count+", counted="+countcheck+"; countquery="+collection1query);// big gap for harvestkey = null
ConcurrentLog.info("CollectionConfiguration","cleanup_processing: re-calculated "+proccount+" new documents, "+
ConcurrentLog.info("CollectionConfiguration","cleanup_processing: re-calculated "+proccount+" new documents, "+