in core/src/main/java/org/apache/stormcrawler/filtering/basic/BasicURLNormalizer.java [172:211]
public void configure(@NotNull Map<String, Object> stormConf, @NotNull JsonNode paramNode) {
JsonNode node = paramNode.get("removeAnchorPart");
if (node != null) {
removeAnchorPart = node.booleanValue();
}
node = paramNode.get("unmangleQueryString");
if (node != null) {
unmangleQueryString = node.booleanValue();
}
node = paramNode.get("queryElementsToRemove");
if (node != null) {
if (!node.isArray()) {
LOG.warn(
"Failed to configure queryElementsToRemove. Not an array: {}",
node.toString());
} else {
ArrayNode array = (ArrayNode) node;
for (JsonNode element : array) {
queryElementsToRemove.add(element.asText());
}
}
}
node = paramNode.get("checkValidURI");
if (node != null) {
checkValidURI = node.booleanValue();
}
node = paramNode.get("removeHashes");
if (node != null) {
removeHashes = node.booleanValue();
}
node = paramNode.get("hostIDNtoASCII");
if (node != null) {
hostIDNtoASCII = node.booleanValue();
}
}