From 16734d528a9a6d2d86f4c277333864a8ba13a1c8 Mon Sep 17 00:00:00 2001
From: Pascal Essiembre
* toField
is ignored unless the keep
* attribute is set to true
.
@@ -46,29 +40,22 @@
*/
@Data
@Accessors(chain = true)
-@SuppressWarnings("javadoc")
public class BaseChecksummerConfig {
/**
* Whether to keep the metadata checksum value as a new metadata field.
- * @param keep true
to keep the checksum
- * @return true
to keep the checksum
*/
private boolean keep;
/**
* The metadata field to use to store the checksum value.
- * Default value is set by checksummer implementations.
+ * A default field name may be set by checksummer implementations.
* Only applicable if {@link #isKeep()} returns {@code true}
- * @param toField the metadata field name
- * @return metadata field name
*/
private String toField;
/**
* The property setter to use when a value is set.
- * @param onSet property setter
- * @return property setter
*/
private PropertySetter onSet;
}
diff --git a/crawler/core/src/main/java/com/norconex/crawler/core/doc/operations/checksum/impl/Md5DocumentChecksummer.java b/crawler/core/src/main/java/com/norconex/crawler/core/doc/operations/checksum/impl/Md5DocumentChecksummer.java
index 697c0711d..b65ce7114 100644
--- a/crawler/core/src/main/java/com/norconex/crawler/core/doc/operations/checksum/impl/Md5DocumentChecksummer.java
+++ b/crawler/core/src/main/java/com/norconex/crawler/core/doc/operations/checksum/impl/Md5DocumentChecksummer.java
@@ -38,10 +38,11 @@
*
* You have the option to keep the checksum as a document metadata field.
- * When {@link #setKeep(boolean)} is true
, the checksum will be
+ * When {@link Md5DocumentChecksummerConfig#setKeep(boolean)} is
+ * true
, the checksum will be
* stored in the target field name specified. If you do not specify any,
* it stores it under the metadata field name
- * {@link CrawlDocMetadata#CHECKSUM_METADATA}.
+ * {@value CrawlDocMetadata#CHECKSUM_METADATA}.
*
@@ -54,38 +55,11 @@ * will ignore the content while specifying none will only use the content. *
* - * {@nx.xml.usage - *
* toField
is ignored unless the keep
* attribute is set to true
.
*
- * The above example uses the document body (default) to make the checksum. - *
- * - *
- * Since 2.0.0, a self-closing
- * <documentChecksummer/>
tag without any attributes
- * is used to disable checksum generation.
- *
Implementation of {@link DocumentChecksummer} which - * returns a MD5 checksum value of the extracted document content unless - * one or more given source fields are specified, in which case the MD5 - * checksum value is constructed from those fields. This checksum is normally - * performed right after the document has been imported. - *
- *
- * You have the option to keep the checksum as a document metadata field.
- * When {@link #setKeep(boolean)} is true
, the checksum will be
- * stored in the target field name specified. If you do not specify any,
- * it stores it under the metadata field name
- * {@link CrawlDocMetadata#CHECKSUM_METADATA}.
- *
- * Since 1.9.0, it is possible to use a combination of document content
- * and fields to create the checksum by setting
- * combineFieldsAndContent
to true
.
- * If you combine fields and content but you don't define a field matcher,
- * it will be the equivalent of adding all fields.
- * If you do not combine the two, specifying a field matcher
- * will ignore the content while specifying none will only use the content.
- *
- * toField
is ignored unless the keep
- * attribute is set to true
.
- *
- * The above example uses the document body (default) to make the checksum. - *
- * - *
- * Since 2.0.0, a self-closing
- * <documentChecksummer/>
tag without any attributes
- * is used to disable checksum generation.
- *
true
if combining fields
- * and content checksums
- * @return true
if combining fields and content checksums
*/
private boolean combineFieldsAndContent;
-
}