case class SimilarityConfig(normOrgLegalformWeight: Double = 0.25, normOrgCountryWeight: Double = 0.5, nameElementSimilarityForHit: Double = 0.9, matchSelectionMode: Int = 0, checkDateForSearchHit: Boolean = true, dateComparisonMethod: Int = 0, maxDateYearDifferenceForHit: Int = 2, checkCountryForSearchHit: Boolean = true, similarityValueForSearchHit: Double = 0.9, numberOfHitsForSearchHit: Int = 2, maxNumberOfCandidatesFromSearch: Int = 10000, searchEntityGroupMode: Int = 0, allowOneLetterAbbreviation: Boolean = false, oneLetterAbbreviationWeight: Double = 0.5) extends Product with Serializable
Class for the configuration of the normalizing and similarity stuff. Important: Make sure you use the same configuration for indexing and searching/comparing. Otherwise there may be unwanted side effects.
- normOrgLegalformWeight
Weight (reduction) of a legal form match (recommended: < 1, default is 0.25).
- normOrgCountryWeight
Weight (reduction) of a country match (recommended: < 1, default is 0.5).
- nameElementSimilarityForHit
Minimum similarity to mark as hit. Default is 0.9.
- matchSelectionMode
Method of how a match has to be determined: 0 = Based on simialrity. 1 = Based on nofHits (number of hits). Default is 0.
- checkDateForSearchHit
Defines whether the date should be taken into account or not. Default is true.
- maxDateYearDifferenceForHit
Defines the uncertainty/tolerance in the annual comparison in number of years (+/-). Default is 2.
- checkCountryForSearchHit
Defines whether the country should be considered or not. Default is true.
- similarityValueForSearchHit
Value of the similarity from which the comparison is classified as a hit. Default is 0.9.
- numberOfHitsForSearchHit
Value of the nofHits (number of hits) from which the comparison is classified as a hit. Default is 2.
- maxNumberOfCandidatesFromSearch
Defines the maximum number of candidates to be considered by the IR search, from which hits are then determined. Default is 10000
- searchEntityGroupMode
Defines the field by which the hits are to be grouped. Depends which value is unique: 0 = externalId, 1 = Id. Default is 0.
- allowOneLetterAbbreviation
Defines whether abbreviations with a letter are taken into account. With true, for example, Benjamin is a hit with B. Default is false.
- oneLetterAbbreviationWeight
If abbreviations are taken into account, this value defines the weight (reduction) of such a hit. Default is 0.5.
- Alphabetic
- By Inheritance
- SimilarityConfig
- Serializable
- Product
- Equals
- AnyRef
- Any
- Hide All
- Show All
- Public
- Protected
Instance Constructors
- new SimilarityConfig(normOrgLegalformWeight: Double = 0.25, normOrgCountryWeight: Double = 0.5, nameElementSimilarityForHit: Double = 0.9, matchSelectionMode: Int = 0, checkDateForSearchHit: Boolean = true, dateComparisonMethod: Int = 0, maxDateYearDifferenceForHit: Int = 2, checkCountryForSearchHit: Boolean = true, similarityValueForSearchHit: Double = 0.9, numberOfHitsForSearchHit: Int = 2, maxNumberOfCandidatesFromSearch: Int = 10000, searchEntityGroupMode: Int = 0, allowOneLetterAbbreviation: Boolean = false, oneLetterAbbreviationWeight: Double = 0.5)
- normOrgLegalformWeight
Weight (reduction) of a legal form match (recommended: < 1, default is 0.25).
- normOrgCountryWeight
Weight (reduction) of a country match (recommended: < 1, default is 0.5).
- nameElementSimilarityForHit
Minimum similarity to mark as hit. Default is 0.9.
- matchSelectionMode
Method of how a match has to be determined: 0 = Based on simialrity. 1 = Based on nofHits (number of hits). Default is 0.
- checkDateForSearchHit
Defines whether the date should be taken into account or not. Default is true.
- maxDateYearDifferenceForHit
Defines the uncertainty/tolerance in the annual comparison in number of years (+/-). Default is 2.
- checkCountryForSearchHit
Defines whether the country should be considered or not. Default is true.
- similarityValueForSearchHit
Value of the similarity from which the comparison is classified as a hit. Default is 0.9.
- numberOfHitsForSearchHit
Value of the nofHits (number of hits) from which the comparison is classified as a hit. Default is 2.
- maxNumberOfCandidatesFromSearch
Defines the maximum number of candidates to be considered by the IR search, from which hits are then determined. Default is 10000
- searchEntityGroupMode
Defines the field by which the hits are to be grouped. Depends which value is unique: 0 = externalId, 1 = Id. Default is 0.
- allowOneLetterAbbreviation
Defines whether abbreviations with a letter are taken into account. With true, for example, Benjamin is a hit with B. Default is false.
- oneLetterAbbreviationWeight
If abbreviations are taken into account, this value defines the weight (reduction) of such a hit. Default is 0.5.
Value Members
- final def !=(arg0: Any): Boolean
- Definition Classes
- AnyRef → Any
- final def ##: Int
- Definition Classes
- AnyRef → Any
- final def ==(arg0: Any): Boolean
- Definition Classes
- AnyRef → Any
- val allowOneLetterAbbreviation: Boolean
- final def asInstanceOf[T0]: T0
- Definition Classes
- Any
- val checkCountryForSearchHit: Boolean
- val checkDateForSearchHit: Boolean
- def clone(): AnyRef
- Attributes
- protected[lang]
- Definition Classes
- AnyRef
- Annotations
- @throws(classOf[java.lang.CloneNotSupportedException]) @native() @HotSpotIntrinsicCandidate()
- val dateComparisonMethod: Int
- final def eq(arg0: AnyRef): Boolean
- Definition Classes
- AnyRef
- final def getClass(): Class[_ <: AnyRef]
- Definition Classes
- AnyRef → Any
- Annotations
- @native() @HotSpotIntrinsicCandidate()
- final def isInstanceOf[T0]: Boolean
- Definition Classes
- Any
- val matchSelectionMode: Int
- val maxDateYearDifferenceForHit: Int
- val maxNumberOfCandidatesFromSearch: Int
- val nameElementSimilarityForHit: Double
- final def ne(arg0: AnyRef): Boolean
- Definition Classes
- AnyRef
- val normOrgCountryWeight: Double
- val normOrgLegalformWeight: Double
- final def notify(): Unit
- Definition Classes
- AnyRef
- Annotations
- @native() @HotSpotIntrinsicCandidate()
- final def notifyAll(): Unit
- Definition Classes
- AnyRef
- Annotations
- @native() @HotSpotIntrinsicCandidate()
- val numberOfHitsForSearchHit: Int
- val oneLetterAbbreviationWeight: Double
- def productElementNames: Iterator[String]
- Definition Classes
- Product
- val searchEntityGroupMode: Int
- val similarityValueForSearchHit: Double
- final def synchronized[T0](arg0: => T0): T0
- Definition Classes
- AnyRef
- final def wait(arg0: Long, arg1: Int): Unit
- Definition Classes
- AnyRef
- Annotations
- @throws(classOf[java.lang.InterruptedException])
- final def wait(arg0: Long): Unit
- Definition Classes
- AnyRef
- Annotations
- @throws(classOf[java.lang.InterruptedException]) @native()
- final def wait(): Unit
- Definition Classes
- AnyRef
- Annotations
- @throws(classOf[java.lang.InterruptedException])
Deprecated Value Members
- def finalize(): Unit
- Attributes
- protected[lang]
- Definition Classes
- AnyRef
- Annotations
- @throws(classOf[java.lang.Throwable]) @Deprecated
- Deprecated