diff --git a/dictionary_example.txt b/dictionary_example.txt new file mode 100644 index 0000000000000000000000000000000000000000..ca9371347746fb9acb8eb4419be88e92d3af31ea --- /dev/null +++ b/dictionary_example.txt @@ -0,0 +1,52 @@ + +|CONFIG| +%% Type will be used to identify annotations. +_annotationType=Inexact_Lookup + +%% Search will consider characters case. use YES or NO. +_caseSensitive=NO + +%% Max value accepted for EditDistance search. +_maxEditDistance=0 + +%% Quantity of better similarities will be used. Annotation with the same similarity will count as only one. +_numberBetterSimilarity=1 + +%% Minimum value accepted for the similarity. +_minAcceptedSimilarity=0.9 + +%% Name of the feature that will store the EditDistance value obtained from the search. +_editDistanceFeatureName=ED + +%% Class and method that implement the algorithm used to calculate the similarity. +%%Method used must receive two Strings and return a Float. +_similarityClass=org.apache.lucene.search.spell.JaroWinklerDistance +_similarityMethod=getDistance + +%% Class and method of transformation. Method must receive a String and return another String. +%% To do not use conversion, remove/comment both lines below. +_transformationClass=org.apache.commons.codec.language.DoubleMetaphone +_transformationMethod=doubleMetaphone + +%% Name of the feature that will store the value from the similarity algorithm. +_similarityFeatureName=Similarity + +%% Character used on entries lines bellow to searate features. +_featureSeparator=; + +%% Charactere used on entries lines bellow to separte name and value of each feature. +_featureNameValueSeparator=: + +%% Character used on entries lines bellow that indicates the end of the entrie. +_entrieDelimiter=# +|/CONFIG| + +%% List of features that are applied for all entries bellow. Do NOT use comments in this section. +|Features4ALL| +Group=XYZ +|/Features4ALL| + +%% List of entries used to build the trie. Do NOT use comments in this section. +|ENTRIES| +Sheffield#Type:city +Maryland#Type:state \ No newline at end of file