# Sample input for Rover Semantic Relatedness Batch Processing # # Use a configuration to narrow down the GermaNet searches and # to specify parameters for the relatedness calculations. # # Word search constraints can be configured separately for both words. # The search constraint options are: # # wordCategories_1, wordCategories_2 (POS): # possible values: one or more of: adj, nomen, verben # default value: list of all possible values # Note that the current measures can only calculate relatedness of # words that belong to the same word category, so the intersection of # these two sets should not be empty. # # wordClasses_1, wordClasses_2 (semantic fields): # possible values: see https://uni-tuebingen.de/en/142844 for details # default value: list of all possible values # # orthForms_1, orthForms_2: # possible values: one or more of: orthForm, orthFormVar, oldOrthForm, oldOrthFormVar # default value: list of all possible values # # ignoreCase_1, ignoreCase_2: # possible values: true, false # default value: false # # Relatedness calculation options: # # measures: # possible values: SimplePath, WuAndPalmer, LeacockAndChodorow, Resnik, Lin, JiangAndConrath # default value: list of all possible values # # normalizedMax: # The raw values returned by relatedness calculations are often difficult to # interpret. Normalization makes it easy to interpret the results of an # individual measure, and also allows comparison of the results of different # measures. Results will be normalized to be between 0 (or near 0) and this value. # possible values: any positive integer, where 0 indicates no normalization # default value: 1 # # decimalPlaces: # Results will be rounded to this many decimal places. # possible values: positive integer # default value: 5 # # # To use the default value for a given config option, either delete # its entry, comment out the entry with '#', or include all values. # # To use all default values, remove or comment out the entire config. # # The config is specified in a JSON-like format, except that string # values do not need to be placed in quotes, and comments are allowed. # # Sample config: config: { wordCategories_1: [nomen], wordClasses_1: [Tier,Mensch], orthFormVariants_1: [orthForm, orthVar], ignoreCase_1: true, wordCategories_2: [nomen], wordClasses_2: [Tier,Mensch], orthFormVariants_2: [orthForm, orthVar], ignoreCase_2: true, measures: [SimplePath, Lin], normalizedMax: 1, decimalPlaces: 5 } # The data section consists of word pairs, one per line, with each # pair separated by a comma. # # The maximum number of word pairs is 200. Comments are allowed. data: Hund, Katze Hund, Spinne Pferd, Schwein