add item package

dmeoli · Jun 24, 2018 · 20399c9 · 20399c9
1 parent 99da357
commit 20399c9
Show file tree

Hide file tree

Showing 34 changed files with 611 additions and 308 deletions.
diff --git a/LICENSE b/LICENSE
@@ -552,7 +552,7 @@ License would be to refrain entirely from conveying the Program.
   13. Use with the GNU Affero General Public License.
 
   Notwithstanding any other provision of this License, you have
-permission to link or combine any covered work with a work licensed
+permission to point or combine any covered work with a work licensed
 under version 3 of the GNU Affero General Public License into a single
 combined work, and to convey the resulting work.  The terms of this
 License will continue to apply to the part which is the covered work,

diff --git a/dict/cntlist b/dict/cntlist
@@ -3158,7 +3158,7 @@
 14 make%2:36:05:: 11
 14 long_ago%4:02:00:: 1
 14 live%2:42:00:: 5
-14 link%2:31:00:: 1
+14 point%2:31:00:: 1
 14 light%3:00:01:: 1
 14 lie%2:42:03:: 4
 14 left%5:00:00:unexhausted:00 2
@@ -8563,8 +8563,8 @@
 5 literally%4:02:00:: 1
 5 liter%1:23:00:: 1
 5 liquid%1:26:00:: 2
-5 link%1:24:00:: 1
-5 link%1:06:00:: 2
+5 point%1:24:00:: 1
+5 point%1:06:00:: 2
 5 line%2:35:00:: 2
 5 line%1:25:01:: 12
 5 life%1:28:02:: 7
@@ -13026,7 +13026,7 @@
 3 literalness%1:07:00:: 1
 3 liquid_air%1:27:00:: 1
 3 lint%1:27:02:: 1
-3 link%2:35:00:: 2
+3 point%2:35:00:: 2
 3 linguistic%3:01:01:: 2
 3 linger%2:42:02:: 1
 3 lined%5:00:00:bordered:00 1
@@ -29175,8 +29175,8 @@
 1 liquid%5:00:00:clear:02 3
 1 lipped%3:00:00:: 1
 1 linoleum%1:27:00:: 1
-1 links%1:06:00:: 1
-1 link%2:42:01:: 3
+1 points%1:06:00:: 1
+1 point%2:42:01:: 3
 1 linguistically%4:02:01:: 1
 1 linguistic_unit%1:10:00:: 1
 1 lingually%4:02:00:: 1

diff --git a/dict/cntlist.rev b/dict/cntlist.rev
@@ -18935,12 +18935,12 @@ linguistic%3:01:01:: 2 3
 linguistic_unit%1:10:00:: 1 1
 linguistically%4:02:01:: 1 1
 linguistics%1:09:00:: 1 2
-link%1:06:00:: 2 5
-link%1:24:00:: 1 5
-link%2:31:00:: 1 14
-link%2:35:00:: 2 3
-link%2:42:01:: 3 1
-links%1:06:00:: 1 1
+point%1:06:00:: 2 5
+point%1:24:00:: 1 5
+point%2:31:00:: 1 14
+point%2:35:00:: 2 3
+point%2:42:01:: 3 1
+points%1:06:00:: 1 1
 linoleum%1:27:00:: 1 1
 lint%1:27:02:: 1 3
 lion%1:05:00:: 1 2

diff --git a/dict/index.verb b/dict/index.verb
@@ -2542,7 +2542,7 @@ cross-fertilise v 2 3 @ > + 2 0 00053889 00053656
 cross-fertilize v 2 3 @ > + 2 0 00053889 00053656  
 cross-file v 1 2 @ ~ 1 0 02472033  
 cross-index v 1 2 @ + 1 0 02472958  
-cross-link v 1 2 @ + 1 0 01291527  
+cross-point v 1 2 @ + 1 0 01291527
 cross-pollinate v 1 2 @ + 1 0 00054059  
 cross-refer v 1 1 @ 1 0 01025935  
 cross_examine v 1 2 @ + 1 0 00787049  
@@ -6077,7 +6077,7 @@ linearise v 1 1 @ 1 0 00489145
 linearize v 1 1 @ 1 0 00489145  
 linger v 5 5 ! @ ~ ^ + 5 4 02731242 02639075 02011560 02058590 02640906  
 linger_over v 1 1 @ 1 0 02640226  
-link v 4 4 @ ~ + ; 4 3 00713167 01354673 02622234 01492052  
+point v 4 4 @ ~ + ; 4 3 00713167 01354673 02622234 01492052
 link_up v 3 3 @ ~ + 3 0 02622234 01354673 00713167  
 lionise v 1 1 @ 1 0 02398956  
 lionize v 1 2 @ + 1 1 02398956  

diff --git a/src/main/config/WS4J.conf b/src/main/config/WS4J.conf
@@ -1,92 +1,143 @@
-# This is a master list of comments as used in the example configuration  
-# files found in this directory. This is not intended to be used as a 
-# configuration file but rather as a plain text summary of possible options  
-# and their values. In fact, the measures will not accept this as a  
+# ----------------------------------------------------------------------
+# This is a master list of comments as used in the example configuration
+# files found in this directory. This is not intended to be used as a
+# configuration file but rather as a plain text summary of possible options
+# and their values. In fact, the measures will not accept this as a
 # configuration file.
 # 
-# All of these options have default values that are described below. The  
-# only exception to this is vectordb, which has no default. If an option is  
-# listed without a value (as in trace:: or cache:: ), then the default value  
+# All of these options have default values that are described below. The 
+# only exception to this is vectordb, which has no default. If an option is 
+# listed without a value (as in trace:: or cache:: ), then the default value
 # is used. 
 # 
-# Note that in the configuration files anything following a # is treated as  
-# a comment, so the following text can be used directly in a configuration 
+# Note that in the configuration files anything following a # is treated as
+# a comment, so the following text can be used directly in a configuration
 # file. You will want to make sure to change the value of an option as fits 
 # your needs however!
 
 # ----------------------------------------------------------------------
 # The following options are supported for all measures
 
-trace = 0          # Turns off (0) tracing. Turn on tracing by setting
-                   # to 1 or 2. The effect of these different levels will
-                   # depend on the measure being used. The default value
-                   # is off (0). If the value is omitted, then the default
-                   # is used. 0, 1, and 2 are the only valid settings.
+trace = 0         # Turns off (0) tracing. Turn on tracing by setting
+                  # to 1 or 2. The effect of these different levels will
+                  # depend on the measure being used. The default value 
+                  # is off (0). If the value is omitted, then the default 
+                  # is used. 0, 1, and 2 are the only valid settings.
 
-cache = 1          # Turns on (1) caching. Turn off caching by setting
-                   # to 0. The default is on (1). If the value is omitted,
-                   # then the default is used. 0 and 1 are the only valid
-                   # settings.
+cache = 1         # Turns on (1) caching. Turn off caching by setting 
+                  # to 0. The default is on (1). If the value is omitted,
+                  # then the default is used. 0 and 1 are the only valid
+                  # settings.
 
-memoryDB = 0       # WordNet DB is loaded on memory when memoryDB (1).
-                   # WordNet DB stays on disk when memoryDB (0).
+memoryDB = 0      # WordNet DB is loaded on memory when memoryDB (1).
+                  # WordNet DB stays on disk when memoryDB (0).
 
-MFS = 0            # Use Most Frequent Sense when (1).
-                   # Use all sense combinations when (0).
-                   # MFS increases calculation speed up
+MFS = 1           # Use Most Frequent Sense when (1).
+                  # Use all sense combinations when (0). 
+                  # MFS increases calculation speed up.
 
 # ----------------------------------------------------------------------
-# In the future, the following option will be supported by:
-# path, lch, wup, res, lin and jcn measure
-# 
-# rootNode = 1     # Turns on (1) a (hypothetical) top-level root node for
-#                  # the nouns, and another for the verbs. Turn off the
-#                  # root nodes by setting to 0.  The default is to use (1)
-#                  # a unique top-level root node.  If the value is omitted,
-#                  # then the default is used.  0 and 1 are the only valid
-#                  # settings.
-#                  # THIS VALUE IS ALWAYS 1 IN CURRENT IMPLEMENTATION.
+# In the future, the following option will be supported by path, lch, 
+# wup, res, lin and jcn measure
+
+# rootNode = 1    # Turns on (1) a (hypothetical) top-level root node for
+                  # the nouns, and another for the verbs. Turn off the 
+                  # root nodes by setting to 0. The default is to use (1) 
+                  # a unique top-level root node. If the value is omitted,
+                  # then the default is used. 0 and 1 are the only valid
+                  # settings. 
+                  # THIS VALUE IS ALWAYS 1 IN CURRENT IMPLEMENTATION.
 
 # ----------------------------------------------------------------------
-# The following option is supported by: res, lin and jcn measure
+# The following option is supported by res, lin and jcn measure
 
 infoContent = ic-semcor.dat
 
-                   # Specifies the name of an information content file under
-                   # data/. The value of this option must be the name of a
-                   # file, or a relative or absolute path name. The default
-                   # value of this option IC-semcor.dat.
+                  # Specifies the name of an information content file under 
+                  # data/. The value of this option must be the name of a
+                  # file, or a relative or absolute path name. The default
+                  # value of this option ic-semcor.dat.
 
 # ----------------------------------------------------------------------
-# The following options are supported by lesk measure
+# The following options are supported by vector and lesk measure
 
-stem = 0           # Turns on (1) stemming. Turn off stemming by setting
-                   # this value to 0. The default value is off (0).  When
-                   # stemming is on (1), all the words in a gloss are stemmed
-                   # by the Porter stemmer before overlaps are identified.
+stem = 0          # Turns on (1) stemming. Turn off stemming by setting
+                  # this value to 0. The default value is off (0). When 
+                  # stemming is on (1), all the words in a gloss are stemmed
+                  # by the Porter stemmer before overlaps are identified.
 
 stopList = stopList.txt
 
-                   # Specifies the name of a stop list, which consists of
-                   # words that are to be ignored in a gloss overlap. The
-                   # value of this must be a file name, or an absolute or
-                   # relative path name. The default is to not use a stop
-                   # list. If the value is omitted, then the default is used.
-                   # The default value of this option is stopList.txt
-
-# leskRelation = lesk-relation.dat
-
-                   # Specifies a lesk relation file. This value can be a file 
-                   # name, or an absolute or relative path name. The default
-                   # is to use the file lesk-relation.dat, 
-                   # Please note that the format of the lesk relation file is not the same as 
-                   # that of the vector relation file. The lesk relation file
-                   # consists of relation pairs that specify glosses that  
-                   # are to be compared for overlaps. 
-
-leskNormalize = 1  # Turns on (1) normalization of lesk scoring. Turn off
-                   # by setting this value to 0. The default value is on 
-                   # (1).  If the  value is omitted, then the default is used.  
-                   # When normalization is enabled, the gloss overlap score 
-                   # is normalized by the size of the glosses. The details 
-                   # are described in Banerjee and Pedersen (2002).
+                  # Specifies the name of a stop list, which consists of
+                  # words that are to be ignored in a gloss overlap. The
+                  # value of this must be a file name, or an absolute or
+                  # relative path name. The default is to not use a stop
+                  # list. If the value is omitted, then the default is used.
+                  # The default value of this option is stoplist.txt.
+
+# ----------------------------------------------------------------------
+# The following options are supported by the lesk measure
+
+# (currently not supported)
+# leskRelation = leskRelation.dat
+
+                  # Specifies a lesk relation file. This value can be a file
+                  # name, or an absolute or relative path name. The default 
+                  # is to use the file lesk-relation.dat, 
+                  # Please note that the format of the lesk relation file is 
+                  # not the same as that of the vector relation file. The lesk 
+                  # relation file consists of relation pairs that specify 
+                  # glosses that are to be compared for overlaps. 
+
+leskNormalize = 1 # Turns on (1) normalization of lesk scoring. Turn off
+                  # by setting this value to 0. The default value is on 
+                  # (1). If the value is omitted, then the default is used. 
+                  # When normalization is enabled, the gloss overlap score 
+                  # is normalized by the size of the glosses. The details 
+                  # are described in Banerjee and Pedersen (2002).
+
+# ----------------------------------------------------------------------
+# In the future, the following options will be supported by the vector measure
+
+# vectorDB = wordVectors.dat
+
+                  # Specifies a database file containing word vectors.
+                  # The value of this option must be a file name, or an
+                  # absolute or relative path name. utils/wordVectors.pl 
+                  # must be used to generate this file. This option is
+                  # required, and there is no default value. If the 
+                  # option is not specified, or if the option is specified
+                  # without a value, the vector measure will fail.
+
+# vectorRelation = vectorRelation.dat
+
+                  # Specifies a vector relation file. This value can be a file
+                  # name, or an absolute or relative path name. The default 
+                  # is to use the glos-example relation. If the value is 
+                  # ommited, then the default is used. Please note that the 
+                  # format of the vector relation file is not the same as 
+                  # that of the lesk relation file. The vector relation file
+                  # consists of single relations that specify which glossess
+                  # of a word will be used in constructing the gloss vector.
+
+# compounds = wn30compounds.txt
+
+                  # Specifies a file of WordNet compounds. The value of
+                  # this option must be a file name, or an absolute or
+                  # relative path. The program utils /compounds.pl can 
+                  # be used to generate this file. When compounds are 
+                  # specified, compound words that occur in glosses are
+                  # identified prior to creating word vectors. The default 
+                  # is to ignore compound words. If the value of this 
+                  # option is omitted, then the default is used. 
+
+# ----------------------------------------------------------------------
+# In the future, the following option may be supported by the random measure
+
+# maxRand = 1     # The random measure will generate measures between 0
+                  # and this value. The value of this option may be an
+                  # integer or a real number. The default value is 1.
+                  # If the value of this option is omitted, then the 
+                  # default is used. 
+
+# ----------------------------------------------------------------------
diff --git a/src/main/java/edu/uniba/di/lacam/kdde/lexical_db/ILexicalDatabase.java b/src/main/java/edu/uniba/di/lacam/kdde/lexical_db/ILexicalDatabase.java
@@ -1,8 +1,8 @@
 package edu.uniba.di.lacam.kdde.lexical_db;
 
 import edu.uniba.di.lacam.kdde.lexical_db.data.Concept;
-import edu.uniba.di.lacam.kdde.lexical_db.data.Link;
-import edu.uniba.di.lacam.kdde.lexical_db.data.POS;
+import edu.uniba.di.lacam.kdde.lexical_db.item.Link;
+import edu.uniba.di.lacam.kdde.lexical_db.item.POS;
 
 import java.util.List;
 
@@ -16,9 +16,9 @@ public interface ILexicalDatabase {
 
     List<Concept> getAllConcepts(String lemma, POS pos);
 
-    List<String> linkToSynsets(String synset, Link link);
+    List<String> linkToSynsets(String synset, Link point);
 
     List<String> findWordsBySynset(String synset);
 
-    List<String> getGloss(Concept synset, String link);
+    List<String> getGloss(Concept synset, Link link);
 }