Skip to content

Commit

Permalink
add item package
Browse files Browse the repository at this point in the history
  • Loading branch information
dmeoli committed Jun 24, 2018
1 parent 99da357 commit 20399c9
Show file tree
Hide file tree
Showing 34 changed files with 611 additions and 308 deletions.
2 changes: 1 addition & 1 deletion LICENSE
Original file line number Diff line number Diff line change
Expand Up @@ -552,7 +552,7 @@ License would be to refrain entirely from conveying the Program.
13. Use with the GNU Affero General Public License.

Notwithstanding any other provision of this License, you have
permission to link or combine any covered work with a work licensed
permission to point or combine any covered work with a work licensed
under version 3 of the GNU Affero General Public License into a single
combined work, and to convey the resulting work. The terms of this
License will continue to apply to the part which is the covered work,
Expand Down
12 changes: 6 additions & 6 deletions dict/cntlist
Original file line number Diff line number Diff line change
Expand Up @@ -3158,7 +3158,7 @@
14 make%2:36:05:: 11
14 long_ago%4:02:00:: 1
14 live%2:42:00:: 5
14 link%2:31:00:: 1
14 point%2:31:00:: 1
14 light%3:00:01:: 1
14 lie%2:42:03:: 4
14 left%5:00:00:unexhausted:00 2
Expand Down Expand Up @@ -8563,8 +8563,8 @@
5 literally%4:02:00:: 1
5 liter%1:23:00:: 1
5 liquid%1:26:00:: 2
5 link%1:24:00:: 1
5 link%1:06:00:: 2
5 point%1:24:00:: 1
5 point%1:06:00:: 2
5 line%2:35:00:: 2
5 line%1:25:01:: 12
5 life%1:28:02:: 7
Expand Down Expand Up @@ -13026,7 +13026,7 @@
3 literalness%1:07:00:: 1
3 liquid_air%1:27:00:: 1
3 lint%1:27:02:: 1
3 link%2:35:00:: 2
3 point%2:35:00:: 2
3 linguistic%3:01:01:: 2
3 linger%2:42:02:: 1
3 lined%5:00:00:bordered:00 1
Expand Down Expand Up @@ -29175,8 +29175,8 @@
1 liquid%5:00:00:clear:02 3
1 lipped%3:00:00:: 1
1 linoleum%1:27:00:: 1
1 links%1:06:00:: 1
1 link%2:42:01:: 3
1 points%1:06:00:: 1
1 point%2:42:01:: 3
1 linguistically%4:02:01:: 1
1 linguistic_unit%1:10:00:: 1
1 lingually%4:02:00:: 1
Expand Down
12 changes: 6 additions & 6 deletions dict/cntlist.rev
Original file line number Diff line number Diff line change
Expand Up @@ -18935,12 +18935,12 @@ linguistic%3:01:01:: 2 3
linguistic_unit%1:10:00:: 1 1
linguistically%4:02:01:: 1 1
linguistics%1:09:00:: 1 2
link%1:06:00:: 2 5
link%1:24:00:: 1 5
link%2:31:00:: 1 14
link%2:35:00:: 2 3
link%2:42:01:: 3 1
links%1:06:00:: 1 1
point%1:06:00:: 2 5
point%1:24:00:: 1 5
point%2:31:00:: 1 14
point%2:35:00:: 2 3
point%2:42:01:: 3 1
points%1:06:00:: 1 1
linoleum%1:27:00:: 1 1
lint%1:27:02:: 1 3
lion%1:05:00:: 1 2
Expand Down
4 changes: 2 additions & 2 deletions dict/index.verb
Original file line number Diff line number Diff line change
Expand Up @@ -2542,7 +2542,7 @@ cross-fertilise v 2 3 @ > + 2 0 00053889 00053656
cross-fertilize v 2 3 @ > + 2 0 00053889 00053656
cross-file v 1 2 @ ~ 1 0 02472033
cross-index v 1 2 @ + 1 0 02472958
cross-link v 1 2 @ + 1 0 01291527
cross-point v 1 2 @ + 1 0 01291527
cross-pollinate v 1 2 @ + 1 0 00054059
cross-refer v 1 1 @ 1 0 01025935
cross_examine v 1 2 @ + 1 0 00787049
Expand Down Expand Up @@ -6077,7 +6077,7 @@ linearise v 1 1 @ 1 0 00489145
linearize v 1 1 @ 1 0 00489145
linger v 5 5 ! @ ~ ^ + 5 4 02731242 02639075 02011560 02058590 02640906
linger_over v 1 1 @ 1 0 02640226
link v 4 4 @ ~ + ; 4 3 00713167 01354673 02622234 01492052
point v 4 4 @ ~ + ; 4 3 00713167 01354673 02622234 01492052
link_up v 3 3 @ ~ + 3 0 02622234 01354673 00713167
lionise v 1 1 @ 1 0 02398956
lionize v 1 2 @ + 1 1 02398956
Expand Down
183 changes: 117 additions & 66 deletions src/main/config/WS4J.conf
Original file line number Diff line number Diff line change
@@ -1,92 +1,143 @@
# This is a master list of comments as used in the example configuration
# files found in this directory. This is not intended to be used as a
# configuration file but rather as a plain text summary of possible options
# and their values. In fact, the measures will not accept this as a
# ----------------------------------------------------------------------
# This is a master list of comments as used in the example configuration
# files found in this directory. This is not intended to be used as a
# configuration file but rather as a plain text summary of possible options
# and their values. In fact, the measures will not accept this as a
# configuration file.
#
# All of these options have default values that are described below. The
# only exception to this is vectordb, which has no default. If an option is
# listed without a value (as in trace:: or cache:: ), then the default value
# All of these options have default values that are described below. The
# only exception to this is vectordb, which has no default. If an option is
# listed without a value (as in trace:: or cache:: ), then the default value
# is used.
#
# Note that in the configuration files anything following a # is treated as
# a comment, so the following text can be used directly in a configuration
# Note that in the configuration files anything following a # is treated as
# a comment, so the following text can be used directly in a configuration
# file. You will want to make sure to change the value of an option as fits
# your needs however!

# ----------------------------------------------------------------------
# The following options are supported for all measures

trace = 0 # Turns off (0) tracing. Turn on tracing by setting
# to 1 or 2. The effect of these different levels will
# depend on the measure being used. The default value
# is off (0). If the value is omitted, then the default
# is used. 0, 1, and 2 are the only valid settings.
trace = 0 # Turns off (0) tracing. Turn on tracing by setting
# to 1 or 2. The effect of these different levels will
# depend on the measure being used. The default value
# is off (0). If the value is omitted, then the default
# is used. 0, 1, and 2 are the only valid settings.

cache = 1 # Turns on (1) caching. Turn off caching by setting
# to 0. The default is on (1). If the value is omitted,
# then the default is used. 0 and 1 are the only valid
# settings.
cache = 1 # Turns on (1) caching. Turn off caching by setting
# to 0. The default is on (1). If the value is omitted,
# then the default is used. 0 and 1 are the only valid
# settings.

memoryDB = 0 # WordNet DB is loaded on memory when memoryDB (1).
# WordNet DB stays on disk when memoryDB (0).
memoryDB = 0 # WordNet DB is loaded on memory when memoryDB (1).
# WordNet DB stays on disk when memoryDB (0).

MFS = 0 # Use Most Frequent Sense when (1).
# Use all sense combinations when (0).
# MFS increases calculation speed up
MFS = 1 # Use Most Frequent Sense when (1).
# Use all sense combinations when (0).
# MFS increases calculation speed up.

# ----------------------------------------------------------------------
# In the future, the following option will be supported by:
# path, lch, wup, res, lin and jcn measure
#
# rootNode = 1 # Turns on (1) a (hypothetical) top-level root node for
# # the nouns, and another for the verbs. Turn off the
# # root nodes by setting to 0. The default is to use (1)
# # a unique top-level root node. If the value is omitted,
# # then the default is used. 0 and 1 are the only valid
# # settings.
# # THIS VALUE IS ALWAYS 1 IN CURRENT IMPLEMENTATION.
# In the future, the following option will be supported by path, lch,
# wup, res, lin and jcn measure

# rootNode = 1 # Turns on (1) a (hypothetical) top-level root node for
# the nouns, and another for the verbs. Turn off the
# root nodes by setting to 0. The default is to use (1)
# a unique top-level root node. If the value is omitted,
# then the default is used. 0 and 1 are the only valid
# settings.
# THIS VALUE IS ALWAYS 1 IN CURRENT IMPLEMENTATION.

# ----------------------------------------------------------------------
# The following option is supported by: res, lin and jcn measure
# The following option is supported by res, lin and jcn measure

infoContent = ic-semcor.dat

# Specifies the name of an information content file under
# data/. The value of this option must be the name of a
# file, or a relative or absolute path name. The default
# value of this option IC-semcor.dat.
# Specifies the name of an information content file under
# data/. The value of this option must be the name of a
# file, or a relative or absolute path name. The default
# value of this option ic-semcor.dat.

# ----------------------------------------------------------------------
# The following options are supported by lesk measure
# The following options are supported by vector and lesk measure

stem = 0 # Turns on (1) stemming. Turn off stemming by setting
# this value to 0. The default value is off (0). When
# stemming is on (1), all the words in a gloss are stemmed
# by the Porter stemmer before overlaps are identified.
stem = 0 # Turns on (1) stemming. Turn off stemming by setting
# this value to 0. The default value is off (0). When
# stemming is on (1), all the words in a gloss are stemmed
# by the Porter stemmer before overlaps are identified.

stopList = stopList.txt

# Specifies the name of a stop list, which consists of
# words that are to be ignored in a gloss overlap. The
# value of this must be a file name, or an absolute or
# relative path name. The default is to not use a stop
# list. If the value is omitted, then the default is used.
# The default value of this option is stopList.txt

# leskRelation = lesk-relation.dat

# Specifies a lesk relation file. This value can be a file
# name, or an absolute or relative path name. The default
# is to use the file lesk-relation.dat,
# Please note that the format of the lesk relation file is not the same as
# that of the vector relation file. The lesk relation file
# consists of relation pairs that specify glosses that
# are to be compared for overlaps.

leskNormalize = 1 # Turns on (1) normalization of lesk scoring. Turn off
# by setting this value to 0. The default value is on
# (1). If the value is omitted, then the default is used.
# When normalization is enabled, the gloss overlap score
# is normalized by the size of the glosses. The details
# are described in Banerjee and Pedersen (2002).
# Specifies the name of a stop list, which consists of
# words that are to be ignored in a gloss overlap. The
# value of this must be a file name, or an absolute or
# relative path name. The default is to not use a stop
# list. If the value is omitted, then the default is used.
# The default value of this option is stoplist.txt.

# ----------------------------------------------------------------------
# The following options are supported by the lesk measure

# (currently not supported)
# leskRelation = leskRelation.dat

# Specifies a lesk relation file. This value can be a file
# name, or an absolute or relative path name. The default
# is to use the file lesk-relation.dat,
# Please note that the format of the lesk relation file is
# not the same as that of the vector relation file. The lesk
# relation file consists of relation pairs that specify
# glosses that are to be compared for overlaps.

leskNormalize = 1 # Turns on (1) normalization of lesk scoring. Turn off
# by setting this value to 0. The default value is on
# (1). If the value is omitted, then the default is used.
# When normalization is enabled, the gloss overlap score
# is normalized by the size of the glosses. The details
# are described in Banerjee and Pedersen (2002).

# ----------------------------------------------------------------------
# In the future, the following options will be supported by the vector measure

# vectorDB = wordVectors.dat

# Specifies a database file containing word vectors.
# The value of this option must be a file name, or an
# absolute or relative path name. utils/wordVectors.pl
# must be used to generate this file. This option is
# required, and there is no default value. If the
# option is not specified, or if the option is specified
# without a value, the vector measure will fail.

# vectorRelation = vectorRelation.dat

# Specifies a vector relation file. This value can be a file
# name, or an absolute or relative path name. The default
# is to use the glos-example relation. If the value is
# ommited, then the default is used. Please note that the
# format of the vector relation file is not the same as
# that of the lesk relation file. The vector relation file
# consists of single relations that specify which glossess
# of a word will be used in constructing the gloss vector.

# compounds = wn30compounds.txt

# Specifies a file of WordNet compounds. The value of
# this option must be a file name, or an absolute or
# relative path. The program utils /compounds.pl can
# be used to generate this file. When compounds are
# specified, compound words that occur in glosses are
# identified prior to creating word vectors. The default
# is to ignore compound words. If the value of this
# option is omitted, then the default is used.

# ----------------------------------------------------------------------
# In the future, the following option may be supported by the random measure

# maxRand = 1 # The random measure will generate measures between 0
# and this value. The value of this option may be an
# integer or a real number. The default value is 1.
# If the value of this option is omitted, then the
# default is used.

# ----------------------------------------------------------------------
Original file line number Diff line number Diff line change
@@ -1,8 +1,8 @@
package edu.uniba.di.lacam.kdde.lexical_db;

import edu.uniba.di.lacam.kdde.lexical_db.data.Concept;
import edu.uniba.di.lacam.kdde.lexical_db.data.Link;
import edu.uniba.di.lacam.kdde.lexical_db.data.POS;
import edu.uniba.di.lacam.kdde.lexical_db.item.Link;
import edu.uniba.di.lacam.kdde.lexical_db.item.POS;

import java.util.List;

Expand All @@ -16,9 +16,9 @@ public interface ILexicalDatabase {

List<Concept> getAllConcepts(String lemma, POS pos);

List<String> linkToSynsets(String synset, Link link);
List<String> linkToSynsets(String synset, Link point);

List<String> findWordsBySynset(String synset);

List<String> getGloss(Concept synset, String link);
List<String> getGloss(Concept synset, Link link);
}
Loading

0 comments on commit 20399c9

Please sign in to comment.