p_FeatureExtractors) {
40 | super(p_FeatureExtractors);
41 | }
42 | }
43 |
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.supervised.ims-gpl/src/main/java/sg/edu/nus/comp/nlp/ims/feature/CCollocation.java:
--------------------------------------------------------------------------------
1 | /*******************************************************************************
2 | * IMS (It Makes Sense) -- NUS WSD System
3 | * Copyright (c) 2013 National University of Singapore.
4 | *
5 | * This program is free software: you can redistribute it and/or modify
6 | * it under the terms of the GNU General Public License as published by
7 | * the Free Software Foundation, either version 3 of the License, or
8 | * (at your option) any later version.
9 | *
10 | * This program is distributed in the hope that it will be useful,
11 | * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 | * GNU General Public License for more details.
14 | *
15 | * You should have received a copy of the GNU General Public License
16 | * along with this program. If not, see .
17 | *
18 | ******************************************************************************/
19 |
20 | package sg.edu.nus.comp.nlp.ims.feature;
21 |
22 | /**
23 | * collocation feature.
24 | *
25 | * @author zhongzhi
26 | *
27 | */
28 | public class CCollocation extends AListFeature {
29 |
30 | /**
31 | *
32 | */
33 | private static final long serialVersionUID = 1L;
34 |
35 | public CCollocation() {
36 | }
37 |
38 | /*
39 | * (non-Javadoc)
40 | * @see sg.edu.nus.comp.nlp.ims.feature.AListFeature#clone()
41 | */
42 | public Object clone() {
43 | CCollocation clone = new CCollocation();
44 | clone.m_Key = this.m_Key;
45 | clone.m_Value = this.m_Value;
46 | return clone;
47 | }
48 | }
49 |
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.supervised.ims-gpl/src/main/java/sg/edu/nus/comp/nlp/ims/feature/CPOSFeature.java:
--------------------------------------------------------------------------------
1 | /*******************************************************************************
2 | * IMS (It Makes Sense) -- NUS WSD System
3 | * Copyright (c) 2013 National University of Singapore.
4 | *
5 | * This program is free software: you can redistribute it and/or modify
6 | * it under the terms of the GNU General Public License as published by
7 | * the Free Software Foundation, either version 3 of the License, or
8 | * (at your option) any later version.
9 | *
10 | * This program is distributed in the hope that it will be useful,
11 | * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 | * GNU General Public License for more details.
14 | *
15 | * You should have received a copy of the GNU General Public License
16 | * along with this program. If not, see .
17 | *
18 | ******************************************************************************/
19 |
20 | package sg.edu.nus.comp.nlp.ims.feature;
21 |
22 | /**
23 | * pos feature.
24 | *
25 | * @author zhongzhi
26 | *
27 | */
28 | public class CPOSFeature extends AListFeature {
29 |
30 | /**
31 | *
32 | */
33 | private static final long serialVersionUID = 1L;
34 |
35 | /*
36 | * (non-Javadoc)
37 | * @see sg.edu.nus.comp.nlp.ims.feature.AListFeature#clone()
38 | */
39 | public Object clone() {
40 | CPOSFeature clone = new CPOSFeature();
41 | clone.m_Key = this.m_Key;
42 | clone.m_Value = this.m_Value;
43 | return clone;
44 | }
45 | }
46 |
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.supervised.ims-gpl/src/main/java/sg/edu/nus/comp/nlp/ims/feature/CSurroundingWord.java:
--------------------------------------------------------------------------------
1 | /*******************************************************************************
2 | * IMS (It Makes Sense) -- NUS WSD System
3 | * Copyright (c) 2013 National University of Singapore.
4 | *
5 | * This program is free software: you can redistribute it and/or modify
6 | * it under the terms of the GNU General Public License as published by
7 | * the Free Software Foundation, either version 3 of the License, or
8 | * (at your option) any later version.
9 | *
10 | * This program is distributed in the hope that it will be useful,
11 | * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 | * GNU General Public License for more details.
14 | *
15 | * You should have received a copy of the GNU General Public License
16 | * along with this program. If not, see .
17 | *
18 | ******************************************************************************/
19 |
20 | package sg.edu.nus.comp.nlp.ims.feature;
21 |
22 | /**
23 | * surrounding word feature.
24 | *
25 | * @author zhongzhi
26 | *
27 | */
28 | public class CSurroundingWord extends ABinaryFeature {
29 |
30 | /**
31 | *
32 | */
33 | private static final long serialVersionUID = 1L;
34 |
35 | /**
36 | * constructor
37 | */
38 | public CSurroundingWord() {
39 | this.m_Key = null;
40 | this.m_Value = true;
41 | }
42 |
43 | /*
44 | * (non-Javadoc)
45 | * @see sg.edu.nus.comp.nlp.ims.feature.ABinaryFeature#clone()
46 | */
47 | public Object clone() {
48 | CSurroundingWord clone = new CSurroundingWord();
49 | clone.m_Key = this.m_Key;
50 | return clone;
51 | }
52 | }
53 |
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.supervised.ims-gpl/src/main/java/sg/edu/nus/comp/nlp/ims/feature/package.html:
--------------------------------------------------------------------------------
1 |
3 |
4 |
5 |
6 | Package related to features used in WSD.
7 |
8 |
9 |
10 |
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.supervised.ims-gpl/src/main/java/sg/edu/nus/comp/nlp/ims/implement/package.html:
--------------------------------------------------------------------------------
1 |
3 |
4 |
5 |
6 | Package containing the main WSD API.
7 |
8 |
9 |
10 |
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.supervised.ims-gpl/src/main/java/sg/edu/nus/comp/nlp/ims/instance/package.html:
--------------------------------------------------------------------------------
1 |
3 |
4 |
5 |
6 | Package related to wsd instance.
7 |
8 |
9 |
10 |
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.supervised.ims-gpl/src/main/java/sg/edu/nus/comp/nlp/ims/io/IModelWriter.java:
--------------------------------------------------------------------------------
1 | /*******************************************************************************
2 | * IMS (It Makes Sense) -- NUS WSD System
3 | * Copyright (c) 2013 National University of Singapore.
4 | *
5 | * This program is free software: you can redistribute it and/or modify
6 | * it under the terms of the GNU General Public License as published by
7 | * the Free Software Foundation, either version 3 of the License, or
8 | * (at your option) any later version.
9 | *
10 | * This program is distributed in the hope that it will be useful,
11 | * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 | * GNU General Public License for more details.
14 | *
15 | * You should have received a copy of the GNU General Public License
16 | * along with this program. If not, see .
17 | *
18 | ******************************************************************************/
19 |
20 | package sg.edu.nus.comp.nlp.ims.io;
21 |
22 | import java.io.IOException;
23 |
24 | /**
25 | * model writer interface.
26 | *
27 | * @author zhongzhi
28 | *
29 | */
30 | public interface IModelWriter {
31 |
32 | /**
33 | * write model
34 | *
35 | * @param p_ModelInfo
36 | * model
37 | * @throws IOException
38 | * exception while saving model
39 | */
40 | public void write(Object p_ModelInfo) throws IOException;
41 |
42 | /**
43 | * set options
44 | *
45 | * @param p_Options
46 | * options
47 | */
48 | public void setOptions(String[] p_Options);
49 | }
50 |
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.supervised.ims-gpl/src/main/java/sg/edu/nus/comp/nlp/ims/io/IResultWriter.java:
--------------------------------------------------------------------------------
1 | /*******************************************************************************
2 | * IMS (It Makes Sense) -- NUS WSD System
3 | * Copyright (c) 2013 National University of Singapore.
4 | *
5 | * This program is free software: you can redistribute it and/or modify
6 | * it under the terms of the GNU General Public License as published by
7 | * the Free Software Foundation, either version 3 of the License, or
8 | * (at your option) any later version.
9 | *
10 | * This program is distributed in the hope that it will be useful,
11 | * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 | * GNU General Public License for more details.
14 | *
15 | * You should have received a copy of the GNU General Public License
16 | * along with this program. If not, see .
17 | *
18 | ******************************************************************************/
19 |
20 | package sg.edu.nus.comp.nlp.ims.io;
21 |
22 | import java.io.IOException;
23 |
24 | /**
25 | * result writer interface.
26 | *
27 | * @author zhongzhi
28 | *
29 | */
30 | public interface IResultWriter {
31 | /**
32 | * write results
33 | *
34 | * @param p_Result
35 | * result
36 | * @throws IOException
37 | * exception while saving result
38 | */
39 | public void write(Object p_Result) throws IOException;
40 |
41 | /**
42 | * convert result to string
43 | *
44 | * @param p_Result
45 | * classification result
46 | * @return string format
47 | */
48 | public String toString(Object p_Result);
49 |
50 | /**
51 | * set options
52 | *
53 | * @param p_Options
54 | * options
55 | */
56 | public void setOptions(String[] p_Options);
57 | }
58 |
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.supervised.ims-gpl/src/main/java/sg/edu/nus/comp/nlp/ims/io/package.html:
--------------------------------------------------------------------------------
1 |
3 |
4 |
5 |
6 | Package related to IO.
7 |
8 |
9 |
10 |
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.supervised.ims-gpl/src/main/java/sg/edu/nus/comp/nlp/ims/lexelt/CCollocationFeatureSelector.java:
--------------------------------------------------------------------------------
1 | /*******************************************************************************
2 | * IMS (It Makes Sense) -- NUS WSD System
3 | * Copyright (c) 2013 National University of Singapore.
4 | *
5 | * This program is free software: you can redistribute it and/or modify
6 | * it under the terms of the GNU General Public License as published by
7 | * the Free Software Foundation, either version 3 of the License, or
8 | * (at your option) any later version.
9 | *
10 | * This program is distributed in the hope that it will be useful,
11 | * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 | * GNU General Public License for more details.
14 | *
15 | * You should have received a copy of the GNU General Public License
16 | * along with this program. If not, see .
17 | *
18 | ******************************************************************************/
19 |
20 | package sg.edu.nus.comp.nlp.ims.lexelt;
21 |
22 | import sg.edu.nus.comp.nlp.ims.feature.CCollocation;
23 |
24 | /**
25 | * collocation feature selector.
26 | *
27 | * @author zhongzhi
28 | *
29 | */
30 | public class CCollocationFeatureSelector extends AListFeatureSelector {
31 | /**
32 | * constructor
33 | *
34 | * @param p_M2
35 | * cut off
36 | */
37 | public CCollocationFeatureSelector(int p_M2) {
38 | this.m_M2 = p_M2;
39 | this.m_FeatureName = CCollocation.class.getName();
40 | }
41 |
42 | }
43 |
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.supervised.ims-gpl/src/main/java/sg/edu/nus/comp/nlp/ims/lexelt/CModelInfo.java:
--------------------------------------------------------------------------------
1 | /*******************************************************************************
2 | * IMS (It Makes Sense) -- NUS WSD System
3 | * Copyright (c) 2013 National University of Singapore.
4 | *
5 | * This program is free software: you can redistribute it and/or modify
6 | * it under the terms of the GNU General Public License as published by
7 | * the Free Software Foundation, either version 3 of the License, or
8 | * (at your option) any later version.
9 | *
10 | * This program is distributed in the hope that it will be useful,
11 | * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 | * GNU General Public License for more details.
14 | *
15 | * You should have received a copy of the GNU General Public License
16 | * along with this program. If not, see .
17 | *
18 | ******************************************************************************/
19 |
20 | package sg.edu.nus.comp.nlp.ims.lexelt;
21 |
22 | /**
23 | * weka model information
24 | *
25 | * @author zhongzhi
26 | *
27 | */
28 | public class CModelInfo {
29 | // model id
30 | public String lexelt;
31 | // weka model
32 | public Object model;
33 | // statistic
34 | public Object statistic;
35 | }
36 |
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.supervised.ims-gpl/src/main/java/sg/edu/nus/comp/nlp/ims/lexelt/CPOSFeatureSelector.java:
--------------------------------------------------------------------------------
1 | /*******************************************************************************
2 | * IMS (It Makes Sense) -- NUS WSD System
3 | * Copyright (c) 2013 National University of Singapore.
4 | *
5 | * This program is free software: you can redistribute it and/or modify
6 | * it under the terms of the GNU General Public License as published by
7 | * the Free Software Foundation, either version 3 of the License, or
8 | * (at your option) any later version.
9 | *
10 | * This program is distributed in the hope that it will be useful,
11 | * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 | * GNU General Public License for more details.
14 | *
15 | * You should have received a copy of the GNU General Public License
16 | * along with this program. If not, see .
17 | *
18 | ******************************************************************************/
19 |
20 | package sg.edu.nus.comp.nlp.ims.lexelt;
21 |
22 | import sg.edu.nus.comp.nlp.ims.feature.CPOSFeature;
23 |
24 | /**
25 | * POS tag feature selector.
26 | *
27 | * @author zhongzhi
28 | *
29 | */
30 | public class CPOSFeatureSelector extends AListFeatureSelector {
31 | /**
32 | * constructor
33 | *
34 | * @param p_M2
35 | * threshold
36 | */
37 | public CPOSFeatureSelector(int p_M2) {
38 | this.m_M2 = p_M2;
39 | this.m_FeatureName = CPOSFeature.class.getName();
40 | }
41 |
42 | }
43 |
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.supervised.ims-gpl/src/main/java/sg/edu/nus/comp/nlp/ims/lexelt/package.html:
--------------------------------------------------------------------------------
1 |
3 |
4 |
5 |
6 | Package related to one instances set of the same lexelt.
7 |
8 |
9 |
10 |
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.supervised.ims-gpl/src/main/java/sg/edu/nus/comp/nlp/ims/util/CPair.java:
--------------------------------------------------------------------------------
1 | /*******************************************************************************
2 | * IMS (It Makes Sense) -- NUS WSD System
3 | * Copyright (c) 2013 National University of Singapore.
4 | *
5 | * This program is free software: you can redistribute it and/or modify
6 | * it under the terms of the GNU General Public License as published by
7 | * the Free Software Foundation, either version 3 of the License, or
8 | * (at your option) any later version.
9 | *
10 | * This program is distributed in the hope that it will be useful,
11 | * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 | * GNU General Public License for more details.
14 | *
15 | * You should have received a copy of the GNU General Public License
16 | * along with this program. If not, see .
17 | *
18 | ******************************************************************************/
19 |
20 | package sg.edu.nus.comp.nlp.ims.util;
21 |
22 | /**
23 | * pair template
24 | * @author zhongzhi
25 | *
26 | */
27 | public class CPair {
28 | // first value
29 | protected F m_First;
30 | // second value
31 | protected S m_Second;
32 |
33 | /**
34 | * constructor
35 | * @param p_First first value
36 | * @param p_Second second value
37 | */
38 | public CPair(F p_First, S p_Second) {
39 | m_First = p_First;
40 | m_Second = p_Second;
41 | }
42 |
43 | /**
44 | * get first value
45 | * @return first
46 | */
47 | public F getFirst() {
48 | return m_First;
49 | }
50 |
51 | /**
52 | * get second value
53 | * @return second
54 | */
55 | public S getSecond() {
56 | return m_Second;
57 | }
58 |
59 | }
60 |
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.supervised.ims-gpl/src/main/java/sg/edu/nus/comp/nlp/ims/util/ILemmatizer.java:
--------------------------------------------------------------------------------
1 | /*******************************************************************************
2 | * IMS (It Makes Sense) -- NUS WSD System
3 | * Copyright (c) 2013 National University of Singapore.
4 | *
5 | * This program is free software: you can redistribute it and/or modify
6 | * it under the terms of the GNU General Public License as published by
7 | * the Free Software Foundation, either version 3 of the License, or
8 | * (at your option) any later version.
9 | *
10 | * This program is distributed in the hope that it will be useful,
11 | * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 | * GNU General Public License for more details.
14 | *
15 | * You should have received a copy of the GNU General Public License
16 | * along with this program. If not, see .
17 | *
18 | ******************************************************************************/
19 |
20 | package sg.edu.nus.comp.nlp.ims.util;
21 |
22 | /**
23 | * lemmatizer interface.
24 | *
25 | * @author zhongzhi
26 | *
27 | */
28 | public interface ILemmatizer {
29 | /**
30 | * lemmatize the input
31 | * @param p_Input input information
32 | * @return lemma
33 | */
34 | public String lemmatize(String[] p_Input);
35 |
36 | /**
37 | * guess lexelt of input
38 | * @param p_Input input
39 | * @return lexelt
40 | */
41 | public String guessLexelt(String[] p_Input);
42 |
43 | /**
44 | * get the lexelt of input
45 | * @param p_Input input
46 | * @return lexelt
47 | */
48 | public String getLexelt(String[] p_Input);
49 | }
50 |
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.supervised.ims-gpl/src/main/java/sg/edu/nus/comp/nlp/ims/util/IPOSTagger.java:
--------------------------------------------------------------------------------
1 | /*******************************************************************************
2 | * IMS (It Makes Sense) -- NUS WSD System
3 | * Copyright (c) 2013 National University of Singapore.
4 | *
5 | * This program is free software: you can redistribute it and/or modify
6 | * it under the terms of the GNU General Public License as published by
7 | * the Free Software Foundation, either version 3 of the License, or
8 | * (at your option) any later version.
9 | *
10 | * This program is distributed in the hope that it will be useful,
11 | * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 | * GNU General Public License for more details.
14 | *
15 | * You should have received a copy of the GNU General Public License
16 | * along with this program. If not, see .
17 | *
18 | ******************************************************************************/
19 |
20 | package sg.edu.nus.comp.nlp.ims.util;
21 |
22 | /**
23 | * POS tagger interface.
24 | *
25 | * @author zhongzhi
26 | *
27 | */
28 | public interface IPOSTagger {
29 | /**
30 | * tag a tokenized input sentence
31 | *
32 | * @param input
33 | * a tokenized sentence
34 | * @return sentence with tag for each token
35 | */
36 | public String tag(String input);
37 |
38 | /**
39 | * get the tag of a tagged token
40 | *
41 | * @param input
42 | * a tagged token
43 | * @return tag
44 | */
45 | public String getTag(String input);
46 |
47 | /**
48 | * get the original token of a tagged token
49 | *
50 | * @param input
51 | * a tagged token
52 | * @return original token
53 | */
54 | public String getToken(String input);
55 |
56 | }
57 |
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.supervised.ims-gpl/src/main/java/sg/edu/nus/comp/nlp/ims/util/ISenseIndex.java:
--------------------------------------------------------------------------------
1 | /*******************************************************************************
2 | * IMS (It Makes Sense) -- NUS WSD System
3 | * Copyright (c) 2013 National University of Singapore.
4 | *
5 | * This program is free software: you can redistribute it and/or modify
6 | * it under the terms of the GNU General Public License as published by
7 | * the Free Software Foundation, either version 3 of the License, or
8 | * (at your option) any later version.
9 | *
10 | * This program is distributed in the hope that it will be useful,
11 | * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 | * GNU General Public License for more details.
14 | *
15 | * You should have received a copy of the GNU General Public License
16 | * along with this program. If not, see .
17 | *
18 | ******************************************************************************/
19 |
20 | package sg.edu.nus.comp.nlp.ims.util;
21 |
22 | /**
23 | * sense index interface. refer to the index.sense file in wordnet.
24 | *
25 | * @author zhongzhi
26 | *
27 | */
28 | public interface ISenseIndex {
29 | /**
30 | * get the first sense of p_Lexelt
31 | *
32 | * @param p_Lexelt
33 | * lexelt id
34 | * @return first sense
35 | */
36 | public String getFirstSense(String p_Lexelt);
37 |
38 | /**
39 | * get sense number of p_Sense
40 | *
41 | * @param p_Sense
42 | * sense
43 | * @return sense number
44 | */
45 | public int getSenseNo(String p_Sense);
46 |
47 | }
48 |
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.supervised.ims-gpl/src/main/java/sg/edu/nus/comp/nlp/ims/util/ISentenceSplitter.java:
--------------------------------------------------------------------------------
1 | /*******************************************************************************
2 | * IMS (It Makes Sense) -- NUS WSD System
3 | * Copyright (c) 2013 National University of Singapore.
4 | *
5 | * This program is free software: you can redistribute it and/or modify
6 | * it under the terms of the GNU General Public License as published by
7 | * the Free Software Foundation, either version 3 of the License, or
8 | * (at your option) any later version.
9 | *
10 | * This program is distributed in the hope that it will be useful,
11 | * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 | * GNU General Public License for more details.
14 | *
15 | * You should have received a copy of the GNU General Public License
16 | * along with this program. If not, see .
17 | *
18 | ******************************************************************************/
19 |
20 | package sg.edu.nus.comp.nlp.ims.util;
21 |
22 | /**
23 | * sentence splitter interface.
24 | *
25 | * @author zhongzhi
26 | *
27 | */
28 | public interface ISentenceSplitter {
29 | /**
30 | * split input into sentences
31 | *
32 | * @param input
33 | * input string
34 | * @return sentences
35 | */
36 | public String[] split(String input);
37 | }
38 |
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.supervised.ims-gpl/src/main/java/sg/edu/nus/comp/nlp/ims/util/ITokenizer.java:
--------------------------------------------------------------------------------
1 | /*******************************************************************************
2 | * IMS (It Makes Sense) -- NUS WSD System
3 | * Copyright (c) 2013 National University of Singapore.
4 | *
5 | * This program is free software: you can redistribute it and/or modify
6 | * it under the terms of the GNU General Public License as published by
7 | * the Free Software Foundation, either version 3 of the License, or
8 | * (at your option) any later version.
9 | *
10 | * This program is distributed in the hope that it will be useful,
11 | * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 | * GNU General Public License for more details.
14 | *
15 | * You should have received a copy of the GNU General Public License
16 | * along with this program. If not, see .
17 | *
18 | ******************************************************************************/
19 |
20 | package sg.edu.nus.comp.nlp.ims.util;
21 |
22 | /**
23 | * sentence tokenizer interface.
24 | *
25 | * @author zhongzhi
26 | *
27 | */
28 | public interface ITokenizer {
29 |
30 | /**
31 | * tokenize an input sentence into tokens
32 | *
33 | * @param input
34 | * input sentence
35 | * @return tokens
36 | */
37 | public String[] tokenize(String input);
38 | }
39 |
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.supervised.ims-gpl/src/main/java/sg/edu/nus/comp/nlp/ims/util/package.html:
--------------------------------------------------------------------------------
1 |
3 |
4 |
5 |
6 | Package related to utility data structures, algorithms and some external API used by multiple other packages.
7 |
8 |
9 |
10 |
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.supervised.ims-gpl/src/test/resources/plain/test.txt:
--------------------------------------------------------------------------------
1 | IMS (It Makes Sense) is a supervised English all-words word sense disambiguation (WSD) system. The flexible framework of IMS allows users to integrate different preprocessing tools, additional features, and different classifiers. By default, we use linear support vector machines as the classifier with multiple features. This implementation of IMS achieves state-of-the-art results on several SensEval and SemEval tasks.
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.supervised.twsi-gpl/.license-header.txt:
--------------------------------------------------------------------------------
1 | Copyright ${year}
2 | Ubiquitous Knowledge Processing (UKP) Lab
3 | Technische Universität Darmstadt
4 |
5 | This program is free software: you can redistribute it and/or modify
6 | it under the terms of the GNU General Public License as published by
7 | the Free Software Foundation, either version 3 of the License, or
8 | (at your option) any later version.
9 |
10 | This program is distributed in the hope that it will be useful,
11 | but WITHOUT ANY WARRANTY; without even the implied warranty of
12 | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 | GNU General Public License for more details.
14 |
15 | You should have received a copy of the GNU General Public License
16 | along with this program. If not, see .
17 |
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.supervised.twsi-gpl/pom.xml:
--------------------------------------------------------------------------------
1 |
21 |
22 | 4.0.0
23 |
24 | de.tudarmstadt.ukp.dkpro.wsd
25 | de.tudarmstadt.ukp.dkpro.wsd-gpl
26 | ../de.tudarmstadt.ukp.dkpro.wsd-gpl
27 | 1.3.0-SNAPSHOT
28 |
29 | de.tudarmstadt.ukp.dkpro.wsd.supervised.twsi-gpl
30 |
31 |
32 | de.tudarmstadt.ukp.dkpro.wsd
33 |
34 | de.tudarmstadt.ukp.dkpro.wsd.si.twsi-gpl
35 |
36 |
37 |
38 | DKPro WSD GPL - TWSI disambiguation
39 | DKPro WSD GPL modules for the Turk Bootstrap Word Sense Inventory disambiguation system
40 |
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.testing/pom.xml:
--------------------------------------------------------------------------------
1 |
18 |
19 | 4.0.0
20 |
21 | de.tudarmstadt.ukp.dkpro.wsd-asl
22 | ../de.tudarmstadt.ukp.dkpro.wsd-asl
23 | de.tudarmstadt.ukp.dkpro.wsd
24 | 1.3.0-SNAPSHOT
25 |
26 | de.tudarmstadt.ukp.dkpro.wsd.testing
27 |
28 |
29 |
30 | maven-javadoc-plugin
31 |
32 | de.tudarmstadt.ukp.dkpro.wsd.testing
33 |
34 |
35 |
36 |
37 | DKPro WSD - Testing
38 | Data used in JUnit tests by various DKPro WSD modules
39 |
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.testing/src/main/java/de/tudarmstadt/ukp/dkpro/wsd/testing/package-info.java:
--------------------------------------------------------------------------------
1 | /*******************************************************************************
2 | * Copyright 2017
3 | * Ubiquitous Knowledge Processing (UKP) Lab
4 | * Technische Universität Darmstadt
5 | *
6 | * Licensed under the Apache License, Version 2.0 (the "License");
7 | * you may not use this file except in compliance with the License.
8 | * You may obtain a copy of the License at
9 | *
10 | * http://www.apache.org/licenses/LICENSE-2.0
11 | *
12 | * Unless required by applicable law or agreed to in writing, software
13 | * distributed under the License is distributed on an "AS IS" BASIS,
14 | * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
15 | * See the License for the specific language governing permissions and
16 | * limitations under the License.
17 | ******************************************************************************/
18 |
19 | /**
20 | * This module contains shared resources for JUnit tests. The
21 | * package has no classes.
22 | */
23 | package de.tudarmstadt.ukp.dkpro.wsd.testing;
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.testing/src/main/resources/masc/tell-v/tell-v.txt:
--------------------------------------------------------------------------------
1 | I am a canon builder," he told me.
2 | But I told the third person that I am only telling you once.
3 |
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.testing/src/main/resources/senseval/index.sense:
--------------------------------------------------------------------------------
1 | call_for%2:32:03:: 01063695 3 1
2 | call_for%2:32:04:: 00752764 1 24
3 | call_for%2:40:00:: 02305586 4 0
4 | call_for%2:42:00:: 02627934 2 21
5 | call%1:10:01:: 06272803 1 9
6 | call%1:10:02:: 07120524 3 3
7 | call%1:10:03:: 06796642 5 1
8 | call%1:10:04:: 07190693 9 0
9 | call%1:10:05:: 07192129 4 2
10 | call%1:10:06:: 07192511 8 0
11 | call%1:10:07:: 06582761 10 0
12 | call%1:10:08:: 07192661 7 0
13 | animal%1:03:00:: 00015388 1 67
14 |
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.testing/src/main/resources/senseval/semeval1aw.dtd:
--------------------------------------------------------------------------------
1 |
2 |
3 |
4 |
5 |
6 |
7 |
8 |
9 |
10 |
11 |
12 |
13 |
14 |
15 |
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.testing/src/main/resources/senseval/semeval1aw.xml:
--------------------------------------------------------------------------------
1 |
2 |
3 |
4 |
5 | Eggs
6 | looked
7 | like
8 | food
9 | .
10 |
11 |
12 |
13 |
14 | Hello
15 | .
16 |
17 |
18 | He
19 | is
20 | good
21 | .
22 |
23 |
24 |
25 |
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.testing/src/main/resources/senseval/semeval2aw.xml:
--------------------------------------------------------------------------------
1 |
2 |
3 |
4 |
5 |
6 | Eggs
7 | looked
8 | up
9 | like
10 | food
11 | .
12 |
13 |
14 |
15 |
16 | Hello
17 | .
18 |
19 |
20 | He
21 | is
22 | good
23 | .
24 |
25 |
26 |
27 |
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.testing/src/main/resources/senseval/senseval2aw.xml:
--------------------------------------------------------------------------------
1 |
2 |
3 |
4 |
5 | He
6 | thought
7 | on
8 | the
9 | spur
10 | of
11 | the
12 | moment
13 | ,
14 | as
15 | a
16 | matter
17 | of
18 | fact
19 | .
20 |
21 |
22 |
23 |
24 |
25 |
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.testing/src/main/resources/senseval/senseval2ls.key:
--------------------------------------------------------------------------------
1 | call.v call.1 call_for%2:32:03::/0.6 call_for%2:42:00::/0.4 !! this is a comment
2 | animal.n animal.1 animal%1:03:00:: U
3 |
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.testing/src/main/resources/senseval/senseval2ls.xml:
--------------------------------------------------------------------------------
1 |
2 |
3 |
4 |
5 | Eggs call for food.
6 |
7 |
8 |
9 |
10 |
11 | Dave is an animal.
12 |
13 |
14 |
15 |
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.testing/src/main/resources/senseval/senseval2ls_lsr.key:
--------------------------------------------------------------------------------
1 | call.v call.1 art#933420|artistic_creation#933420|artistic_production#933420|---n/0.6 art#5638987|artistry#5638987|prowess#5638987|---n/0.4 !! this is a comment
2 | animal.n animal.1 bar#2937469|cake#2937469|---n U
3 |
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.testing/src/main/resources/senseval/senseval2ls_test.key:
--------------------------------------------------------------------------------
1 | call.v call.2 call_for%2:32:03::/0.0 call_for%2:42:00::/1.0 !! this is a comment
2 | animal.n animal.1 animal%1:03:00::/0.75 U/0.0 foo/0.5
3 |
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.testing/src/main/resources/webcage/webcage.dtd:
--------------------------------------------------------------------------------
1 |
2 |
3 |
4 |
5 |
6 |
7 |
8 |
9 |
10 |
11 |
12 |
13 |
14 |
15 |
16 |
17 |
18 |
19 |
20 |
21 |
22 |
23 |
24 |
25 |
26 |
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.testing/src/main/resources/webcage/webcage0.xml:
--------------------------------------------------------------------------------
1 |
2 |
3 |
4 | Vor und während eines Krieges kommt es häufig zum Abbruch der diplomatischen Beziehungen.
5 | Nach dem Unwetter blieb uns nur eine Lösung: Abbruch der Zelte.
6 |
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.testing/src/main/resources/webcage/webcage1.xml:
--------------------------------------------------------------------------------
1 |
2 |
3 |
4 |
5 | Der Ladevorgang einer Internetseite kann in verschiedenen Webbrowsern mit der Escape-Taste unterbrochen werden. In den meisten Dialogfenstern von Windows-Anwendungen entspricht das Drücken der Escape-Taste einem Klick auf die Schaltfläche „Abbrechen“. Ein Druck auf die Escape-Taste bricht auch eine bereits begonnene Eingabe in einem Textfeld ab und stellt den Ursprungszustand wieder her.
6 |
7 |
8 | Im Augenblick sind vierzehn Kasinos 24 Stunden am Tag geöffnet, zu Lande oder auf dem Meer, in denen Spielergruppen - weitaus leiser, als man vermuten möchte - ohne Unterbrechung in fensterlosen Sälen unter gleißendem Neonlicht zocken.
9 |
10 |
11 |
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.wrapper-gpl/.license-header.txt:
--------------------------------------------------------------------------------
1 | Copyright ${year}
2 | Ubiquitous Knowledge Processing (UKP) Lab
3 | Technische Universität Darmstadt
4 |
5 | This program is free software: you can redistribute it and/or modify
6 | it under the terms of the GNU General Public License as published by
7 | the Free Software Foundation, either version 3 of the License, or
8 | (at your option) any later version.
9 |
10 | This program is distributed in the hope that it will be useful,
11 | but WITHOUT ANY WARRANTY; without even the implied warranty of
12 | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 | GNU General Public License for more details.
14 |
15 | You should have received a copy of the GNU General Public License
16 | along with this program. If not, see .
17 |
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.wrapper-gpl/src/main/java/de/tudarmstadt/ukp/dkpro/wsd/wrapper/Disambiguator.java:
--------------------------------------------------------------------------------
1 | /**
2 | * Copyright 2017
3 | * Ubiquitous Knowledge Processing (UKP) Lab
4 | * Technische Universität Darmstadt
5 | *
6 | * This program is free software: you can redistribute it and/or modify
7 | * it under the terms of the GNU General Public License as published by
8 | * the Free Software Foundation, either version 3 of the License, or
9 | * (at your option) any later version.
10 | *
11 | * This program is distributed in the hope that it will be useful,
12 | * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 | * GNU General Public License for more details.
15 | *
16 | * You should have received a copy of the GNU General Public License
17 | * along with this program. If not, see .
18 | */
19 | package de.tudarmstadt.ukp.dkpro.wsd.wrapper;
20 |
21 | import java.io.IOException;
22 | import java.util.List;
23 |
24 | /**
25 | * A disambiguator that returns senses for an input text
26 | * @author nico.erbs@gmail.com
27 | *
28 | */
29 | public interface Disambiguator {
30 |
31 | /**
32 | * @param inputText The input text.
33 | *
34 | * @return
35 | * The list of string with the senses disambiguated in the input text.
36 | */
37 | List disambiguate(String inputText) throws IOException;
38 |
39 | /**
40 | * @return The name of the disambiguator.
41 | */
42 | String getName();
43 |
44 | /**
45 | * @return Returns a string with the configuration details of this word sense disambiguator.
46 | */
47 | String getConfigurationDetails();
48 |
49 | }
50 |
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.wrapper-gpl/src/main/resources/stopwords/german_stopwords.txt:
--------------------------------------------------------------------------------
1 | "
2 | '
3 | ?
4 | !
5 | ,
6 | ;
7 | :
8 | .
9 | +
10 | (
11 | )
12 | [
13 | ]
14 | {
15 | }
16 | /
17 | \
18 | aber
19 | als
20 | am
21 | an
22 | auch
23 | auf
24 | aus
25 | bei
26 | bin
27 | bis
28 | bist
29 | da
30 | dadurch
31 | daher
32 | darum
33 | das
34 | daß
35 | dass
36 | dein
37 | deine
38 | dem
39 | den
40 | der
41 | des
42 | dessen
43 | deshalb
44 | die
45 | dies
46 | dieser
47 | dieses
48 | doch
49 | dort
50 | du
51 | durch
52 | ein
53 | eine
54 | einem
55 | einen
56 | einer
57 | eines
58 | er
59 | es
60 | euer
61 | eure
62 | für
63 | hatte
64 | hatten
65 | hattest
66 | hattet
67 | hier hinter
68 | ich
69 | ihr
70 | ihre
71 | im
72 | in
73 | ist
74 | ja
75 | jede
76 | jedem
77 | jeden
78 | jeder
79 | jedes
80 | jener
81 | jenes
82 | jetzt
83 | kann
84 | kannst
85 | können
86 | könnt
87 | machen
88 | mein
89 | meine
90 | mit
91 | muß
92 | mußt
93 | musst
94 | müssen
95 | müßt
96 | nach
97 | nachdem
98 | nein
99 | nicht
100 | nun
101 | oder
102 | seid
103 | sein
104 | seine
105 | sich
106 | sie
107 | sind
108 | soll
109 | sollen
110 | sollst
111 | sollt
112 | sonst
113 | soweit
114 | sowie
115 | und
116 | unser
117 | unsere
118 | unter
119 | vom
120 | von
121 | vor
122 | wann
123 | warum
124 | was
125 | weiter
126 | weitere
127 | wenn
128 | wer
129 | werde
130 | werden
131 | werdet
132 | weshalb
133 | wie
134 | wieder
135 | wieso
136 | wir
137 | wird
138 | wirst
139 | wo
140 | woher
141 | wohin
142 | zu
143 | zum
144 | zur
145 | über
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.wrapper-gpl/src/main/resources/stopwords/punctuation.txt:
--------------------------------------------------------------------------------
1 | .
2 | ,
3 | :
4 | ;
5 | ?
6 | !
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.wrapper-gpl/src/main/resources/stopwords/stoplist_de.txt:
--------------------------------------------------------------------------------
1 | aber
2 | als
3 | am
4 | an
5 | auch
6 | auf
7 | aus
8 | bei
9 | bin
10 | bis
11 | bist
12 | da
13 | dadurch
14 | daher
15 | darum
16 | das
17 | daß
18 | dass
19 | dein
20 | deine
21 | dem
22 | den
23 | der
24 | des
25 | dessen
26 | deshalb
27 | die
28 | dies
29 | dieser
30 | dieses
31 | doch
32 | dort
33 | du
34 | durch
35 | ein
36 | eine
37 | einem
38 | einen
39 | einer
40 | eines
41 | er
42 | es
43 | euer
44 | eure
45 | für
46 | hatte
47 | hatten
48 | hattest
49 | hattet
50 | hier hinter
51 | ich
52 | ihr
53 | ihre
54 | im
55 | in
56 | ist
57 | ja
58 | jede
59 | jedem
60 | jeden
61 | jeder
62 | jedes
63 | jener
64 | jenes
65 | jetzt
66 | kann
67 | kannst
68 | können
69 | könnt
70 | machen
71 | mein
72 | meine
73 | mit
74 | muß
75 | mußt
76 | musst
77 | müssen
78 | müßt
79 | nach
80 | nachdem
81 | nein
82 | nicht
83 | nun
84 | oder
85 | seid
86 | sein
87 | seine
88 | sich
89 | sie
90 | sind
91 | soll
92 | sollen
93 | sollst
94 | sollt
95 | sonst
96 | soweit
97 | sowie
98 | und
99 | unser
100 | unsere
101 | unter
102 | vom
103 | von
104 | vor
105 | wann
106 | warum
107 | was
108 | weiter
109 | weitere
110 | wenn
111 | wer
112 | werde
113 | werden
114 | werdet
115 | weshalb
116 | wie
117 | wieder
118 | wieso
119 | wir
120 | wird
121 | wirst
122 | wo
123 | woher
124 | wohin
125 | zu
126 | zum
127 | zur
128 | über
129 | ,
130 | .
131 | -
132 | •
133 |
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.wrapper-gpl/src/test/java/de/tudarmstadt/ukp/dkpro/wsd/wrapper/LinkDatabaseLinkMeasureDisambiguatorTest.java:
--------------------------------------------------------------------------------
1 | /**
2 | * Copyright 2017
3 | * Ubiquitous Knowledge Processing (UKP) Lab
4 | * Technische Universität Darmstadt
5 | *
6 | * This program is free software: you can redistribute it and/or modify
7 | * it under the terms of the GNU General Public License as published by
8 | * the Free Software Foundation, either version 3 of the License, or
9 | * (at your option) any later version.
10 | *
11 | * This program is distributed in the hope that it will be useful,
12 | * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 | * GNU General Public License for more details.
15 | *
16 | * You should have received a copy of the GNU General Public License
17 | * along with this program. If not, see .
18 | */
19 | package de.tudarmstadt.ukp.dkpro.wsd.wrapper;
20 |
21 | import static org.junit.Assert.*;
22 |
23 | import java.io.IOException;
24 | import java.util.ArrayList;
25 | import java.util.List;
26 |
27 | import org.junit.Ignore;
28 | import org.junit.Test;
29 |
30 | public class LinkDatabaseLinkMeasureDisambiguatorTest {
31 |
32 | @Test
33 | @Ignore
34 | public void disambiguateTest() throws IOException {
35 | String input = "Please disambiguate this text.";
36 |
37 | Disambiguator disambiguator = new LinkDatabaseLinkMeasureDisambiguator();
38 | List senses = disambiguator.disambiguate(input);
39 | System.out.println(senses);
40 |
41 | List goldSenses = new ArrayList();
42 | goldSenses.add("word_sense_disambiguation");
43 |
44 | assertEquals(goldSenses.size(), senses.size());
45 | for(String sense : senses){
46 | assertTrue(goldSenses.contains(sense));
47 | }
48 | }
49 | }
50 |
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.wrapper-gpl/src/test/java/de/tudarmstadt/ukp/dkpro/wsd/wrapper/LinkDatabaseMFSDisambiguatorTest.java:
--------------------------------------------------------------------------------
1 | /**
2 | * Copyright 2017
3 | * Ubiquitous Knowledge Processing (UKP) Lab
4 | * Technische Universität Darmstadt
5 | *
6 | * This program is free software: you can redistribute it and/or modify
7 | * it under the terms of the GNU General Public License as published by
8 | * the Free Software Foundation, either version 3 of the License, or
9 | * (at your option) any later version.
10 | *
11 | * This program is distributed in the hope that it will be useful,
12 | * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 | * GNU General Public License for more details.
15 | *
16 | * You should have received a copy of the GNU General Public License
17 | * along with this program. If not, see .
18 | */
19 | package de.tudarmstadt.ukp.dkpro.wsd.wrapper;
20 |
21 | import static org.junit.Assert.*;
22 |
23 | import java.io.IOException;
24 | import java.util.ArrayList;
25 | import java.util.List;
26 |
27 | import org.junit.Ignore;
28 | import org.junit.Test;
29 |
30 | public class LinkDatabaseMFSDisambiguatorTest {
31 |
32 | @Test
33 | @Ignore
34 | public void disambiguateTest() throws IOException {
35 | String input = "Please disambiguate this text.";
36 |
37 | Disambiguator disambiguator = new LinkDatabaseMFSDisambiguator();
38 | List senses = disambiguator.disambiguate(input);
39 | System.out.println(senses);
40 |
41 | List goldSenses = new ArrayList();
42 | goldSenses.add("word_sense_disambiguation");
43 | goldSenses.add("text_user_interface");
44 |
45 | assertEquals(goldSenses.size(), senses.size());
46 | for(String sense : senses){
47 | assertTrue(goldSenses.contains(sense));
48 | }
49 | }
50 | }
51 |
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.wsi/README.txt:
--------------------------------------------------------------------------------
1 | DKPro WSD WSI
2 |
3 | This package contains parts of the UKP system participating in the SemEval 2013 Task 11
4 | "Word Sense Induction & Disambiguation within an End-User Application".
5 |
6 | In particular it contains
7 | * a reader for the dataset (AMBIENTReader)
8 | * an annotator for marking the target words (WSIAnnotator),
9 | * a loadable sense inventory (JSONSenseInventory) which may use an induced inventory
10 | * the WSD step and a writer that produces input files for the official evaluation package (Semeval2013Task11Evaluator).
11 |
12 | What is missing to run the actual system is
13 |
14 | * the actual WSI algorithm, which was written in R. An older version of this algorithm is included
15 | as SimpleGraphClusterinInductionAlgorithm and I am planning to port back the improvements from the
16 | R implementation.
17 |
18 | * the co-occurrence database. The code to generate such a database will soon be available as part of the
19 | DKPro BigData package (https://code.google.com/p/dkpro-bigdata/).
20 |
21 | * the distributional thesaurus for lexical expansion. The code to generate the thesaurus is available
22 | from http://www.jobimtext.org.
23 |
24 | The documentation will be updated soon. If you want to make use of this module, do not hesitate to contact
25 | me (at hpzorn@gmail.com)
26 |
27 | August 2013,
28 | Hans-Peter Zorn
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.wsi/src/main/java/de/tudarmstadt/ukp/dkpro/wsd/wsi/algorithm/SenseInductionAlgorithm.java:
--------------------------------------------------------------------------------
1 | /*******************************************************************************
2 | * Copyright 2017
3 | * Ubiquitous Knowledge Processing (UKP) Lab
4 | * Technische Universität Darmstadt
5 | *
6 | * Licensed under the Apache License, Version 2.0 (the "License");
7 | * you may not use this file except in compliance with the License.
8 | * You may obtain a copy of the License at
9 | *
10 | * http://www.apache.org/licenses/LICENSE-2.0
11 | *
12 | * Unless required by applicable law or agreed to in writing, software
13 | * distributed under the License is distributed on an "AS IS" BASIS,
14 | * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
15 | * See the License for the specific language governing permissions and
16 | * limitations under the License.
17 | ******************************************************************************/
18 | package de.tudarmstadt.ukp.dkpro.wsd.wsi.algorithm;
19 |
20 | import java.util.Collection;
21 |
22 | import de.tudarmstadt.ukp.dkpro.wsd.WSDException;
23 | import de.tudarmstadt.ukp.dkpro.wsd.si.SenseInventory;
24 |
25 | public interface SenseInductionAlgorithm
26 | {
27 | /**
28 | * Starts a batch induction
29 | *
30 | * @param targetWords
31 | */
32 | public SenseInventory induce(Collection targetWords);
33 |
34 | /**
35 | * @param term
36 | * @throws WSDException
37 | */
38 | public void induceSenses(String term)
39 | throws WSDException;
40 |
41 | public SenseInventory getSenseInventory();
42 | }
--------------------------------------------------------------------------------
/de.tudarmstadt.ukp.dkpro.wsd.wsi/src/main/java/de/tudarmstadt/ukp/dkpro/wsd/wsi/algorithm/WSIAlgorithmBase.java:
--------------------------------------------------------------------------------
1 | /*******************************************************************************
2 | * Copyright 2017
3 | * Ubiquitous Knowledge Processing (UKP) Lab
4 | * Technische Universität Darmstadt
5 | *
6 | * Licensed under the Apache License, Version 2.0 (the "License");
7 | * you may not use this file except in compliance with the License.
8 | * You may obtain a copy of the License at
9 | *
10 | * http://www.apache.org/licenses/LICENSE-2.0
11 | *
12 | * Unless required by applicable law or agreed to in writing, software
13 | * distributed under the License is distributed on an "AS IS" BASIS,
14 | * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
15 | * See the License for the specific language governing permissions and
16 | * limitations under the License.
17 | ******************************************************************************/
18 | package de.tudarmstadt.ukp.dkpro.wsd.wsi.algorithm;
19 |
20 | import de.tudarmstadt.ukp.dkpro.wsd.si.SenseInventory;
21 | import de.tudarmstadt.ukp.dkpro.wsd.wsi.si.InducedSenseInventory;
22 |
23 | public abstract class WSIAlgorithmBase
24 | implements SenseInductionAlgorithm
25 | {
26 |
27 | protected InducedSenseInventory senseInventory;
28 |
29 | public WSIAlgorithmBase()
30 | {
31 | super();
32 | }
33 |
34 | @Override
35 | public SenseInventory getSenseInventory()
36 | {
37 | return senseInventory;
38 | }
39 |
40 | }
--------------------------------------------------------------------------------