From f59de6c4091f192179ddf61ebfc8978f8d151dd8 Mon Sep 17 00:00:00 2001
From: vicmak <vitiokm@gmail.com>
Date: Tue, 22 Apr 2014 23:16:29 +0300
Subject: [PATCH] Concatenated values of word net suggestions

The values that are suggested from wordnet are here concatenated. this
is done for further indexing and retrieval operations in GATE ANNIC
platform. That is for saving in searchable lucene datastore, and
performing querying on the corpus.
In addition soundex value for each word is added. This is done for
searching at homophone confusion
---
 src/org/philgooch/WordNetSuggester.java | 522 ++++++------------------
 1 file changed, 133 insertions(+), 389 deletions(-)
diff --git a/src/org/philgooch/WordNetSuggester.java b/src/org/philgooch/WordNetSuggester.java
index 03ddfc4..27bf678 100644
--- a/src/org/philgooch/WordNetSuggester.java
+++ b/src/org/philgooch/WordNetSuggester.java
@@ -2,7 +2,7 @@
  * To change this template, choose Tools | Templates
  * and open the template in the editor.
  */
-package org.philgooch;
+package wordnetsuggester;
 
 import gate.*;
 import gate.creole.*;
@@ -11,6 +11,7 @@
 
 import gate.Annotation;
 import gate.AnnotationSet;
+import gate.Document;
 import gate.Factory;
 import gate.FeatureMap;
 
@@ -20,11 +21,15 @@
 import java.io.*;
 import java.net.*;
 
+import org.apache.commons.codec.language.Soundex;
+
 /**
  *
- * @author philipgooch
+ * @author victor
+ * This class was edited to add concatenated annotations for further
+ * indexing and retrieving purposes
  */
-@CreoleResource(name = "WordNet Suggester",
+@CreoleResource(name = "WordNet Suggester Concatenated",
 helpURL = "",
 comment = "Plugin that wraps the WordNet API to add synonyms and hyponyms to features in the input/output annotations defined.")
 public class WordNetSuggester extends AbstractLanguageAnalyser implements
@@ -33,40 +38,27 @@ public class WordNetSuggester extends AbstractLanguageAnalyser implements
 
     private WordNet wordNet;        // WordNet instance
     private URL configFileURL;      // URL to WordNet configuration file
+    
     private String inputASName;     //  Input AnnotationSet name
     private String outputASName;    // Output AnnotationSet set name
     private ArrayList<String> inputASTypes; // list of input annotations from which string content will be taken for input to WordNet
     private String outputASType;    // Output annotation name within outputASName for holding WordNet features
-    private ArrayList<String> inputASTypeFeatures;      // List of features within inputASTypes from which string content will be submitted to WordNet
-    // These are evaluated in order, e.g. if string and root are specified, then
-    // the string feature is used, if it is empty, the root feature is used,
-    // if both are empty, the annotation content is used if useTokensOnMissingInputFeature is set
+    private String inputASTypeFeature;      // Name of feature within inputASTypes from which string content will be submitted to WordNet
     private String tokASName;     //  Name of AnnotationSet containing Tokens
     private String tokName;         //  Name of Token annotation (default to Token)
     private String tokRoot;         //  Root or string content of Token (default to string)
     private String tokCategory;     //  POS category of Token (default to category)
     private Integer shortestWord;       // ignore words under this threshold
-    private Boolean ignoreMissingInputFeature;     // if true, don't use underlying annotation content if no inputASTypeFeatures exist
-    private Boolean addGloss;                       // output WordNet gloss
-    private Boolean outputFullHypernymHierarchy;              // if true, output full class hierarchy
-
     private OutputFormat outputListFormat;      // Output Lists as strings or as a List object
     // Exit gracefully if exception caught on init()
     private boolean gracefulExit;
     private Integer truncateSize;               // truncate candidates lists to N size
     private boolean createNewAnnot;        // create a new annot to hold WordNet output
     private AnnotationSet outputAS;         // output AnnotationSet
-    private Boolean matchPOS;                   // only output WordNet synonyms if the POS matches the POS of the input Token
-    private ArrayList<String> excludeIfContains;    // don't get wordnet synonyms if term contains one of these annots
-    private ArrayList<String> excludeIfWithin;      // don't get wordnet synonyms if term occurs inside one of these annots
-    private Boolean attemptFullMatch;               // Attempt to match on complete phrase first before matching on each token
-    private String outputASTypeName;
-    private String outputASTypeFeatureName;         // can specify outputASType in the form Ann.feature=value
-    private String outputASTypeFeatureValue;
+    private Soundex m_soundex;
 
     // Output Lists as strings or as a List object
     public enum OutputFormat {
-
         String, List
     }
 
@@ -76,23 +68,21 @@ public Resource init() throws ResourceInstantiationException {
 
         // Default input to WordNet is by Token
         inputASTypes = new ArrayList<String>();
-        inputASTypes.add(ANNIEConstants.TOKEN_ANNOTATION_TYPE);
+        inputASTypes.add("Token");
 
-        inputASTypeFeatures = new ArrayList<String>();
-        inputASTypeFeatures.add(ANNIEConstants.TOKEN_STRING_FEATURE_NAME);
-        
+        m_soundex = new Soundex();
         // If there is an instance of the WordNet LR already loaded, use that,
         // otherwise, load a new instance of the WordNet LR
         try {
             Gate.getCreoleRegister().registerDirectories(
-                    new File(Gate.getGateHome().getAbsolutePath()
-                    + "/plugins/WordNet").toURI().toURL());
+              new File(Gate.getGateHome().getAbsolutePath()
+                      + "/plugins/WordNet").toURI().toURL());
             try {
                 wordNet = (gate.wordnet.WordNet) Gate.getCreoleRegister().getAllInstances("gate.wordnet.WordNet").get(0);
             } catch (IndexOutOfBoundsException i) {
                 FeatureMap fm = Factory.newFeatureMap();
                 fm.put("propertyUrl", configFileURL);
-                wordNet = (WordNet) gate.Factory.createResource("gate.wordnet.JWNLWordNetImpl", fm);
+                wordNet = (WordNet)gate.Factory.createResource("gate.wordnet.JWNLWordNetImpl", fm);
             }
         } catch (MalformedURLException m) {
             gate.util.Err.println("Unable to locate WordNet plugin. Please check that it is installed.");
@@ -100,11 +90,13 @@ public Resource init() throws ResourceInstantiationException {
         } catch (GateException g) {
             gate.util.Err.println("Unable to initialise WordNet plugin. Please check that it is installed and configured correctly.");
             gracefulExit = true;
-        }
+        } 
 
         return this;
     } // end init()
 
+
+    
     @Override
     public void execute() throws ExecutionException {
         // quit if setup failed
@@ -122,111 +114,35 @@ public void execute() throws ExecutionException {
         // Get all Tokens that are words
         FeatureMap tokFeats = Factory.newFeatureMap();
 
-        tokFeats.put(ANNIEConstants.TOKEN_KIND_FEATURE_NAME, "word");
+        tokFeats.put("kind", "word");
         AnnotationSet tokenAS = (tokASName == null || tokASName.trim().length() == 0) ? document.getAnnotations().get(tokName, tokFeats) : document.getAnnotations(tokASName).get(tokName, tokFeats);
 
         String docContent = document.getContent().toString();
 
-        
-        if (outputASType == null || outputASType.isEmpty()) {
-            createNewAnnot = false;
-        } else {        // Allow output annotation to have a feature name and value
-            createNewAnnot = true;
-            String[] outputAnnArr = outputASType.split("(\\.)|(=)");
-            if (outputAnnArr.length == 3) {
-                outputASTypeName = outputAnnArr[0];
-                outputASTypeFeatureName = outputAnnArr[1];
-                outputASTypeFeatureValue = outputAnnArr[2];
-            } else {
-                outputASTypeName = outputAnnArr[0];
-                outputASTypeFeatureName = null;
-                outputASTypeFeatureValue = null;
-            }
-        }
+        createNewAnnot = (outputASType == null || outputASType.isEmpty()) ? false : true;
+
         // process the content of each annot in inputASTypes
-        for (String inputAnnType : inputASTypes) {
-
-            AnnotationSet inputAnnSet;
-
-            // We allow inputAnnType of the form
-            // Annotation.feature == value
-            String annName = inputAnnType;  // assume just a simple ann name to start with
-            String annFeature;
-            String annFeatureValue;
-            String[] inputAnnArr = inputAnnType.split("(\\.)|(==)");
-            if (inputAnnArr.length == 3 || inputAnnArr.length == 2) {
-                annName = inputAnnArr[0];
-                annFeature = inputAnnArr[1];
-                if (inputAnnArr.length == 2) {
-                    Set<String> feats = new HashSet<String>();
-                    feats.add(annFeature);
-                    inputAnnSet = inputAS.get(annName, feats);
-                } else {
-                    FeatureMap annFeats = Factory.newFeatureMap();
-                    annFeatureValue = inputAnnArr[2];
-                    annFeats.put(annFeature, annFeatureValue);
-                    inputAnnSet = inputAS.get(annName, annFeats);
-                }
+        for (String inputAnnName : inputASTypes) {
 
-            } else {
-                inputAnnSet = inputAS.get(inputAnnType);
-            }
+            AnnotationSet inputAnnSet = inputAS.get(inputAnnName);
 
             for (Annotation ann : inputAnnSet) {
-                boolean skip = false;
-                boolean hasInputASTypeFeature = false;
-
                 Long annStart = ann.getStartNode().getOffset();
                 Long annEnd = ann.getEndNode().getOffset();
 
-                // Don't look up this term if it occurs within or wraps any of these annots
-                if (excludeIfWithin != null && !(excludeIfWithin.isEmpty())) {
-                    for (String excludeAnnName : excludeIfWithin) {
-                        if (!inputAS.getCovering(excludeAnnName, annStart, annEnd).isEmpty()) {
-                            skip = true;
-                            break;
-                        }
-                    }
-                }
-                if (excludeIfContains != null && !(excludeIfContains.isEmpty())) {
-                    for (String excludeAnnName : excludeIfContains) {
-                        if (!inputAS.getContained(annStart, annEnd).get(excludeAnnName).isEmpty()) {
-                            skip = true;
-                            break;
-                        }
-                    }
-                }
-                if (skip) {
-                    continue;
-                }
-
                 List<Annotation> innerToks = new ArrayList<Annotation>(tokenAS.getContained(annStart, annEnd));
                 Collections.sort(innerToks, new OffsetComparator());
 
                 String strTerm = "";            // Annotation string content
 
-                FeatureMap annFeats = ann.getFeatures();
-                String annFeatureContent = null;
-
-                // Iterate through inputASTypeFeatures and use the first non-empty one
-                if (inputASTypeFeatures != null && !inputASTypeFeatures.isEmpty()) {
-                    for (String inputASTypeFeature : inputASTypeFeatures) {
-                        Object feat = annFeats.get(inputASTypeFeature);
-                        annFeatureContent = (feat == null) ? "" : feat.toString();
-                        if (annFeatureContent != null && annFeatureContent.trim().length() > 0) {
-                            strTerm = annFeatureContent.trim();
-                            hasInputASTypeFeature = true;
-                            break;
-                        }
-                    }
-                }
+                Object o = ann.getFeatures().get(inputASTypeFeature);
+                String annFeatureContent = (o == null) ? "" : o.toString();
 
-
-                // If annFeatureContent is null then there are no non-empty inputASTypeFeatures,
-                // so we use the docContent substring
+                // Use the content of a named feature as input ?
                 if (annFeatureContent == null || annFeatureContent.trim().length() == 0) {
                     strTerm = docContent.substring(annStart.intValue(), annEnd.intValue()).trim();
-                    hasInputASTypeFeature = false;
+                } else {
+                    strTerm = annFeatureContent.trim();
                 }
 
                 // Skip processing for short words
@@ -234,164 +150,45 @@ public void execute() throws ExecutionException {
                     continue;
                 }
 
-                // Try to match the whole phrase
+                // Try to match the whole phrase, and treat it as a noun
                 // if no match, then match individual tokens
                 try {
                     boolean fullMatch = false;
-                    // Attempt to match the whole phrase?
-                    if (attemptFullMatch) {
-                        fullMatch = wordNetSuggest(strTerm, ann);
+                    // Attempt to match the whole phrase if it's not a Token or has not been tokenized
+                    if (!inputAnnName.equals(tokName) && (innerToks.isEmpty() || innerToks.size() > 1)) {
+                        fullMatch = wordNetSuggest(strTerm, ann, WordNet.POS_NOUN);
                     }
 
                     if (!fullMatch) {
-                        if (hasInputASTypeFeature) {
-                            // Tokenize the contents of the input feature and run WordNet on each word
-                            String strTermArr[] = strTerm.split("[\\W\\s\\xA0]+");
-                            for (String str : strTermArr) {
-                                if (str.length() >= shortestWord) {
-                                    wordNetSuggest(str, ann);
-                                }
-                            }
-                        } else if (! ignoreMissingInputFeature) {
-                            // Use the inputAS tokens
-                            for (Annotation tok : innerToks) {
-                                Object oStr = tok.getFeatures().get(tokRoot);
-                                strTerm = (oStr == null) ? "" : oStr.toString();
-                                if (strTerm.length() >= shortestWord) {
-                                    wordNetSuggest(strTerm, tok);
-                                }
-                            }
+                        for (Annotation tok : innerToks) {
+                            Object oStr = tok.getFeatures().get(tokRoot);
+                            strTerm = (oStr == null) ? "" : oStr.toString();
+                            wordNetSuggest(strTerm, tok);
                         }
-                    } // end if
+                    }
 
                 } catch (WordNetException w) {
                     gate.util.Err.println(w.getMessage());
-                } // end try
-            } // end for
-        } // end for
-        fireProcessFinished();
-    } // end execute()
-
-    private boolean wordNetSuggest(String strTerm1, Annotation ann, int pos) throws WordNetException {
-        // Replace spaces with underscore so compound terms get matched if possible
-        String strTerm = strTerm1.replaceAll("[\\s\\xA0]+", "_");
-        FeatureMap fm = ann.getFeatures();
-
-        List<WordSense> senseList = wordNet.lookupWord(strTerm, pos);
-        if (senseList == null || senseList.isEmpty()) {
-            return false;
-        }
-
-        int iter = 0;
-        for (WordSense sense : senseList) {
-            // Create a new FeatureMap for each new annot
-            if (createNewAnnot) {
-                fm = Factory.newFeatureMap();
-                if (outputASTypeFeatureName != null) {
-                    fm.put(outputASTypeFeatureName, outputASTypeFeatureValue);
                 }
             }
-
-            // only iterate over N candidates as specified by truncateSize parameter
-            if (++iter > truncateSize) {
-                break;
-            }
-
-            Synset s = sense.getSynset();
-
-            if (createNewAnnot) {
-                outputAS.add(ann.getStartNode(), ann.getEndNode(), outputASTypeName, fm);
-            } else if (iter > 1) {
-                // If we're not creating new annotations,
-                // we can only output features for the first candidate
-                break;
-            }
-
-            if (addGloss) {
-                fm.put("gloss", s.getGloss());
-            }
-
-            List<WordSense> synonyms = s.getWordSenses();
-
-            // Get synonyms and similar words
-            List<String> synList = new ArrayList<String>();
-            for (WordSense ws : synonyms) {
-                synList.add(ws.getWord().getLemma());
-            }
-
-            // Adjectives have a similar-to relation, source of other synonyms
-            if (pos == WordNet.POS_ADJECTIVE || sense.getPOS() == WordNet.POS_ADJECTIVE) {
-                synList.addAll(getSemanticRelation(s, SemanticRelation.REL_SIMILAR_TO));
-            }
-            this.addFeature("synonyms", fm, synList);
-            synList.clear();
-
-            // Adjectives have a related noun
-            if (pos == WordNet.POS_ADJECTIVE || sense.getPOS() == WordNet.POS_ADJECTIVE) {
-                synList.addAll(getLexicalRelation(sense, LexicalRelation.REL_DERIVED_FROM_ADJECTIVE));
-                this.addFeature("derived", fm, synList);
-                synList.clear();
-            }
-
-            // Verbs have related verb group
-            if (pos == WordNet.POS_VERB || sense.getPOS() == WordNet.POS_VERB) {
-                synList.addAll(getSemanticRelation(s, SemanticRelation.REL_VERB_GROUP));
-                this.addFeature("verb_group", fm, synList);
-                synList.clear();
-            }
-
-            synList.addAll(getSemanticRelation(s, SemanticRelation.REL_ANTONYM));
-            synList.addAll(getLexicalRelation(sense, LexicalRelation.REL_ANTONYM));
-            this.addFeature("antonyms", fm, synList);
-            synList.clear();
-
-            synList.addAll(getSemanticRelation(s, SemanticRelation.REL_HYPERNYM));
-            this.addFeature("hypernyms", fm, synList);
-            synList.clear();
-
-            synList.addAll(getSemanticRelation(s, SemanticRelation.REL_HYPONYM));
-            this.addFeature("hyponyms", fm, synList);
-            synList.clear();
-
-            // For simplicity, we don't distinguish between has_part, has_member, has_substance
-            // - just use has_part
-            synList.addAll(getSemanticRelation(s, SemanticRelation.REL_PART_MERONYM));
-            synList.addAll(getSemanticRelation(s, SemanticRelation.REL_MEMBER_MERONYM));
-            synList.addAll(getSemanticRelation(s, SemanticRelation.REL_SUBSTANCE_MERONYM));
-            this.addFeature("meronyms", fm, synList);
-            synList.clear();
-
-            // For simplicity, we don't distinguish between part_of, member_of, substance_of
-            // - just use part_of
-            synList.addAll(getSemanticRelation(s, SemanticRelation.REL_PART_HOLONYM));
-            synList.addAll(getSemanticRelation(s, SemanticRelation.REL_MEMBER_HOLONYM));
-            synList.addAll(getSemanticRelation(s, SemanticRelation.REL_SUBSTANCE_HOLONYM));
-            this.addFeature("holonyms", fm, synList);
-            synList.clear();
-
-            synList.addAll(getSemanticRelation(s, SemanticRelation.REL_ATTRIBUTE));
-            this.addFeature("attributes", fm, synList);
-            synList.clear();
-
         }
+        fireProcessFinished();
+    } // end execute()
 
-        return true;
-    }
 
+    
     /**
      * 
-     * @param strTerm               The text to be looked up
-     * @param ann                   The annotation that spans the text
-     * @return                      True if matched, false if not
+     * @param strTerm       The text to be looked up
+     * @param ann           The annotation that spans the text
+     * @return              True if matched, false if not
      * @throws WordNetException
      */
-    private boolean wordNetSuggest(String strTerm1, Annotation ann) throws WordNetException {
-        // Replace spaces with underscore so compound terms get matched if possible
-        String strTerm = strTerm1.replaceAll("[\\s\\xA0]+", "_");
+    private boolean wordNetSuggest(String strTerm, Annotation ann) throws WordNetException {
         FeatureMap fm = ann.getFeatures();
-
-        String posFeat = "NN";
         int pos = WordNet.POS_NOUN;
+        String posFeat = "NN";
+
         // Does it contain POS information
         if (fm.containsKey(tokCategory)) {
             posFeat = fm.get(tokCategory).toString();
@@ -407,44 +204,48 @@ private boolean wordNetSuggest(String strTerm1, Annotation ann) throws WordNetEx
             pos = WordNet.POS_ADVERB;
         }
 
-        List<WordSense> senseList = wordNet.lookupWord(strTerm);
+        return wordNetSuggest(strTerm, ann, pos);
+    }
+
+    /**
+     * 
+     * @param strTerm               The text to be looked up
+     * @param ann                   The annotation that spans the text
+     * @param pos                   POS identifier
+     * @return                      True if matched, false if not
+     * @throws WordNetException
+     */
+    private boolean wordNetSuggest(String strTerm1, Annotation ann, int pos) throws WordNetException {
+        // Replace spaces with underscore so compound terms get matched if possible
+        String strTerm = strTerm1.replaceAll("[\\s\\xA0]+", "_");
+        FeatureMap fm = ann.getFeatures();
+
+        this.addPhoneticFeature(fm, strTerm);
+        
+        List<WordSense> senseList = wordNet.lookupWord(strTerm, pos);
         if (senseList == null || senseList.isEmpty()) {
             return false;
         }
 
         int iter = 0;
         for (WordSense sense : senseList) {
-            if (matchPOS && sense.getPOS() != pos) {
-                // WordNet sense does not match the POS of the input
-                continue;
-            }
-
             // Create a new FeatureMap for each new annot
-            if (createNewAnnot) {
-                fm = Factory.newFeatureMap();
-                if (outputASTypeFeatureName != null) {
-                    fm.put(outputASTypeFeatureName, outputASTypeFeatureValue);
-                }
-            }
+            if (createNewAnnot) { fm = Factory.newFeatureMap(); }
 
             // only iterate over N candidates as specified by truncateSize parameter
-            if (++iter > truncateSize) {
-                break;
-            }
-
+            if (++iter > truncateSize) { break; }
+            
             Synset s = sense.getSynset();
 
             if (createNewAnnot) {
-                outputAS.add(ann.getStartNode(), ann.getEndNode(), outputASTypeName, fm);
+                outputAS.add(ann.getStartNode(), ann.getEndNode(), outputASType, fm);
             } else if (iter > 1) {
                 // If we're not creating new annotations,
                 // we can only output features for the first candidate
                 break;
             }
 
-            if (addGloss) {
-                fm.put("gloss", s.getGloss());
-            }
+            fm.put("gloss", s.getGloss());
 
             List<WordSense> synonyms = s.getWordSenses();
 
@@ -455,21 +256,21 @@ private boolean wordNetSuggest(String strTerm1, Annotation ann) throws WordNetEx
             }
 
             // Adjectives have a similar-to relation, source of other synonyms
-            if (sense.getPOS() == WordNet.POS_ADJECTIVE) {
+            if (pos == WordNet.POS_ADJECTIVE || sense.getPOS() == WordNet.POS_ADJECTIVE) {
                 synList.addAll(getSemanticRelation(s, SemanticRelation.REL_SIMILAR_TO));
             }
-            this.addFeature("synonyms", fm, synList);
+            this.addFeatureConcateneted("synonyms", fm, synList);
             synList.clear();
 
             // Adjectives have a related noun
-            if (sense.getPOS() == WordNet.POS_ADJECTIVE) {
+            if (pos == WordNet.POS_ADJECTIVE || sense.getPOS() == WordNet.POS_ADJECTIVE) {
                 synList.addAll(getLexicalRelation(sense, LexicalRelation.REL_DERIVED_FROM_ADJECTIVE));
                 this.addFeature("derived", fm, synList);
                 synList.clear();
             }
 
             // Verbs have related verb group
-            if (sense.getPOS() == WordNet.POS_VERB) {
+            if (pos == WordNet.POS_VERB || sense.getPOS() == WordNet.POS_VERB) {
                 synList.addAll(getSemanticRelation(s, SemanticRelation.REL_VERB_GROUP));
                 this.addFeature("verb_group", fm, synList);
                 synList.clear();
@@ -477,31 +278,15 @@ private boolean wordNetSuggest(String strTerm1, Annotation ann) throws WordNetEx
 
             synList.addAll(getSemanticRelation(s, SemanticRelation.REL_ANTONYM));
             synList.addAll(getLexicalRelation(sense, LexicalRelation.REL_ANTONYM));
-            this.addFeature("antonyms", fm, synList);
+            this.addFeatureConcateneted("antonyms", fm, synList);
             synList.clear();
 
-            // HYPERNYMS
-            List<String> hypernymList = new ArrayList<String>();
-            if (outputFullHypernymHierarchy) {
-                List<SemanticRelation> hypernyms = s.getSemanticRelations(SemanticRelation.REL_HYPERNYM);
-                while (! hypernyms.isEmpty()) {
-                    for (SemanticRelation hypernym : hypernyms) {
-                        Synset target = hypernym.getTarget();
-                        List<WordSense> srTargetList = target.getWordSenses();
-                        for (WordSense targWs : srTargetList) {
-                            hypernymList.add(targWs.getWord().getLemma());
-                        }
-                        hypernyms = target.getSemanticRelations(SemanticRelation.REL_HYPERNYM);
-                    }
-                }
-            } else {
-                hypernymList = getSemanticRelation(s, SemanticRelation.REL_HYPERNYM);
-            }
-            this.addFeature("hypernyms", fm, hypernymList);
+            synList.addAll(getSemanticRelation(s, SemanticRelation.REL_HYPERNYM));
+            this.addFeatureConcateneted("hypernyms", fm, synList);
+            synList.clear();
 
-            // HYPONYMS
             synList.addAll(getSemanticRelation(s, SemanticRelation.REL_HYPONYM));
-            this.addFeature("hyponyms", fm, synList);
+            this.addFeatureConcateneted("hyponyms", fm, synList);
             synList.clear();
 
             // For simplicity, we don't distinguish between has_part, has_member, has_substance
@@ -509,7 +294,7 @@ private boolean wordNetSuggest(String strTerm1, Annotation ann) throws WordNetEx
             synList.addAll(getSemanticRelation(s, SemanticRelation.REL_PART_MERONYM));
             synList.addAll(getSemanticRelation(s, SemanticRelation.REL_MEMBER_MERONYM));
             synList.addAll(getSemanticRelation(s, SemanticRelation.REL_SUBSTANCE_MERONYM));
-            this.addFeature("meronyms", fm, synList);
+            this.addFeatureConcateneted("meronyms", fm, synList);
             synList.clear();
 
             // For simplicity, we don't distinguish between part_of, member_of, substance_of
@@ -517,7 +302,7 @@ private boolean wordNetSuggest(String strTerm1, Annotation ann) throws WordNetEx
             synList.addAll(getSemanticRelation(s, SemanticRelation.REL_PART_HOLONYM));
             synList.addAll(getSemanticRelation(s, SemanticRelation.REL_MEMBER_HOLONYM));
             synList.addAll(getSemanticRelation(s, SemanticRelation.REL_SUBSTANCE_HOLONYM));
-            this.addFeature("holonyms", fm, synList);
+            this.addFeatureConcateneted("holonyms", fm, synList);
             synList.clear();
 
             synList.addAll(getSemanticRelation(s, SemanticRelation.REL_ATTRIBUTE));
@@ -529,6 +314,7 @@ private boolean wordNetSuggest(String strTerm1, Annotation ann) throws WordNetEx
         return true;
     }
 
+    
     /**
      * 
      * @param feat              String feature name
@@ -536,7 +322,7 @@ private boolean wordNetSuggest(String strTerm1, Annotation ann) throws WordNetEx
      * @param synList           List<String> to add to FeatureMap
      */
     private void addFeature(String feat, FeatureMap fm, List<String> synList) {
-        if (!synList.isEmpty() && !fm.containsKey(feat)) {
+        if (!synList.isEmpty()) {
             if (outputListFormat == OutputFormat.List) {
                 fm.put(feat, new ArrayList<String>(synList));
             } else {
@@ -544,8 +330,49 @@ private void addFeature(String feat, FeatureMap fm, List<String> synList) {
             }
         }
     }
+    
+    /**
+     * Adds the members of a particular semantic set in a concatenated manner
+     * This way indexing and querying with GATE gets easier. Will be further used with ANNIC adaptation
+     * @param feat is the current feature being updated
+     * @param fm is the feature map
+     * @param synList is the list of member for calling member semantic set
+     */
+    private void addFeatureConcateneted(String feat, FeatureMap fm, List<String> synList) {
+        if (!synList.isEmpty()) {
+            
+        	String concatenated_value = "";
+        	for (Iterator iterator = synList.iterator(); iterator.hasNext();) {
+				String current_member = (String) iterator.next();
+				concatenated_value = concatenated_value + current_member;
+			}
+        	
+        	fm.put(feat, concatenated_value);
+        	
+        }
+    }
+
+    private void addPhoneticFeature(FeatureMap fm, String word)
+    {
+    	if (m_soundex != null && word != null)
+    	{
+    		try{
+    			fm.put("phonetic", m_soundex.encode(word));	
+    		}
+    		catch(IllegalArgumentException e)
+    		{
+    			return;
+    		}
+    		
+    	}
+    	else
+    	{
+    		fm.put("phonetic", "NO_SOUND");
+    	}
+    }
 
     /**
+     * 
      *
      * @param sense                 WordSense object
      * @return                      List<String> of related lemmas
@@ -578,9 +405,7 @@ private List<String> getLexicalRelation(List<LexicalRelation> lrList) throws Wor
         List<String> ret = new ArrayList<String>();
         int iter = 0;
         for (LexicalRelation lr : lrList) {
-            if (++iter > truncateSize) {
-                break;
-            }
+            if (++iter > truncateSize) { break; }
             // System.out.println(lr.getLabel() + ":" + lr.getType());
             WordSense target = lr.getTarget();
             Synset t = target.getSynset();
@@ -626,22 +451,19 @@ private List<String> getSemanticRelation(List<SemanticRelation> semrel) throws W
         int iter1 = 0;
         int iter2 = 0;
         for (SemanticRelation sr : semrel) {
-            if (++iter1 > truncateSize) {
-                break;
-            }
+            if (++iter1 > truncateSize) { break; }
             // System.out.println(sr.getLabel() + ":" + sr.getType());
             Synset target = sr.getTarget();
             List<WordSense> srTargetList = target.getWordSenses();
             for (WordSense targWs : srTargetList) {
-                if (++iter2 > truncateSize) {
-                    break;
-                }
+                if (++iter2 > truncateSize) { break; }
                 ret.add(targWs.getWord().getLemma());
             }
         }
         return ret;
     }
 
+
     @CreoleParameter(defaultValue = "resources/wordnet-config.xml",
     comment = "Location of configuration file")
     public void setConfigFileURL(URL configFileURL) {
@@ -655,12 +477,12 @@ public URL getConfigFileURL() {
     @Optional
     @RunTime
     @CreoleParameter(comment = "If set, only send the content of the given feature from annotations within inputASTypes to WordNet")
-    public void setInputASTypeFeatures(ArrayList<String> inputASTypeFeatures) {
-        this.inputASTypeFeatures = inputASTypeFeatures;
+    public void setInputASTypeFeature(String inputASTypeFeature) {
+        this.inputASTypeFeature = inputASTypeFeature;
     }
 
-    public ArrayList<String> getInputASTypeFeatures() {
-        return inputASTypeFeatures;
+    public String getInputASTypeFeature() {
+        return inputASTypeFeature;
     }
 
     @Optional
@@ -783,82 +605,4 @@ public void setTruncateSize(Integer truncateSize) {
     public Integer getTruncateSize() {
         return truncateSize;
     }
-
-    @Optional
-    @RunTime
-    @CreoleParameter(comment = "Don't look up terms that contain these annotations")
-    public void setExcludeIfContains(ArrayList<String> excludeIfContains) {
-        this.excludeIfContains = excludeIfContains;
-    }
-
-    public ArrayList<String> getExcludeIfContains() {
-        return excludeIfContains;
-    }
-
-    @Optional
-    @RunTime
-    @CreoleParameter(comment = "Don't look up terms that are within these annotations")
-    public void setExcludeIfWithin(ArrayList<String> excludeIfWithin) {
-        this.excludeIfWithin = excludeIfWithin;
-    }
-
-    public ArrayList<String> getExcludeIfWithin() {
-        return excludeIfWithin;
-    }
-
-    @RunTime
-    @CreoleParameter(defaultValue = "true",
-    comment = "Match WordNet output to the POS of the input Token")
-    public void setMatchPOS(Boolean matchPOS) {
-        this.matchPOS = matchPOS;
-    }
-
-    public Boolean getMatchPOS() {
-        return matchPOS;
-    }
-
-    @RunTime
-    @CreoleParameter(defaultValue = "false",
-    comment = "Attempt to match whole phrase before matching each token")
-    public void setAttemptFullMatch(Boolean attemptFullMatch) {
-        this.attemptFullMatch = attemptFullMatch;
-    }
-
-    public Boolean getAttemptFullMatch() {
-        return attemptFullMatch;
-    }
-
-    @RunTime
-    @CreoleParameter(defaultValue = "false",
-    comment = "If true, don't attempt to use underlying annotation content if no inputASTypeFeatures found")
-    public void setIgnoreMissingInputFeature(Boolean ignoreMissingInputFeature) {
-        this.ignoreMissingInputFeature = ignoreMissingInputFeature;
-    }
-
-    public Boolean getIgnoreMissingInputFeature() {
-        return ignoreMissingInputFeature;
-    }
-
-    @RunTime
-    @CreoleParameter(defaultValue = "false",
-    comment = "Output the WordNet description?")
-    public void setAddGloss(Boolean addGloss) {
-        this.addGloss = addGloss;
-    }
-
-    public Boolean getAddGloss() {
-        return addGloss;
-    }
-
-    @RunTime
-    @CreoleParameter(defaultValue = "false",
-    comment = "Output the full WordNet hypernym hierarchy?")
-    public void setoutputFullHypernymHierarchy(Boolean outputFullHypernymHierarchy) {
-        this.outputFullHypernymHierarchy = outputFullHypernymHierarchy;
-    }
-
-    public Boolean getoutputFullHypernymHierarchy() {
-        return outputFullHypernymHierarchy;
-    }
-
 }