com.digitalpebble.behemoth.gate.GATEAnnotationFilters.java Source code

Java tutorial

Introduction

Here is the source code for com.digitalpebble.behemoth.gate.GATEAnnotationFilters.java

Source

/**
 * Licensed to the Apache Software Foundation (ASF) under one or more
 * contributor license agreements.  See the NOTICE file distributed with
 * this work for additional information regarding copyright ownership.
 * The ASF licenses this file to You under the Apache License, Version 2.0
 * (the "License"); you may not use this file except in compliance with
 * the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package com.digitalpebble.behemoth.gate;

import java.util.ArrayList;
import java.util.Collections;
import java.util.HashMap;
import java.util.HashSet;
import java.util.Iterator;
import java.util.List;
import java.util.Map;
import java.util.Set;

import org.apache.hadoop.conf.Configuration;

/** Container for the annotation filters which is built from **/

public class GATEAnnotationFilters {

    HashSet<String> types;
    Map<String, Set<String>> featfilts;
    String annotationSetName;
    HashSet<String> docFeatureNames;

    public static GATEAnnotationFilters getFilters(Configuration config) {
        GATEAnnotationFilters filter = new GATEAnnotationFilters();

        filter.annotationSetName = config.get("gate.annotationset.output", "");
        String[] stypes = config.getStrings("gate.annotations.filter", "");
        String[] sFeatFilt = config.getStrings("gate.features.filter", "");
        String[] docFeatFilt = config.getStrings("gate.docfeatures.filter", "");

        // the featurefilters have the following form : Type.featureName
        filter.featfilts = new HashMap<String, Set<String>>();
        for (String ff : sFeatFilt) {
            String[] fp = ff.split("\\.");
            if (fp.length != 2)
                continue;
            Set<String> fnames = filter.featfilts.get(fp[0]);
            if (fnames == null) {
                fnames = new HashSet<String>();
                filter.featfilts.put(fp[0], fnames);
            }
            fnames.add(fp[1]);
        }

        filter.types = new HashSet<String>();
        for (String s : stypes) {
            s = s.trim();
            if (s.length() > 0)
                filter.types.add(s);
        }

        filter.docFeatureNames = new HashSet<String>();
        for (String s : docFeatFilt) {
            s = s.trim();
            if (s.length() > 0)
                filter.docFeatureNames.add(s);
        }

        return filter;
    }

    public HashSet<String> getTypes() {
        return types;
    }

    public HashSet<String> getDocFeaturesFilter() {
        return docFeatureNames;
    }

    public Map<String, Set<String>> getFeatureFilters() {
        return featfilts;
    }

    public String getAnnotationSetName() {
        return annotationSetName;
    }

    public void setTypes(HashSet<String> types) {
        this.types = types;
    }

    public void setFeatfilts(Map<String, Set<String>> featfilts) {
        this.featfilts = featfilts;
    }

    public void setAnnotationSetName(String annotationSetName) {
        this.annotationSetName = annotationSetName;
    }

    /**
     * Returns a unmodifiable sorted list of all known annotations and feature
     * names so that we can use their position in the serialisation instead of
     * writing them as strings
     ***/
    public List<String> getLexicon() {
        HashSet<String> lexicon = new HashSet<String>();
        lexicon.addAll(types);
        Iterator<Set<String>> iter = featfilts.values().iterator();
        while (iter.hasNext()) {
            lexicon.addAll(iter.next());
        }
        ArrayList<String> temp = new ArrayList<String>(lexicon);
        Collections.sort(temp);
        return Collections.unmodifiableList(temp);
    }

}