org.apache.uima.ruta.action.MarkTableAction.java Source code

Java tutorial

Introduction

Here is the source code for org.apache.uima.ruta.action.MarkTableAction.java

Source

/*
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 * 
 * http://www.apache.org/licenses/LICENSE-2.0
 * 
 * Unless required by applicable law or agreed to in writing,
 * software distributed under the License is distributed on an
 * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 * KIND, either express or implied.  See the License for the
 * specific language governing permissions and limitations
 * under the License.
 */

package org.apache.uima.ruta.action;

import java.util.Collection;
import java.util.HashMap;
import java.util.List;
import java.util.Map;

import org.apache.commons.lang3.StringUtils;
import org.apache.uima.cas.Feature;
import org.apache.uima.cas.FeatureStructure;
import org.apache.uima.cas.Type;
import org.apache.uima.cas.text.AnnotationFS;
import org.apache.uima.jcas.cas.TOP;
import org.apache.uima.jcas.tcas.Annotation;
import org.apache.uima.ruta.RutaBlock;
import org.apache.uima.ruta.RutaStream;
import org.apache.uima.ruta.UIMAConstants;
import org.apache.uima.ruta.expression.bool.IBooleanExpression;
import org.apache.uima.ruta.expression.bool.SimpleBooleanExpression;
import org.apache.uima.ruta.expression.number.INumberExpression;
import org.apache.uima.ruta.expression.resource.WordTableExpression;
import org.apache.uima.ruta.expression.string.IStringExpression;
import org.apache.uima.ruta.expression.type.TypeExpression;
import org.apache.uima.ruta.resource.RutaTable;
import org.apache.uima.ruta.resource.RutaWordList;
import org.apache.uima.ruta.rule.RuleElement;
import org.apache.uima.ruta.rule.RuleMatch;
import org.apache.uima.ruta.visitor.InferenceCrowd;

public class MarkTableAction extends AbstractRutaAction {

    private final TypeExpression typeExpr;

    private final WordTableExpression tableExpr;

    private final Map<IStringExpression, INumberExpression> featureMap;

    private final INumberExpression indexExpr;

    private final IBooleanExpression ignoreCase;

    private final INumberExpression ignoreLength;

    private final IStringExpression ignoreChar;

    private final INumberExpression maxIgnoreChar;

    private IBooleanExpression ignoreWS = new SimpleBooleanExpression(true);

    public MarkTableAction(TypeExpression typeExpr, INumberExpression indexExpr, WordTableExpression tableExpr,
            Map<IStringExpression, INumberExpression> featureMap, IBooleanExpression ignoreCase,
            INumberExpression ignoreLength, IStringExpression ignoreChar, INumberExpression maxIgnoreChar) {
        super();
        this.typeExpr = typeExpr;
        this.indexExpr = indexExpr;
        this.tableExpr = tableExpr;
        this.featureMap = featureMap;
        this.ignoreCase = ignoreCase;
        this.ignoreLength = ignoreLength;
        this.ignoreChar = ignoreChar;
        this.maxIgnoreChar = maxIgnoreChar;
    }

    public void setIgnoreWS(IBooleanExpression ignoreWS) {
        this.ignoreWS = ignoreWS;
    }

    @Override
    public void execute(RuleMatch match, RuleElement element, RutaStream stream, InferenceCrowd crowd) {
        RutaBlock block = element.getParent();
        RutaTable table = tableExpr.getTable(block);
        int index = indexExpr.getIntegerValue(block, match, element, stream);
        Type type = typeExpr.getType(block);
        Map<String, Integer> map = new HashMap<String, Integer>();
        for (IStringExpression each : featureMap.keySet()) {
            map.put(each.getStringValue(block, match, element, stream),
                    featureMap.get(each).getIntegerValue(block, match, element, stream));
        }

        boolean ignoreCaseValue = ignoreCase != null
                ? ignoreCase.getBooleanValue(element.getParent(), match, element, stream)
                : false;
        int ignoreLengthValue = ignoreLength != null
                ? ignoreLength.getIntegerValue(element.getParent(), match, element, stream)
                : 0;
        String ignoreCharValue = ignoreChar != null
                ? ignoreChar.getStringValue(element.getParent(), match, element, stream)
                : "";
        int maxIgnoreCharValue = maxIgnoreChar != null
                ? maxIgnoreChar.getIntegerValue(element.getParent(), match, element, stream)
                : 0;
        boolean ignoreWSValue = ignoreWS != null
                ? ignoreWS.getBooleanValue(element.getParent(), match, element, stream)
                : false;

        RutaWordList wordList = table.getWordList(index, element.getParent());
        Collection<AnnotationFS> found = wordList.find(stream, ignoreCaseValue, ignoreLengthValue,
                ignoreCharValue.toCharArray(), maxIgnoreCharValue, ignoreWSValue);
        for (AnnotationFS annotationFS : found) {
            // HOTFIX: for feature assignment
            String candidate = stream.getVisibleCoveredText(annotationFS);
            if (!StringUtils.isBlank(ignoreCharValue)) {
                for (int i = 0; i < maxIgnoreCharValue; i++) {
                    candidate = candidate.replaceFirst("[" + ignoreCharValue + "]", "");
                }
            }
            List<String> rowWhere = table.getRowWhere(index - 1, candidate);
            if (rowWhere.isEmpty() && ignoreCaseValue && candidate.length() > ignoreLengthValue) {
                // TODO: does not cover all variants
                rowWhere = table.getRowWhere(index - 1, candidate.toLowerCase());
            }
            FeatureStructure newFS = stream.getCas().createFS(type);
            if (newFS instanceof Annotation) {
                Annotation a = (Annotation) newFS;
                a.setBegin(annotationFS.getBegin());
                a.setEnd(annotationFS.getEnd());
                stream.addAnnotation(a, match);
            }
            TOP newStructure = null;
            if (newFS instanceof TOP) {
                newStructure = (TOP) newFS;
                fillFeatures(newStructure, map, annotationFS, element, rowWhere, stream);
                newStructure.addToIndexes();
            }
        }
    }

    private void fillFeatures(TOP structure, Map<String, Integer> map, AnnotationFS annotationFS,
            RuleElement element, List<String> row, RutaStream stream) {
        List<?> featuresList = structure.getType().getFeatures();
        for (int i = 0; i < featuresList.size(); i++) {
            Feature targetFeature = (Feature) featuresList.get(i);
            String name = targetFeature.getName();
            String shortFName = name.substring(name.indexOf(":") + 1, name.length());
            Integer entryIndex = map.get(shortFName);
            Type range = targetFeature.getRange();
            if (entryIndex != null && row.size() >= entryIndex) {
                String value = row.get(entryIndex - 1);
                if (range.getName().equals(UIMAConstants.TYPE_STRING)) {
                    structure.setStringValue(targetFeature, value);
                } else if (range.getName().equals(UIMAConstants.TYPE_INTEGER)) {
                    Integer integer = Integer.parseInt(value);
                    structure.setIntValue(targetFeature, integer);
                } else if (range.getName().equals(UIMAConstants.TYPE_DOUBLE)) {
                    Double d = Double.parseDouble(value);
                    structure.setDoubleValue(targetFeature, d);
                } else if (range.getName().equals(UIMAConstants.TYPE_FLOAT)) {
                    Float d = Float.parseFloat(value);
                    structure.setFloatValue(targetFeature, d);
                } else if (range.getName().equals(UIMAConstants.TYPE_BYTE)) {
                    Byte d = Byte.parseByte(value);
                    structure.setByteValue(targetFeature, d);
                } else if (range.getName().equals(UIMAConstants.TYPE_SHORT)) {
                    Short d = Short.parseShort(value);
                    structure.setShortValue(targetFeature, d);
                } else if (range.getName().equals(UIMAConstants.TYPE_LONG)) {
                    Long d = Long.parseLong(value);
                    structure.setLongValue(targetFeature, d);
                } else if (range.getName().equals(UIMAConstants.TYPE_BOOLEAN)) {
                    Boolean b = Boolean.parseBoolean(value);
                    structure.setBooleanValue(targetFeature, b);
                } else {
                }
            }

        }
    }

    public TypeExpression getTypeExpr() {
        return typeExpr;
    }

    public WordTableExpression getTableExpr() {
        return tableExpr;
    }

    public Map<IStringExpression, INumberExpression> getFeatureMap() {
        return featureMap;
    }

    public INumberExpression getIndexExpr() {
        return indexExpr;
    }

    public IBooleanExpression getIgnoreCase() {
        return ignoreCase;
    }

    public INumberExpression getIgnoreLength() {
        return ignoreLength;
    }

    public IStringExpression getIgnoreChar() {
        return ignoreChar;
    }

    public INumberExpression getMaxIgnoreChar() {
        return maxIgnoreChar;
    }
}