com.scaleunlimited.classify.vectors.TfNormalizer.java Source code

Java tutorial

Introduction

Here is the source code for com.scaleunlimited.classify.vectors.TfNormalizer.java

Source

/**
 * Copyright (c) 2009-2015 Scale Unlimited, Inc.
 * 
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 * 
 *     http://www.apache.org/licenses/LICENSE-2.0
 * 
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package com.scaleunlimited.classify.vectors;

import org.apache.mahout.math.Vector;
import org.apache.mahout.math.function.DoubleDoubleFunction;

/**
 * Given a vector of counts, turn these into term frequency values.
 *
 */
@SuppressWarnings("serial")
public class TfNormalizer extends BaseNormalizer {

    @Override
    public void normalize(Vector vector) {
        double totalCount = vector.zSum();
        vector.assign(new DoubleDoubleFunction() {

            @Override
            public double apply(double curValue, double totalCount) {
                return curValue / totalCount;
            }
        }, totalCount);
    }
}