org.apache.lucene.analysis.kr.test.CNounsUtils.java Source code

Java tutorial

Introduction

Here is the source code for org.apache.lucene.analysis.kr.test.CNounsUtils.java

Source

/*
 * Copyright 2011-2013 the original author or authors.
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package org.apache.lucene.analysis.kr.test;

import junit.framework.TestCase;
import lombok.extern.slf4j.Slf4j;
import org.apache.commons.io.FileUtils;
import org.apache.commons.lang3.StringUtils;

import java.io.File;
import java.io.IOException;
import java.util.*;

@Slf4j
public class CNounsUtils extends TestCase {

    public void testAdjust() throws Exception {

        List<String> strs = FileUtils.readLines(new File("cnouns_all.txt"));

        Map<String, String> compoundList = new TreeMap<String, String>();
        Map<String, String> nounList = new TreeMap<String, String>();

        for (String str : strs) {
            System.out.println(str);
            if (str == null || str.length() < 1)
                continue;

            str = str.trim();
            String[] infoNouns = StringUtils.split(str, ":");
            if (infoNouns.length == 2) {
                infoNouns[0] = infoNouns[0].trim();
                if (compoundList.get(infoNouns[0]) == null)
                    compoundList.put(infoNouns[0], str);
            } else {
                if (compoundList.get(str) == null && str.length() > 1)
                    nounList.put(str, str);
            }
        }

        writeResult(compoundList, "compounds.txt");
        writeResult(nounList, "noun.txt");

    }

    private void writeResult(Map map, String fName) throws IOException {

        Iterator<String> iter = map.keySet().iterator();
        List list = new ArrayList();
        while (iter.hasNext()) {
            String str = iter.next();
            list.add(map.get(str));
        }

        FileUtils.writeLines(new File(fName), list);
    }

}