org.aliuge.crawler.extractor.selector.action.string.StringSplitAction.java Source code

Java tutorial

Introduction

Here is the source code for org.aliuge.crawler.extractor.selector.action.string.StringSplitAction.java

Source

/**
 * Licensed to the Apache Software Foundation (ASF) under one or more
 * contributor license agreements.  See the NOTICE file distributed with
 * this work for additional information regarding copyright ownership.
 * The ASF licenses this file to You under the Apache License, Version 2.0
 * (the "License"); you may not use this file except in compliance with
 * the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package org.aliuge.crawler.extractor.selector.action.string;

import java.util.Set;

import org.aliuge.crawler.extractor.selector.action.StringSelectorAction;
import org.apache.commons.lang3.StringUtils;

import com.google.common.collect.Sets;

/**
 * @author 
 * @date 2014911
 * @desc ?????Split???</br>
 * ?()??
 */
public class StringSplitAction extends StringSelectorAction {
    /**
     * 
     */
    private String split;
    private String newsplit = "|";
    private Set<Integer> set = Sets.newLinkedHashSet();

    /**
     * 
     * @param split
     * @param index
     */
    public StringSplitAction(String split, String index) {
        if (StringUtils.isNotBlank(split)) {
            this.split = split;
        } else {
            this.split = ",";
        }
        if (StringUtils.isNotBlank(index)) {
            String is[] = index.split(",");
            for (String i : is) {
                if (StringUtils.isNumeric(i)) {
                    set.add(Integer.parseInt(i));
                }
            }
        }
    }

    public StringSplitAction(String split, String index, String newsplit) {
        if (StringUtils.isNotBlank(split)) {
            this.split = split;
        } else {
            this.split = ",";
        }
        if (StringUtils.isNotBlank(index)) {
            String is[] = index.split(",");
            for (String i : is) {
                if (StringUtils.isNumeric(i)) {
                    set.add(Integer.parseInt(i));
                }
            }
            if (set.size() > 0) {
                if (StringUtils.isNotBlank(newsplit))
                    this.newsplit = newsplit;
            }
        }
    }

    /**
     * ?????Split???</br>
     * ?()??</br>
     * ?0?
     */
    @Override
    public String doAction(String content) {
        if (StringUtils.isNotBlank(content)) {
            if (set.size() > 0) {
                String[] subs = StringUtils.split(content, this.split);
                StringBuilder sb = new StringBuilder();
                for (Integer i : set) {
                    if (i < subs.length) {
                        if (i > -1)
                            sb.append(subs[i]).append(newsplit);
                    }
                }
                if (sb.length() > 0)
                    return sb.substring(0, sb.length() - 1);
            } else {
                return StringUtils.split(content, this.split)[0];
            }
        }
        return "";
    }

}