package edu.fudan.nlp.pipe.seq;
import edu.fudan.ml.types.Instance;
import edu.fudan.nlp.cn.Chars;
import edu.fudan.nlp.pipe.Pipe;
/**
* 处理混合语言字符串
* @author Feng Ji
*
*/
public class MixedString2Sequence extends Pipe {
@Override
public void addThruPipe(Instance inst) throws Exception {
String str = (String) inst.getData();
char[] toks = str.toCharArray();
StringBuilder sb = new StringBuilder();
for(int i = 0; i < toks.length; i++) {
if (Chars.isChar(toks[i])) {
sb.append(toks[i]);
sb.append(" ");
}
}
}
}