package com.cse10.duplicateDetector;
import java.util.ArrayList;
import java.util.List;
/**
* use to generate 2-grams
* Created by Chamath on 1/2/2015.
*/
public class BinoryWordSegmenter extends WordSegmenter {
private StringBuilder stringBuilder;
public BinoryWordSegmenter() {
stringBuilder = new StringBuilder();
}
@Override
protected List<String> getWords(String document) {
List<String> binaryWords = new ArrayList<String>();
for (int i = 0; i < document.length() - 1; i += 1) {
//clear string builder
stringBuilder.setLength(0);
stringBuilder.append(document.charAt(i)).append(document.charAt(i + 1));
binaryWords.add(stringBuilder.toString());
}
return binaryWords;
}
}