/* * Copyright (c) 2015 Villu Ruusmann * * This file is part of JPMML-SkLearn * * JPMML-SkLearn is free software: you can redistribute it and/or modify * it under the terms of the GNU Affero General Public License as published by * the Free Software Foundation, either version 3 of the License, or * (at your option) any later version. * * JPMML-SkLearn is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU Affero General Public License for more details. * * You should have received a copy of the GNU Affero General Public License * along with JPMML-SkLearn. If not, see <http://www.gnu.org/licenses/>. */ package sklearn.preprocessing; import java.util.Arrays; import java.util.Collections; import java.util.List; import numpy.core.NDArray; import org.dmg.pmml.DataField; import org.dmg.pmml.DataType; import org.dmg.pmml.FieldName; import org.dmg.pmml.OpType; import org.jpmml.converter.BinaryFeature; import org.jpmml.converter.CategoricalFeature; import org.jpmml.converter.Feature; import org.jpmml.converter.PMMLUtil; import org.jpmml.converter.WildcardFeature; import org.jpmml.sklearn.SkLearnEncoder; import org.junit.Test; import static org.junit.Assert.assertEquals; import static org.junit.Assert.assertTrue; public class LabelBinarizerTest { @Test public void encode(){ SkLearnEncoder encoder = new SkLearnEncoder(); DataField dataField = encoder.createDataField(FieldName.create("x"), OpType.CATEGORICAL, DataType.STRING); Feature inputFeature = new WildcardFeature(encoder, dataField); NDArray array = new NDArray(); array.put("data", Arrays.asList("low", "medium", "high")); array.put("fortran_order", Boolean.FALSE); LabelBinarizer binarizer = new LabelBinarizer("sklearn.preprocessing.label", "LabelBinarizer"); binarizer.put("classes_", array); binarizer.put("pos_label", 1d); binarizer.put("neg_label", -1d); List<Feature> outputFeatures = binarizer.encodeFeatures(Collections.singletonList(inputFeature), encoder); for(Feature outputFeature : outputFeatures){ assertTrue(outputFeature instanceof CategoricalFeature); } assertEquals(Arrays.asList("low", "medium", "high"), PMMLUtil.getValues(dataField)); binarizer.put("neg_label", 0d); outputFeatures = binarizer.encodeFeatures(Collections.singletonList(inputFeature), encoder); for(Feature outputFeature : outputFeatures){ assertTrue(outputFeature instanceof BinaryFeature); } assertEquals(Arrays.asList("low", "medium", "high"), PMMLUtil.getValues(dataField)); } }