/*
* Licensed to Elasticsearch under one or more contributor
* license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright
* ownership. Elasticsearch licenses this file to you under
* the Apache License, Version 2.0 (the "License"); you may
* not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing,
* software distributed under the License is distributed on an
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
* KIND, either express or implied. See the License for the
* specific language governing permissions and limitations
* under the License.
*/
package org.elasticsearch.ml.modelinput;
import java.util.ArrayList;
import java.util.HashMap;
import java.util.List;
import java.util.Map;
public class VectorRangesToVectorPMML extends VectorRangesToVector {
public VectorRangesToVectorPMML(List<VectorRange> fieldsToVectors, int numEntries) {
this.sparse = true;
this.vectorRangeList = fieldsToVectors;
this.numEntries = numEntries;
}
@SuppressWarnings("unchecked")
public Object vector(DataSource dataSource) {
HashMap<String, List<Object>> fieldValues = new HashMap<>();
for (VectorRange vectorRange : this.vectorRangeList) {
// TODO: vector range can depend on several fields
String field = vectorRange.getField();
if (field != null) {
// TODO: We assume here doc lookup will always give us something back. What if not?
fieldValues.put(field, dataSource.getValues(field));
}
}
return vector(fieldValues);
}
public Object vector(Map<String, List<Object>> fieldValues) {
int length = 0;
List<EsSparseNumericVector> sparseNumericVectors = new ArrayList<>();
for (VectorRange vectorRange : this.vectorRangeList) {
EsVector entries = vectorRange.getVector(fieldValues);
assert entries instanceof EsSparseNumericVector;
sparseNumericVectors.add((EsSparseNumericVector) entries);
length += ((EsSparseNumericVector) entries).values.v1().length;
}
Map<String, Object> finalVector = new HashMap<>();
double[] values = new double[length];
int[] indices = new int[length];
int i = 0;
for (EsSparseNumericVector esSparseNumericVector : sparseNumericVectors) {
for (int j = 0; j < esSparseNumericVector.values.v1().length; j++) {
indices[i] = esSparseNumericVector.values.v1()[j];
values[i] = esSparseNumericVector.values.v2()[j];
i++;
}
}
finalVector.put("values", values);
finalVector.put("indices", indices);
finalVector.put("length", numEntries);
return finalVector;
}
public static class VectorRangesToVectorPMMLGeneralizedRegression extends VectorRangesToVectorPMML {
public String[] getOrderedParameterList() {
return orderedParameterList;
}
private final String[] orderedParameterList;
public VectorRangesToVectorPMMLGeneralizedRegression(List<VectorRange> features, int numEntries, String[] orderedParameterList) {
super(features, numEntries);
this.orderedParameterList = orderedParameterList;
}
}
public static class VectorRangesToVectorPMMLTreeModel extends VectorRangesToVectorPMML {
public VectorRangesToVectorPMMLTreeModel(List<VectorRange> fieldsToVectors) {
super(fieldsToVectors, fieldsToVectors.size());
}
@Override
public Object vector(Map<String, List<Object>> fieldValues) {
HashMap<String, Object> values = new HashMap<>();
for (VectorRange vectorRange : vectorRangeList) {
assert vectorRange instanceof PMMLVectorRange.FieldToValue;
values.putAll(((EsValueMapVector) vectorRange.getVector(fieldValues)).getValues());
}
return values;
}
}
}