/*
* This file is part of ELKI:
* Environment for Developing KDD-Applications Supported by Index-Structures
*
* Copyright (C) 2017
* ELKI Development Team
*
* This program is free software: you can redistribute it and/or modify
* it under the terms of the GNU Affero General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU Affero General Public License for more details.
*
* You should have received a copy of the GNU Affero General Public License
* along with this program. If not, see <http://www.gnu.org/licenses/>.
*/
package de.lmu.ifi.dbs.elki.datasource;
import java.util.ArrayList;
import java.util.Arrays;
import java.util.List;
import de.lmu.ifi.dbs.elki.data.DoubleVector;
import de.lmu.ifi.dbs.elki.data.type.SimpleTypeInformation;
import de.lmu.ifi.dbs.elki.data.type.TypeUtil;
import de.lmu.ifi.dbs.elki.data.type.VectorFieldTypeInformation;
import de.lmu.ifi.dbs.elki.database.ids.DBIDFactory;
import de.lmu.ifi.dbs.elki.datasource.bundle.MultipleObjectsBundle;
import de.lmu.ifi.dbs.elki.utilities.exceptions.AbortException;
/**
* Import an existing data matrix (<code>double[rows][cols]</code>) into an ELKI
* database.
*
* For efficiency, the data is <em>not</em> copied. If you modify the array
* afterwards, you can break indexes and algorithm results. It is your
* responsbility to not do this!
*
* Note: this class is not parameterizable, but can only be used from Java.
*
* @author Erich Schubert
* @since 0.5.0
*/
public class ArrayAdapterDatabaseConnection implements DatabaseConnection {
/**
* The actual data.
*/
double[][] data;
/**
* Object labels.
*/
String[] labels;
/**
* Starting ID for fixed object ids.
*/
Integer startid = null;
/**
* Constructor.
*
* @param data Existing data matrix
*/
public ArrayAdapterDatabaseConnection(double[][] data) {
this(data, null, null);
}
/**
* Constructor.
*
* @param data Existing data matrix
* @param labels Object labels
*/
public ArrayAdapterDatabaseConnection(double[][] data, String[] labels) {
this(data, labels, null);
}
/**
* Constructor.
*
* @param data Existing data matrix
* @param labels Object labels
* @param startid Starting object ID
*/
public ArrayAdapterDatabaseConnection(double[][] data, String[] labels, Integer startid) {
super();
this.data = data;
this.labels = labels;
this.startid = startid;
}
@Override
public MultipleObjectsBundle loadData() {
MultipleObjectsBundle b = new MultipleObjectsBundle();
if(startid != null) {
b.setDBIDs(DBIDFactory.FACTORY.generateStaticDBIDRange(startid, data.length));
}
int mind = Integer.MAX_VALUE;
int maxd = 0;
List<DoubleVector> vecs = new ArrayList<>(data.length);
for(int i = 0; i < data.length; i++) {
mind = Math.min(mind, data[i].length);
maxd = Math.max(maxd, data[i].length);
vecs.add(DoubleVector.wrap(data[i]));
}
SimpleTypeInformation<DoubleVector> type = new VectorFieldTypeInformation<>(DoubleVector.FACTORY, mind, maxd, DoubleVector.FACTORY.getDefaultSerializer());
b.appendColumn(type, vecs);
if(labels != null) {
if(labels.length != data.length) {
throw new AbortException("Label and DBID columns must have the same size.");
}
b.appendColumn(TypeUtil.STRING, Arrays.asList(labels));
}
return b;
}
}