/**
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.mahout.math.hadoop.stochasticsvd;
import java.util.Arrays;
import java.util.Iterator;
import org.apache.mahout.math.Vector;
import org.apache.mahout.math.Vector.Element;
/**
* simplistic implementation for Omega matrix in Stochastic SVD method
*/
public class Omega {
private static final double UNIFORM_DIVISOR = Math.pow(2.0, 64);
private final long seed;
private final int kp;
public Omega(long seed, int k, int p) {
this.seed = seed;
kp = k + p;
}
/**
* Get omega element at (x,y) uniformly distributed within [-1...1)
*
* @param row
* omega row
* @param column
* omega column
*/
public double getQuick(int row, int column) {
long hash = murmur64((long) row << Integer.SIZE | column, 8, seed);
return hash / UNIFORM_DIVISOR;
}
/**
* compute YRow=ARow*Omega.
*
* @param aRow
* row of matrix A (size n)
* @param yRow
* row of matrix Y (result) must be pre-allocated to size of (k+p)
*/
@Deprecated
public void computeYRow(Vector aRow, double[] yRow) {
// assert yRow.length == kp;
Arrays.fill(yRow, 0.0);
if (aRow.isDense()) {
int n = aRow.size();
for (int j = 0; j < n; j++) {
accumDots(j, aRow.getQuick(j), yRow);
}
} else {
for (Iterator<Element> iter = aRow.iterateNonZero(); iter.hasNext();) {
Element el = iter.next();
accumDots(el.index(), el.get(), yRow);
}
}
}
/**
* A version to compute yRow as a sparse vector in case of extremely sparse
* matrices
*
* @param aRow
* @param yRowOut
*/
public void computeYRow(Vector aRow, Vector yRowOut) {
yRowOut.assign(0.0);
if (aRow.isDense()) {
int n = aRow.size();
for (int j = 0; j < n; j++) {
accumDots(j, aRow.getQuick(j), yRowOut);
}
} else {
for (Iterator<Element> iter = aRow.iterateNonZero(); iter.hasNext();) {
Element el = iter.next();
accumDots(el.index(), el.get(), yRowOut);
}
}
}
protected void accumDots(int aIndex, double aElement, double[] yRow) {
for (int i = 0; i < kp; i++) {
yRow[i] += getQuick(aIndex, i) * aElement;
}
}
protected void accumDots(int aIndex, double aElement, Vector yRow) {
for (int i = 0; i < kp; i++) {
yRow.setQuick(i, yRow.getQuick(i) + getQuick(aIndex, i) * aElement);
}
}
/**
* Shortened version for data < 8 bytes packed into {@code len} lowest bytes
* of {@code val}.
*
* @param val
* the value
* @param len
* the length of data packed into this many low bytes of {@code val}
* @param seed
* the seed to use
* @return murmur hash
*/
public static long murmur64(long val, int len, long seed) {
// assert len > 0 && len <= 8;
long m = 0xc6a4a7935bd1e995L;
long h = seed ^ len * m;
long k = val;
k *= m;
int r = 47;
k ^= k >>> r;
k *= m;
h ^= k;
h *= m;
h ^= h >>> r;
h *= m;
h ^= h >>> r;
return h;
}
public static long murmur64(byte[] val, int offset, int len, long seed) {
long m = 0xc6a4a7935bd1e995L;
int r = 47;
long h = seed ^ (len * m);
int lt = len >>> 3;
for (int i = 0; i < lt; i++, offset += 8) {
long k = 0;
for (int j = 0; j < 8; j++) {
k <<= 8;
k |= val[offset + j] & 0xff;
}
k *= m;
k ^= k >>> r;
k *= m;
h ^= k;
h *= m;
}
if (offset < len) {
long k = 0;
while (offset < len) {
k <<= 8;
k |= val[offset] & 0xff;
offset++;
}
h ^= k;
h *= m;
}
h ^= h >>> r;
h *= m;
h ^= h >>> r;
return h;
}
}