/**
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.mahout.cf.taste.similarity.precompute.example;
import org.apache.mahout.cf.taste.impl.recommender.GenericItemBasedRecommender;
import org.apache.mahout.cf.taste.impl.similarity.LogLikelihoodSimilarity;
import org.apache.mahout.cf.taste.impl.similarity.precompute.FileSimilarItemsWriter;
import org.apache.mahout.cf.taste.impl.similarity.precompute.MultithreadedBatchItemSimilarities;
import org.apache.mahout.cf.taste.model.DataModel;
import org.apache.mahout.cf.taste.recommender.ItemBasedRecommender;
import org.apache.mahout.cf.taste.similarity.precompute.BatchItemSimilarities;
import java.io.File;
/**
* Example that precomputes all item similarities of the Movielens1M dataset
*
* Usage: download movielens1M from http://www.grouplens.org/node/73 , unzip it and invoke this code with the path
* to the ratings.dat file as argument
*
*/
public final class BatchItemSimilaritiesGroupLens {
private BatchItemSimilaritiesGroupLens() {}
public static void main(String[] args) throws Exception {
if (args.length != 1) {
System.err.println("Need path to ratings.dat of the movielens1M dataset as argument!");
System.exit(-1);
}
File resultFile = new File(System.getProperty("java.io.tmpdir"), "similarities.csv");
if (resultFile.exists()) {
resultFile.delete();
}
DataModel dataModel = new GroupLensDataModel(new File(args[0]));
ItemBasedRecommender recommender = new GenericItemBasedRecommender(dataModel,
new LogLikelihoodSimilarity(dataModel));
BatchItemSimilarities batch = new MultithreadedBatchItemSimilarities(recommender, 5);
int numSimilarities = batch.computeItemSimilarities(Runtime.getRuntime().availableProcessors(), 1,
new FileSimilarItemsWriter(resultFile));
System.out.println("Computed " + numSimilarities + " similarities for " + dataModel.getNumItems() + " items "
+ "and saved them to " + resultFile.getAbsolutePath());
}
}