package eu.dnetlib.iis.wf.affmatching.bucket.projectorg.read; import java.io.Serializable; import org.apache.spark.api.java.JavaRDD; import org.apache.spark.api.java.JavaSparkContext; import eu.dnetlib.iis.wf.affmatching.bucket.projectorg.model.AffMatchDocumentProject; /** * Reader of relations between documents and projects. * * @author mhorst */ public interface DocumentProjectReader extends Serializable { /** * Reads document to project relations that are in <code>inputPath</code>. * The relations that are in <code>inputPath</code> can be in any format. * The implementation of the reader, however, must return them as rdd of {@link AffMatchDocumentProject}. */ JavaRDD<AffMatchDocumentProject> readDocumentProjects(JavaSparkContext sc, String inputPath); }