TupleWriter.java example

Explorer
myria-master
package edu.washington.escience.myria;

import java.io.IOException;
import java.io.OutputStream;
import java.io.Serializable;
import java.util.List;

import com.fasterxml.jackson.annotation.JsonSubTypes;
import com.fasterxml.jackson.annotation.JsonSubTypes.Type;
import com.fasterxml.jackson.annotation.JsonTypeInfo;

import edu.washington.escience.myria.storage.ReadableTable;

/**
 * A {@link TupleWriter} is an object that can serialize a {@link ReadableTable}. The assumption is that most classes
 * that implement {@link TupleWriter} will write the data to an {@link java.io.OutputStream}, e.g.
 *
 * There are three functions:
 *
 * <ul>
 * <li>{@link writeColumnHeaders} - called once at the start of a batch of tuples to enable the writer to label columns
 * if desired.</li>
 * <li>{@link writeTuples} - called when there are new tuples to serialize.</li>
 * <li>{@link done} - called when there will be no more tuples.</li>
 * </ul>
 *
 *
 */
@JsonTypeInfo(
  use = JsonTypeInfo.Id.NAME,
  include = JsonTypeInfo.As.PROPERTY,
  property = "writerType"
)
@JsonSubTypes({
  @Type(name = "CSV", value = CsvTupleWriter.class),
  @Type(name = "JSON", value = JsonTupleWriter.class),
  @Type(name = "PostgresBinary", value = PostgresBinaryTupleWriter.class)
})
public interface TupleWriter extends Serializable {
  /**
   * This will initialize the {@link TupleWriter} {@link java.io.OutputStream}.
   */
  void open(OutputStream stream) throws IOException;

  /**
   * Inform the {@link TupleWriter} of the column headers. In the standard case (CSV output, see {@link CsvTupleWriter}
   * ), they are written out directly. In some cases, they may be cached and output with the data (see
   * {@link JsonTupleWriter}).
   *
   * @param columnNames the names of the columns.
   * @throws IOException if there is an error writing the tuples.
   */
  void writeColumnHeaders(List<String> columnNames) throws IOException;

  /**
   * Provide a {@link TupleWriter} with tuples to serialize.
   *
   * @param tuples the batch of tuples to be serialized.
   * @throws IOException if there is an error writing the tuples.
   */
  void writeTuples(ReadableTable tuples) throws IOException;

  /**
   * Inform the {@link TupleWriter} that no more tuples will come. It may close and flush an
   * {@link java.io.OutputStream}, for example.
   *
   * @throws IOException if there is an error writing the tuples.
   */
  void done() throws IOException;

  /**
   * Called when the query filling in the {@link TupleWriter} has experienced an error. The {@link TupleWriter} should
   * close the stream, preferably also informing the end-point of the error.
   *
   * @throws IOException if there is an error manipulating the state.
   */
  void error() throws IOException;
}