/* The contents of this file are subject to the license and copyright terms * detailed in the license directory at the root of the source tree (also * available online at http://fedora-commons.org/license/). */ package fedora.server.storage.translation; import fedora.common.Constants; import fedora.common.Models; import fedora.common.PID; import fedora.common.xml.format.XMLFormat; import fedora.server.errors.ObjectIntegrityException; import fedora.server.errors.StreamIOException; import fedora.server.storage.types.Datastream; import fedora.server.storage.types.DatastreamXMLMetadata; import fedora.server.storage.types.DigitalObject; import fedora.server.utilities.DateUtility; import fedora.server.utilities.StreamUtility; import fedora.utilities.MimeTypeUtils; import org.apache.abdera.Abdera; import org.apache.abdera.ext.thread.ThreadHelper; import org.apache.abdera.i18n.iri.IRI; import org.apache.abdera.model.Entry; import org.apache.abdera.model.Feed; import org.apache.abdera.model.Link; import org.apache.abdera.util.MimeTypeHelper; import org.apache.commons.io.IOUtils; import java.io.ByteArrayInputStream; import java.io.IOException; import java.io.InputStream; import java.io.OutputStream; import java.io.Reader; import java.io.StringReader; import java.io.UnsupportedEncodingException; import java.util.Date; import java.util.Iterator; import java.util.zip.ZipEntry; import java.util.zip.ZipOutputStream; /** * <p>Serializes a Fedora Object in Atom with Threading Extensions.</p> * * <p>A Fedora Digital Object is represented as an atom:feed and * Datastreams are represented as an atom:entries.</p> * * <p>The hierarchy of Datastreams their Datastream Versions is * represented via the Atom Threading Extensions. * For convenience, a datastream entry references its latest datastream * version entry with an atom:link element. For example, a DC datastream * entry with a reference to its most recent version: <br/> * <code><link href="info:fedora/demo:foo/DC/2008-04-01T12:30:15.123" rel="alternate"/></code></p> * * <p>Each datastream version refers to its parent datastream via a * thr:in-reply-to element. For example, the entry for a DC datastream * version would include:<br/> * <code><thr:in-reply-to ref="info:fedora/demo:foo/DC"/></code></p> * * @see <a href="http://atomenabled.org/developers/syndication/atom-format-spec.php">The Atom Syndication Format</a> * @see <a href="http://www.ietf.org/rfc/rfc4685.txt">Atom Threading Extensions</a> * * @author Edwin Shin * @since 3.0 * @version $Id$ */ public class AtomDOSerializer implements DOSerializer, Constants { /** * The format this serializer will write if unspecified at construction. * This defaults to the latest ATOM format. */ public static final XMLFormat DEFAULT_FORMAT = ATOM1_1; private final static Abdera abdera = Abdera.getInstance(); private DigitalObject m_obj; private String m_encoding; /** The current translation context. */ private int m_transContext; /** The format this serializer writes. */ private final XMLFormat m_format; private PID m_pid; protected Feed m_feed; private ZipOutputStream m_zout; public AtomDOSerializer() { this(DEFAULT_FORMAT); } public AtomDOSerializer(XMLFormat format) { if (format.equals(ATOM1_1) || format.equals(ATOM_ZIP1_1)) { m_format = format; } else { throw new IllegalArgumentException("Not an ATOM format: " + format.uri); } } /** * {@inheritDoc} */ public DOSerializer getInstance() { return new AtomDOSerializer(m_format); } /** * {@inheritDoc} */ public void serialize(DigitalObject obj, OutputStream out, String encoding, int transContext) throws ObjectIntegrityException, StreamIOException, UnsupportedEncodingException { m_obj = obj; m_encoding = (encoding == null || encoding == "") ? "UTF-8" : encoding; m_transContext = transContext; m_pid = PID.getInstance(m_obj.getPid()); m_feed = abdera.newFeed(); if (m_format.equals(ATOM_ZIP1_1)) { m_zout = new ZipOutputStream(out); } addObjectProperties(); m_feed .setIcon("http://www.fedora-commons.org/images/logo_vertical_transparent_200_251.png"); addDatastreams(); if (m_format.equals(ATOM_ZIP1_1)) { try { m_zout.putNextEntry(new ZipEntry("atommanifest.xml")); m_feed.writeTo("prettyxml", m_zout); m_zout.closeEntry(); m_zout.close(); } catch (IOException e) { throw new StreamIOException(e.getMessage(), e); } } else { try { m_feed.writeTo("prettyxml", out); } catch (IOException e) { throw new StreamIOException(e.getMessage(), e); } } } private void addObjectProperties() throws ObjectIntegrityException { String state = DOTranslationUtility.getStateAttribute(m_obj); String ownerId = m_obj.getOwnerId(); String label = m_obj.getLabel(); Date cdate = m_obj.getCreateDate(); Date mdate = m_obj.getLastModDate(); m_feed.setId(m_pid.toURI()); m_feed.setTitle(label == null ? "" : label); m_feed.setUpdated(mdate); m_feed.addAuthor(ownerId == null ? "" : StreamUtility.enc(ownerId)); m_feed.addCategory(MODEL.STATE.uri, state, null); if (cdate != null) { m_feed.addCategory(MODEL.CREATED_DATE.uri, DateUtility .convertDateToString(cdate), null); } // TODO not sure I'm satisfied with this representation of extProperties for (String extProp : m_obj.getExtProperties().keySet()) { m_feed.addCategory(MODEL.EXT_PROPERTY.uri, extProp, m_obj .getExtProperty(extProp)); } } private void addDatastreams() throws ObjectIntegrityException, UnsupportedEncodingException, StreamIOException { Iterator<String> iter = m_obj.datastreamIdIterator(); String dsid; while (iter.hasNext()) { dsid = iter.next(); // AUDIT datastream is rebuilt from the latest in-memory audit trail // which is a separate array list in the DigitalObject class. // So, ignore it here. if (dsid.equals("AUDIT") || dsid.equals("FEDORA-AUDITTRAIL")) { continue; } Entry dsEntry = m_feed.addEntry(); Datastream latestCreated = null; long latestCreateTime = -1; for (Datastream v : m_obj.datastreams(dsid)) { Datastream dsv = DOTranslationUtility.setDatastreamDefaults(v); // Keep track of the most recent datastream version if (dsv.DSCreateDT.getTime() > latestCreateTime) { latestCreateTime = dsv.DSCreateDT.getTime(); latestCreated = dsv; } Entry dsvEntry = m_feed.addEntry(); dsvEntry.setId(m_pid.toURI() + "/" + dsv.DatastreamID + "/" + DateUtility.convertDateToString(dsv.DSCreateDT)); dsvEntry.setTitle(dsv.DSVersionID); dsvEntry.setUpdated(dsv.DSCreateDT); ThreadHelper.addInReplyTo(dsvEntry, m_pid.toURI() + "/" + dsv.DatastreamID); String altIds = DOTranslationUtility.oneString(dsv.DatastreamAltIDs); if (altIds != null && !altIds.equals("")) { dsvEntry.addCategory(MODEL.ALT_IDS.uri, altIds, null); } if (dsv.DSFormatURI != null && !dsv.DSFormatURI.equals("")) { dsvEntry.addCategory(MODEL.FORMAT_URI.uri, dsv.DSFormatURI, null); } dsvEntry.addCategory(MODEL.LABEL.uri, dsv.DSLabel == null ? "" : dsv.DSLabel, null); // include checksum if it has a value String csType = dsv.getChecksumType(); if (csType != null && csType.length() > 0 && !csType.equals(Datastream.CHECKSUMTYPE_DISABLED)) { dsvEntry.addCategory(MODEL.DIGEST_TYPE.uri, csType, null); dsvEntry.addCategory(MODEL.DIGEST.uri, dsv.getChecksum(), null); } // include size if it's non-zero if (dsv.DSSize != 0) { dsvEntry.addCategory(MODEL.LENGTH.uri, Long .toString(dsv.DSSize), null); } setContent(dsvEntry, dsv); } // The "main" entry for the Datastream with a link to the atom:id // of the most recent datastream version dsEntry.setId(m_pid.toURI() + "/" + latestCreated.DatastreamID); dsEntry.setTitle(latestCreated.DatastreamID); dsEntry.setUpdated(latestCreated.DSCreateDT); dsEntry .addLink(m_pid.toURI() + "/" + latestCreated.DatastreamID + "/" + DateUtility .convertDateToString(latestCreated.DSCreateDT), Link.REL_ALTERNATE); dsEntry.addCategory(MODEL.STATE.uri, latestCreated.DSState, null); dsEntry.addCategory(MODEL.CONTROL_GROUP.uri, latestCreated.DSControlGrp, null); dsEntry.addCategory(MODEL.VERSIONABLE.uri, Boolean .toString(latestCreated.DSVersionable), null); } addAuditDatastream(); } /** * AUDIT datastream is rebuilt from the latest in-memory audit trail which * is a separate array list in the DigitalObject class. Audit trail * datastream re-created from audit records. There is only ONE version of * the audit trail datastream * * @throws ObjectIntegrityException * @throws StreamIOException */ private void addAuditDatastream() throws ObjectIntegrityException, StreamIOException { if (m_obj.getAuditRecords().size() == 0) { return; } String dsId = m_pid.toURI() + "/AUDIT"; String dsvId = dsId + "/" + DateUtility .convertDateToString(m_obj.getCreateDate()); Entry dsEntry = m_feed.addEntry(); dsEntry.setId(dsId); dsEntry.setTitle("AUDIT"); dsEntry.setUpdated(m_obj.getCreateDate()); // create date? dsEntry.addCategory(MODEL.STATE.uri, "A", null); dsEntry.addCategory(MODEL.CONTROL_GROUP.uri, "X", null); dsEntry.addCategory(MODEL.VERSIONABLE.uri, "false", null); dsEntry.addLink(dsvId, Link.REL_ALTERNATE); Entry dsvEntry = m_feed.addEntry(); dsvEntry.setId(dsvId); dsvEntry.setTitle("AUDIT.0"); dsvEntry.setUpdated(m_obj.getCreateDate()); ThreadHelper.addInReplyTo(dsvEntry, m_pid.toURI() + "/AUDIT"); dsvEntry.addCategory(MODEL.FORMAT_URI.uri, AUDIT1_0.uri, null); dsvEntry .addCategory(MODEL.LABEL.uri, "Audit Trail for this object", null); if (m_format.equals(ATOM_ZIP1_1)) { String name = "AUDIT.0.xml"; try { m_zout.putNextEntry(new ZipEntry(name)); Reader r = new StringReader(DOTranslationUtility.getAuditTrail(m_obj)); IOUtils.copy(r, m_zout, m_encoding); m_zout.closeEntry(); r.close(); } catch(IOException e) { throw new StreamIOException(e.getMessage(), e); } IRI iri = new IRI(name); dsvEntry.setSummary("AUDIT.0"); dsvEntry.setContent(iri, "text/xml"); } else { dsvEntry.setContent(DOTranslationUtility.getAuditTrail(m_obj), "text/xml"); } } private void setContent(Entry entry, Datastream vds) throws UnsupportedEncodingException, StreamIOException { if (vds.DSControlGrp.equalsIgnoreCase("X")) { setInlineXML(entry, (DatastreamXMLMetadata) vds); } else if (vds.DSControlGrp.equalsIgnoreCase("E") || vds.DSControlGrp.equalsIgnoreCase("R")) { setReferencedContent(entry, vds); } else if (vds.DSControlGrp.equalsIgnoreCase("M")) { setManagedContent(entry, vds); } } private void setInlineXML(Entry entry, DatastreamXMLMetadata ds) throws UnsupportedEncodingException, StreamIOException { String content; if (m_obj.hasContentModel( Models.SERVICE_DEPLOYMENT_3_0) && (ds.DatastreamID.equals("SERVICE-PROFILE") || ds.DatastreamID .equals("WSDL"))) { content = DOTranslationUtility .normalizeInlineXML(new String(ds.xmlContent, m_encoding), m_transContext); } else { content = new String(ds.xmlContent, m_encoding); } if (m_format.equals(ATOM_ZIP1_1)) { String name = ds.DSVersionID + ".xml"; try { m_zout.putNextEntry(new ZipEntry(name)); InputStream is = new ByteArrayInputStream(content.getBytes(m_encoding)); IOUtils.copy(is, m_zout); m_zout.closeEntry(); is.close(); } catch(IOException e) { throw new StreamIOException(e.getMessage(), e); } IRI iri = new IRI(name); entry.setSummary(ds.DSVersionID); entry.setContent(iri, ds.DSMIME); } else { entry.setContent(content, ds.DSMIME); } } private void setReferencedContent(Entry entry, Datastream vds) throws StreamIOException { entry.setSummary(vds.DSVersionID); String dsLocation = StreamUtility.enc(DOTranslationUtility .normalizeDSLocationURLs(m_obj.getPid(), vds, m_transContext).DSLocation); IRI iri = new IRI(dsLocation); entry.setContent(iri, vds.DSMIME); } private void setManagedContent(Entry entry, Datastream vds) throws StreamIOException { // If the ARCHIVE context is selected, inline & base64 encode the content, // unless the format is ZIP. if (m_transContext == DOTranslationUtility.SERIALIZE_EXPORT_ARCHIVE && !m_format.equals(ATOM_ZIP1_1)) { String mimeType = vds.DSMIME; if (MimeTypeHelper.isText(mimeType) || MimeTypeHelper.isXml(mimeType)) { try { entry.setContent(IOUtils.toString(vds.getContentStream(), m_encoding), mimeType); } catch (IOException e) { throw new StreamIOException(e.getMessage(), e); } } else { entry.setContent(vds.getContentStream(), mimeType); } } else { String dsLocation; IRI iri; if (m_format.equals(ATOM_ZIP1_1) && m_transContext != DOTranslationUtility.AS_IS) { dsLocation = vds.DSVersionID + "." + MimeTypeUtils.fileExtensionForMIMEType(vds.DSMIME); try { m_zout.putNextEntry(new ZipEntry(dsLocation)); IOUtils.copy(vds.getContentStream(), m_zout); m_zout.closeEntry(); } catch(IOException e) { throw new StreamIOException(e.getMessage(), e); } } else { dsLocation = StreamUtility.enc(DOTranslationUtility .normalizeDSLocationURLs(m_obj.getPid(), vds, m_transContext).DSLocation); } iri = new IRI(dsLocation); entry.setSummary(vds.DSVersionID); entry.setContent(iri, vds.DSMIME); } } }