/** * OLAT - Online Learning and Training<br> * http://www.olat.org * <p> * Licensed under the Apache License, Version 2.0 (the "License"); <br> * you may not use this file except in compliance with the License.<br> * You may obtain a copy of the License at * <p> * http://www.apache.org/licenses/LICENSE-2.0 * <p> * Unless required by applicable law or agreed to in writing,<br> * software distributed under the License is distributed on an "AS IS" BASIS, <br> * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. <br> * See the License for the specific language governing permissions and <br> * limitations under the License. * <p> * Copyright (c) since 2004 at Multimedia- & E-Learning Services (MELS),<br> * University of Zurich, Switzerland. * <hr> * <a href="http://www.openolat.org"> * OpenOLAT - Online Learning and Training</a><br> * This file has been modified by the OpenOLAT community. Changes are licensed * under the Apache 2.0 license as the original file. */ package org.olat.search.service.document.file; import java.io.IOException; import java.io.InputStream; import org.apache.lucene.document.Document; import org.olat.core.gui.util.CSSHelper; import org.olat.core.logging.OLog; import org.olat.core.logging.Tracing; import org.olat.core.util.FileUtils; import org.olat.core.util.filter.impl.NekoHTMLFilter; import org.olat.core.util.filter.impl.NekoHTMLFilter.NekoContent; import org.olat.core.util.vfs.VFSLeaf; import org.olat.search.service.SearchResourceContext; /** * Lucene document mapper. * @author Christian Guretzki */ public class XmlDocument extends FileDocument { private static final long serialVersionUID = -5486191227086694167L; private static final OLog log = Tracing.createLoggerFor(XmlDocument.class); public static final String FILE_TYPE = "type.file.html"; public XmlDocument() { // } public static Document createDocument(SearchResourceContext leafResourceContext, VFSLeaf leaf) throws IOException,DocumentException,DocumentAccessException { XmlDocument htmlDocument = new XmlDocument(); htmlDocument.init(leafResourceContext,leaf); htmlDocument.setFileType(FILE_TYPE); htmlDocument.setCssIcon(CSSHelper.createFiletypeIconCssClassFor(leaf.getName())); if (log.isDebug() ) log.debug(htmlDocument.toString()); return htmlDocument.getLuceneDocument(); } //fxdiff FXOLAT-97: index run in infinite loop protected FileContent readContent(VFSLeaf leaf) throws IOException { InputStream is = leaf.getInputStream(); // Remove all HTML and   Tags NekoContent output; try { output = new NekoHTMLFilter().filter(is); if (log.isDebug() ) log.debug("HTML content without tags :" + output); } catch (Exception e) { throw new IOException(e); } finally { FileUtils.closeSafely(is); } return new FileContent(output.getTitle(), output.getContent()); } }