/* * Copyright 2010-2011 Øyvind Berg (elacin@gmail.com) * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package org.elacin.pdfextract; /** * Created by IntelliJ IDEA. User: elacin Date: 16.01.11 Time: 19.57 To change this template use * File | Settings | File Templates. */ @SuppressWarnings({ "RedundantFieldInitialization" }) public class Constants { /* column finder */ public static final float COLUMNS_MIN_COLUMN_WIDTH = 2.0f; public static final int RENDER_DPI = 2*72; public static final int RENDER_RESOLUTION = 100; public static final String SIMPLE_OUTPUT_EXTENSION = ".pxml"; public static final String TEI_OUTPUT_EXTENSION = ".xml"; // ------------------------------ FIELDS ------------------------------ /* segmentation */ public static final boolean USE_EXISTING_WHITESPACE = true; public static final boolean SPLIT_PARAGRAPHS_BY_STYLES = true; /* what to render */ public static final boolean RENDER_WHITESPACE = true; public static final boolean RENDER_REAL_PAGE = true; public static final boolean RENDER_PARAGRAPHS = false; public static final boolean RENDER_PARAGRAPH_NUMBERS = false; public static final boolean RENDER_PAGE_REGIONS = false; public static final boolean RENDER_LINE_NODES = true; public static final boolean RENDER_GRAPHIC_NODES = true; public static final boolean RENDER_WORD_NODES = true; /* rendering */ public static final boolean RENDER_ENABLED = false; public static final boolean RENDER_COLUMNS = true; public static final boolean RENDER_COLUMN_CANDIDATES = false; /* technical */ public static final boolean RECTANGLE_COLLECTION_CACHE_ENABLED = true; /* xmls output */ public static final boolean VERBOSE_OUTPUT = false; public static final boolean TEI_OUTPUT_ENABLED = true; public static final boolean SIMPLE_OUTPUT_ENABLED = true; public static final boolean ESCAPE_HTML = false; /* whitespace cover algorithm */ public static final boolean WHITESPACE_CHECK_LOCAL_HEIGHT = true; public static final boolean WHITESPACE_CHECK_TEXT_BOTH_SIDES = true; public static final boolean WHITESPACE_CHECK_CONNECTED_FROM_EDGE = true; public static final float WHITESPACE_FUZZINESS = 0.2f; public static final boolean WHITESPACE_FUZZY_EMPTY_CHECK = true; public static final float WHITESPACE_OBSTACLE_OVERLAP = 1.5f; public static final int WHITESPACE_MAX_QUEUE_SIZE = 100000; public static final int WHITESPACE_NUMBER_WANTED = 50; public static final boolean WHITESPACE_USE_WHOLE_PAGE = false; /* columns */ public static final boolean COLUMNS_ENABLE_TEXT_SPLIT_CHECK = true; public static final boolean COLUMNS_ENABLE_COLUMN_HEIGHT_ADJUSTMENT = true; public static final boolean COLUMNS_ENABLE_COLUMN_DETECTION = true; }