/****************************************************************************** * Copyright (c) 2010 Basis Technology Corp. * * Basis Technology Corp. licenses this file * to you under the Apache License, Version 2.0 (the * "License"); you may not use this file except in compliance * with the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, * software distributed under the License is distributed on an * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY * KIND, either express or implied. See the License for the * specific language governing permissions and limitations * under the License. */ package com.basistech.readability; /** * Interface to reading HTML pages. */ public interface PageReader { /** * Read the content of a page. Return null and log if * there's some problem or another. This is responsible * for dealing with charset. * @param url * @return */ String readPage(String url) throws PageReadException; /** * Provide a character set detector. * @param detector */ void setCharsetDetector(PageCharsetDetector detector); }