HTMLParser.java example

Explorer

lwuit-master
- Apps
  - Browser
    - BrowserDesktop
      - src
        com
        sun
        lwuit
        browser
        Main.java
    - BrowserMIDP
      - src
        com
        sun
        lwuit
        browser
        Browser.java
    - BrowserRIM
      - src
        com
        sun
        lwuit
        browser
        Browser.java
    - src
      - com
        sun
        lwuit
        browser
        BrowserApp.java
        BrowserForm.java
        BrowserStorage.java
        BrowserToolbar.java
        ExtHTMLComponent.java
        HttpRequestHandler.java
  - IODemo
    - src
      - net
        java
        lwuit
        demo
        iodemo
        Main.java
        MainMIDlet.java
        ResultRenderer.java
  - LWUITBrowser
    - src
      - com
        sun
        lwuit
        browser
        BrowserForm.java
        BrowserMIDlet.java
        BrowserToolbar.java
        ExtHTMLComponent.java
        HttpRequestHandler.java
        Storage.java
  - LWUITDemo
    - LWUITDemoCDC
      - src
        com
        sun
        lwuit
        uidemo
        LWUITXlet.java
    - LWUITDemoDesktop
      - src
        com
        sun
        lwuit
        uidemo
        LWUITApplet.java
        Main.java
    - LWUITDemoMIDP
      - src
        com
        sun
        lwuit
        uidemo
        Main.java
    - LWUITDemoRIM
      - src
        com
        sun
        lwuit
        uidemo
        Main.java
    - src
      - com
        sun
        lwuit
        uidemo
        AnimationDemo.java
        ButtonsDemo.java
        Demo.java
        DialogDemo.java
        FontDemo.java
        HTMLDemo.java
        LayoutDemo.java
        RenderingDemo.java
        ScrollDemo.java
        TableDemo.java
        TabsDemo.java
        ThemeDemo.java
        TransitionDemo.java
        TreeDemo.java
        UIDemoMain.java
  - LWUITSpeed
    - src
      - net
        java
        dev
        lwuit
        speed
        BitmapFontRate.java
        ComponentTest.java
        DrawingRate.java
        Framerate3D.java
        FramerateTest.java
        GradientRate.java
        IndexedImageTest.java
        ListTest.java
        ResultsForm.java
        ScalingRate.java
        SpeedMIDlet.java
  - Makeover
    - MakeoverDesktop
      - src
        com
        sun
        me
        web
        sample
        local
        Main.java
    - MakeoverMIDP
      - src
        com
        sun
        me
        web
        sample
        local
        Main.java
    - MakeoverRIM
      - src
        com
        sun
        me
        web
        sample
        local
        Main.java
    - src
      - com
        sun
        me
        web
        sample
        local
        InfiniteProgressIndicator.java
        LocalApp.java
  - TimeZone
    - Desktop
      - src
        desktop
        LWUITApplet.java
        Main.java
    - MIDP
      - src
        userclasses
        MainMIDlet.java
    - RIM
      - src
        userclasses
        MainMIDlet.java
    - src
      - generated
        StateMachineBase.java
      - userclasses
        StateMachine.java
  - Tipster
    - Desktop
      - src
        desktop
        LWUITApplet.java
        Main.java
    - MIDP
      - src
        userclasses
        MainMIDlet.java
    - RIM
      - src
        userclasses
        MainMIDlet.java
    - src
      - generated
        StateMachineBase.java
      - userclasses
        StateMachine.java
- IO
  - src
    - com
      - sun
        lwuit
        io
        CacheMap.java
        ConnectionRequest.java
        Cookie.java
        Externalizable.java
        FileSystemStorage.java
        NetworkEvent.java
        NetworkManager.java
        Storage.java
        html
        AsyncDocumentRequestHandlerImpl.java
        impl
        IOImplementation.java
        PlatformImplementation.java
        services
        GoogleRESTService.java
        ImageDownloadService.java
        RSSService.java
        TwitterRESTService.java
        ui
        FileEncodedImage.java
        FileEncodedImageAsync.java
        FileTree.java
        FileTreeModel.java
        Progress.java
        RSSReader.java
        SliderBridge.java
        StorageImage.java
        WebBrowser.java
        util
        BufferedInputStream.java
        BufferedOutputStream.java
        IOProgressListener.java
        JSONParseCallback.java
        JSONParser.java
        Log.java
        Oauth2.java
        Util.java
- Ports
  - CDC_PBP
    - UI_CDC
      - src
        com
        sun
        lwuit
        impl
        ImplementationFactory.java
        cdc
        CDCImplementation.java
  - MIDP
    - IO_MIDP
      - src
        com
        sun
        lwuit
        io
        impl
        MIDPImpl.java
        PlatformImplementation.java
    - UI
      - src
        com
        sun
        lwuit
        M3G.java
        animations
        Transition3D.java
        impl
        ImplementationFactory.java
        midp
        CanvasImplementation.java
        GameCanvasImplementation.java
        MMAPIPlayer.java
        SVGImplementation.java
        SVGImplementationFactory.java
        VKBImplementationFactory.java
        VirtualKeyboard.java
        util
        Log.java
  - Nokia
    - IO_Nokia
      - src
        com
        sun
        lwuit
        io
        impl
        NokiaAPImplementation.java
        PlatformImplementation.java
    - NokiaIAP_API
      - src
        com
        nokia
        mid
        iapinfo
        AccessPoint.java
        IAPInfo.java
        IAPInfoException.java
  - RIM
    - IO_RIM
      - src
        com
        sun
        lwuit
        io
        impl
        PlatformImplementation.java
        RIMImplementation.java
    - UI_RIM
      - src
        com
        sun
        lwuit
        impl
        ImplementationFactory.java
        blackberry
        BlackBerryCanvas.java
        BlackBerryImplementation.java
        BlackBerryTouchImplementation.java
        BlackBerryTouchSupport.java
        BlackBerryVirtualKeyboard.java
        MMAPIPlayer.java
  - SE
    - IO_SE
      - src
        com
        sun
        lwuit
        io
        impl
        PlatformImplementation.java
    - UI_SE
      - src
        com
        sun
        lwuit
        awtport
        AwtImpl.java
        impl
        ImplementationFactory.java
- UI
  - src
    - com
      - sun
        lwuit
        BrowserComponent.java
        Button.java
        ButtonGroup.java
        Calendar.java
        CheckBox.java
        ComboBox.java
        Command.java
        Component.java
        ComponentGroup.java
        Container.java
        CustomFont.java
        Dialog.java
        Display.java
        EncodedImage.java
        Font.java
        Form.java
        Graphics.java
        Image.java
        IndexedImage.java
        Label.java
        List.java
        M3G.java
        MediaComponent.java
        MenuBar.java
        Painter.java
        PeerComponent.java
        RGBImage.java
        RadioButton.java
        RunnableWrapper.java
        Slider.java
        StaticAnimation.java
        TabbedPane.java
        Tabs.java
        TextArea.java
        TextField.java
        VideoComponent.java
        VirtualKeyboard.java
        animations
        Animation.java
        AnimationObject.java
        CommonTransitions.java
        Motion.java
        Timeline.java
        Transition.java
        Transition3D.java
        events
        ActionEvent.java
        ActionListener.java
        DataChangedListener.java
        FocusListener.java
        SelectionListener.java
        StyleListener.java
        geom
        Dimension.java
        Rectangle.java
        html
        AsyncDocumentRequestHandler.java
        CSSBgPainter.java
        CSSElement.java
        CSSEngine.java
        CSSParser.java
        CSSParserCallback.java
        CellConstraint.java
        DefaultDocumentRequestHandler.java
        DefaultHTMLCallback.java
        DocumentInfo.java
        DocumentRequestHandler.java
        HTMLCallback.java
        HTMLComponent.java
        HTMLElement.java
        HTMLEventsListener.java
        HTMLFont.java
        HTMLForm.java
        HTMLImageMap.java
        HTMLInputFormat.java
        HTMLLink.java
        HTMLListItem.java
        HTMLParser.java
        HTMLTable.java
        HTMLTableModel.java
        HTMLUtils.java
        ImageMapData.java
        MultiComboBox.java
        OptionItem.java
        ResourceThreadQueue.java
        impl
        ImplementationFactory.java
        LWUITImplementation.java
        VirtualKeyboardInterface.java
        layouts
        BorderLayout.java
        BoxLayout.java
        CoordinateLayout.java
        FlowLayout.java
        GridLayout.java
        GroupLayout.java
        LayeredLayout.java
        Layout.java
        LayoutStyle.java
        list
        CellRenderer.java
        ContainerList.java
        DefaultListCellRenderer.java
        DefaultListModel.java
        GenericListCellRenderer.java
        ListCellRenderer.java
        ListModel.java
        painter
        BackgroundPainter.java
        PainterChain.java
        plaf
        Border.java
        DefaultLookAndFeel.java
        LookAndFeel.java
        Style.java
        UIManager.java
        spinner
        DateTimeRenderer.java
        Spinner.java
        SpinnerDateModel.java
        SpinnerNumberModel.java
        table
        DefaultTableModel.java
        Table.java
        TableLayout.java
        TableModel.java
        tree
        Tree.java
        TreeModel.java
        util
        Effects.java
        EmbeddedContainer.java
        EventDispatcher.java
        Resources.java
        UIBuilder.java
        xml
        Element.java
        ParserCallback.java
        XMLParser.java
- tools

/*
 * Copyright (c) 2008, 2010, Oracle and/or its affiliates. All rights reserved.
 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
 * This code is free software; you can redistribute it and/or modify it
 * under the terms of the GNU General Public License version 2 only, as
 * published by the Free Software Foundation.  Oracle designates this
 * particular file as subject to the "Classpath" exception as provided
 * by Oracle in the LICENSE file that accompanied this code.
 *
 * This code is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
 * version 2 for more details (a copy is included in the LICENSE file that
 * accompanied this code).
 *
 * You should have received a copy of the GNU General Public License version
 * 2 along with this work; if not, write to the Free Software Foundation,
 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
 *
 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores
 * CA 94065 USA or visit www.oracle.com if you need additional information or
 * have any questions.
 */
package com.sun.lwuit.html;

import com.sun.lwuit.xml.Element;
import com.sun.lwuit.xml.XMLParser;
import java.io.IOException;
import java.io.InputStreamReader;
import java.io.Reader;

/**
 * The HTMLParser class is used to parse an XHTML-MP 1.0 document into a DOM object (Element).
 * Unsupported tags and attributes as well as comments are dropped in the parsing process.
 * The parser is also makes use of CSSParser for external CSS files, embedded CSS segments and CSS within the 'style' attribute.
 *
 * @author Ofir Leitner
 */
public class HTMLParser extends XMLParser {

    HTMLComponent htmlC; // The HTMLComponent that uses this Parser

    /**
     * The list of empty tags (tags that naturally don't have any children).
     * This is used to enable empty tags to be closed also in a non-strict way (i.e. <br> instead of <br>/;)
     * some of these tags are not a part of the XHTML-MP 1.0 standard, but including them here allows a more smooth parsing if the document is not strictly XHTML-MP 1.0
     */
    private static String[] EMPTY_TAGS = {"br","link","meta","base","area","basefont","col","frame","hr","img","input","isindex","param"};

    /**
     * Constructs a new instance of HTMLParser
     */
    public HTMLParser() {
        // Add common char entities that are above the HTML 2.0 char entities range
        addCharEntity("bull", 8226);
        addCharEntity("euro", 8364);
        setIncludeWhitespacesBetweenTags(true);
    }

    /**
     * Pair this HTMLParser with the HTMLComponent that uses it.
     * This pairing is necessary to allow access to the htmlC in parseTagContent upon finding a CSS embedded segment
     * 
     * @param htmlC The HTMLComponent that uses this parser
     */
    void setHTMLComponent(HTMLComponent htmlC) {
        if ((htmlC!=null) && (this.htmlC!=null)) {
            throw new IllegalStateException("This HTMLParser is already paired with an HTMLComponent");
        }
        this.htmlC=htmlC;
    }
    
    /**
     * Overrides XMLParser.parseTagContent to enable embedded CSS segments (Style tags)
     * 
     * @param element The current parent element
     * @param is The reader containing the XML
     * @throws IOException if an I/O error in the stream is encountered
     */
    protected void parseTagContent(Element element, Reader is) throws IOException {
        if ((HTMLComponent.SUPPORT_CSS) && (htmlC.loadCSS) && (((HTMLElement)element).getTagId() == HTMLElement.TAG_STYLE)) { // We aren't strict and don't require text/css in a style tag // && "text/css".equals(element.getAttributeById(Element.ATTR_TYPE)))) {
            CSSElement addTo = CSSParser.getInstance().parseCSSSegment(is,null,htmlC,null);
            htmlC.addToEmebeddedCSS(addTo);
            return;
        }

        super.parseTagContent(element, is);
    }

    /**
     * Overrides XMLParser.createNewElement to return an HTMLElement instance
     * 
     * @param name The HTMLElement's name
     * @return a new instance of the names HTMLElement
     */
    protected Element createNewElement(String name) {
        HTMLElement elem=new HTMLElement(name);
        return elem;
    }

    /**
     * Overrides XMLParser.createNewTextElement to return an HTMLElement instance
     *
     * @param text The HTMLElement's text
     * @return a new instance of the HTMLElement
     */
    protected Element createNewTextElement(String text) {
        HTMLElement elem=new HTMLElement(text,true);
        return elem;
    }

    /**
     * Overrides XMLParser.convertCharEntity to add in HTML char entities
     *
     * @param charEntity The char entity to convert
     * @return A string containing a single char, or the original char entity string (with & and ;) if the char entity couldn't be resolved
     */
    protected String convertCharEntity(String charEntity) {
        try {
            return HTMLUtils.convertCharEntity(charEntity, true, null);
        } catch (IllegalArgumentException iae) {
            return super.convertCharEntity(charEntity);
        }
    }

    /**
     * This method translates between an HTML char entity string to the according char code.
     * It first tries to find it using its super method.
     * If not found, the search continues to a wider string array of char codes 160-255 which are supported in ISO-8859-1 / HTML 2.0
     *
     * @param symbol The symbol to lookup
     * @return The char code of the symbol, or -1 if none found
     *
    protected int getCharEntityCode(String symbol) {
        int val=super.getCharEntityCode(symbol);
        if (val==-1) {
            // Not one of the most popular char codes, proceed to check the ISO-8859-1 symbols array
            val=CSSElement.getStringVal(symbol, CHAR_ENTITY_STRINGS);
            if (val!=-1) {
                return val+160;
            }
        }
        return val;
    }*/



    /**
     * Checks whether the specified tag is an empty tag as defined in EMPTY_TAGS
     *
     * @param tagName The tag name to check
     * @return true if that tag is defined as an empty tag, false otherwise
     */
    protected boolean isEmptyTag(String tagName) {
        int i=0;
        boolean found=false;
        while ((i<EMPTY_TAGS.length) && (!found)) {
            if (tagName.equals(EMPTY_TAGS[i])) {
                found=true;
            }
            i++;
        }
        return found;
    }

    /**
     * A convenience method that casts the returned type of the parse method to HTMLElement.
     * Basically calling this method is simlar to calling parse and casting to HTMLElement.
     * 
     * @param isr The input stream containing the HTML
     * @return The HTML document
     */
    public HTMLElement parseHTML(InputStreamReader isr) {
        return (HTMLElement)super.parse(isr);
    }

    /**
     * {@inheritDoc}
     */
    protected String getSupportedStandardName() {
        return "XHTML-MP 1.0";
    }

    /**
     * Overrides the Element.isSupported to let the parser know which tags are supported in XHTML-MP 1.0
     *
     * @return true if the tag is a supported XHTML Mobile Profile 1.0 tag, false otherwise
     */
    protected boolean isSupported(Element element) {
        return (((HTMLElement)element).getTagId()!=HTMLElement.TAG_UNSUPPORTED);
    }

    /**
     * Overrides the Element.shouldEvaluate method to return false on the script tag.
     * The script tag should be skipped entirely, since it may contain characters like greater-than and lesser-than which may break the HTML
     * All other tags are evaluated (i.e. added including all their children to the tree), even if not supported (But of course their functionality is ignored by HTMLComponent)
     *
     * @return false if this is the SCRIPT tag, true otherwise
     */
    protected boolean shouldEvaluate(Element element) {
        return ((((HTMLElement)element).getTagId()!=HTMLElement.TAG_UNSUPPORTED) || (!element.getTagName().equalsIgnoreCase("script")));
    }



}