/* * Copyright (C) 2009 Google Inc. * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package com.google.sites.liberation.parsers; import static com.google.common.base.Preconditions.checkNotNull; import static com.google.sites.liberation.parsers.ParserUtils.hasClass; import com.google.gdata.data.Person; import org.w3c.dom.Element; import org.w3c.dom.Node; import org.w3c.dom.NodeList; /** * Implements AuthorParser to parse an html element for authorship. * * @author bsimon@google.com (Benjamin Simon) */ final class AuthorParserImpl implements AuthorParser { @Override public Person parseAuthor(Element element) { checkNotNull(element); Person author = new Person(); parseElement(element, author); return author; } /** * Parses the given element and populates the given Person object accordingly. */ private void parseElement(Element element, Person author) { NodeList nodeList = element.getChildNodes(); for (int i = 0; i < nodeList.getLength(); i++) { Node node = nodeList.item(i); if (node.getNodeType() == Node.ELEMENT_NODE) { Element child = (Element) node; if (hasClass(child, "vcard")) { parseHCard(child, author); } else { parseElement(child, author); } } } } private void parseHCard(Element element, Person author) { NodeList nodeList = element.getChildNodes(); for (int i = 0; i < nodeList.getLength(); i++) { Node node = nodeList.item(i); if (node.getNodeType() == Node.ELEMENT_NODE) { Element child = (Element) node; if (hasClass(child, "fn")) { author.setName(child.getTextContent()); String href = child.getAttribute("href"); if (href.startsWith("mailto:") && (author.getEmail() == null)) { author.setEmail(href.substring(7)); } } else if (hasClass(child, "n")) { author.setName(child.getTextContent()); } else if (hasClass(child, "email")) { author.setEmail(child.getTextContent()); } else { parseHCard(child, author); } } } } }