package com.hua.goddess.utils; import java.util.ArrayList; import org.jsoup.Jsoup; import org.jsoup.nodes.Document; import org.jsoup.nodes.Element; import org.jsoup.select.Elements; import com.hua.goddess.vo.CommentVO; import com.hua.goddess.vo.NewsContentVo; public class HtmlResolving { /* * 解析新闻类容 */ public ArrayList<NewsContentVo> getNewsContent(String news_detaiol) { ArrayList<NewsContentVo> contents = new ArrayList<NewsContentVo>(); NewsContentVo ncv = null; Document document = Jsoup.parse(news_detaiol); Elements info = document.getElementsByTag("span"); for (Element element : info) { ncv = new NewsContentVo(); ncv.setIsImg(0); ncv.setContentList(element.text()); contents.add(ncv); } Elements elements = document.getElementsByTag("p"); Elements media = document.select("[src]"); int i = 1; for (Element element : elements) { if (element.hasText()) { ncv = new NewsContentVo(); ncv.setIsImg(0); ncv.setContentList(element.text()); contents.add(ncv); } else { if (element.hasAttr("align") && media != null && media.size() > 0 && media.size() > i) { Element src = media.get(i); if (src.tagName().equals("img")) { ncv = new NewsContentVo(); ncv.setIsImg(1); ncv.setContentList(src.attr("src")); contents.add(ncv); } i++; } } } return contents; } /* * 新闻评论解析 */ public ArrayList<CommentVO> getCommentContent(String comments) { ArrayList<CommentVO> comm = new ArrayList<CommentVO>(); CommentVO cvo = null; Document document = Jsoup.parse(comments); Elements elements = document.getElementsByClass("content"); for (Element element : elements) { cvo = new CommentVO(); cvo.setTime(element.child(0).text()); cvo.setName(element.child(1).text()); cvo.setContent(element.ownText()); comm.add(cvo); } return comm; } }