SafeHtml.java example

Explorer

jforum3-master
- src
  - main
    - java
      - net
        jforum
        actions
        extensions
        TopicWatchExtension.java
        helpers
        ActionUtils.java
        Actions.java
        ApproveInfo.java
        AttachedFile.java
        Domain.java
        PostFormOptions.java
        interceptors
        ControllerSecurityInterceptor.java
        ExtendsAnnotationInterceptor.java
        MethodSecurityInterceptor.java
        SecurityInterceptor.java
        SessionManagerInterceptor.java
        api
        JForumExecutionContext.java
        controllers
        AdminController.java
        AvatarAdminController.java
        BadWordAdminController.java
        BanlistAdminController.java
        CategoryAdminController.java
        ConfigController.java
        ForumAdminController.java
        ForumController.java
        GroupAdminController.java
        HibernateStatisticsController.java
        LuceneAdminController.java
        MessageController.java
        ModerationController.java
        PostController.java
        PostReportController.java
        PrivateMessageController.java
        RSSController.java
        RankingAdminController.java
        RecentTopicsController.java
        SearchController.java
        SmilieAdminController.java
        ThemeController.java
        TopicController.java
        UserAdminController.java
        UserController.java
        core
        PageExtensionRedirectFilter.java
        Role.java
        SecurityConstraint.java
        SessionManager.java
        UrlPattern.java
        UserSessionListener.java
        VRaptorCustomPathResolver.java
        VRaptorSpringProvider.java
        events
        category
        NewCategoryGroupPermissionsEvent.java
        forum
        NewForumGroupPermissionsEvent.java
        post
        BadWordEvent.java
        ForumPostEvent.java
        TopicPostEvent.java
        TopicReplyEvent.java
        TopicWatchPostEvent.java
        topic
        ForumTopicEvent.java
        TopicWatchTopicEvent.java
        exceptions
        AccessRuleException.java
        DatabaseException.java
        ForumException.java
        MailException.java
        ValidationException.java
        support
        hibernate
        CacheEvictionRules.java
        QueryCache.java
        QueryCacheFactory.java
        SessionFactoryCreator.java
        SpringInterceptor.java
        SpringSessionFactory.java
        spring
        HttpServletRequestFactoryBean.java
        HttpServletResponseFactoryBean.java
        RoleManagerFactoryBean.java
        tags
        DisplayCategoriesTag.java
        DisplayFormattedMessageTag.java
        DisplayForumsTag.java
        FormatSignatureTag.java
        Functions.java
        I18nTag.java
        ImportFileTag.java
        ImportResponseWrapper.java
        JForumTag.java
        SettingsTag.java
        TemplateResourceTag.java
        URLTag.java
        entities
        Attachment.java
        AttachmentExtension.java
        AttachmentExtensionGroup.java
        AttachmentQuota.java
        Avatar.java
        AvatarType.java
        BadWord.java
        Banlist.java
        Category.java
        Config.java
        Forum.java
        ForumStats.java
        ForumWatch.java
        Group.java
        ModerationLog.java
        ModerationLogType.java
        MostUsersEverOnline.java
        Poll.java
        PollOption.java
        PollVoter.java
        Post.java
        PostReport.java
        PostReportStatus.java
        PrivateMessage.java
        PrivateMessageType.java
        Ranking.java
        Role.java
        Session.java
        Smilie.java
        Theme.java
        Topic.java
        TopicWatch.java
        User.java
        UserSession.java
        util
        PaginatedResult.java
        Pagination.java
        SearchMatchType.java
        SearchParams.java
        SearchResult.java
        SearchSort.java
        SearchSortType.java
        events
        EmptyCategoryEvent.java
        EmptyForumEvent.java
        EmptyPostEvent.java
        EmptyTopicEvent.java
        Event.java
        listeners
        AbstractListener.java
        CategoryEventListener.java
        ForumEventListener.java
        PostEventListener.java
        TopicEventListener.java
        extensions
        ActionExtension.java
        ActionExtensionManager.java
        Extends.java
        PostReportCounterOperation.java
        RequestOperation.java
        RequestOperationChain.java
        formatters
        BBCode.java
        BBCodeConfigParser.java
        BBConfigFormatter.java
        Formatter.java
        HtmlEntitiesFormatter.java
        NewLineToHtmlBreakFormatter.java
        PostFormatters.java
        PostOptions.java
        SafeHtmlAttributesFormatter.java
        SafeHtmlTagsFormatter.java
        SmiliesFormatter.java
        plugins
        post
        ForumAdminExtension.java
        ForumLimitedTime.java
        ForumLimitedTimeRepository.java
        PostEditInterceptor.java
        repository
        AttachmentRepository.java
        AvatarRepository.java
        BadWordRepository.java
        BanlistRepository.java
        CategoryRepository.java
        ConfigRepository.java
        ForumRepository.java
        GroupRepository.java
        HibernateGenericDAO.java
        ModerationLogRepository.java
        PollRepository.java
        PostReportRepository.java
        PostRepository.java
        PrivateMessageRepository.java
        RSSRepository.java
        RankingRepository.java
        RecentTopicsRepository.java
        Repository.java
        SearchRepository.java
        SessionRepository.java
        SmilieRepository.java
        ThemeRepository.java
        TopicRepository.java
        TopicWatchRepository.java
        UserRepository.java
        security
        AccessForumRule.java
        AccessRule.java
        AdministrationRule.java
        AuthenticatedRule.java
        ChangePostRule.java
        CreateNewTopicRule.java
        DownloadAttachmentRule.java
        EditUserRule.java
        EmptyRule.java
        ModerationRule.java
        PrivateMessageEnabledRule.java
        PrivateMessageOwnerRule.java
        ReplyTopicRule.java
        RoleManager.java
        TopicFilter.java
        services
        AttachmentService.java
        AvatarService.java
        CategoryService.java
        ConfigService.java
        ForumService.java
        GroupService.java
        LostPasswordService.java
        MessageFormatService.java
        ModerationLogService.java
        ModerationService.java
        MostUsersEverOnlineService.java
        PollService.java
        PostService.java
        PrivateMessageService.java
        RSSService.java
        RankingService.java
        SmilieService.java
        TopicService.java
        TopicWatchService.java
        UserService.java
        sso
        DefaultLoginAuthenticator.java
        LoginAuthenticator.java
        RemoteUserSSO.java
        SSO.java
        SSOUtils.java
        util
        CategoryOrderComparator.java
        ConfigKeys.java
        GroupInteractionFilter.java
        I18n.java
        ImageInfo.java
        ImageUtils.java
        JForumConfig.java
        MD5.java
        SafeHtml.java
        SecurityConstants.java
        URLBuilder.java
        UploadUtils.java
        mail
        ActivationKeySpammer.java
        EmailSenderTask.java
        IdentifiableMimeMessage.java
        LostPasswordSpammer.java
        MessageId.java
        PrivateMessageSpammer.java
        Spammer.java
        SpammerFactory.java
        SpammerTaskExecutor.java
        TopicReplySpammer.java
  - test
    - java
      - net
        jforum
        actions
        extensions
        TopicWatchExtensionTestCase.java
        helpers
        PaginationTestCase.java
        bbcode
        AutoEmail_TestCase.java
        BBCodeConfigParserTestCase.java
        B_TestCase.java
        Color_TestCase.java
        DescriptiveUrl_TestCase.java
        Google_TestCase.java
        HtmlEntitiesFormatterTestCase.java
        IMG_TestCase.java
        I_TestCase.java
        NewLineToHtmBreakFormatterTestCase.java
        SimpleUrl_TestCase.java
        Size_TestCase.java
        SmiliesFormatterTestCase.java
        TagBaseTest.java
        U_TestCase.java
        YouTube_TestCase.java
        controllers
        AdminControllerTestCase.java
        AdminTestCase.java
        AvatarAdminControllerTestCase.java
        BadWordControllerActionsTestCase.java
        BanlistAdminControllerTestCase.java
        CategoryAdminControllerTestCase.java
        ForumAdminControllerTestCase.java
        ForumControllerTestCase.java
        GroupAdminControllerTestCase.java
        MessageControllerTestCase.java
        ModerationControllerTestCase.java
        PostControllerTestCase.java
        PostReportControllerTestCase.java
        PrivateMessageControllerTestCase.java
        RSSControllerTestCase.java
        RankingAdminControllerTestCase.java
        RecentTopicsControllerTestCase.java
        SearchControllerTestCase.java
        SmilieAdminControllerTestCase.java
        TopicControllerTestCase.java
        UserAdminControllerTestCase.java
        UserControllerTestCase.java
        core
        SessionManagerTestCase.java
        events
        category
        NewCategoryGroupPermissionsEventTestCase.java
        forum
        NewForumGroupPermissionsEventTestCase.java
        post
        BadWordEventTestCase.java
        ForumPostEventTestCase.java
        TopicPostEventTestCase.java
        TopicWatchPostEventTestCase.java
        topic
        ForumTopicEventTestCase.java
        TopicWatchTopicEventTestCase.java
        hibernate
        AbstractDAOTestCase.java
        AvatarDAOTestCase.java
        BadWordDAOTestCase.java
        BanlistDAOTestCase.java
        CategoryDAOTestCase.java
        ConfigDAOTestCase.java
        ForumDAOTestCase.java
        GroupDAOTestCase.java
        PostDAOTestCase.java
        PostReportDAOTestCase.java
        PrivateMessageDAOTestCase.java
        RSSDAOTestCase.java
        RankingDAOTestCase.java
        RecentTopicsDAOTestCase.java
        SessionDAOTestCase.java
        SmilieDAOTestCase.java
        TopicDAOTestCase.java
        TopicWatchDAOTestCase.java
        UserDAOTestCase.java
        tests
        EmptyCache.java
        EmptyCacheProvider.java
        support
        hibernate
        CacheEvictionRulesTestCase.java
        entities
        ForumTestCase.java
        GroupTestCase.java
        SearchParamsTest.java
        TopicTestCase.java
        UserSessionTestCase.java
        extensions
        PostReportCounterOperationTestCase.java
        plugins
        post
        ForumAdminTestCase.java
        FourmLimitedTimeDAOTestCase.java
        security
        AccessForumRuleTestCase.java
        AdministrationRuleTestCase.java
        AuthenticatedRuleTestCase.java
        ChangePostRuleTestCase.java
        CreateNewTopicRuleTestCase.java
        EditUserRuleTestCase.java
        ModerationRuleTestCase.java
        PrivateMessageEnabledRuleTestCase.java
        PrivateMessageOwnerRuleTestCase.java
        ReplyTopicRuleTestCase.java
        RoleManagerTestCase.java
        services
        AvatarServiceTestCase.java
        CategoryServiceTestCase.java
        ForumServiceTestCase.java
        GroupServiceTestCase.java
        ModerationServiceTestCase.java
        MostUsersEverOnlineServiceTestCase.java
        PollServiceTestCase.java
        PostServiceTestCase.java
        PrivateMessageServiceTestCase.java
        RSSServiceTestCase.java
        RankingServiceTestCase.java
        SmilieServiceTestCase.java
        TopicServiceTestCase.java
        TopicWatchServiceTestCase.java
        UserServiceTestCase.java
        sso
        DefaultLoginAuthenticatorTestCase.java
        RemoteUserSSOTestCase.java
        util
        GroupInteractionFilterTestCase.java
        I18nTestCase.java
        JDBCLoader.java
        SafeHtmlTestCase.java
        TestCaseUtils.java
        mail
        LostPasswordSpammerTestCase.java
        MailTestCase.java
        TopicReplySpammerTestCase.java

/*
 * Copyright (c) JForum Team
 * All rights reserved.
 *
 * Redistribution and use in source and binary forms,
 * with or without modification, are permitted provided
 * that the following conditions are met:
 *
 * 1) Redistributions of source code must retain the above
 * copyright notice, this list of conditions and the
 * following  disclaimer.
 * 2)  Redistributions in binary form must reproduce the
 * above copyright notice, this list of conditions and
 * the following disclaimer in the documentation and/or
 * other materials provided with the distribution.
 * 3) Neither the name of "Rafael Steil" nor
 * the names of its contributors may be used to endorse
 * or promote products derived from this software without
 * specific prior written permission.
 *
 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
 * HOLDERS AND CONTRIBUTORS "AS IS" AND ANY
 * EXPRESS OR IMPLIED WARRANTIES, INCLUDING,
 * BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
 * MERCHANTABILITY AND FITNESS FOR A PARTICULAR
 * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL
 * THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE
 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
 * EXEMPLARY, OR CONSEQUENTIAL DAMAGES
 * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA,
 * OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
 * CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER
 * IN CONTRACT, STRICT LIABILITY, OR TORT
 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN
 * ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
 * ADVISED OF THE POSSIBILITY OF SUCH DAMAGE
 *
 * This file creation date: 27/09/2004 23:59:10
 * The JForum Project
 * http://www.jforum.net
 */
package net.jforum.util;

import java.util.HashSet;
import java.util.Iterator;
import java.util.Set;
import java.util.Vector;

import net.jforum.core.exceptions.ForumException;

import org.apache.commons.lang.StringUtils;
import org.htmlparser.Attribute;
import org.htmlparser.Node;
import org.htmlparser.Tag;
import org.htmlparser.lexer.Lexer;
import org.htmlparser.nodes.TextNode;

import br.com.caelum.vraptor.ioc.ApplicationScoped;
import br.com.caelum.vraptor.ioc.Component;

/**
 * Process text with html and remove possible malicious tags and attributes.
 * Work based on tips from Amit Klein and the following documents: <br>
 * <li>http://ha.ckers.org/xss.html
 * <li>http://quickwired.com/kallahar/smallprojects/php_xss_filter_function.php <br>
 *
 * @author Rafael Steil
 */
@Component
@ApplicationScoped
public class SafeHtml {
	private Set<String> welcomeTags = new HashSet<String>();
	private Set<String> welcomeAttributes = new HashSet<String>();
	private Set<String> allowedProtocols = new HashSet<String>();

	private JForumConfig config;

	public SafeHtml(JForumConfig config) {
		this.config = config;

		this.splitAndTrim(ConfigKeys.HTML_TAGS_WELCOME, this.welcomeTags);
		this.splitAndTrim(ConfigKeys.HTML_ATTRIBUTES_WELCOME, this.welcomeAttributes);
		this.splitAndTrim(ConfigKeys.HTML_LINKS_ALLOW_PROTOCOLS, this.allowedProtocols);
	}

	private void splitAndTrim(String s, Set<String> data) {
		if (this.config.containsKey(s)) {
			String value = this.config.getValue(s);
			String[] parts = value.split(",");

			for (String part : parts) {
				part = part.trim();

				if (!StringUtils.isEmpty(part)) {
					data.add(part.toUpperCase());
				}
			}
		}
	}

	/**
	 * Given an input, analyze each HTML tag and remove unsecure attributes from them.
	 *
	 * @param contents The content to verify
	 * @return the content, secure.
	 */
	public String ensureAllAttributesAreSafe(String contents) {
		StringBuilder sb = new StringBuilder(contents.length());

		try {
			Lexer lexer = new Lexer(contents);
			Node node;

			while ((node = lexer.nextNode()) != null) {
				if (node instanceof Tag) {
					Tag tag = (Tag) node;

					this.checkAndValidateAttributes(tag, false);

					sb.append(tag.toHtml());
				}
				else {
					sb.append(node.toHtml());
				}
			}
		}
		catch (Exception e) {
			throw new ForumException("Problems while parsing HTML: " + e, e);
		}

		return sb.toString();
	}

	/**
	 * Given an input, makes it safe for HTML displaying.
	 * Removes any not allowed HTML tag or attribute, as well unwanted
	 * Javascript statements inside the tags.
	 *
	 * @param contents the input to analyze
	 * @return the modified and safe string
	 */
	public String makeSafe(String contents) {
		if (contents == null || contents.length() == 0) {
			return contents;
		}

		StringBuilder sb = new StringBuilder(contents.length());

		try {
			Lexer lexer = new Lexer(contents);
			Node node;

			while ((node = lexer.nextNode()) != null) {
				boolean isTextNode = node instanceof TextNode;

				if (isTextNode) {
					// Text nodes are raw data, so we just
					// strip off all possible html content
					String text = node.toHtml();

					if (text.indexOf('>') > -1 || text.indexOf('<') > -1) {
						text = StringUtils.replace(text, "<", "<");
						text = StringUtils.replace(text, ">", ">");
						text = StringUtils.replace(text, "\"", """);

						node.setText(text);
					}

					sb.append(node.toHtml());
				}
				else if (node instanceof Tag && this.isTagWelcome(node)) {
					sb.append(node.toHtml());
				}
				else {
					String text = node.toHtml();

					text = StringUtils.replace(text, "<", "<");
					text = StringUtils.replace(text, ">", ">");

					sb.append(text);
				}
			}
		}
		catch (Exception e) {
			throw new ForumException("Error while parsing HTML: " + e, e);
		}

		return sb.toString();
	}

	/**
	 * Returns true if a given tag is allowed. Also, it checks and removes any unwanted attribute the tag may contain.
	 *
	 * @param node The tag node to analyze
	 * @return true if it is a valid tag.
	 */
	private boolean isTagWelcome(Node node) {
		Tag tag = (Tag) node;

		if (!welcomeTags.contains(tag.getTagName())) {
			return false;
		}

		this.checkAndValidateAttributes((Tag)node, true);

		return true;
	}

	/**
	 * Given a tag, check its attributes, removing those unwanted or not secure
	 *
	 * @param tag The tag to analyze
	 * @param checkIfAttributeIsWelcome true if the attribute name should be matched against the list of welcome attributes, set in the main
	 *            configuration file.
	 */
	@SuppressWarnings("unchecked")
	private void checkAndValidateAttributes(Tag tag, boolean checkIfAttributeIsWelcome) {
		Vector<Attribute> newAttributes = new Vector<Attribute>();

		for (Iterator<Attribute> iter = tag.getAttributesEx().iterator(); iter.hasNext();) {
			Attribute a = iter.next();
			String name = a.getName();

			if (name == null) {
				newAttributes.add(a);
			}
			else {
				name = name.toUpperCase();

				if (a.getValue() == null) {
					newAttributes.add(a);
					continue;
				}

				String value = a.getValue().toLowerCase();

				if (checkIfAttributeIsWelcome && !this.isAttributeWelcome(name)) {
					continue;
				}

				if (!this.isAttributeSafe(name, value)) {
					continue;
				}

				if (a.getValue().indexOf("&#") > -1) {
					a.setValue(StringUtils.replace(a.getValue(), "&#", "&#"));
				}

				newAttributes.add(a);
			}
		}

		tag.setAttributesEx(newAttributes);
	}

	/**
	 * Check if the given attribute name is in the list of allowed attributes
	 *
	 * @param name the attribute name
	 * @return true if it is an allowed attribute name
	 */
	private boolean isAttributeWelcome(String name) {
		return welcomeAttributes.contains(name);
	}

	/**
	 * Check if the attribute is safe, checking either its name and value.
	 *
	 * @param name the attribute name
	 * @param value the attribute value
	 * @return true if it is a safe attribute
	 */
	private boolean isAttributeSafe(String name, String value) {
		if (name.length() >= 2 && name.charAt(0) == 'O' && name.charAt(1) == 'N') {
			return false;
		}

		if (value.indexOf('\n') > -1 || value.indexOf('\r') > -1 || value.indexOf('\0') > -1) {
			return false;
		}

		if (("HREF".equals(name) || "SRC".equals(name))) {
			if (!this.isHrefValid(value)) {
				return false;
			}
		}
		else if ("STYLE".equals(name)) {
			// It is much more a try to not allow constructions
			// like style="background-color: url(javascript:xxxx)" than anything else
			if (value.indexOf('(') > -1) {
				return false;
			}
		}

		return true;
	}

	/**
	 * Checks if a given address is valid
	 *
	 * @param href The address to check
	 * @return true if it is valid
	 */
	private boolean isHrefValid(String href) {
		if (this.config.getBoolean(ConfigKeys.HTML_LINKS_ALLOW_RELATIVE) && href.length() > 0 && href.charAt(0) == '/') {
			return true;
		}

		for (String string : allowedProtocols) {
			String protocol = string.toLowerCase();

			if (href.startsWith(protocol)) {
				return true;
			}
		}

		return false;
	}
}