/* * Licensed to the Apache Software Foundation (ASF) under one or more * contributor license agreements. See the NOTICE file distributed with * this work for additional information regarding copyright ownership. * The ASF licenses this file to You under the Apache License, Version 2.0 * (the "License"); you may not use this file except in compliance with * the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package org.apache.tika.utils; import static org.junit.Assert.assertEquals; import static org.junit.Assert.assertNotNull; import static org.junit.Assert.assertTrue; import java.util.List; import org.junit.Test; /** * Test case for {@link RegexUtils}. * * @version $Revision$ $Date$ */ public class RegexUtilsTest { /** * Test {@link RegexUtils#extractLinks(String)} with no links. */ @Test public void testExtractLinksNone() { List<String> links = null; links = RegexUtils.extractLinks(null); assertNotNull(links); assertEquals(0, links.size()); links = RegexUtils.extractLinks(""); assertNotNull(links); assertEquals(0, links.size()); links = RegexUtils.extractLinks( "Test with no links " + "What about www.google.com"); assertNotNull(links); assertEquals(0, links.size()); } /** * Test {@link RegexUtils#extractLinks(String)} for http. */ @Test public void testExtractLinksHttp() { List<String> links = RegexUtils.extractLinks( "Test with http://www.nutch.org/index.html is it found? " + "What about www.google.com at http://www.google.de " + "A longer URL could be http://www.sybit.com/solutions/portals.html"); assertTrue("Url not found!", links.size() == 3); assertEquals("Wrong URL", "http://www.nutch.org/index.html", links.get(0)); assertEquals("Wrong URL", "http://www.google.de", links.get(1)); assertEquals("Wrong URL", "http://www.sybit.com/solutions/portals.html", links.get(2)); } /** * Test {@link RegexUtils#extractLinks(String)} for ftp. */ @Test public void testExtractLinksFtp() { List<String> links = RegexUtils.extractLinks( "Test with ftp://www.nutch.org is it found? " + "What about www.google.com at ftp://www.google.de"); assertTrue("Url not found!", links.size() == 2); assertEquals("Wrong URL", "ftp://www.nutch.org", links.get(0)); assertEquals("Wrong URL", "ftp://www.google.de", links.get(1)); } }