package de.pinyto.ctSESAM; import java.util.regex.Matcher; import java.util.regex.Pattern; /** * This class is used to extract domains from urls. */ public class DomainExtractor { public static String extract(String url) { Pattern pattern = Pattern.compile("(?:https?://)?(\\w+\\.)+(co\\.\\w+).*"); Matcher matcher = pattern.matcher(url); if (matcher.matches() && matcher.groupCount() >= 2) { return matcher.group(matcher.groupCount() - 1) + matcher.group(matcher.groupCount()); } pattern = Pattern.compile("(?:https?://)?(\\w+\\.)+(\\w+).*"); matcher = pattern.matcher(url); if (matcher.matches() && matcher.groupCount() >= 2) { return matcher.group(matcher.groupCount() - 1) + matcher.group(matcher.groupCount()); } else { return url; } } }