diff --git a/src/java/org/apache/nutch/util/URLUtil.java b/src/java/org/apache/nutch/util/URLUtil.java index afd6f13857..44c6309d2a 100644 --- a/src/java/org/apache/nutch/util/URLUtil.java +++ b/src/java/org/apache/nutch/util/URLUtil.java @@ -262,7 +262,7 @@ public static String getDomainSuffix(URL url) { EffectiveTldFinder.EffectiveTLD suffix = EffectiveTldFinder.getEffectiveTLD(host, true); if (suffix != null) { - return suffix.getDomain(); + return suffix.getSuffix(); } return null; diff --git a/src/test/org/apache/nutch/util/TestURLUtil.java b/src/test/org/apache/nutch/util/TestURLUtil.java index 32dda0929d..092edb9c18 100644 --- a/src/test/org/apache/nutch/util/TestURLUtil.java +++ b/src/test/org/apache/nutch/util/TestURLUtil.java @@ -147,6 +147,8 @@ public void testGetDomainSuffix() throws Exception { assertEquals("2000.hu", URLUtil.getDomainSuffix(url)); // test non-ASCII + url = new URL("https://www.taiuru.māori.nz/"); + assertEquals("xn--mori-qsa.nz", URLUtil.getDomainSuffix(url)); url = new URL("http://www.example.flå.no"); assertEquals("xn--fl-zia.no", URLUtil.getDomainSuffix(url)); url = new URL("http://www.example.栃木.jp");