public final class nl.basjes.parse.useragent.utils.HostnameExtracter extends java.lang.Object implements java.io.Serializable
{
private static final java.util.Set UNWANTED_URL_BRANDS;
private static final java.util.Set UNWANTED_EMAIL_BRANDS;
private static final java.util.List SITE_PATH_EXTRACTS;
private static final java.util.regex.Pattern DOT_SPLITTER;
private void <init>()
{
nl.basjes.parse.useragent.utils.HostnameExtracter v;
v := @this: nl.basjes.parse.useragent.utils.HostnameExtracter;
specialinvoke v.<java.lang.Object: void <init>()>();
return;
}
public static java.lang.String extractHostname(java.lang.String)
{
java.lang.String[] v;
int v, v, v, v, v, v, v, v;
java.lang.String v, v, v;
java.net.URI v;
boolean v, v, v;
char v, v;
java.lang.IllegalArgumentException v;
v := @parameter: java.lang.String;
if v == null goto label;
v = virtualinvoke v.<java.lang.String: boolean isEmpty()>();
if v == 0 goto label;
label:
return null;
label:
v = virtualinvoke v.<java.lang.String: int indexOf(int)>(63);
v = virtualinvoke v.<java.lang.String: int indexOf(int)>(38);
v = (int) -1;
v = v;
v = (int) -1;
if v == v goto label;
v = (int) -1;
if v == v goto label;
v = v;
goto label;
label:
v = v;
goto label;
label:
v = (int) -1;
if v == v goto label;
v = v;
label:
v = (int) -1;
if v == v goto label;
v = virtualinvoke v.<java.lang.String: java.lang.String substring(int,int)>(0, v);
label:
v = virtualinvoke v.<java.lang.String: char charAt(int)>(0);
if v != 47 goto label;
v = virtualinvoke v.<java.lang.String: char charAt(int)>(1);
if v != 47 goto label;
v = staticinvoke <java.net.URI: java.net.URI create(java.lang.String)>(v);
goto label;
label:
return null;
label:
v = virtualinvoke v.<java.lang.String: boolean contains(java.lang.CharSequence)>(":");
if v == 0 goto label;
v = staticinvoke <java.net.URI: java.net.URI create(java.lang.String)>(v);
goto label;
label:
v = virtualinvoke v.<java.lang.String: boolean contains(java.lang.CharSequence)>("/");
if v == 0 goto label;
v = virtualinvoke v.<java.lang.String: java.lang.String[] split(java.lang.String,int)>("/", 2);
v = v[0];
label:
return v;
label:
return v;
label:
v := @caughtexception;
return null;
label:
v = virtualinvoke v.<java.net.URI: java.lang.String getHost()>();
return v;
catch java.lang.IllegalArgumentException from label to label with label;
catch java.lang.IllegalArgumentException from label to label with label;
}
public static java.lang.String extractBrandFromUrl(java.lang.String)
{
java.util.Set v;
java.lang.String v, v, v;
v := @parameter: java.lang.String;
v = staticinvoke <nl.basjes.parse.useragent.utils.HostnameExtracter: java.lang.String extractHostname(java.lang.String)>(v);
v = <nl.basjes.parse.useragent.utils.HostnameExtracter: java.util.Set UNWANTED_URL_BRANDS>;
v = staticinvoke <nl.basjes.parse.useragent.utils.HostnameExtracter: java.lang.String extractCompanyFromHostName(java.lang.String,java.util.Set)>(v, v);
if v != null goto label;
v = staticinvoke <nl.basjes.parse.useragent.utils.HostnameExtracter: java.lang.String extractCompanyFromSoftwareRepositoryUrl(java.lang.String)>(v);
label:
return v;
}
public static java.lang.String extractBrandFromEmail(java.lang.String)
{
int v, v;
java.util.Set v;
java.lang.String v, v, v;
v := @parameter: java.lang.String;
v = v;
v = virtualinvoke v.<java.lang.String: int indexOf(int)>(64);
if v < 0 goto label;
v = v + 1;
v = virtualinvoke v.<java.lang.String: java.lang.String substring(int)>(v);
label:
v = <nl.basjes.parse.useragent.utils.HostnameExtracter: java.util.Set UNWANTED_EMAIL_BRANDS>;
v = staticinvoke <nl.basjes.parse.useragent.utils.HostnameExtracter: java.lang.String extractCompanyFromHostName(java.lang.String,java.util.Set)>(v, v);
return v;
}
private static java.lang.String extractCompanyFromSoftwareRepositoryUrl(java.lang.String)
{
java.lang.String[] v;
int v, v, v, v, v;
java.lang.String v, v, v, v, v;
boolean v, v, v;
java.util.Iterator v;
java.util.List v;
java.lang.Object v;
v := @parameter: java.lang.String;
v = <nl.basjes.parse.useragent.utils.HostnameExtracter: java.util.List SITE_PATH_EXTRACTS>;
v = interfaceinvoke v.<java.util.List: java.util.Iterator iterator()>();
label:
v = interfaceinvoke v.<java.util.Iterator: boolean hasNext()>();
if v == 0 goto label;
v = interfaceinvoke v.<java.util.Iterator: java.lang.Object next()>();
v = v.<nl.basjes.parse.useragent.utils.HostnameExtracter$SitePathExtract: java.lang.String prefix>;
v = virtualinvoke v.<java.lang.String: boolean startsWith(java.lang.String)>(v);
if v == 0 goto label;
v = v.<nl.basjes.parse.useragent.utils.HostnameExtracter$SitePathExtract: int prefixLength>;
v = virtualinvoke v.<java.lang.String: java.lang.String substring(int)>(v);
v = virtualinvoke v.<java.lang.String: java.lang.String[] split(java.lang.String)>("/");
v = lengthof v;
if v == 0 goto label;
v = lengthof v;
v = v.<nl.basjes.parse.useragent.utils.HostnameExtracter$SitePathExtract: int brandSegment>;
if v >= v goto label;
label:
return null;
label:
v = v.<nl.basjes.parse.useragent.utils.HostnameExtracter$SitePathExtract: int brandSegment>;
v = v[v];
v = virtualinvoke v.<java.lang.String: boolean isEmpty()>();
if v == 0 goto label;
return null;
label:
v = staticinvoke <nl.basjes.parse.useragent.utils.Normalize: java.lang.String brand(java.lang.String)>(v);
return v;
label:
return null;
}
private static java.lang.String extractCompanyFromHostName(java.lang.String, java.util.Set)
{
java.util.Set v;
java.lang.String[] v;
nl.basjes.parse.useragent.utils.publicsuffixlist.PublicSuffixMatcher v;
nl.basjes.parse.useragent.utils.publicsuffixlist.DomainType v;
java.util.Locale v;
java.lang.String v, v, v, v, v;
java.util.regex.Pattern v;
boolean v;
v := @parameter: java.lang.String;
v := @parameter: java.util.Set;
if v != null goto label;
return null;
label:
v = <java.util.Locale: java.util.Locale ROOT>;
v = virtualinvoke v.<java.lang.String: java.lang.String toLowerCase(java.util.Locale)>(v);
v = interfaceinvoke v.<java.util.Set: boolean contains(java.lang.Object)>(v);
if v == 0 goto label;
return null;
label:
v = staticinvoke <nl.basjes.parse.useragent.utils.publicsuffixlist.PublicSuffixMatcherLoader: nl.basjes.parse.useragent.utils.publicsuffixlist.PublicSuffixMatcher getDefault()>();
v = <nl.basjes.parse.useragent.utils.publicsuffixlist.DomainType: nl.basjes.parse.useragent.utils.publicsuffixlist.DomainType ICANN>;
v = virtualinvoke v.<nl.basjes.parse.useragent.utils.publicsuffixlist.PublicSuffixMatcher: java.lang.String getDomainRoot(java.lang.String,nl.basjes.parse.useragent.utils.publicsuffixlist.DomainType)>(v, v);
if v != null goto label;
return null;
label:
v = <nl.basjes.parse.useragent.utils.HostnameExtracter: java.util.regex.Pattern DOT_SPLITTER>;
v = virtualinvoke v.<java.util.regex.Pattern: java.lang.String[] split(java.lang.CharSequence,int)>(v, 2);
v = v[0];
v = staticinvoke <nl.basjes.parse.useragent.utils.Normalize: java.lang.String brand(java.lang.String)>(v);
return v;
}
static void <clinit>()
{
nl.basjes.parse.useragent.utils.HostnameExtracter$SitePathExtract v, v, v;
java.util.HashSet v, v;
java.util.Set v, v, v, v, v, v, v, v;
java.util.List v;
nl.basjes.parse.useragent.utils.HostnameExtracter$SitePathExtract[] v;
java.util.regex.Pattern v;
v = new java.util.HashSet;
specialinvoke v.<java.util.HashSet: void <init>()>();
<nl.basjes.parse.useragent.utils.HostnameExtracter: java.util.Set UNWANTED_URL_BRANDS> = v;
v = <nl.basjes.parse.useragent.utils.HostnameExtracter: java.util.Set UNWANTED_URL_BRANDS>;
interfaceinvoke v.<java.util.Set: boolean add(java.lang.Object)>("localhost");
v = <nl.basjes.parse.useragent.utils.HostnameExtracter: java.util.Set UNWANTED_URL_BRANDS>;
interfaceinvoke v.<java.util.Set: boolean add(java.lang.Object)>("github.com");
v = <nl.basjes.parse.useragent.utils.HostnameExtracter: java.util.Set UNWANTED_URL_BRANDS>;
interfaceinvoke v.<java.util.Set: boolean add(java.lang.Object)>("gitlab.com");
v = <nl.basjes.parse.useragent.utils.HostnameExtracter: java.util.Set UNWANTED_URL_BRANDS>;
interfaceinvoke v.<java.util.Set: boolean add(java.lang.Object)>("bit.ly");
v = <nl.basjes.parse.useragent.utils.HostnameExtracter: java.util.Set UNWANTED_URL_BRANDS>;
interfaceinvoke v.<java.util.Set: boolean add(java.lang.Object)>("wordpress.com");
v = new java.util.HashSet;
specialinvoke v.<java.util.HashSet: void <init>()>();
<nl.basjes.parse.useragent.utils.HostnameExtracter: java.util.Set UNWANTED_EMAIL_BRANDS> = v;
v = <nl.basjes.parse.useragent.utils.HostnameExtracter: java.util.Set UNWANTED_EMAIL_BRANDS>;
interfaceinvoke v.<java.util.Set: boolean add(java.lang.Object)>("localhost");
v = <nl.basjes.parse.useragent.utils.HostnameExtracter: java.util.Set UNWANTED_EMAIL_BRANDS>;
interfaceinvoke v.<java.util.Set: boolean add(java.lang.Object)>("gmail.com");
v = <nl.basjes.parse.useragent.utils.HostnameExtracter: java.util.Set UNWANTED_EMAIL_BRANDS>;
interfaceinvoke v.<java.util.Set: boolean add(java.lang.Object)>("outlook.com");
v = newarray (nl.basjes.parse.useragent.utils.HostnameExtracter$SitePathExtract)[3];
v = new nl.basjes.parse.useragent.utils.HostnameExtracter$SitePathExtract;
specialinvoke v.<nl.basjes.parse.useragent.utils.HostnameExtracter$SitePathExtract: void <init>(java.lang.String,int)>("https://github.com/", 0);
v[0] = v;
v = new nl.basjes.parse.useragent.utils.HostnameExtracter$SitePathExtract;
specialinvoke v.<nl.basjes.parse.useragent.utils.HostnameExtracter$SitePathExtract: void <init>(java.lang.String,int)>("https://gitlab.com/", 0);
v[1] = v;
v = new nl.basjes.parse.useragent.utils.HostnameExtracter$SitePathExtract;
specialinvoke v.<nl.basjes.parse.useragent.utils.HostnameExtracter$SitePathExtract: void <init>(java.lang.String,int)>("https://sourceforge.net/projects/", 0);
v[2] = v;
v = staticinvoke <java.util.Arrays: java.util.List asList(java.lang.Object[])>(v);
<nl.basjes.parse.useragent.utils.HostnameExtracter: java.util.List SITE_PATH_EXTRACTS> = v;
v = staticinvoke <java.util.regex.Pattern: java.util.regex.Pattern compile(java.lang.String)>("\\.");
<nl.basjes.parse.useragent.utils.HostnameExtracter: java.util.regex.Pattern DOT_SPLITTER> = v;
return;
}
}