// Copyright 2012 The Go Authors. All rights reserved. // Use of this source code is governed by a BSD-style // license that can be found in the LICENSE file. //go:generate go run gen.go // Package publicsuffix provides a public suffix list based on data from // http://publicsuffix.org/. A public suffix is one under which Internet users // can directly register names. package publicsuffix // import "golang.org/x/net/publicsuffix" // TODO: specify case sensitivity and leading/trailing dot behavior for // func PublicSuffix and func EffectiveTLDPlusOne. import ( "fmt" "net/http/cookiejar" "strings" ) // List implements the cookiejar.PublicSuffixList interface by calling the // PublicSuffix function. var List cookiejar.PublicSuffixList = list{} type list struct{} func (list) PublicSuffix(domain string) string { ps, _ := PublicSuffix(domain) return ps } func (list) String() string { return version } // PublicSuffix returns the public suffix of the domain using a copy of the // publicsuffix.org database compiled into the library. // // icann is whether the public suffix is managed by the Internet Corporation // for Assigned Names and Numbers. If not, the public suffix is privately // managed. For example, foo.org and foo.co.uk are ICANN domains, // foo.dyndns.org and foo.blogspot.co.uk are private domains. // // Use cases for distinguishing ICANN domains like foo.com from private // domains like foo.appspot.com can be found at // https://wiki.mozilla.org/Public_Suffix_List/Use_Cases func PublicSuffix(domain string) (publicSuffix string, icann bool) { lo, hi := uint32(0), uint32(numTLD) s, suffix, wildcard := domain, len(domain), false loop: for { dot := strings.LastIndex(s, ".") if wildcard { suffix = 1 + dot } if lo == hi { break } f := find(s[1+dot:], lo, hi) if f == notFound { break } u := nodes[f] >> (nodesBitsTextOffset + nodesBitsTextLength) icann = u&(1<<nodesBitsICANN-1) != 0 u >>= nodesBitsICANN u = children[u&(1<<nodesBitsChildren-1)] lo = u & (1<<childrenBitsLo - 1) u >>= childrenBitsLo hi = u & (1<<childrenBitsHi - 1) u >>= childrenBitsHi switch u & (1<<childrenBitsNodeType - 1) { case nodeTypeNormal: suffix = 1 + dot case nodeTypeException: suffix = 1 + len(s) break loop } u >>= childrenBitsNodeType wildcard = u&(1<<childrenBitsWildcard-1) != 0 if dot == -1 { break } s = s[:dot] } if suffix == len(domain) { // If no rules match, the prevailing rule is "*". return domain[1+strings.LastIndex(domain, "."):], icann } return domain[suffix:], icann } const notFound uint32 = 1<<32 - 1 // find returns the index of the node in the range [lo, hi) whose label equals // label, or notFound if there is no such node. The range is assumed to be in // strictly increasing node label order. func find(label string, lo, hi uint32) uint32 { for lo < hi { mid := lo + (hi-lo)/2 s := nodeLabel(mid) if s < label { lo = mid + 1 } else if s == label { return mid } else { hi = mid } } return notFound } // nodeLabel returns the label for the i'th node. func nodeLabel(i uint32) string { x := nodes[i] length := x & (1<<nodesBitsTextLength - 1) x >>= nodesBitsTextLength offset := x & (1<<nodesBitsTextOffset - 1) return text[offset : offset+length] } // EffectiveTLDPlusOne returns the effective top level domain plus one more // label. For example, the eTLD+1 for "foo.bar.golang.org" is "golang.org". func EffectiveTLDPlusOne(domain string) (string, error) { suffix, _ := PublicSuffix(domain) if len(domain) <= len(suffix) { return "", fmt.Errorf("publicsuffix: cannot derive eTLD+1 for domain %q", domain) } i := len(domain) - len(suffix) - 1 if domain[i] != '.' { return "", fmt.Errorf("publicsuffix: invalid public suffix %q for domain %q", suffix, domain) } return domain[1+strings.LastIndex(domain[:i], "."):], nil }