Domain Extractor (Draft)

import urllib

def get_domain(url):

url = url.split(".")

tlds = urllib.urlopen("http://data.iana.org/TLD/tlds-alpha-by-domain.txt").readlines()

for x in range(0, len(url)):

try:

xx=url[x].split("/")

for y in xx:

s = str()

if(tlds.find(y)>-1):

return url[x-1]

except Exception, ex:

print x, ex

continue
Advertisements

Leave a Reply

Fill in your details below or click an icon to log in:

WordPress.com Logo

You are commenting using your WordPress.com account. Log Out / Change )

Twitter picture

You are commenting using your Twitter account. Log Out / Change )

Facebook photo

You are commenting using your Facebook account. Log Out / Change )

Google+ photo

You are commenting using your Google+ account. Log Out / Change )

Connecting to %s

%d bloggers like this: