2to3port #2
@ -45,7 +45,7 @@ class Parser(object):
|
||||
logging.basicConfig(level=logging.DEBUG)
|
||||
logging.debug("__init__: DEBUG is set to True")
|
||||
|
||||
self.domain = unicode(domain, "utf-8").encode("idna")
|
||||
self.domain = str(domain)
|
||||
|
||||
if not text:
|
||||
raise error.InvalidInputText(text)
|
||||
@ -63,13 +63,13 @@ class Parser(object):
|
||||
|
||||
self.parseDefaultConf = {}
|
||||
logging.debug("__init__: Loading default tld configuration file")
|
||||
execfile(os.path.join(self.tldPath, "default"), {}, self.parseDefaultConf)
|
||||
exec(compile(open(os.path.join(self.tldPath, "default")).read(), os.path.join(self.tldPath, "default"), 'exec'), {}, self.parseDefaultConf)
|
||||
self.parseDefaultConf = self.parseDefaultConf.get("parse")
|
||||
|
||||
self.parseConf = {}
|
||||
|
||||
try:
|
||||
execfile(os.path.join(self.tldPath, self.tld), {}, self.parseConf)
|
||||
exec(compile(open(os.path.join(self.tldPath, self.tld)).read(), os.path.join(self.tldPath, self.tld), 'exec'), {}, self.parseConf)
|
||||
|
||||
self.parseConf = self.parseConf.get("parse")
|
||||
|
||||
@ -113,7 +113,7 @@ class Parser(object):
|
||||
|
||||
logging.debug("__init__: Loading configuration file of tld name %s"%(lcTLD))
|
||||
|
||||
execfile(os.path.join(self.tldPath, "%s"%(lcTLD)), {}, lcConf)
|
||||
exec(compile(open(os.path.join(self.tldPath, "%s"%(lcTLD))).read(), os.path.join(self.tldPath, "%s"%(lcTLD)), 'exec'), {}, lcConf)
|
||||
lcConf = lcConf.get("parse")
|
||||
|
||||
self.parseConf.update(lcConf.get(lcWS))
|
||||
@ -135,7 +135,7 @@ class Parser(object):
|
||||
matches = re.findall(self.parseConf[key], self.text, re.MULTILINE)
|
||||
if matches:
|
||||
logging.debug("run: regex matches found for key %s. %s"%(key, matches))
|
||||
result.update({key: map(lambda x: x.strip(), matches)})
|
||||
result.update({key: [x.strip() for x in matches]})
|
||||
else:
|
||||
logging.debug("run: No match for %s"%(key))
|
||||
|
||||
|
||||
145
whois/parser.py2
Normal file
145
whois/parser.py2
Normal file
@ -0,0 +1,145 @@
|
||||
# -*- coding: utf-8 -*-
|
||||
|
||||
# ______ ______ ______ ______ ______ ______
|
||||
#/\ == \/\ __ \ /\ == \ /\ ___\ /\ ___\ /\ == \
|
||||
#\ \ _-/\ \ __ \\ \ __< \ \___ \\ \ __\ \ \ __<
|
||||
# \ \_\ \ \_\ \_\\ \_\ \_\\/\_____\\ \_____\\ \_\ \_\
|
||||
# \/_/ \/_/\/_/ \/_/ /_/ \/_____/ \/_____/ \/_/ /_/
|
||||
|
||||
from . import error
|
||||
import re
|
||||
import sys
|
||||
import os
|
||||
import time
|
||||
import logging
|
||||
|
||||
def convertDate(s):
|
||||
"""Convert any date string found in WHOIS to a datetime object.
|
||||
"""
|
||||
# Source from https://code.google.com/p/pywhois/source/browse/whois/parser.py
|
||||
known_formats = [
|
||||
'%d-%b-%Y', # 02-jan-2000
|
||||
'%Y-%m-%d', # 2000-01-02
|
||||
'%d.%m.%Y', # 2.1.2000
|
||||
'%Y.%m.%d', # 2000.01.02
|
||||
'%Y/%m/%d', # 2000/01/02
|
||||
'%d-%b-%Y %H:%M:%S %Z', # 24-Jul-2009 13:20:03 UTC
|
||||
'%a %b %d %H:%M:%S %Z %Y', # Tue Jun 21 23:59:59 GMT 2011
|
||||
'%Y-%m-%dT%H:%M:%SZ', # 2007-01-26T19:10:31Z
|
||||
'%Y. %m. %d.', # 2012. 04. 03. - whois.krnic.net
|
||||
'%d/%m/%Y %H:%M:%S', # 14/09/2013 00:59:59 - whois.nic.im
|
||||
'%Y/%m/%d %H:%M:%S (%Z)', # 2012/07/01 01:05:01 (JST) - whois.jprs.jp
|
||||
]
|
||||
|
||||
for known_format in known_formats:
|
||||
try:
|
||||
return time.mktime(time.strptime(s.strip(), known_format))
|
||||
except ValueError as e:
|
||||
pass # Wrong format, keep trying
|
||||
|
||||
return s
|
||||
|
||||
class Parser(object):
|
||||
def __init__(self, domain, text, whoisServer=None, debug=False):
|
||||
if debug:
|
||||
logging.basicConfig(level=logging.DEBUG)
|
||||
logging.debug("__init__: DEBUG is set to True")
|
||||
|
||||
self.domain = unicode(domain, "utf-8").encode("idna")
|
||||
|
||||
if not text:
|
||||
raise error.InvalidInputText(text)
|
||||
|
||||
self.text = text
|
||||
self.whoisServer = whoisServer and whoisServer or "default"
|
||||
|
||||
self.tld = self.domain.split(".")[-1]
|
||||
|
||||
self.currPath = os.path.dirname(os.path.realpath(__file__))
|
||||
self.tldPath = os.path.join(self.currPath, "tlds")
|
||||
|
||||
logging.debug("__init__: Setting initial variables...\nself.domain: %s\nself.text = %s\nself.whoisServer = %s\nself.tld = %s\nself.currPath = %s\nself.tldPath = %s"
|
||||
%(self.domain, self.text, self.whoisServer, self.tld, self.currPath, self.tldPath))
|
||||
|
||||
self.parseDefaultConf = {}
|
||||
logging.debug("__init__: Loading default tld configuration file")
|
||||
execfile(os.path.join(self.tldPath, "default"), {}, self.parseDefaultConf)
|
||||
self.parseDefaultConf = self.parseDefaultConf.get("parse")
|
||||
|
||||
self.parseConf = {}
|
||||
|
||||
try:
|
||||
execfile(os.path.join(self.tldPath, self.tld), {}, self.parseConf)
|
||||
|
||||
self.parseConf = self.parseConf.get("parse")
|
||||
|
||||
# THERE IS NO "parse" in the tld config AND THERE IS regex for specified server in default conf
|
||||
if not self.parseConf and whoisServer not in self.parseDefaultConf:
|
||||
self.parseConf = self.parseDefaultConf.get("default")
|
||||
|
||||
# THERE IS NO "parse" in the tld config
|
||||
elif not self.parseConf:
|
||||
self.parseConf = self.parseDefaultConf.get(whoisServer)
|
||||
|
||||
# THERE IS "parse" in the tld config AND THERE IS regex for specified server
|
||||
elif self.whoisServer in self.parseConf:
|
||||
self.parseConf = self.parseConf.get(self.whoisServer)
|
||||
|
||||
# THERE IS "parse" in the tld config AND THERE IS "default" regex in the tld config AND
|
||||
# THERE IS NO regex for specified server
|
||||
elif "default" in self.parseConf:
|
||||
self.parseConf = self.parseConf.get("default")
|
||||
|
||||
# THEE IS "parse" in the tld config AND THERE IS NO "default" regex in the tld config
|
||||
# MAYBE empty file?
|
||||
else:
|
||||
self.parseConf = self.parseDefaultConf.get("default")
|
||||
|
||||
# Check for LoadConf
|
||||
_parseConf = self.parseConf
|
||||
self.parseConf = {}
|
||||
|
||||
if "LoadConf" in _parseConf:
|
||||
logging.debug("__init__: LoadConf found in parser config")
|
||||
try:
|
||||
# <tld>/<whois server>
|
||||
# e.g. org/whois.publicinternetregistry.net
|
||||
lc = _parseConf["LoadConf"].split("/", 1)
|
||||
|
||||
lcTLD = lc[0]
|
||||
lcWS = lc[1]
|
||||
|
||||
lcConf = {}
|
||||
|
||||
logging.debug("__init__: Loading configuration file of tld name %s"%(lcTLD))
|
||||
|
||||
execfile(os.path.join(self.tldPath, "%s"%(lcTLD)), {}, lcConf)
|
||||
lcConf = lcConf.get("parse")
|
||||
|
||||
self.parseConf.update(lcConf.get(lcWS))
|
||||
|
||||
except:
|
||||
pass
|
||||
|
||||
self.parseConf.update(_parseConf)
|
||||
|
||||
except:
|
||||
self.parseConf = self.parseDefaultConf.get("default")
|
||||
|
||||
|
||||
logging.debug("__init__: self.parseConf = %s"%(self.parseConf))
|
||||
|
||||
def parse(self):
|
||||
result = {}
|
||||
for key in self.parseConf:
|
||||
matches = re.findall(self.parseConf[key], self.text, re.MULTILINE)
|
||||
if matches:
|
||||
logging.debug("run: regex matches found for key %s. %s"%(key, matches))
|
||||
result.update({key: map(lambda x: x.strip(), matches)})
|
||||
else:
|
||||
logging.debug("run: No match for %s"%(key))
|
||||
|
||||
return result
|
||||
|
||||
|
||||
|
||||
145
whois/py3/parser.py
Normal file
145
whois/py3/parser.py
Normal file
@ -0,0 +1,145 @@
|
||||
# -*- coding: utf-8 -*-
|
||||
|
||||
# ______ ______ ______ ______ ______ ______
|
||||
#/\ == \/\ __ \ /\ == \ /\ ___\ /\ ___\ /\ == \
|
||||
#\ \ _-/\ \ __ \\ \ __< \ \___ \\ \ __\ \ \ __<
|
||||
# \ \_\ \ \_\ \_\\ \_\ \_\\/\_____\\ \_____\\ \_\ \_\
|
||||
# \/_/ \/_/\/_/ \/_/ /_/ \/_____/ \/_____/ \/_/ /_/
|
||||
|
||||
from . import error
|
||||
import re
|
||||
import sys
|
||||
import os
|
||||
import time
|
||||
import logging
|
||||
|
||||
def convertDate(s):
|
||||
"""Convert any date string found in WHOIS to a datetime object.
|
||||
"""
|
||||
# Source from https://code.google.com/p/pywhois/source/browse/whois/parser.py
|
||||
known_formats = [
|
||||
'%d-%b-%Y', # 02-jan-2000
|
||||
'%Y-%m-%d', # 2000-01-02
|
||||
'%d.%m.%Y', # 2.1.2000
|
||||
'%Y.%m.%d', # 2000.01.02
|
||||
'%Y/%m/%d', # 2000/01/02
|
||||
'%d-%b-%Y %H:%M:%S %Z', # 24-Jul-2009 13:20:03 UTC
|
||||
'%a %b %d %H:%M:%S %Z %Y', # Tue Jun 21 23:59:59 GMT 2011
|
||||
'%Y-%m-%dT%H:%M:%SZ', # 2007-01-26T19:10:31Z
|
||||
'%Y. %m. %d.', # 2012. 04. 03. - whois.krnic.net
|
||||
'%d/%m/%Y %H:%M:%S', # 14/09/2013 00:59:59 - whois.nic.im
|
||||
'%Y/%m/%d %H:%M:%S (%Z)', # 2012/07/01 01:05:01 (JST) - whois.jprs.jp
|
||||
]
|
||||
|
||||
for known_format in known_formats:
|
||||
try:
|
||||
return time.mktime(time.strptime(s.strip(), known_format))
|
||||
except ValueError as e:
|
||||
pass # Wrong format, keep trying
|
||||
|
||||
return s
|
||||
|
||||
class Parser(object):
|
||||
def __init__(self, domain, text, whoisServer=None, debug=False):
|
||||
if debug:
|
||||
logging.basicConfig(level=logging.DEBUG)
|
||||
logging.debug("__init__: DEBUG is set to True")
|
||||
|
||||
self.domain = str(domain, "utf-8").encode("idna")
|
||||
|
||||
if not text:
|
||||
raise error.InvalidInputText(text)
|
||||
|
||||
self.text = text
|
||||
self.whoisServer = whoisServer and whoisServer or "default"
|
||||
|
||||
self.tld = self.domain.split(".")[-1]
|
||||
|
||||
self.currPath = os.path.dirname(os.path.realpath(__file__))
|
||||
self.tldPath = os.path.join(self.currPath, "tlds")
|
||||
|
||||
logging.debug("__init__: Setting initial variables...\nself.domain: %s\nself.text = %s\nself.whoisServer = %s\nself.tld = %s\nself.currPath = %s\nself.tldPath = %s"
|
||||
%(self.domain, self.text, self.whoisServer, self.tld, self.currPath, self.tldPath))
|
||||
|
||||
self.parseDefaultConf = {}
|
||||
logging.debug("__init__: Loading default tld configuration file")
|
||||
exec(compile(open(os.path.join(self.tldPath, "default")).read(), os.path.join(self.tldPath, "default"), 'exec'), {}, self.parseDefaultConf)
|
||||
self.parseDefaultConf = self.parseDefaultConf.get("parse")
|
||||
|
||||
self.parseConf = {}
|
||||
|
||||
try:
|
||||
exec(compile(open(os.path.join(self.tldPath, self.tld)).read(), os.path.join(self.tldPath, self.tld), 'exec'), {}, self.parseConf)
|
||||
|
||||
self.parseConf = self.parseConf.get("parse")
|
||||
|
||||
# THERE IS NO "parse" in the tld config AND THERE IS regex for specified server in default conf
|
||||
if not self.parseConf and whoisServer not in self.parseDefaultConf:
|
||||
self.parseConf = self.parseDefaultConf.get("default")
|
||||
|
||||
# THERE IS NO "parse" in the tld config
|
||||
elif not self.parseConf:
|
||||
self.parseConf = self.parseDefaultConf.get(whoisServer)
|
||||
|
||||
# THERE IS "parse" in the tld config AND THERE IS regex for specified server
|
||||
elif self.whoisServer in self.parseConf:
|
||||
self.parseConf = self.parseConf.get(self.whoisServer)
|
||||
|
||||
# THERE IS "parse" in the tld config AND THERE IS "default" regex in the tld config AND
|
||||
# THERE IS NO regex for specified server
|
||||
elif "default" in self.parseConf:
|
||||
self.parseConf = self.parseConf.get("default")
|
||||
|
||||
# THEE IS "parse" in the tld config AND THERE IS NO "default" regex in the tld config
|
||||
# MAYBE empty file?
|
||||
else:
|
||||
self.parseConf = self.parseDefaultConf.get("default")
|
||||
|
||||
# Check for LoadConf
|
||||
_parseConf = self.parseConf
|
||||
self.parseConf = {}
|
||||
|
||||
if "LoadConf" in _parseConf:
|
||||
logging.debug("__init__: LoadConf found in parser config")
|
||||
try:
|
||||
# <tld>/<whois server>
|
||||
# e.g. org/whois.publicinternetregistry.net
|
||||
lc = _parseConf["LoadConf"].split("/", 1)
|
||||
|
||||
lcTLD = lc[0]
|
||||
lcWS = lc[1]
|
||||
|
||||
lcConf = {}
|
||||
|
||||
logging.debug("__init__: Loading configuration file of tld name %s"%(lcTLD))
|
||||
|
||||
exec(compile(open(os.path.join(self.tldPath, "%s"%(lcTLD))).read(), os.path.join(self.tldPath, "%s"%(lcTLD)), 'exec'), {}, lcConf)
|
||||
lcConf = lcConf.get("parse")
|
||||
|
||||
self.parseConf.update(lcConf.get(lcWS))
|
||||
|
||||
except:
|
||||
pass
|
||||
|
||||
self.parseConf.update(_parseConf)
|
||||
|
||||
except:
|
||||
self.parseConf = self.parseDefaultConf.get("default")
|
||||
|
||||
|
||||
logging.debug("__init__: self.parseConf = %s"%(self.parseConf))
|
||||
|
||||
def parse(self):
|
||||
result = {}
|
||||
for key in self.parseConf:
|
||||
matches = re.findall(self.parseConf[key], self.text, re.MULTILINE)
|
||||
if matches:
|
||||
logging.debug("run: regex matches found for key %s. %s"%(key, matches))
|
||||
result.update({key: [x.strip() for x in matches]})
|
||||
else:
|
||||
logging.debug("run: No match for %s"%(key))
|
||||
|
||||
return result
|
||||
|
||||
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user