mirror of
https://github.com/adulau/DomainClassifier.git
synced 2024-11-22 18:07:07 +00:00
Update README to match new DomainClassifier
This commit is contained in:
parent
9f4ae469d9
commit
b5bfadb368
1 changed files with 24 additions and 0 deletions
24
README.md
24
README.md
|
@ -4,11 +4,35 @@ DomainClassifier
|
||||||
DomainClassifier is a simple Python library to extract and classify Internet
|
DomainClassifier is a simple Python library to extract and classify Internet
|
||||||
domains from raw text files following their existence, localization or attributes.
|
domains from raw text files following their existence, localization or attributes.
|
||||||
|
|
||||||
|
How To Use It
|
||||||
|
-------------
|
||||||
|
|
||||||
|
```python
|
||||||
|
import domainclassifier
|
||||||
|
|
||||||
|
c = domainclassifier.Extract( rawtext = "this is a text with a domain called test@foo.lu another test abc.lu something a.b.c.d.e end of 1.2.3.4 foo.be www.belnet.be http://www.cert.be/ www.public.lu www.allo.lu quuxtest www.eurodns.com something-broken-www.google.com www.google.lu trailing test")
|
||||||
|
|
||||||
|
# extracting potentially valid domains from rawtext
|
||||||
|
print c.domain()
|
||||||
|
|
||||||
|
# reduce set of potentially valid domains to existing domains
|
||||||
|
# (based on SOA,A,AAAA,CNAME,MX records)
|
||||||
|
print c.validdomain(extended=True)
|
||||||
|
|
||||||
|
# reduce set of valid domains with DNS records associated to a
|
||||||
|
# specified country
|
||||||
|
print "US:"
|
||||||
|
print c.localizedomain(cc='US')
|
||||||
|
print "LU:"
|
||||||
|
print c.localizedomain(cc='LU')
|
||||||
|
print "BE:"
|
||||||
|
print c.localizedomain(cc='BE')
|
||||||
|
```
|
||||||
### Software Required
|
### Software Required
|
||||||
|
|
||||||
* Python (tested successfully on version 2.6)
|
* Python (tested successfully on version 2.6)
|
||||||
* dnspython library - http://www.dnspython.org/
|
* dnspython library - http://www.dnspython.org/
|
||||||
|
* IPy library
|
||||||
|
|
||||||
### License
|
### License
|
||||||
|
|
||||||
|
|
Loading…
Reference in a new issue