| author | Evgeni Kunev <evgeni.kunev@gmail.com> |
| Fri, 15 Aug 2014 17:11:52 +0300 | |
| changeset 35 | 0de2468a27e8 |
| child 70 | 1fe2c20adeba |
| permissions | -rw-r--r-- |
|
35
0de2468a27e8
Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff
changeset
|
1 |
# coding=utf-8 |
|
0de2468a27e8
Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff
changeset
|
2 |
|
|
0de2468a27e8
Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff
changeset
|
3 |
import unittest |
|
0de2468a27e8
Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff
changeset
|
4 |
from whois import extract_domain |
|
0de2468a27e8
Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff
changeset
|
5 |
|
|
0de2468a27e8
Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff
changeset
|
6 |
|
|
0de2468a27e8
Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff
changeset
|
7 |
class TestExtractDomain(unittest.TestCase): |
|
0de2468a27e8
Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff
changeset
|
8 |
def test_simple_ascii_domain(self): |
|
0de2468a27e8
Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff
changeset
|
9 |
url = 'google.com' |
|
0de2468a27e8
Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff
changeset
|
10 |
domain = url |
|
0de2468a27e8
Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff
changeset
|
11 |
self.assertEqual(domain, extract_domain(url)) |
|
0de2468a27e8
Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff
changeset
|
12 |
|
|
0de2468a27e8
Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff
changeset
|
13 |
def test_ascii_with_schema_path_and_query(self): |
|
0de2468a27e8
Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff
changeset
|
14 |
url = 'https://www.google.com/search?q=why+is+domain+whois+such+a+mess' |
|
0de2468a27e8
Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff
changeset
|
15 |
domain = 'google.com' |
|
0de2468a27e8
Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff
changeset
|
16 |
self.assertEqual(domain, extract_domain(url)) |
|
0de2468a27e8
Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff
changeset
|
17 |
|
|
0de2468a27e8
Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff
changeset
|
18 |
def test_simple_unicode_domain(self): |
|
0de2468a27e8
Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff
changeset
|
19 |
url = 'http://нарояци.com/' |
|
0de2468a27e8
Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff
changeset
|
20 |
domain = 'нарояци.com' |
|
0de2468a27e8
Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff
changeset
|
21 |
self.assertEqual(domain, extract_domain(url)) |
|
0de2468a27e8
Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff
changeset
|
22 |
|
|
0de2468a27e8
Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff
changeset
|
23 |
def test_unicode_domain_and_tld(self): |
|
0de2468a27e8
Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff
changeset
|
24 |
url = 'http://россия.рф/' |
|
0de2468a27e8
Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff
changeset
|
25 |
domain = 'россия.рф' |
|
0de2468a27e8
Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff
changeset
|
26 |
self.assertEqual(domain, extract_domain(url)) |