test/test_main.py
author Evgeni Kunev <evgeni.kunev@gmail.com>
Fri, 15 Aug 2014 17:11:52 +0300
changeset 35 0de2468a27e8
child 70 1fe2c20adeba
permissions -rw-r--r--
Fix extract_domain to work with unicode domains
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
35
0de2468a27e8 Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff changeset
     1
# coding=utf-8
0de2468a27e8 Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff changeset
     2
0de2468a27e8 Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff changeset
     3
import unittest
0de2468a27e8 Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff changeset
     4
from whois import extract_domain
0de2468a27e8 Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff changeset
     5
0de2468a27e8 Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff changeset
     6
0de2468a27e8 Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff changeset
     7
class TestExtractDomain(unittest.TestCase):
0de2468a27e8 Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff changeset
     8
    def test_simple_ascii_domain(self):
0de2468a27e8 Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff changeset
     9
        url = 'google.com'
0de2468a27e8 Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff changeset
    10
        domain = url
0de2468a27e8 Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff changeset
    11
        self.assertEqual(domain, extract_domain(url))
0de2468a27e8 Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff changeset
    12
0de2468a27e8 Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff changeset
    13
    def test_ascii_with_schema_path_and_query(self):
0de2468a27e8 Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff changeset
    14
        url = 'https://www.google.com/search?q=why+is+domain+whois+such+a+mess'
0de2468a27e8 Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff changeset
    15
        domain = 'google.com'
0de2468a27e8 Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff changeset
    16
        self.assertEqual(domain, extract_domain(url))
0de2468a27e8 Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff changeset
    17
0de2468a27e8 Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff changeset
    18
    def test_simple_unicode_domain(self):
0de2468a27e8 Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff changeset
    19
        url = 'http://нарояци.com/'
0de2468a27e8 Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff changeset
    20
        domain = 'нарояци.com'
0de2468a27e8 Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff changeset
    21
        self.assertEqual(domain, extract_domain(url))
0de2468a27e8 Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff changeset
    22
0de2468a27e8 Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff changeset
    23
    def test_unicode_domain_and_tld(self):
0de2468a27e8 Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff changeset
    24
        url = 'http://россия.рф/'
0de2468a27e8 Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff changeset
    25
        domain = 'россия.рф'
0de2468a27e8 Fix extract_domain to work with unicode domains
Evgeni Kunev <evgeni.kunev@gmail.com>
parents:
diff changeset
    26
        self.assertEqual(domain, extract_domain(url))