From f7a360a0609f2274deca3e52e4bb775b7be628f0 Mon Sep 17 00:00:00 2001
From: PyYoshi <myoshi321go@gmail.com>
Date: Mon, 17 Oct 2016 11:21:12 +0900
Subject: [PATCH] simplify tests

---
 test/tests.py | 566 +++++++-------------------------------------------
 1 file changed, 75 insertions(+), 491 deletions(-)

diff --git a/test/tests.py b/test/tests.py
index ed79481..7eca088 100644
--- a/test/tests.py
+++ b/test/tests.py
@@ -5,428 +5,84 @@ from nose.tools import eq_
 
 import cchardet
 
+encodings_map = {
+    r'testdata/bg/ISO-8859-5/wikitop_bg_ISO-8859-5.txt': 'ISO-8859-5',
+    r'testdata/bg/UTF-8/wikitop_bg_UTF-8.txt': 'UTF-8',
+    r'testdata/bg/WINDOWS-1251/wikitop_bg_WINDOWS-1251.txt': 'WINDOWS-1251',
+    r'testdata/cz/ISO-8859-2/wikitop_cz_ISO-8859-2.txt': 'ISO-8859-2',
+    r'testdata/cz/UTF-8/wikitop_cz_UTF-8.txt': 'UTF-8',
+    r'testdata/de/UTF-8/wikitop_de_UTF-8.txt': 'UTF-8',
+    r'testdata/de/WINDOWS-1252/wikitop_de_WINDOWS-1252.txt': 'WINDOWS-1252',
+    r'testdata/dk/UTF-8/wikitop_dk_UTF-8.txt': 'UTF-8',
+    r'testdata/dk/WINDOWS-1252/wikitop_dk_WINDOWS-1252.txt': 'WINDOWS-1252',
+    r'testdata/el/ISO-8859-7/wikitop_el_ISO-8859-7.txt': 'ISO-8859-7',
+    r'testdata/el/UTF-8/wikitop_el_UTF-8.txt': 'UTF-8',
+    r'testdata/en/UTF-8/wikitop_en_UTF-8.txt': 'UTF-8',
+    r'testdata/en/WINDOWS-1252/wikitop_en_WINDOWS-1252.txt': 'WINDOWS-1252',
+    r'testdata/es/UTF-8/wikitop_es_UTF-8.txt': 'UTF-8',
+    r'testdata/es/WINDOWS-1252/wikitop_es_WINDOWS-1252.txt': 'WINDOWS-1252',
+    r'testdata/fi/UTF-8/wikitop_fi_UTF-8.txt': 'UTF-8',
+    r'testdata/fi/WINDOWS-1252/wikitop_fi_WINDOWS-1252.txt': 'WINDOWS-1252',
+    r'testdata/fr/UTF-8/wikitop_fr_UTF-8.txt': 'UTF-8',
+    r'testdata/fr/WINDOWS-1252/wikitop_fr_WINDOWS-1252.txt': 'WINDOWS-1252',
+    r'testdata/he/UTF-8/wikitop_he_UTF-8.txt': 'UTF-8',
+    r'testdata/he/WINDOWS-1255/wikitop_he_WINDOWS-1255.txt': 'WINDOWS-1255',
+    r'testdata/hu/UTF-8/wikitop_hu_UTF-8.txt': 'UTF-8',
+    r'testdata/hu/ISO-8859-2/wikitop_hu_ISO-8859-2.txt': 'ISO-8859-2',
+    r'testdata/it/UTF-8/wikitop_it_UTF-8.txt': 'UTF-8',
+    r'testdata/it/WINDOWS-1252/wikitop_it_WINDOWS-1252.txt': 'WINDOWS-1252',
+    r'testdata/nl/UTF-8/wikitop_nl_UTF-8.txt': 'UTF-8',
+    r'testdata/nl/WINDOWS-1252/wikitop_nl_WINDOWS-1252.txt': 'WINDOWS-1252',
+    r'testdata/no/UTF-8/wikitop_no_UTF-8.txt': 'UTF-8',
+    r'testdata/no/WINDOWS-1252/wikitop_no_WINDOWS-1252.txt': 'WINDOWS-1252',
+    r'testdata/pl/UTF-8/wikitop_pl_UTF-8.txt': 'UTF-8',
+    r'testdata/pl/ISO-8859-2/wikitop_pl_ISO-8859-2.txt': 'ISO-8859-2',
+    r'testdata/pt/UTF-8/wikitop_pt_UTF-8.txt': 'UTF-8',
+    r'testdata/pt/WINDOWS-1252/wikitop_pt_WINDOWS-1252.txt': 'WINDOWS-1252',
+    r'testdata/ru/UTF-8/wikitop_ru_UTF-8.txt': 'UTF-8',
+    r'testdata/ru/WINDOWS-1251/wikitop_ru_WINDOWS-1251.txt': 'WINDOWS-1251',
+    r'testdata/ru/IBM855/wikitop_ru_IBM855.txt': 'IBM855',
+    r'testdata/ru/KOI8-R/wikitop_ru_KOI8-R.txt': 'KOI8-R',
+    r'testdata/ru/X-MAC-CYRILLIC/wikitop_ru_MACCYRILLIC.txt': 'MAC-CYRILLIC',
+    r'testdata/se/UTF-8/wikitop_se_UTF-8.txt': 'UTF-8',
+    r'testdata/se/WINDOWS-1252/wikitop_se_WINDOWS-1252.txt': 'WINDOWS-1252',
+    r'testdata/th/UTF-8/wikitop_th_UTF-8.txt': 'UTF-8',
+    r'testdata/th/TIS-620/utffool_th_TIS-620.txt': 'TIS-620',
+    r'testdata/th/TIS-620/wikitop_th_TIS-620.txt': 'TIS-620',
+    r'testdata/tr/UTF-8/wikitop_tr_UTF-8.txt': 'UTF-8',
+    r'testdata/tr/ISO-8859-9/wikitop_tr_ISO-8859-9.txt': 'ISO-8859-9',
+    r'testdata/zh/UTF-8/wikitop_zh_UTF-8.txt': 'UTF-8',
+    r'testdata/zh/GB18030/wikitop_zh_GB18030.txt': 'GB18030',
+}
 
-class TestCchardet():
-    def test_detect_bg_iso88595(self):
-        encoding = "ISO-8859-5"
-        path = r"testdata/bg/ISO-8859-5/wikitop_bg_ISO-8859-5.txt"
-        with open(path, 'rb') as f:
-            msg = f.read()
-        detected_encoding = cchardet.detect(msg)
-        eq_(encoding.lower(), detected_encoding['encoding'].lower())
 
-    def test_detect_bg_utf8(self):
-        encoding = "UTF-8"
-        path = r"testdata/bg/UTF-8/wikitop_bg_UTF-8.txt"
-        with open(path, 'rb') as f:
-            msg = f.read()
-        detected_encoding = cchardet.detect(msg)
-        print(detected_encoding)
-        eq_(encoding.lower(), detected_encoding['encoding'].lower())
+class TestCChardet():
+    def test_detect(self):
+        for path, encoding in encodings_map.items():
+            with open(path, 'rb') as f:
+                msg = f.read()
+                detected_encoding = cchardet.detect(msg)
+                eq_(encoding.lower(), detected_encoding['encoding'].lower(), 'Invalid encoding: %s' % path)
 
-    def test_detect_bg_windows1251(self):
-        encoding = "WINDOWS-1251"
-        path = r"testdata/bg/WINDOWS-1251/wikitop_bg_WINDOWS-1251.txt"
-        with open(path, 'rb') as f:
-            msg = f.read()
-        detected_encoding = cchardet.detect(msg)
-        print(detected_encoding)
-        eq_(encoding.lower(), detected_encoding['encoding'].lower())
+    def test_detector(self):
+        for path, encoding in encodings_map.items():
+            detector = cchardet.Detector()
+            with open(path, 'rb') as f:
+                line = f.readline()
+                while line:
+                    detector.feed(line)
+                    if detector.done:
+                        break
+                    line = f.readline()
+            detector.close()
+            detected_encoding = detector.result
+            eq_(encoding.lower(), detected_encoding['encoding'].lower(), 'Invalid encoding: %s' % path)
 
-    def test_detect_cz_iso88592(self):
-        encoding = "ISO-8859-2"
-        path = r"testdata/cz/ISO-8859-2/wikitop_cz_ISO-8859-2.txt"
-        with open(path, 'rb') as f:
-            msg = f.read()
-        detected_encoding = cchardet.detect(msg)
-        print(detected_encoding)
-        eq_(encoding.lower(), detected_encoding['encoding'].lower())
-
-    def test_detect_cz_utf8(self):
-        encoding = "UTF-8"
-        path = r"testdata/cz/UTF-8/wikitop_cz_UTF-8.txt"
-        with open(path, 'rb') as f:
-            msg = f.read()
-        detected_encoding = cchardet.detect(msg)
-        print(detected_encoding)
-        eq_(encoding.lower(), detected_encoding['encoding'].lower())
-
-    def test_detect_de_utf8(self):
-        encoding = "UTF-8"
-        path = r"testdata/de/UTF-8/wikitop_de_UTF-8.txt"
-        with open(path, 'rb') as f:
-            msg = f.read()
-        detected_encoding = cchardet.detect(msg)
-        print(detected_encoding)
-        eq_(encoding.lower(), detected_encoding['encoding'].lower())
-
-    def test_detect_de_windows1252(self):
-        encoding = "WINDOWS-1252"
-        path = r"testdata/de/WINDOWS-1252/wikitop_de_WINDOWS-1252.txt"
-        with open(path, 'rb') as f:
-            msg = f.read()
-        detected_encoding = cchardet.detect(msg)
-        print(detected_encoding)
-        eq_(encoding.lower(), detected_encoding['encoding'].lower())
-
-    def test_detect_dk_utf8(self):
-        encoding = "UTF-8"
-        path = r"testdata/dk/UTF-8/wikitop_dk_UTF-8.txt"
-        with open(path, 'rb') as f:
-            msg = f.read()
-        detected_encoding = cchardet.detect(msg)
-        print(detected_encoding)
-        eq_(encoding.lower(), detected_encoding['encoding'].lower())
-
-    def test_detect_dk_windows1252(self):
-        encoding = "WINDOWS-1252"
-        path = r"testdata/dk/WINDOWS-1252/wikitop_dk_WINDOWS-1252.txt"
-        with open(path, 'rb') as f:
-            msg = f.read()
-        detected_encoding = cchardet.detect(msg)
-        print(detected_encoding)
-        eq_(encoding.lower(), detected_encoding['encoding'].lower())
-
-    def test_detect_el_iso88597(self):
-        encoding = "ISO-8859-7"
-        path = r"testdata/el/ISO-8859-7/wikitop_el_ISO-8859-7.txt"
-        with open(path, 'rb') as f:
-            msg = f.read()
-        detected_encoding = cchardet.detect(msg)
-        print(detected_encoding)
-        eq_(encoding.lower(), detected_encoding['encoding'].lower())
-
-    def test_detect_el_utf8(self):
-        encoding = "UTF-8"
-        path = r"testdata/el/UTF-8/wikitop_el_UTF-8.txt"
-        with open(path, 'rb') as f:
-            msg = f.read()
-        detected_encoding = cchardet.detect(msg)
-        print(detected_encoding)
-        eq_(encoding.lower(), detected_encoding['encoding'].lower())
-
-    def test_detect_en_utf8(self):
-        encoding = "UTF-8"
-        path = r"testdata/en/UTF-8/wikitop_en_UTF-8.txt"
-        with open(path, 'rb') as f:
-            msg = f.read()
-        detected_encoding = cchardet.detect(msg)
-        print(detected_encoding)
-        eq_(encoding.lower(), detected_encoding['encoding'].lower())
-
-    def test_detect_en_windows1252(self):
-        encoding = "WINDOWS-1252"
-        path = r"testdata/en/WINDOWS-1252/wikitop_en_WINDOWS-1252.txt"
-        with open(path, 'rb') as f:
-            msg = f.read()
-        detected_encoding = cchardet.detect(msg)
-        print(detected_encoding)
-        eq_(encoding.lower(), detected_encoding['encoding'].lower())
-
-    def test_detect_es_utf8(self):
-        encoding = "UTF-8"
-        path = r"testdata/es/UTF-8/wikitop_es_UTF-8.txt"
-        with open(path, 'rb') as f:
-            msg = f.read()
-        detected_encoding = cchardet.detect(msg)
-        print(detected_encoding)
-        eq_(encoding.lower(), detected_encoding['encoding'].lower())
-
-    def test_detect_es_windows1252(self):
-        encoding = "WINDOWS-1252"
-        path = r"testdata/es/WINDOWS-1252/wikitop_es_WINDOWS-1252.txt"
-        with open(path, 'rb') as f:
-            msg = f.read()
-        detected_encoding = cchardet.detect(msg)
-        print(detected_encoding)
-        eq_(encoding.lower(), detected_encoding['encoding'].lower())
-
-    def test_detect_fi_utf8(self):
-        encoding = "UTF-8"
-        path = r"testdata/fi/UTF-8/wikitop_fi_UTF-8.txt"
-        with open(path, 'rb') as f:
-            msg = f.read()
-        detected_encoding = cchardet.detect(msg)
-        print(detected_encoding)
-        eq_(encoding.lower(), detected_encoding['encoding'].lower())
-
-    def test_detect_fi_windows1252(self):
-        encoding = "WINDOWS-1252"
-        path = r"testdata/fi/WINDOWS-1252/wikitop_fi_WINDOWS-1252.txt"
-        with open(path, 'rb') as f:
-            msg = f.read()
-        detected_encoding = cchardet.detect(msg)
-        print(detected_encoding)
-        eq_(encoding.lower(), detected_encoding['encoding'].lower())
-
-    def test_detect_fr_utf8(self):
-        encoding = "UTF-8"
-        path = r"testdata/fr/UTF-8/wikitop_fr_UTF-8.txt"
-        with open(path, 'rb') as f:
-            msg = f.read()
-        detected_encoding = cchardet.detect(msg)
-        print(detected_encoding)
-        eq_(encoding.lower(), detected_encoding['encoding'].lower())
-
-    def test_detect_fr_windows1252(self):
-        encoding = "WINDOWS-1252"
-        path = r"testdata/fr/WINDOWS-1252/wikitop_fr_WINDOWS-1252.txt"
-        with open(path, 'rb') as f:
-            msg = f.read()
-        detected_encoding = cchardet.detect(msg)
-        print(detected_encoding)
-        eq_(encoding.lower(), detected_encoding['encoding'].lower())
-
-    def test_detect_he_utf8(self):
-        encoding = "UTF-8"
-        path = r"testdata/he/UTF-8/wikitop_he_UTF-8.txt"
-        with open(path, 'rb') as f:
-            msg = f.read()
-        detected_encoding = cchardet.detect(msg)
-        print(detected_encoding)
-        eq_(encoding.lower(), detected_encoding['encoding'].lower())
-
-    def test_detect_he_windows1255(self):
-        encoding = "WINDOWS-1255"
-        path = r"testdata/he/WINDOWS-1255/wikitop_he_WINDOWS-1255.txt"
-        with open(path, 'rb') as f:
-            msg = f.read()
-        detected_encoding = cchardet.detect(msg)
-        print(detected_encoding)
-        eq_(encoding.lower(), detected_encoding['encoding'].lower())
-
-    def test_detect_hu_utf8(self):
-        encoding = "UTF-8"
-        path = r"testdata/hu/UTF-8/wikitop_hu_UTF-8.txt"
-        with open(path, 'rb') as f:
-            msg = f.read()
-        detected_encoding = cchardet.detect(msg)
-        print(detected_encoding)
-        eq_(encoding.lower(), detected_encoding['encoding'].lower())
-
-    def test_detect_hu_iso55892(self):
-        encoding = "ISO-8859-2"
-        path = r"testdata/hu/ISO-8859-2/wikitop_hu_ISO-8859-2.txt"
-        with open(path, 'rb') as f:
-            msg = f.read()
-        detected_encoding = cchardet.detect(msg)
-        print(detected_encoding)
-        eq_(encoding.lower(), detected_encoding['encoding'].lower())
-
-    def test_detect_it_utf8(self):
-        encoding = "UTF-8"
-        path = r"testdata/it/UTF-8/wikitop_it_UTF-8.txt"
-        with open(path, 'rb') as f:
-            msg = f.read()
-        detected_encoding = cchardet.detect(msg)
-        print(detected_encoding)
-        eq_(encoding.lower(), detected_encoding['encoding'].lower())
-
-    def test_detect_it_windows1252(self):
-        encoding = "WINDOWS-1252"
-        path = r"testdata/it/WINDOWS-1252/wikitop_it_WINDOWS-1252.txt"
-        with open(path, 'rb') as f:
-            msg = f.read()
-        detected_encoding = cchardet.detect(msg)
-        print(detected_encoding)
-        eq_(encoding.lower(), detected_encoding['encoding'].lower())
-
-    def test_detect_nl_utf8(self):
-        encoding = "UTF-8"
-        path = r"testdata/nl/UTF-8/wikitop_nl_UTF-8.txt"
-        with open(path, 'rb') as f:
-            msg = f.read()
-        detected_encoding = cchardet.detect(msg)
-        print(detected_encoding)
-        eq_(encoding.lower(), detected_encoding['encoding'].lower())
-
-    def test_detect_nl_windows1252(self):
-        encoding = "WINDOWS-1252"
-        path = r"testdata/nl/WINDOWS-1252/wikitop_nl_WINDOWS-1252.txt"
-        with open(path, 'rb') as f:
-            msg = f.read()
-        detected_encoding = cchardet.detect(msg)
-        print(detected_encoding)
-        eq_(encoding.lower(), detected_encoding['encoding'].lower())
-
-    def test_detect_no_utf8(self):
-        encoding = "UTF-8"
-        path = r"testdata/no/UTF-8/wikitop_no_UTF-8.txt"
-        with open(path, 'rb') as f:
-            msg = f.read()
-        detected_encoding = cchardet.detect(msg)
-        print(detected_encoding)
-        eq_(encoding.lower(), detected_encoding['encoding'].lower())
-
-    def test_detect_no_windows1252(self):
-        encoding = "WINDOWS-1252"
-        path = r"testdata/no/WINDOWS-1252/wikitop_no_WINDOWS-1252.txt"
-        with open(path, 'rb') as f:
-            msg = f.read()
-        detected_encoding = cchardet.detect(msg)
-        print(detected_encoding)
-        eq_(encoding.lower(), detected_encoding['encoding'].lower())
-
-    def test_detect_pl_utf8(self):
-        encoding = "UTF-8"
-        path = r"testdata/pl/UTF-8/wikitop_pl_UTF-8.txt"
-        with open(path, 'rb') as f:
-            msg = f.read()
-        detected_encoding = cchardet.detect(msg)
-        print(detected_encoding)
-        eq_(encoding.lower(), detected_encoding['encoding'].lower())
-
-    def test_detect_pl_iso88592(self):
-        encoding = "ISO-8859-2"
-        path = r"testdata/pl/ISO-8859-2/wikitop_pl_ISO-8859-2.txt"
-        with open(path, 'rb') as f:
-            msg = f.read()
-        detected_encoding = cchardet.detect(msg)
-        print(detected_encoding)
-        eq_(encoding.lower(), detected_encoding['encoding'].lower())
-
-    def test_detect_pt_utf8(self):
-        encoding = "UTF-8"
-        path = r"testdata/pt/UTF-8/wikitop_pt_UTF-8.txt"
-        with open(path, 'rb') as f:
-            msg = f.read()
-        detected_encoding = cchardet.detect(msg)
-        print(detected_encoding)
-        eq_(encoding.lower(), detected_encoding['encoding'].lower())
-
-    def test_detect_pt_windows1252(self):
-        encoding = "WINDOWS-1252"
-        path = r"testdata/pt/WINDOWS-1252/wikitop_pt_WINDOWS-1252.txt"
-        with open(path, 'rb') as f:
-            msg = f.read()
-        detected_encoding = cchardet.detect(msg)
-        print(detected_encoding)
-        eq_(encoding.lower(), detected_encoding['encoding'].lower())
-
-    def test_detect_ru_utf8(self):
-        encoding = "UTF-8"
-        path = r"testdata/ru/UTF-8/wikitop_ru_UTF-8.txt"
-        with open(path, 'rb') as f:
-            msg = f.read()
-        detected_encoding = cchardet.detect(msg)
-        print(detected_encoding)
-        eq_(encoding.lower(), detected_encoding['encoding'].lower())
-
-    def test_detect_ru_windows1251(self):
-        encoding = "WINDOWS-1251"
-        path = r"testdata/ru/WINDOWS-1251/wikitop_ru_WINDOWS-1251.txt"
-        with open(path, 'rb') as f:
-            msg = f.read()
-        detected_encoding = cchardet.detect(msg)
-        print(detected_encoding)
-        eq_(encoding.lower(), detected_encoding['encoding'].lower())
-
-    def test_detect_ru_ibm855(self):
-        encoding = "IBM855"
-        path = r"testdata/ru/IBM855/wikitop_ru_IBM855.txt"
-        with open(path, 'rb') as f:
-            msg = f.read()
-        detected_encoding = cchardet.detect(msg)
-        print(detected_encoding)
-        eq_(encoding.lower(), detected_encoding['encoding'].lower())
-
-    def test_detect_ru_koi8r(self):
-        encoding = "KOI8-R"
-        path = r"testdata/ru/KOI8-R/wikitop_ru_KOI8-R.txt"
-        with open(path, 'rb') as f:
-            msg = f.read()
-        detected_encoding = cchardet.detect(msg)
-        print(detected_encoding)
-        eq_(encoding.lower(), detected_encoding['encoding'].lower())
-
-    def test_detect_ru_maccyrillic(self):
-        encoding = "MAC-CYRILLIC"
-        path = r"testdata/ru/X-MAC-CYRILLIC/wikitop_ru_MACCYRILLIC.txt"
-        with open(path, 'rb') as f:
-            msg = f.read()
-        detected_encoding = cchardet.detect(msg)
-        print(detected_encoding)
-        eq_(encoding.lower(), detected_encoding['encoding'].lower())
-
-    def test_detect_se_utf8(self):
-        encoding = "UTF-8"
-        path = r"testdata/se/UTF-8/wikitop_se_UTF-8.txt"
-        with open(path, 'rb') as f:
-            msg = f.read()
-        detected_encoding = cchardet.detect(msg)
-        print(detected_encoding)
-        eq_(encoding.lower(), detected_encoding['encoding'].lower())
-
-    def test_detect_se_windows1252(self):
-        encoding = "WINDOWS-1252"
-        path = r"testdata/se/WINDOWS-1252/wikitop_se_WINDOWS-1252.txt"
-        with open(path, 'rb') as f:
-            msg = f.read()
-        detected_encoding = cchardet.detect(msg)
-        print(detected_encoding)
-        eq_(encoding.lower(), detected_encoding['encoding'].lower())
-
-    def test_detect_th_utf8(self):
-        encoding = "UTF-8"
-        path = r"testdata/th/UTF-8/wikitop_th_UTF-8.txt"
-        with open(path, 'rb') as f:
-            msg = f.read()
-        detected_encoding = cchardet.detect(msg)
-        print(detected_encoding)
-        eq_(encoding.lower(), detected_encoding['encoding'].lower())
-
-    def test_detect_th_tis620_1(self):
-        encoding = "TIS-620"
-        path = r"testdata/th/TIS-620/utffool_th_TIS-620.txt"
-        with open(path, 'rb') as f:
-            msg = f.read()
-        detected_encoding = cchardet.detect(msg)
-        print(detected_encoding)
-        eq_(encoding.lower(), detected_encoding['encoding'].lower())
-
-    def test_detect_th_tis620_2(self):
-        encoding = "TIS-620"
-        path = r"testdata/th/TIS-620/wikitop_th_TIS-620.txt"
-        with open(path, 'rb') as f:
-            msg = f.read()
-        detected_encoding = cchardet.detect(msg)
-        print(detected_encoding)
-        eq_(encoding.lower(), detected_encoding['encoding'].lower())
-
-    def test_detect_tr_utf8(self):
-        encoding = "UTF-8"
-        path = r"testdata/tr/UTF-8/wikitop_tr_UTF-8.txt"
-        with open(path, 'rb') as f:
-            msg = f.read()
-        detected_encoding = cchardet.detect(msg)
-        print(detected_encoding)
-        eq_(encoding.lower(), detected_encoding['encoding'].lower())
-
-    def test_detect_tr_iso88599(self):
-        encoding = "ISO-8859-9"
-        path = r"testdata/tr/ISO-8859-9/wikitop_tr_ISO-8859-9.txt"
-        with open(path, 'rb') as f:
-            msg = f.read()
-        detected_encoding = cchardet.detect(msg)
-        print(detected_encoding)
-        eq_(encoding.lower(), detected_encoding['encoding'].lower())
-
-    def test_detect_zh_utf8(self):
-        encoding = "UTF-8"
-        path = r"testdata/zh/UTF-8/wikitop_zh_UTF-8.txt"
-        with open(path, 'rb') as f:
-            msg = f.read()
-        detected_encoding = cchardet.detect(msg)
-        print(detected_encoding)
-        eq_(encoding.lower(), detected_encoding['encoding'].lower())
-
-    def test_detect_zh_gb18030(self):
-        encoding = "GB18030"
-        path = r"testdata/zh/GB18030/wikitop_zh_GB18030.txt"
-        with open(path, 'rb') as f:
-            msg = f.read()
-        detected_encoding = cchardet.detect(msg)
-        eq_(encoding.lower(), detected_encoding['encoding'].lower())
+    def test_detector_noresult(self):
+        detector = cchardet.Detector()
+        detector.feed('0')
+        eq_(detector.done, False)
+        eq_(detector.result, {'encoding': None, 'confidence': None})
 
 
 class TestCchardetSpeed():
@@ -438,7 +94,7 @@ class TestCchardetSpeed():
             has_chardet = False
         import time
         do_times = 5
-        path = r"testdata/wikipediaJa_One_Thousand_and_One_Nights_SJIS.txt"
+        path = r'testdata/wikipediaJa_One_Thousand_and_One_Nights_SJIS.txt'
         with open(path, 'rb') as f:
             msg = f.read()
         # Test chardet
@@ -456,75 +112,3 @@ class TestCchardetSpeed():
             cchardet.detect(msg)
             result_cchardet += (time.time() - start_cchardet)
         print('cchardet:', 1 / (result_cchardet / do_times), 'call(s)/s')
-
-
-class TestDetector():
-    encodings_map = {
-        r"testdata/bg/ISO-8859-5/wikitop_bg_ISO-8859-5.txt": "ISO-8859-5",
-        r"testdata/bg/UTF-8/wikitop_bg_UTF-8.txt": "UTF-8",
-        r"testdata/bg/WINDOWS-1251/wikitop_bg_WINDOWS-1251.txt": "WINDOWS-1251",
-        r"testdata/cz/ISO-8859-2/wikitop_cz_ISO-8859-2.txt": "ISO-8859-2",
-        r"testdata/cz/UTF-8/wikitop_cz_UTF-8.txt": "UTF-8",
-        r"testdata/de/UTF-8/wikitop_de_UTF-8.txt": "UTF-8",
-        r"testdata/de/WINDOWS-1252/wikitop_de_WINDOWS-1252.txt": "WINDOWS-1252",
-        r"testdata/dk/UTF-8/wikitop_dk_UTF-8.txt": "UTF-8",
-        r"testdata/dk/WINDOWS-1252/wikitop_dk_WINDOWS-1252.txt": "WINDOWS-1252",
-        r"testdata/el/ISO-8859-7/wikitop_el_ISO-8859-7.txt": "ISO-8859-7",
-        r"testdata/el/UTF-8/wikitop_el_UTF-8.txt": "UTF-8",
-        r"testdata/en/UTF-8/wikitop_en_UTF-8.txt": "UTF-8",
-        r"testdata/en/WINDOWS-1252/wikitop_en_WINDOWS-1252.txt": "WINDOWS-1252",
-        r"testdata/es/UTF-8/wikitop_es_UTF-8.txt": "UTF-8",
-        r"testdata/es/WINDOWS-1252/wikitop_es_WINDOWS-1252.txt": "WINDOWS-1252",
-        r"testdata/fi/UTF-8/wikitop_fi_UTF-8.txt": "UTF-8",
-        r"testdata/fi/WINDOWS-1252/wikitop_fi_WINDOWS-1252.txt": "WINDOWS-1252",
-        r"testdata/fr/UTF-8/wikitop_fr_UTF-8.txt": "UTF-8",
-        r"testdata/fr/WINDOWS-1252/wikitop_fr_WINDOWS-1252.txt": "WINDOWS-1252",
-        r"testdata/he/UTF-8/wikitop_he_UTF-8.txt": "UTF-8",
-        r"testdata/he/WINDOWS-1255/wikitop_he_WINDOWS-1255.txt": "WINDOWS-1255",
-        r"testdata/hu/UTF-8/wikitop_hu_UTF-8.txt": "UTF-8",
-        r"testdata/hu/ISO-8859-2/wikitop_hu_ISO-8859-2.txt": "ISO-8859-2",
-        r"testdata/it/UTF-8/wikitop_it_UTF-8.txt": "UTF-8",
-        r"testdata/it/WINDOWS-1252/wikitop_it_WINDOWS-1252.txt": "WINDOWS-1252",
-        r"testdata/nl/UTF-8/wikitop_nl_UTF-8.txt": "UTF-8",
-        r"testdata/nl/WINDOWS-1252/wikitop_nl_WINDOWS-1252.txt": "WINDOWS-1252",
-        r"testdata/no/UTF-8/wikitop_no_UTF-8.txt": "UTF-8",
-        r"testdata/no/WINDOWS-1252/wikitop_no_WINDOWS-1252.txt": "WINDOWS-1252",
-        r"testdata/pl/UTF-8/wikitop_pl_UTF-8.txt": "UTF-8",
-        r"testdata/pl/ISO-8859-2/wikitop_pl_ISO-8859-2.txt": "ISO-8859-2",
-        r"testdata/pt/UTF-8/wikitop_pt_UTF-8.txt": "UTF-8",
-        r"testdata/pt/WINDOWS-1252/wikitop_pt_WINDOWS-1252.txt": "WINDOWS-1252",
-        r"testdata/ru/UTF-8/wikitop_ru_UTF-8.txt": "UTF-8",
-        r"testdata/ru/WINDOWS-1251/wikitop_ru_WINDOWS-1251.txt": "WINDOWS-1251",
-        r"testdata/ru/IBM855/wikitop_ru_IBM855.txt": "IBM855",
-        r"testdata/ru/KOI8-R/wikitop_ru_KOI8-R.txt": "KOI8-R",
-        r"testdata/ru/X-MAC-CYRILLIC/wikitop_ru_MACCYRILLIC.txt": "MAC-CYRILLIC",
-        r"testdata/se/UTF-8/wikitop_se_UTF-8.txt": "UTF-8",
-        r"testdata/se/WINDOWS-1252/wikitop_se_WINDOWS-1252.txt": "WINDOWS-1252",
-        r"testdata/th/UTF-8/wikitop_th_UTF-8.txt": "UTF-8",
-        r"testdata/th/TIS-620/utffool_th_TIS-620.txt": "TIS-620",
-        r"testdata/th/TIS-620/wikitop_th_TIS-620.txt": "TIS-620",
-        r"testdata/tr/UTF-8/wikitop_tr_UTF-8.txt": "UTF-8",
-        r"testdata/tr/ISO-8859-9/wikitop_tr_ISO-8859-9.txt": "ISO-8859-9",
-        r"testdata/zh/UTF-8/wikitop_zh_UTF-8.txt": "UTF-8",
-        r"testdata/zh/GB18030/wikitop_zh_GB18030.txt": "GB18030",
-    }
-
-    def test_detector(self):
-        for path, encoding in self.encodings_map.items():
-            detector = cchardet.Detector()
-            with open(path, 'rb') as f:
-                line = f.readline()
-                while line:
-                    detector.feed(line)
-                    if detector.done:
-                        break
-                    line = f.readline()
-            detector.close()
-            detected_encoding = detector.result
-            eq_(encoding.lower(), detected_encoding['encoding'].lower())
-
-    def test_detector_noresult(self):
-        detector = cchardet.Detector()
-        detector.feed('0')
-        eq_(detector.done, False)
-        eq_(detector.result, {"encoding": None, "confidence": None})