add tests (#18)

* add tests

* add sentencepiece dependency
This commit is contained in:
Maciej Budyś
2022-11-03 21:01:36 +01:00
committed by GitHub
parent 71fe10621a
commit 6309289958
18 changed files with 93 additions and 0 deletions

View File

@@ -11,6 +11,7 @@ numpy
opencv-python
pandas
Pillow
pytest
scikit-image
scikit-learn
scipy

View File

@@ -26,6 +26,7 @@ setup(
"numpy",
"Pillow",
"pyperclip",
"sentencepiece",
"torch>=1.0",
"transformers>=4.12.5",
"unidic_lite",

0
tests/__init__.py Normal file
View File

View File

@@ -0,0 +1,50 @@
[
{
"filename": "00.jpg",
"result": "素直にあやまるしか"
},
{
"filename": "01.jpg",
"result": "立川で見た〝穴〟の下の巨大な眼は:"
},
{
"filename": "02.jpg",
"result": "実戦剣術も一流です"
},
{
"filename": "03.jpg",
"result": "第30話重苦しい闇の奥で静かに呼吸づきながら"
},
{
"filename": "04.jpg",
"result": "きのうハンパーヶとって、ゴメン!!!"
},
{
"filename": "05.jpg",
"result": "ぎゃっ"
},
{
"filename": "06.jpg",
"result": "ピンポーーン"
},
{
"filename": "07.jpg",
"result": "LINK!私達7人の力でガノンの塔の結界をやぶります"
},
{
"filename": "08.jpg",
"result": "ファイアパンチ"
},
{
"filename": "09.jpg",
"result": "少し黙っている"
},
{
"filename": "10.jpg",
"result": "わかるかな〜?"
},
{
"filename": "11.jpg",
"result": "警察にも先生にも町中の人達に!!"
}
]

BIN
tests/data/images/00.jpg Normal file

Binary file not shown.

After

Width:  |  Height:  |  Size: 9.2 KiB

BIN
tests/data/images/01.jpg Normal file

Binary file not shown.

After

Width:  |  Height:  |  Size: 34 KiB

BIN
tests/data/images/02.jpg Normal file

Binary file not shown.

After

Width:  |  Height:  |  Size: 2.8 KiB

BIN
tests/data/images/03.jpg Normal file

Binary file not shown.

After

Width:  |  Height:  |  Size: 18 KiB

BIN
tests/data/images/04.jpg Normal file

Binary file not shown.

After

Width:  |  Height:  |  Size: 89 KiB

BIN
tests/data/images/05.jpg Normal file

Binary file not shown.

After

Width:  |  Height:  |  Size: 3.8 KiB

BIN
tests/data/images/06.jpg Normal file

Binary file not shown.

After

Width:  |  Height:  |  Size: 9.2 KiB

BIN
tests/data/images/07.jpg Normal file

Binary file not shown.

After

Width:  |  Height:  |  Size: 15 KiB

BIN
tests/data/images/08.jpg Normal file

Binary file not shown.

After

Width:  |  Height:  |  Size: 6.9 KiB

BIN
tests/data/images/09.jpg Normal file

Binary file not shown.

After

Width:  |  Height:  |  Size: 6.2 KiB

BIN
tests/data/images/10.jpg Normal file

Binary file not shown.

After

Width:  |  Height:  |  Size: 3.4 KiB

BIN
tests/data/images/11.jpg Normal file

Binary file not shown.

After

Width:  |  Height:  |  Size: 15 KiB

View File

@@ -0,0 +1,25 @@
import json
from pathlib import Path
from tqdm import tqdm
from manga_ocr import MangaOcr
TEST_DATA_ROOT = Path(__file__).parent / 'data'
def generate_expected_results():
mocr = MangaOcr()
results = []
for path in tqdm(sorted((TEST_DATA_ROOT / 'images').iterdir())):
result = mocr(path)
results.append({'filename': path.name, 'result': result})
(TEST_DATA_ROOT / 'expected_results.json').write_text(json.dumps(results, ensure_ascii=False, indent=2),
encoding='utf-8')
if __name__ == '__main__':
generate_expected_results()

16
tests/test_ocr.py Normal file
View File

@@ -0,0 +1,16 @@
import json
from pathlib import Path
from manga_ocr import MangaOcr
TEST_DATA_ROOT = Path(__file__).parent / 'data'
def test_ocr():
mocr = MangaOcr()
expected_results = json.loads((TEST_DATA_ROOT / 'expected_results.json').read_text(encoding='utf-8'))
for item in expected_results:
result = mocr(TEST_DATA_ROOT / 'images' / item['filename'])
assert result == item['result']