diff --git a/requirements.txt b/requirements.txt index 7ee2c4a..9413282 100644 --- a/requirements.txt +++ b/requirements.txt @@ -9,5 +9,5 @@ opencv-python==4.9.0.80 Shapely==2.0.4 transformers==4.40.1 pdf2image==1.17.0 -git+https://github.com/huridocs/pdf-tokens-type-labeler +git+https://github.com/huridocs/pdf-tokens-type-labeler@14bf7aef39b40843305ff43d8fe04953be746956 git+https://github.com/huridocs/pdf_paragraphs_extraction \ No newline at end of file diff --git a/src/test_end_to_end.py b/src/test_end_to_end.py index 7feaabb..a568547 100644 --- a/src/test_end_to_end.py +++ b/src/test_end_to_end.py @@ -90,3 +90,35 @@ def test_regular_pdf_fast(self): results = requests.post(f"{self.service_url}/fast", files=files) self.assertEqual(200, results.status_code) + + def test_korean(self): + with open(f"{ROOT_PATH}/test_pdfs/korean.pdf", "rb") as stream: + files = {"file": stream} + + results = requests.post(f"{self.service_url}", files=files) + + self.assertEqual(200, results.status_code) + + def test_chinese(self): + with open(f"{ROOT_PATH}/test_pdfs/chinese.pdf", "rb") as stream: + files = {"file": stream} + + results = requests.post(f"{self.service_url}", files=files) + + self.assertEqual(200, results.status_code) + + def test_korean_fast(self): + with open(f"{ROOT_PATH}/test_pdfs/korean.pdf", "rb") as stream: + files = {"file": stream} + + results = requests.post(f"{self.service_url}/fast", files=files) + + self.assertEqual(200, results.status_code) + + def test_chinese_fast(self): + with open(f"{ROOT_PATH}/test_pdfs/chinese.pdf", "rb") as stream: + files = {"file": stream} + + results = requests.post(f"{self.service_url}/fast", files=files) + + self.assertEqual(200, results.status_code)