2022-02-17 19:00:48 +00:00
|
|
|
"""Unit tests for textract-supported APIs."""
|
2022-02-21 15:13:36 +00:00
|
|
|
from random import randint
|
|
|
|
from botocore.exceptions import ClientError, ParamValidationError
|
|
|
|
import pytest
|
2022-02-17 19:00:48 +00:00
|
|
|
import boto3
|
|
|
|
|
2022-02-21 17:56:50 +00:00
|
|
|
from unittest import SkipTest
|
2022-02-21 15:13:36 +00:00
|
|
|
from moto.textract.models import TextractBackend
|
2022-02-21 17:56:50 +00:00
|
|
|
from moto import settings, mock_textract
|
2022-02-17 19:00:48 +00:00
|
|
|
|
|
|
|
# See our Development Tips on writing tests for hints on how to write good tests:
|
|
|
|
# http://docs.getmoto.org/en/latest/docs/contributing/development_tips/tests.html
|
|
|
|
|
|
|
|
|
2022-02-21 15:13:36 +00:00
|
|
|
@mock_textract
|
|
|
|
def test_get_document_text_detection():
|
2022-02-21 17:56:50 +00:00
|
|
|
if settings.TEST_SERVER_MODE:
|
|
|
|
raise SkipTest("Cannot set textract backend values in server mode")
|
|
|
|
|
2022-02-21 15:13:36 +00:00
|
|
|
TextractBackend.JOB_STATUS = "SUCCEEDED"
|
|
|
|
TextractBackend.PAGES = randint(5, 500)
|
|
|
|
TextractBackend.BLOCKS = [
|
|
|
|
{
|
|
|
|
"Text": "This is a test",
|
|
|
|
"Id": "0",
|
|
|
|
"Confidence": "100",
|
|
|
|
"Geometry": {
|
|
|
|
"BoundingBox": {
|
|
|
|
"Width": "0.5",
|
|
|
|
"Height": "0.5",
|
|
|
|
"Left": "0.5",
|
|
|
|
"Top": "0.5",
|
|
|
|
},
|
|
|
|
},
|
|
|
|
}
|
|
|
|
]
|
|
|
|
|
|
|
|
client = boto3.client("textract", region_name="us-east-1")
|
|
|
|
job = client.start_document_text_detection(
|
|
|
|
DocumentLocation={"S3Object": {"Bucket": "bucket", "Name": "name"}}
|
|
|
|
)
|
2022-02-17 19:00:48 +00:00
|
|
|
|
2022-02-21 15:13:36 +00:00
|
|
|
resp = client.get_document_text_detection(JobId=job["JobId"])
|
2022-02-17 19:00:48 +00:00
|
|
|
|
2022-02-21 15:13:36 +00:00
|
|
|
resp["Blocks"][0]["Text"].should.equal("This is a test")
|
|
|
|
resp["Blocks"][0]["Id"].should.equal("0")
|
|
|
|
resp["Blocks"][0]["Confidence"].should.equal("100")
|
|
|
|
resp["Blocks"][0]["Geometry"]["BoundingBox"]["Width"].should.equal("0.5")
|
|
|
|
resp["Blocks"][0]["Geometry"]["BoundingBox"]["Height"].should.equal("0.5")
|
|
|
|
resp["Blocks"][0]["Geometry"]["BoundingBox"]["Left"].should.equal("0.5")
|
|
|
|
resp["Blocks"][0]["Geometry"]["BoundingBox"]["Top"].should.equal("0.5")
|
|
|
|
resp["JobStatus"].should.equal("SUCCEEDED")
|
|
|
|
resp["DocumentMetadata"]["Pages"].should.equal(TextractBackend.PAGES)
|
2022-02-17 19:00:48 +00:00
|
|
|
|
|
|
|
|
|
|
|
@mock_textract
|
|
|
|
def test_start_document_text_detection():
|
2022-02-17 19:31:40 +00:00
|
|
|
client = boto3.client("textract", region_name="us-east-1")
|
2022-02-17 19:00:48 +00:00
|
|
|
resp = client.start_document_text_detection(
|
2022-02-21 15:13:36 +00:00
|
|
|
DocumentLocation={"S3Object": {"Bucket": "bucket", "Name": "name"}}
|
2022-02-17 19:00:48 +00:00
|
|
|
)
|
|
|
|
|
2022-02-18 19:49:54 +00:00
|
|
|
resp.should.have.key("JobId")
|
2022-02-21 15:13:36 +00:00
|
|
|
|
|
|
|
|
|
|
|
@mock_textract
|
|
|
|
def test_get_document_text_detection_without_job_id():
|
|
|
|
client = boto3.client("textract", region_name="us-east-1")
|
|
|
|
with pytest.raises(ClientError) as e:
|
|
|
|
client.get_document_text_detection(JobId="Invalid Job Id")
|
|
|
|
|
|
|
|
e.value.response["Error"]["Code"].should.equal("InvalidJobIdException")
|
|
|
|
|
|
|
|
|
|
|
|
@mock_textract
|
|
|
|
def test_get_document_text_detection_without_document_location():
|
|
|
|
client = boto3.client("textract", region_name="us-east-1")
|
|
|
|
with pytest.raises(ParamValidationError) as e:
|
|
|
|
client.start_document_text_detection()
|
|
|
|
|
|
|
|
assert e.typename == "ParamValidationError"
|
|
|
|
assert (
|
|
|
|
'Parameter validation failed:\nMissing required parameter in input: "DocumentLocation"'
|
|
|
|
in e.value.args
|
|
|
|
)
|