moto/tests/test_textract/test_textract.py

Ignoring revisions in .git-blame-ignore-revs. Click here to bypass and see the normal blame view.

86 lines
2.9 KiB
Python
Raw Normal View History

2022-02-17 19:00:48 +00:00
"""Unit tests for textract-supported APIs."""
2022-02-21 15:13:36 +00:00
from random import randint
from botocore.exceptions import ClientError, ParamValidationError
import pytest
2022-02-17 19:00:48 +00:00
import boto3
2022-02-21 17:56:50 +00:00
from unittest import SkipTest
2022-02-21 15:13:36 +00:00
from moto.textract.models import TextractBackend
2022-02-21 17:56:50 +00:00
from moto import settings, mock_textract
2022-02-17 19:00:48 +00:00
# See our Development Tips on writing tests for hints on how to write good tests:
# http://docs.getmoto.org/en/latest/docs/contributing/development_tips/tests.html
2022-02-21 15:13:36 +00:00
@mock_textract
def test_get_document_text_detection():
2022-02-21 17:56:50 +00:00
if settings.TEST_SERVER_MODE:
raise SkipTest("Cannot set textract backend values in server mode")
2022-02-21 15:13:36 +00:00
TextractBackend.JOB_STATUS = "SUCCEEDED"
TextractBackend.PAGES = randint(5, 500)
TextractBackend.BLOCKS = [
{
"Text": "This is a test",
"Id": "0",
"Confidence": "100",
"Geometry": {
"BoundingBox": {
"Width": "0.5",
"Height": "0.5",
"Left": "0.5",
"Top": "0.5",
},
},
}
]
client = boto3.client("textract", region_name="us-east-1")
job = client.start_document_text_detection(
DocumentLocation={"S3Object": {"Bucket": "bucket", "Name": "name"}}
)
2022-02-17 19:00:48 +00:00
2022-02-21 15:13:36 +00:00
resp = client.get_document_text_detection(JobId=job["JobId"])
2022-02-17 19:00:48 +00:00
2022-02-21 15:13:36 +00:00
resp["Blocks"][0]["Text"].should.equal("This is a test")
resp["Blocks"][0]["Id"].should.equal("0")
resp["Blocks"][0]["Confidence"].should.equal("100")
resp["Blocks"][0]["Geometry"]["BoundingBox"]["Width"].should.equal("0.5")
resp["Blocks"][0]["Geometry"]["BoundingBox"]["Height"].should.equal("0.5")
resp["Blocks"][0]["Geometry"]["BoundingBox"]["Left"].should.equal("0.5")
resp["Blocks"][0]["Geometry"]["BoundingBox"]["Top"].should.equal("0.5")
resp["JobStatus"].should.equal("SUCCEEDED")
resp["DocumentMetadata"]["Pages"].should.equal(TextractBackend.PAGES)
2022-02-17 19:00:48 +00:00
@mock_textract
def test_start_document_text_detection():
2022-02-17 19:31:40 +00:00
client = boto3.client("textract", region_name="us-east-1")
2022-02-17 19:00:48 +00:00
resp = client.start_document_text_detection(
2022-02-21 15:13:36 +00:00
DocumentLocation={"S3Object": {"Bucket": "bucket", "Name": "name"}}
2022-02-17 19:00:48 +00:00
)
resp.should.have.key("JobId")
2022-02-21 15:13:36 +00:00
@mock_textract
def test_get_document_text_detection_without_job_id():
client = boto3.client("textract", region_name="us-east-1")
with pytest.raises(ClientError) as e:
client.get_document_text_detection(JobId="Invalid Job Id")
e.value.response["Error"]["Code"].should.equal("InvalidJobIdException")
@mock_textract
def test_get_document_text_detection_without_document_location():
client = boto3.client("textract", region_name="us-east-1")
with pytest.raises(ParamValidationError) as e:
client.start_document_text_detection()
assert e.typename == "ParamValidationError"
assert (
'Parameter validation failed:\nMissing required parameter in input: "DocumentLocation"'
in e.value.args
)