# -*- coding: utf-8 -*- from __future__ import unicode_literals import boto3 import sure # noqa from moto import mock_transcribe @mock_transcribe def test_run_medical_transcription_job_minimal_params(): region_name = "us-east-1" client = boto3.client("transcribe", region_name=region_name) job_name = "MyJob" args = { "MedicalTranscriptionJobName": job_name, "LanguageCode": "en-US", "Media": {"MediaFileUri": "s3://my-bucket/my-media-file.wav",}, "OutputBucketName": "my-output-bucket", "Specialty": "PRIMARYCARE", "Type": "CONVERSATION", } resp = client.start_medical_transcription_job(**args) resp["ResponseMetadata"]["HTTPStatusCode"].should.equal(200) # CREATED resp = client.get_medical_transcription_job(MedicalTranscriptionJobName=job_name) resp["ResponseMetadata"]["HTTPStatusCode"].should.equal(200) transcription_job = resp["MedicalTranscriptionJob"] transcription_job["MedicalTranscriptionJobName"].should.equal( args["MedicalTranscriptionJobName"] ) transcription_job["TranscriptionJobStatus"].should.equal("QUEUED") transcription_job["LanguageCode"].should.equal(args["LanguageCode"]) transcription_job["Media"].should.equal(args["Media"]) transcription_job.should.contain("CreationTime") transcription_job.doesnt.contain("StartTime") transcription_job.doesnt.contain("CompletionTime") transcription_job.doesnt.contain("Transcript") transcription_job["Settings"]["ChannelIdentification"].should.equal(False) transcription_job["Settings"]["ShowAlternatives"].should.equal(False) transcription_job["Specialty"].should.equal(args["Specialty"]) transcription_job["Type"].should.equal(args["Type"]) # IN_PROGRESS resp = client.get_medical_transcription_job(MedicalTranscriptionJobName=job_name) resp["ResponseMetadata"]["HTTPStatusCode"].should.equal(200) transcription_job = resp["MedicalTranscriptionJob"] transcription_job["TranscriptionJobStatus"].should.equal("IN_PROGRESS") transcription_job["MediaFormat"].should.equal("wav") transcription_job.should.contain("StartTime") transcription_job.doesnt.contain("CompletionTime") transcription_job.doesnt.contain("Transcript") transcription_job["MediaSampleRateHertz"].should.equal(44100) # COMPLETED resp = client.get_medical_transcription_job(MedicalTranscriptionJobName=job_name) resp["ResponseMetadata"]["HTTPStatusCode"].should.equal(200) transcription_job = resp["MedicalTranscriptionJob"] transcription_job["TranscriptionJobStatus"].should.equal("COMPLETED") transcription_job.should.contain("CompletionTime") transcription_job["Transcript"].should.equal( { "TranscriptFileUri": "https://s3.{}.amazonaws.com/{}/medical/{}.json".format( region_name, args["OutputBucketName"], args["MedicalTranscriptionJobName"], ) } ) # Delete client.delete_medical_transcription_job(MedicalTranscriptionJobName=job_name) client.get_medical_transcription_job.when.called_with( MedicalTranscriptionJobName=job_name ).should.throw(client.exceptions.BadRequestException) @mock_transcribe def test_run_medical_transcription_job_all_params(): region_name = "us-east-1" client = boto3.client("transcribe", region_name=region_name) vocabulary_name = "MyMedicalVocabulary" resp = client.create_medical_vocabulary( VocabularyName=vocabulary_name, LanguageCode="en-US", VocabularyFileUri="https://s3.us-east-1.amazonaws.com/AWSDOC-EXAMPLE-BUCKET/vocab.txt", ) resp["ResponseMetadata"]["HTTPStatusCode"].should.equal(200) job_name = "MyJob2" args = { "MedicalTranscriptionJobName": job_name, "LanguageCode": "en-US", "MediaSampleRateHertz": 48000, "MediaFormat": "flac", "Media": {"MediaFileUri": "s3://my-bucket/my-media-file.dat",}, "OutputBucketName": "my-output-bucket", "OutputEncryptionKMSKeyId": "arn:aws:kms:us-east-1:012345678901:key/37111b5e-8eff-4706-ae3a-d4f9d1d559fc", "Settings": { "ShowSpeakerLabels": True, "MaxSpeakerLabels": 5, "ChannelIdentification": True, "ShowAlternatives": True, "MaxAlternatives": 6, "VocabularyName": vocabulary_name, }, "Specialty": "PRIMARYCARE", "Type": "CONVERSATION", } resp = client.start_medical_transcription_job(**args) resp["ResponseMetadata"]["HTTPStatusCode"].should.equal(200) # CREATED resp = client.get_medical_transcription_job(MedicalTranscriptionJobName=job_name) resp["ResponseMetadata"]["HTTPStatusCode"].should.equal(200) transcription_job = resp["MedicalTranscriptionJob"] transcription_job["MedicalTranscriptionJobName"].should.equal( args["MedicalTranscriptionJobName"] ) transcription_job["TranscriptionJobStatus"].should.equal("QUEUED") transcription_job["LanguageCode"].should.equal(args["LanguageCode"]) transcription_job["Media"].should.equal(args["Media"]) transcription_job.should.contain("CreationTime") transcription_job.doesnt.contain("StartTime") transcription_job.doesnt.contain("CompletionTime") transcription_job.doesnt.contain("Transcript") transcription_job["Settings"]["ShowSpeakerLabels"].should.equal( args["Settings"]["ShowSpeakerLabels"] ) transcription_job["Settings"]["MaxSpeakerLabels"].should.equal( args["Settings"]["MaxSpeakerLabels"] ) transcription_job["Settings"]["ChannelIdentification"].should.equal( args["Settings"]["ChannelIdentification"] ) transcription_job["Settings"]["ShowAlternatives"].should.equal( args["Settings"]["ShowAlternatives"] ) transcription_job["Settings"]["MaxAlternatives"].should.equal( args["Settings"]["MaxAlternatives"] ) transcription_job["Settings"]["VocabularyName"].should.equal( args["Settings"]["VocabularyName"] ) transcription_job["Specialty"].should.equal(args["Specialty"]) transcription_job["Type"].should.equal(args["Type"]) # IN_PROGRESS resp = client.get_medical_transcription_job(MedicalTranscriptionJobName=job_name) resp["ResponseMetadata"]["HTTPStatusCode"].should.equal(200) transcription_job = resp["MedicalTranscriptionJob"] transcription_job["TranscriptionJobStatus"].should.equal("IN_PROGRESS") transcription_job["MediaFormat"].should.equal("flac") transcription_job.should.contain("StartTime") transcription_job.doesnt.contain("CompletionTime") transcription_job.doesnt.contain("Transcript") transcription_job["MediaSampleRateHertz"].should.equal(48000) # COMPLETED resp = client.get_medical_transcription_job(MedicalTranscriptionJobName=job_name) resp["ResponseMetadata"]["HTTPStatusCode"].should.equal(200) transcription_job = resp["MedicalTranscriptionJob"] transcription_job["TranscriptionJobStatus"].should.equal("COMPLETED") transcription_job.should.contain("CompletionTime") transcription_job["Transcript"].should.equal( { "TranscriptFileUri": "https://s3.{}.amazonaws.com/{}/medical/{}.json".format( region_name, args["OutputBucketName"], args["MedicalTranscriptionJobName"], ) } ) @mock_transcribe def test_get_nonexistent_medical_transcription_job(): region_name = "us-east-1" client = boto3.client("transcribe", region_name=region_name) client.get_medical_transcription_job.when.called_with( MedicalTranscriptionJobName="NonexistentJobName" ).should.throw(client.exceptions.BadRequestException) @mock_transcribe def test_run_medical_transcription_job_with_existing_job_name(): region_name = "us-east-1" client = boto3.client("transcribe", region_name=region_name) job_name = "MyJob" args = { "MedicalTranscriptionJobName": job_name, "LanguageCode": "en-US", "Media": {"MediaFileUri": "s3://my-bucket/my-media-file.wav",}, "OutputBucketName": "my-output-bucket", "Specialty": "PRIMARYCARE", "Type": "CONVERSATION", } resp = client.start_medical_transcription_job(**args) resp["ResponseMetadata"]["HTTPStatusCode"].should.equal(200) client.start_medical_transcription_job.when.called_with(**args).should.throw( client.exceptions.ConflictException ) @mock_transcribe def test_run_medical_transcription_job_nonexistent_vocabulary(): region_name = "us-east-1" client = boto3.client("transcribe", region_name=region_name) job_name = "MyJob3" args = { "MedicalTranscriptionJobName": job_name, "LanguageCode": "en-US", "Media": {"MediaFileUri": "s3://my-bucket/my-media-file.dat",}, "OutputBucketName": "my-output-bucket", "Settings": {"VocabularyName": "NonexistentVocabulary"}, "Specialty": "PRIMARYCARE", "Type": "CONVERSATION", } client.start_medical_transcription_job.when.called_with(**args).should.throw( client.exceptions.BadRequestException ) @mock_transcribe def test_list_medical_transcription_jobs(): region_name = "us-east-1" client = boto3.client("transcribe", region_name=region_name) def run_job(index, target_status): job_name = "Job_{}".format(index) args = { "MedicalTranscriptionJobName": job_name, "LanguageCode": "en-US", "Media": {"MediaFileUri": "s3://my-bucket/my-media-file.wav",}, "OutputBucketName": "my-output-bucket", "Specialty": "PRIMARYCARE", "Type": "CONVERSATION", } resp = client.start_medical_transcription_job(**args) resp["ResponseMetadata"]["HTTPStatusCode"].should.equal(200) # IMPLICITLY PROMOTE JOB STATUS TO QUEUED resp = client.get_medical_transcription_job( MedicalTranscriptionJobName=job_name ) # IN_PROGRESS if target_status in ["IN_PROGRESS", "COMPLETED"]: resp = client.get_medical_transcription_job( MedicalTranscriptionJobName=job_name ) # COMPLETED if target_status == "COMPLETED": resp = client.get_medical_transcription_job( MedicalTranscriptionJobName=job_name ) # Run 5 pending jobs for i in range(5): run_job(i, "PENDING") # Run 10 job to IN_PROGRESS for i in range(5, 15): run_job(i, "IN_PROGRESS") # Run 15 job to COMPLETED for i in range(15, 30): run_job(i, "COMPLETED") # List all response = client.list_medical_transcription_jobs() response.should.contain("MedicalTranscriptionJobSummaries") len(response["MedicalTranscriptionJobSummaries"]).should.equal(30) response.shouldnt.contain("NextToken") response.shouldnt.contain("Status") # List IN_PROGRESS response = client.list_medical_transcription_jobs(Status="IN_PROGRESS") response.should.contain("MedicalTranscriptionJobSummaries") len(response["MedicalTranscriptionJobSummaries"]).should.equal(10) response.shouldnt.contain("NextToken") response.should.contain("Status") response["Status"].should.equal("IN_PROGRESS") # List JobName contains "8" response = client.list_medical_transcription_jobs(JobNameContains="8") response.should.contain("MedicalTranscriptionJobSummaries") len(response["MedicalTranscriptionJobSummaries"]).should.equal(3) response.shouldnt.contain("NextToken") response.shouldnt.contain("Status") # Pagination by 11 response = client.list_medical_transcription_jobs(MaxResults=11) response.should.contain("MedicalTranscriptionJobSummaries") len(response["MedicalTranscriptionJobSummaries"]).should.equal(11) response.should.contain("NextToken") response.shouldnt.contain("Status") response = client.list_medical_transcription_jobs( NextToken=response["NextToken"], MaxResults=11 ) response.should.contain("MedicalTranscriptionJobSummaries") len(response["MedicalTranscriptionJobSummaries"]).should.equal(11) response.should.contain("NextToken") response = client.list_medical_transcription_jobs( NextToken=response["NextToken"], MaxResults=11 ) response.should.contain("MedicalTranscriptionJobSummaries") len(response["MedicalTranscriptionJobSummaries"]).should.equal(8) response.shouldnt.contain("NextToken") @mock_transcribe def test_create_medical_vocabulary(): region_name = "us-east-1" client = boto3.client("transcribe", region_name=region_name) vocabulary_name = "MyVocabulary" resp = client.create_medical_vocabulary( VocabularyName=vocabulary_name, LanguageCode="en-US", VocabularyFileUri="https://s3.us-east-1.amazonaws.com/AWSDOC-EXAMPLE-BUCKET/vocab.txt", ) resp["ResponseMetadata"]["HTTPStatusCode"].should.equal(200) # PENDING resp = client.get_medical_vocabulary(VocabularyName=vocabulary_name) resp["ResponseMetadata"]["HTTPStatusCode"].should.equal(200) resp["VocabularyName"].should.equal(vocabulary_name) resp["LanguageCode"].should.equal("en-US") resp["VocabularyState"].should.equal("PENDING") resp.should.contain("LastModifiedTime") resp.shouldnt.contain("FailureReason") resp["DownloadUri"].should.contain(vocabulary_name) # IN_PROGRESS resp = client.get_medical_vocabulary(VocabularyName=vocabulary_name) resp["ResponseMetadata"]["HTTPStatusCode"].should.equal(200) resp["VocabularyState"].should.equal("READY") # Delete client.delete_medical_vocabulary(VocabularyName=vocabulary_name) client.get_medical_vocabulary.when.called_with( VocabularyName=vocabulary_name ).should.throw(client.exceptions.BadRequestException) @mock_transcribe def test_get_nonexistent_medical_vocabulary(): region_name = "us-east-1" client = boto3.client("transcribe", region_name=region_name) client.get_medical_vocabulary.when.called_with( VocabularyName="NonexistentVocabularyName" ).should.throw(client.exceptions.BadRequestException) @mock_transcribe def test_create_medical_vocabulary_with_existing_vocabulary_name(): region_name = "us-east-1" client = boto3.client("transcribe", region_name=region_name) vocabulary_name = "MyVocabulary" args = { "VocabularyName": vocabulary_name, "LanguageCode": "en-US", "VocabularyFileUri": "https://s3.us-east-1.amazonaws.com/AWSDOC-EXAMPLE-BUCKET/vocab.txt", } resp = client.create_medical_vocabulary(**args) resp["ResponseMetadata"]["HTTPStatusCode"].should.equal(200) client.create_medical_vocabulary.when.called_with(**args).should.throw( client.exceptions.ConflictException )