|
30 | 30 | import pytest
|
31 | 31 |
|
32 | 32 | from google.cloud import documentai
|
| 33 | +from google.cloud.storage import Blob, Bucket |
33 | 34 | from google.cloud.documentai_toolbox import document, gcs_utilities
|
34 | 35 |
|
35 | 36 |
|
@@ -397,6 +398,37 @@ def test_document_from_gcs_with_unordered_shards(get_bytes_unordered_files_mock)
|
397 | 398 | assert page.page_number == page_index + 1
|
398 | 399 |
|
399 | 400 |
|
| 401 | +@mock.patch("google.cloud.documentai_toolbox.utilities.gcs_utilities.storage") |
| 402 | +def test_document_list_from_gcs_with_multiple_input_files( |
| 403 | + mock_storage, |
| 404 | + get_bytes_multiple_directories_mock, |
| 405 | +): |
| 406 | + client = mock_storage.Client.return_value |
| 407 | + |
| 408 | + mock_bucket = mock.Mock() |
| 409 | + |
| 410 | + client.Bucket.return_value = mock_bucket |
| 411 | + |
| 412 | + client.list_blobs.return_value = [ |
| 413 | + Blob(name="documentai/output/123456789/1/test_shard1.json", bucket=None), |
| 414 | + Blob(name="documentai/output/123456789/1/test_shard2.json", bucket=None), |
| 415 | + Blob(name="documentai/output/123456789/2/test_shard3.json", bucket=None), |
| 416 | + ] |
| 417 | + documents = document.Document.list_from_gcs( |
| 418 | + gcs_bucket_name="test-directory", gcs_prefix="documentai/output/123456789/" |
| 419 | + ) |
| 420 | + get_bytes_multiple_directories_mock.assert_called() |
| 421 | + assert get_bytes_multiple_directories_mock.call_count == 2 |
| 422 | + |
| 423 | + assert len(documents) == 2 |
| 424 | + |
| 425 | + assert documents[0].gcs_bucket_name == "test-directory" |
| 426 | + assert documents[0].gcs_prefix == "documentai/output/123456789/1" |
| 427 | + |
| 428 | + assert documents[1].gcs_bucket_name == "test-directory" |
| 429 | + assert documents[1].gcs_prefix == "documentai/output/123456789/2" |
| 430 | + |
| 431 | + |
400 | 432 | def test_document_from_batch_process_metadata_with_multiple_input_files(
|
401 | 433 | get_bytes_multiple_directories_mock,
|
402 | 434 | ):
|
|
0 commit comments