|
14 | 14 |
|
15 | 15 | import json |
16 | 16 | import unittest |
17 | | -from unittest.mock import AsyncMock, patch |
| 17 | +from unittest.mock import AsyncMock, MagicMock, patch |
18 | 18 |
|
19 | 19 | from chunkr_ai.models import Status |
20 | 20 |
|
@@ -119,6 +119,92 @@ async def test_get_task_output_poll_error(self, mock_chunkr_class): |
119 | 119 | mock_chunkr_instance.get_task.assert_called_once_with("test_task_id") |
120 | 120 | mock_task.poll.assert_called_once() |
121 | 121 |
|
| 122 | + def test_chunkr_reader_config_defaults(self): |
| 123 | + """Test ChunkrReaderConfig with default values.""" |
| 124 | + config = ChunkrReaderConfig() |
| 125 | + |
| 126 | + self.assertEqual(config.chunk_processing, 512) |
| 127 | + self.assertEqual(config.high_resolution, True) |
| 128 | + self.assertEqual(config.ocr_strategy, "Auto") |
| 129 | + self.assertEqual(config.kwargs, {}) |
| 130 | + |
| 131 | + def test_chunkr_reader_config_custom_values(self): |
| 132 | + """Test ChunkrReaderConfig with custom values.""" |
| 133 | + config = ChunkrReaderConfig( |
| 134 | + chunk_processing=1024, |
| 135 | + high_resolution=False, |
| 136 | + ocr_strategy="All", |
| 137 | + ) |
| 138 | + |
| 139 | + self.assertEqual(config.chunk_processing, 1024) |
| 140 | + self.assertEqual(config.high_resolution, False) |
| 141 | + self.assertEqual(config.ocr_strategy, "All") |
| 142 | + |
| 143 | + def test_chunkr_reader_config_with_kwargs(self): |
| 144 | + """Test ChunkrReaderConfig with additional kwargs.""" |
| 145 | + config = ChunkrReaderConfig( |
| 146 | + chunk_processing=2048, |
| 147 | + expires_in=3600, |
| 148 | + pipeline="custom_pipeline", |
| 149 | + ) |
| 150 | + |
| 151 | + self.assertEqual(config.chunk_processing, 2048) |
| 152 | + self.assertEqual(config.kwargs["expires_in"], 3600) |
| 153 | + self.assertEqual(config.kwargs["pipeline"], "custom_pipeline") |
| 154 | + |
| 155 | + @patch('chunkr_ai.models.Configuration') |
| 156 | + @patch('chunkr_ai.models.ChunkProcessing') |
| 157 | + @patch('chunkr_ai.models.OcrStrategy') |
| 158 | + def test_to_chunkr_configuration_auto_strategy( |
| 159 | + self, mock_ocr_strategy, mock_chunk_processing, mock_configuration |
| 160 | + ): |
| 161 | + """Test _to_chunkr_configuration with Auto OCR strategy.""" |
| 162 | + config = ChunkrReaderConfig( |
| 163 | + chunk_processing=512, high_resolution=True, ocr_strategy="Auto" |
| 164 | + ) |
| 165 | + |
| 166 | + mock_chunk_processing_instance = MagicMock() |
| 167 | + mock_chunk_processing.return_value = mock_chunk_processing_instance |
| 168 | + mock_ocr_strategy.AUTO = "AUTO" |
| 169 | + |
| 170 | + self.reader._to_chunkr_configuration(config) |
| 171 | + |
| 172 | + mock_chunk_processing.assert_called_once_with(target_length=512) |
| 173 | + mock_configuration.assert_called_once_with( |
| 174 | + chunk_processing=mock_chunk_processing_instance, |
| 175 | + high_resolution=True, |
| 176 | + ocr_strategy="AUTO", |
| 177 | + ) |
| 178 | + |
| 179 | + @patch('chunkr_ai.models.Configuration') |
| 180 | + @patch('chunkr_ai.models.ChunkProcessing') |
| 181 | + @patch('chunkr_ai.models.OcrStrategy') |
| 182 | + def test_to_chunkr_configuration_with_kwargs( |
| 183 | + self, mock_ocr_strategy, mock_chunk_processing, mock_configuration |
| 184 | + ): |
| 185 | + """Test _to_chunkr_configuration with additional kwargs.""" |
| 186 | + config = ChunkrReaderConfig( |
| 187 | + chunk_processing=512, |
| 188 | + high_resolution=True, |
| 189 | + ocr_strategy="Auto", |
| 190 | + expires_in=7200, |
| 191 | + pipeline="test_pipeline", |
| 192 | + ) |
| 193 | + |
| 194 | + mock_chunk_processing_instance = MagicMock() |
| 195 | + mock_chunk_processing.return_value = mock_chunk_processing_instance |
| 196 | + mock_ocr_strategy.AUTO = "AUTO" |
| 197 | + |
| 198 | + result = self.reader._to_chunkr_configuration(config) |
| 199 | + |
| 200 | + mock_chunk_processing.assert_called_once_with(target_length=512) |
| 201 | + mock_configuration.assert_called_once_with( |
| 202 | + chunk_processing=mock_chunk_processing_instance, |
| 203 | + high_resolution=True, |
| 204 | + ocr_strategy="AUTO", |
| 205 | + expires_in=7200, |
| 206 | + pipeline="test_pipeline", |
| 207 | + ) |
122 | 208 |
|
123 | 209 | if __name__ == "__main__": |
124 | 210 | unittest.main() |
0 commit comments