0
# Batch Processing
1
2
Large-scale batch inference and data processing with distributed computing integration and resource optimization.
3
4
## Capabilities
5
6
### Batch Prediction Jobs
7
8
Execute large-scale batch inference with automatic scaling and comprehensive monitoring.
9
10
```python { .api }
11
class BatchPredictionJob:
12
@classmethod
13
def create(
14
cls,
15
job_display_name: str,
16
model_name: str,
17
instances_format: str,
18
gcs_source_uris: Optional[List[str]] = None,
19
bigquery_source_uri: Optional[str] = None,
20
gcs_destination_output_uri_prefix: Optional[str] = None,
21
bigquery_destination_output_uri: Optional[str] = None,
22
predictions_format: str = 'jsonl',
23
model_parameters: Optional[Dict] = None,
24
machine_type: Optional[str] = None,
25
accelerator_type: Optional[str] = None,
26
accelerator_count: Optional[int] = None,
27
starting_replica_count: Optional[int] = None,
28
max_replica_count: Optional[int] = None,
29
batch_size: Optional[int] = None,
30
instances_format: str = 'jsonl',
31
predictions_format: str = 'jsonl',
32
generate_explanation: bool = False,
33
explanation_metadata: Optional[explain.ExplanationMetadata] = None,
34
explanation_parameters: Optional[explain.ExplanationParameters] = None,
35
labels: Optional[Dict[str, str]] = None,
36
credentials: Optional[auth_credentials.Credentials] = None,
37
encryption_spec_key_name: Optional[str] = None,
38
sync: bool = True,
39
create_request_timeout: Optional[float] = None,
40
**kwargs
41
) -> 'BatchPredictionJob': ...
42
43
@classmethod
44
def create_from_job_spec(
45
cls,
46
job_spec: Dict,
47
**kwargs
48
) -> 'BatchPredictionJob': ...
49
50
@property
51
def state(self) -> JobState: ...
52
@property
53
def output_info(self) -> Optional[Dict]: ...
54
@property
55
def partial_failures(self) -> Optional[List[Dict]]: ...
56
```
57
58
## Usage Examples
59
60
**Basic batch prediction:**
61
```python
62
import google.cloud.aiplatform as aiplatform
63
64
aiplatform.init(project='my-project', location='us-central1')
65
66
job = aiplatform.BatchPredictionJob.create(
67
job_display_name='batch-prediction-job',
68
model_name='projects/my-project/locations/us-central1/models/123456',
69
instances_format='jsonl',
70
gcs_source_uris=['gs://my-bucket/input.jsonl'],
71
gcs_destination_output_uri_prefix='gs://my-bucket/output/',
72
machine_type='n1-standard-4',
73
starting_replica_count=1,
74
max_replica_count=5
75
)
76
77
print(f'Job created: {job.resource_name}')
78
print(f'Job state: {job.state}')
79
```