Create a batch prediction job

Creates a batch prediction job using the create_batch_prediction_job method.

Explore further

For detailed documentation that includes this code sample, see the following:

Get batch inferences from a custom trained model

Code sample

Java

Before trying this sample, follow the Java setup instructions in the Vertex AI quickstart using client libraries . For more information, see the Vertex AI Java API reference documentation .

To authenticate to Vertex AI, set up Application Default Credentials. For more information, see Set up authentication for a local development environment .

  import 
  
 com.google.cloud.aiplatform.util. ValueConverter 
 
 ; 
 import 
  
 com.google.cloud.aiplatform.v1. AcceleratorType 
 
 ; 
 import 
  
 com.google.cloud.aiplatform.v1. BatchDedicatedResources 
 
 ; 
 import 
  
 com.google.cloud.aiplatform.v1. BatchPredictionJob 
 
 ; 
 import 
  
 com.google.cloud.aiplatform.v1. GcsDestination 
 
 ; 
 import 
  
 com.google.cloud.aiplatform.v1. GcsSource 
 
 ; 
 import 
  
 com.google.cloud.aiplatform.v1. JobServiceClient 
 
 ; 
 import 
  
 com.google.cloud.aiplatform.v1. JobServiceSettings 
 
 ; 
 import 
  
 com.google.cloud.aiplatform.v1. LocationName 
 
 ; 
 import 
  
 com.google.cloud.aiplatform.v1. MachineSpec 
 
 ; 
 import 
  
 com.google.cloud.aiplatform.v1. ModelName 
 
 ; 
 import 
  
 com.google.protobuf. Value 
 
 ; 
 import 
  
 java.io.IOException 
 ; 
 public 
  
 class 
 CreateBatchPredictionJobSample 
  
 { 
  
 public 
  
 static 
  
 void 
  
 main 
 ( 
 String 
 [] 
  
 args 
 ) 
  
 throws 
  
 IOException 
  
 { 
  
 // TODO(developer): Replace these variables before running the sample. 
  
 String 
  
 project 
  
 = 
  
 "PROJECT" 
 ; 
  
 String 
  
 displayName 
  
 = 
  
 "DISPLAY_NAME" 
 ; 
  
 String 
  
 modelName 
  
 = 
  
 "MODEL_NAME" 
 ; 
  
 String 
  
 instancesFormat 
  
 = 
  
 "INSTANCES_FORMAT" 
 ; 
  
 String 
  
 gcsSourceUri 
  
 = 
  
 "GCS_SOURCE_URI" 
 ; 
  
 String 
  
 predictionsFormat 
  
 = 
  
 "PREDICTIONS_FORMAT" 
 ; 
  
 String 
  
 gcsDestinationOutputUriPrefix 
  
 = 
  
 "GCS_DESTINATION_OUTPUT_URI_PREFIX" 
 ; 
  
 createBatchPredictionJobSample 
 ( 
  
 project 
 , 
  
 displayName 
 , 
  
 modelName 
 , 
  
 instancesFormat 
 , 
  
 gcsSourceUri 
 , 
  
 predictionsFormat 
 , 
  
 gcsDestinationOutputUriPrefix 
 ); 
  
 } 
  
 static 
  
 void 
  
 createBatchPredictionJobSample 
 ( 
  
 String 
  
 project 
 , 
  
 String 
  
 displayName 
 , 
  
 String 
  
 model 
 , 
  
 String 
  
 instancesFormat 
 , 
  
 String 
  
 gcsSourceUri 
 , 
  
 String 
  
 predictionsFormat 
 , 
  
 String 
  
 gcsDestinationOutputUriPrefix 
 ) 
  
 throws 
  
 IOException 
  
 { 
  
  JobServiceSettings 
 
  
 settings 
  
 = 
  
  JobServiceSettings 
 
 . 
 newBuilder 
 () 
  
 . 
 setEndpoint 
 ( 
 "us-central1-aiplatform.googleapis.com:443" 
 ) 
  
 . 
 build 
 (); 
  
 String 
  
 location 
  
 = 
  
 "us-central1" 
 ; 
  
 // Initialize client that will be used to send requests. This client only needs to be created 
  
 // once, and can be reused for multiple requests. After completing all of your requests, call 
  
 // the "close" method on the client to safely clean up any remaining background resources. 
  
 try 
  
 ( 
  JobServiceClient 
 
  
 client 
  
 = 
  
  JobServiceClient 
 
 . 
 create 
 ( 
 settings 
 )) 
  
 { 
  
 // Passing in an empty Value object for model parameters 
  
  Value 
 
  
 modelParameters 
  
 = 
  
  ValueConverter 
 
 . 
 EMPTY_VALUE 
 ; 
  
  GcsSource 
 
  
 gcsSource 
  
 = 
  
  GcsSource 
 
 . 
 newBuilder 
 (). 
  addUris 
 
 ( 
 gcsSourceUri 
 ). 
 build 
 (); 
  
  BatchPredictionJob 
 
 . 
  InputConfig 
 
  
 inputConfig 
  
 = 
  
  BatchPredictionJob 
 
 . 
 InputConfig 
 . 
 newBuilder 
 () 
  
 . 
  setInstancesFormat 
 
 ( 
 instancesFormat 
 ) 
  
 . 
 setGcsSource 
 ( 
 gcsSource 
 ) 
  
 . 
 build 
 (); 
  
  GcsDestination 
 
  
 gcsDestination 
  
 = 
  
  GcsDestination 
 
 . 
 newBuilder 
 (). 
  setOutputUriPrefix 
 
 ( 
 gcsDestinationOutputUriPrefix 
 ). 
 build 
 (); 
  
  BatchPredictionJob 
 
 . 
 OutputConfig 
  
 outputConfig 
  
 = 
  
  BatchPredictionJob 
 
 . 
 OutputConfig 
 . 
 newBuilder 
 () 
  
 . 
  setPredictionsFormat 
 
 ( 
 predictionsFormat 
 ) 
  
 . 
 setGcsDestination 
 ( 
 gcsDestination 
 ) 
  
 . 
 build 
 (); 
  
  MachineSpec 
 
  
 machineSpec 
  
 = 
  
  MachineSpec 
 
 . 
 newBuilder 
 () 
  
 . 
  setMachineType 
 
 ( 
 "n1-standard-2" 
 ) 
  
 . 
  setAcceleratorType 
 
 ( 
  AcceleratorType 
 
 . 
 NVIDIA_TESLA_T4 
 ) 
  
 . 
  setAcceleratorCount 
 
 ( 
 1 
 ) 
  
 . 
 build 
 (); 
  
  BatchDedicatedResources 
 
  
 dedicatedResources 
  
 = 
  
  BatchDedicatedResources 
 
 . 
 newBuilder 
 () 
  
 . 
 setMachineSpec 
 ( 
 machineSpec 
 ) 
  
 . 
  setStartingReplicaCount 
 
 ( 
 1 
 ) 
  
 . 
 setMaxReplicaCount 
 ( 
 1 
 ) 
  
 . 
 build 
 (); 
  
 String 
  
 modelName 
  
 = 
  
  ModelName 
 
 . 
 of 
 ( 
 project 
 , 
  
 location 
 , 
  
 model 
 ). 
 toString 
 (); 
  
  BatchPredictionJob 
 
  
 batchPredictionJob 
  
 = 
  
  BatchPredictionJob 
 
 . 
 newBuilder 
 () 
  
 . 
 setDisplayName 
 ( 
 displayName 
 ) 
  
 . 
 setModel 
 ( 
 modelName 
 ) 
  
 . 
  setModelParameters 
 
 ( 
 modelParameters 
 ) 
  
 . 
  setInputConfig 
 
 ( 
 inputConfig 
 ) 
  
 . 
 setOutputConfig 
 ( 
 outputConfig 
 ) 
  
 . 
 setDedicatedResources 
 ( 
 dedicatedResources 
 ) 
  
 . 
 build 
 (); 
  
  LocationName 
 
  
 parent 
  
 = 
  
  LocationName 
 
 . 
 of 
 ( 
 project 
 , 
  
 location 
 ); 
  
  BatchPredictionJob 
 
  
 response 
  
 = 
  
 client 
 . 
 createBatchPredictionJob 
 ( 
 parent 
 , 
  
 batchPredictionJob 
 ); 
  
 System 
 . 
 out 
 . 
 format 
 ( 
 "response: %s\n" 
 , 
  
 response 
 ); 
  
 System 
 . 
 out 
 . 
 format 
 ( 
 "\tName: %s\n" 
 , 
  
 response 
 . 
  getName 
 
 ()); 
  
 } 
  
 } 
 }

Python

Before trying this sample, follow the Python setup instructions in the Vertex AI quickstart using client libraries . For more information, see the Vertex AI Python API reference documentation .