Load a JSON file with autodetect schema

Load a JSON file from Cloud Storage using autodetect schema.

Explore further

For detailed documentation that includes this code sample, see the following:

Code sample

Go

Before trying this sample, follow the Go setup instructions in the BigQuery quickstart using client libraries . For more information, see the BigQuery Go API reference documentation .

To authenticate to BigQuery, set up Application Default Credentials. For more information, see Set up authentication for client libraries .

  import 
  
 ( 
  
 "context" 
  
 "fmt" 
  
 "cloud.google.com/go/bigquery" 
 ) 
 // importJSONAutodetectSchema demonstrates loading data from newline-delimited JSON data in Cloud Storage 
 // and using schema autodetection to identify the available columns. 
 func 
  
 importJSONAutodetectSchema 
 ( 
 projectID 
 , 
  
 datasetID 
 , 
  
 tableID 
  
 string 
 ) 
  
 error 
  
 { 
  
 // projectID := "my-project-id" 
  
 // datasetID := "mydataset" 
  
 // tableID := "mytable" 
  
 ctx 
  
 := 
  
 context 
 . 
 Background 
 () 
  
 client 
 , 
  
 err 
  
 := 
  
 bigquery 
 . 
 NewClient 
 ( 
 ctx 
 , 
  
 projectID 
 ) 
  
 if 
  
 err 
  
 != 
  
 nil 
  
 { 
  
 return 
  
 fmt 
 . 
 Errorf 
 ( 
 "bigquery.NewClient: %w" 
 , 
  
 err 
 ) 
  
 } 
  
 defer 
  
 client 
 . 
 Close 
 () 
  
 gcsRef 
  
 := 
  
 bigquery 
 . 
  NewGCSReference 
 
 ( 
 "gs://cloud-samples-data/bigquery/us-states/us-states.json" 
 ) 
  
 gcsRef 
 . 
 SourceFormat 
  
 = 
  
 bigquery 
 . 
  JSON 
 
  
 gcsRef 
 . 
 AutoDetect 
  
 = 
  
 true 
  
 loader 
  
 := 
  
 client 
 . 
 Dataset 
 ( 
 datasetID 
 ). 
 Table 
 ( 
 tableID 
 ). 
  LoaderFrom 
 
 ( 
 gcsRef 
 ) 
  
 loader 
 . 
 WriteDisposition 
  
 = 
  
 bigquery 
 . 
  WriteEmpty 
 
  
 job 
 , 
  
 err 
  
 := 
  
 loader 
 . 
 Run 
 ( 
 ctx 
 ) 
  
 if 
  
 err 
  
 != 
  
 nil 
  
 { 
  
 return 
  
 err 
  
 } 
  
 status 
 , 
  
 err 
  
 := 
  
 job 
 . 
 Wait 
 ( 
 ctx 
 ) 
  
 if 
  
 err 
  
 != 
  
 nil 
  
 { 
  
 return 
  
 err 
  
 } 
  
 if 
  
 status 
 . 
  Err 
 
 () 
  
 != 
  
 nil 
  
 { 
  
 return 
  
 fmt 
 . 
 Errorf 
 ( 
 "job completed with error: %w" 
 , 
  
 status 
 . 
  Err 
 
 ()) 
  
 } 
  
 return 
  
 nil 
 } 
 

Java

Before trying this sample, follow the Java setup instructions in the BigQuery quickstart using client libraries . For more information, see the BigQuery Java API reference documentation .

To authenticate to BigQuery, set up Application Default Credentials. For more information, see Set up authentication for client libraries .

  import 
  
 com.google.cloud.bigquery. BigQuery 
 
 ; 
 import 
  
 com.google.cloud.bigquery. BigQueryException 
 
 ; 
 import 
  
 com.google.cloud.bigquery. BigQueryOptions 
 
 ; 
 import 
  
 com.google.cloud.bigquery. FormatOptions 
 
 ; 
 import 
  
 com.google.cloud.bigquery. Job 
 
 ; 
 import 
  
 com.google.cloud.bigquery. JobInfo 
 
 ; 
 import 
  
 com.google.cloud.bigquery. LoadJobConfiguration 
 
 ; 
 import 
  
 com.google.cloud.bigquery. TableId 
 
 ; 
 // Sample to load JSON data with autodetect schema from Cloud Storage into a new BigQuery table 
 public 
  
 class 
 LoadJsonFromGcsAutodetect 
  
 { 
  
 public 
  
 static 
  
 void 
  
 main 
 ( 
 String 
 [] 
  
 args 
 ) 
  
 { 
  
 // TODO(developer): Replace these variables before running the sample. 
  
 String 
  
 datasetName 
  
 = 
  
 "MY_DATASET_NAME" 
 ; 
  
 String 
  
 tableName 
  
 = 
  
 "MY_TABLE_NAME" 
 ; 
  
 String 
  
 sourceUri 
  
 = 
  
 "gs://cloud-samples-data/bigquery/us-states/us-states.json" 
 ; 
  
 loadJsonFromGcsAutodetect 
 ( 
 datasetName 
 , 
  
 tableName 
 , 
  
 sourceUri 
 ); 
  
 } 
  
 public 
  
 static 
  
 void 
  
 loadJsonFromGcsAutodetect 
 ( 
  
 String 
  
 datasetName 
 , 
  
 String 
  
 tableName 
 , 
  
 String 
  
 sourceUri 
 ) 
  
 { 
  
 try 
  
 { 
  
 // Initialize client that will be used to send requests. This client only needs to be created 
  
 // once, and can be reused for multiple requests. 
  
  BigQuery 
 
  
 bigquery 
  
 = 
  
  BigQueryOptions 
 
 . 
 getDefaultInstance 
 (). 
 getService 
 (); 
  
  TableId 
 
  
 tableId 
  
 = 
  
  TableId 
 
 . 
 of 
 ( 
 datasetName 
 , 
  
 tableName 
 ); 
  
  LoadJobConfiguration 
 
  
 loadConfig 
  
 = 
  
  LoadJobConfiguration 
 
 . 
 newBuilder 
 ( 
 tableId 
 , 
  
 sourceUri 
 ) 
  
 . 
 setFormatOptions 
 ( 
  FormatOptions 
 
 . 
 json 
 ()) 
  
 . 
 setAutodetect 
 ( 
 true 
 ) 
  
 . 
 build 
 (); 
  
 // Load data from a GCS JSON file into the table 
  
  Job 
 
  
 job 
  
 = 
  
 bigquery 
 . 
  create 
 
 ( 
 JobInfo 
 . 
 of 
 ( 
 loadConfig 
 )); 
  
 // Blocks until this load table job completes its execution, either failing or succeeding. 
  
 job 
  
 = 
  
 job 
 . 
  waitFor 
 
 (); 
  
 if 
  
 ( 
 job 
 . 
  isDone 
 
 ()) 
  
 { 
  
 System 
 . 
 out 
 . 
 println 
 ( 
 "Json Autodetect from GCS successfully loaded in a table" 
 ); 
  
 } 
  
 else 
  
 { 
  
 System 
 . 
 out 
 . 
 println 
 ( 
  
 "BigQuery was unable to load into the table due to an error:" 
  
 + 
  
 job 
 . 
 getStatus 
 (). 
 getError 
 ()); 
  
 } 
  
 } 
  
 catch 
  
 ( 
  BigQueryException 
 
  
 | 
  
 InterruptedException 
  
 e 
 ) 
  
 { 
  
 System 
 . 
 out 
 . 
 println 
 ( 
 "Column not added during load append \n" 
  
 + 
  
 e 
 . 
 toString 
 ()); 
  
 } 
  
 } 
 } 
 

Node.js

Before trying this sample, follow the Node.js setup instructions in the BigQuery quickstart using client libraries . For more information, see the BigQuery Node.js API reference documentation .

To authenticate to BigQuery, set up Application Default Credentials. For more information, see Set up authentication for client libraries .

  // Import the Google Cloud client libraries 
 const 
  
 { 
 BigQuery 
 } 
  
 = 
  
 require 
 ( 
 ' @google-cloud/bigquery 
' 
 ); 
 const 
  
 { 
 Storage 
 } 
  
 = 
  
 require 
 ( 
 ' @google-cloud/storage 
' 
 ); 
 /** 
 * TODO(developer): Uncomment the following lines before running the sample. 
 */ 
 // const datasetId = "my_dataset"; 
 // const tableId = "my_table"; 
 /** 
 * This sample loads the JSON file at 
 * https://storage.googleapis.com/cloud-samples-data/bigquery/us-states/us-states.json 
 * 
 * TODO(developer): Replace the following lines with the path to your file. 
 */ 
 const 
  
 bucketName 
  
 = 
  
 'cloud-samples-data' 
 ; 
 const 
  
 filename 
  
 = 
  
 'bigquery/us-states/us-states.json' 
 ; 
 async 
  
 function 
  
 loadJSONFromGCSAutodetect 
 () 
  
 { 
  
 // Imports a GCS file into a table with autodetected schema. 
  
 // Instantiate clients 
  
 const 
  
 bigquery 
  
 = 
  
 new 
  
  BigQuery 
 
 (); 
  
 const 
  
 storage 
  
 = 
  
 new 
  
 Storage 
 (); 
  
 // Configure the load job. For full list of options, see: 
  
 // https://cloud.google.com/bigquery/docs/reference/rest/v2/Job#JobConfigurationLoad 
  
 const 
  
 metadata 
  
 = 
  
 { 
  
 sourceFormat 
 : 
  
 'NEWLINE_DELIMITED_JSON' 
 , 
  
 autodetect 
 : 
  
 true 
 , 
  
 location 
 : 
  
 'US' 
 , 
  
 }; 
  
 // Load data from a Google Cloud Storage file into the table 
  
 const 
  
 [ 
 job 
 ] 
  
 = 
  
 await 
  
 bigquery 
  
 . 
 dataset 
 ( 
 datasetId 
 ) 
  
 . 
 table 
 ( 
 tableId 
 ) 
  
 . 
  load 
 
 ( 
 storage 
 . 
 bucket 
 ( 
 bucketName 
 ). 
 file 
 ( 
 filename 
 ), 
  
 metadata 
 ); 
  
 // load() waits for the job to finish 
  
 console 
 . 
 log 
 ( 
 `Job 
 ${ 
  job 
 
 . 
 id 
 } 
 completed.` 
 ); 
 } 
 loadJSONFromGCSAutodetect 
 (); 
 

PHP

Before trying this sample, follow the PHP setup instructions in the BigQuery quickstart using client libraries . For more information, see the BigQuery PHP API reference documentation .

To authenticate to BigQuery, set up Application Default Credentials. For more information, see Set up authentication for client libraries .

  use Google\Cloud\BigQuery\BigQueryClient; 
 /** 
 * Imports data to the given table from json file present in GCS by auto 
 * detecting options and schema. 
 * 
 * @param string $projectId The project Id of your Google Cloud Project. 
 * @param string $datasetId The BigQuery dataset ID. 
 * @param string $tableId The BigQuery table ID. 
 */ 
 function import_from_storage_json_autodetect( 
 string $projectId, 
 string $datasetId, 
 string $tableId = 'us_states' 
 ): void { 
 // instantiate the bigquery table service 
 $bigQuery = new BigQueryClient([ 
 'projectId' => $projectId, 
 ]); 
 $dataset = $bigQuery->dataset($datasetId); 
 $table = $dataset->table($tableId); 
 // create the import job 
 $gcsUri = 'gs://cloud-samples-data/bigquery/us-states/us-states.json'; 
 $loadConfig = $table->loadFromStorage($gcsUri)->autodetect(true)->sourceFormat('NEWLINE_DELIMITED_JSON'); 
 $job = $table->runJob($loadConfig); 
 // check if the job is complete 
 $job->reload(); 
 if (!$job->isComplete()) { 
 throw new \Exception('Job has not yet completed', 500); 
 } 
 // check if the job has errors 
 if (isset($job->info()['status']['errorResult'])) { 
 $error = $job->info()['status']['errorResult']['message']; 
 printf('Error running job: %s' . PHP_EOL, $error); 
 } else { 
 print('Data imported successfully' . PHP_EOL); 
 } 
 } 
 

Python

Before trying this sample, follow the Python setup instructions in the BigQuery quickstart using client libraries . For more information, see the BigQuery Python API reference documentation .

To authenticate to BigQuery, set up Application Default Credentials. For more information, see Set up authentication for client libraries .

  from 
  
 google.cloud 
  
 import 
  bigquery 
 
 # Construct a BigQuery client object. 
 client 
 = 
  bigquery 
 
 . 
  Client 
 
 () 
 # TODO(developer): Set table_id to the ID of the table to create. 
 # table_id = "your-project.your_dataset.your_table_name 
 # Set the encryption key to use for the destination. 
 # TODO: Replace this key with a key you have created in KMS. 
 # kms_key_name = "projects/{}/locations/{}/keyRings/{}/cryptoKeys/{}".format( 
 #     "cloud-samples-tests", "us", "test", "test" 
 # ) 
 job_config 
 = 
  bigquery 
 
 . 
  LoadJobConfig 
 
 ( 
 autodetect 
 = 
 True 
 , 
 source_format 
 = 
  bigquery 
 
 . 
  SourceFormat 
 
 . 
 NEWLINE_DELIMITED_JSON 
 ) 
 uri 
 = 
 "gs://cloud-samples-data/bigquery/us-states/us-states.json" 
 load_job 
 = 
 client 
 . 
  load_table_from_uri 
 
 ( 
 uri 
 , 
 table_id 
 , 
 job_config 
 = 
 job_config 
 ) 
 # Make an API request. 
 load_job 
 . 
 result 
 () 
 # Waits for the job to complete. 
 destination_table 
 = 
 client 
 . 
  get_table 
 
 ( 
 table_id 
 ) 
 print 
 ( 
 "Loaded 
 {} 
 rows." 
 . 
 format 
 ( 
 destination_table 
 . 
  num_rows 
 
 )) 
 

Ruby

Before trying this sample, follow the Ruby setup instructions in the BigQuery quickstart using client libraries . For more information, see the BigQuery Ruby API reference documentation .

To authenticate to BigQuery, set up Application Default Credentials. For more information, see Set up authentication for client libraries .

  require 
  
 "google/cloud/bigquery" 
 def 
  
 load_table_gcs_json_autodetect 
  
 dataset_id 
  
 = 
  
 "your_dataset_id" 
  
 bigquery 
  
 = 
  
 Google 
 :: 
 Cloud 
 :: 
  Bigquery 
 
 . 
  new 
 
  
 dataset 
  
 = 
  
 bigquery 
 . 
 dataset 
  
 dataset_id 
  
 gcs_uri 
  
 = 
  
 "gs://cloud-samples-data/bigquery/us-states/us-states.json" 
  
 table_id 
  
 = 
  
 "us_states" 
  
 load_job 
  
 = 
  
 dataset 
 . 
 load_job 
  
 table_id 
 , 
  
 gcs_uri 
 , 
  
 format 
 : 
  
 "json" 
 , 
  
 autodetect 
 : 
  
 true 
  
 puts 
  
 "Starting job 
 #{ 
 load_job 
 . 
  job_id 
 
 } 
 " 
  
 load_job 
 . 
 wait_until_done! 
  
 # Waits for table load to complete. 
  
 puts 
  
 "Job finished." 
  
 table 
  
 = 
  
 dataset 
 . 
 table 
  
 table_id 
  
 puts 
  
 "Loaded 
 #{ 
 table 
 . 
  rows_count 
 
 } 
 rows to table 
 #{ 
 table 
 . 
 id 
 } 
 " 
 end 
 

What's next

To search and filter code samples for other Google Cloud products, see the Google Cloud sample browser .

Create a Mobile Website
View Site in Mobile | Classic
Share by: