Search in sources :

Example 6 with Dataset

use of com.google.api.services.bigquery.model.Dataset in project DataflowJavaSDK-examples by GoogleCloudPlatform.

the class ExampleUtils method setupBigQueryTable.

private void setupBigQueryTable(String projectId, String datasetId, String tableId, TableSchema schema) throws IOException {
    if (bigQueryClient == null) {
        bigQueryClient = newBigQueryClient(options.as(BigQueryOptions.class)).build();
    }
    Datasets datasetService = bigQueryClient.datasets();
    if (executeNullIfNotFound(datasetService.get(projectId, datasetId)) == null) {
        Dataset newDataset = new Dataset().setDatasetReference(new DatasetReference().setProjectId(projectId).setDatasetId(datasetId));
        datasetService.insert(projectId, newDataset).execute();
    }
    Tables tableService = bigQueryClient.tables();
    Table table = executeNullIfNotFound(tableService.get(projectId, datasetId, tableId));
    if (table == null) {
        Table newTable = new Table().setSchema(schema).setTableReference(new TableReference().setProjectId(projectId).setDatasetId(datasetId).setTableId(tableId));
        tableService.insert(projectId, datasetId, newTable).execute();
    } else if (!table.getSchema().equals(schema)) {
        throw new RuntimeException("Table exists and schemas do not match, expecting: " + schema.toPrettyString() + ", actual: " + table.getSchema().toPrettyString());
    }
}
Also used : Datasets(com.google.api.services.bigquery.Bigquery.Datasets) DatasetReference(com.google.api.services.bigquery.model.DatasetReference) TableReference(com.google.api.services.bigquery.model.TableReference) Table(com.google.api.services.bigquery.model.Table) Dataset(com.google.api.services.bigquery.model.Dataset) Tables(com.google.api.services.bigquery.Bigquery.Tables) BigQueryOptions(org.apache.beam.sdk.io.gcp.bigquery.BigQueryOptions)

Example 7 with Dataset

use of com.google.api.services.bigquery.model.Dataset in project google-cloud-java by GoogleCloudPlatform.

the class DatasetInfo method toPb.

Dataset toPb() {
    Dataset datasetPb = new Dataset();
    datasetPb.setDatasetReference(datasetId.toPb());
    datasetPb.setCreationTime(creationTime);
    datasetPb.setDefaultTableExpirationMs(defaultTableLifetime);
    datasetPb.setDescription(description);
    datasetPb.setEtag(etag);
    datasetPb.setFriendlyName(friendlyName);
    datasetPb.setId(generatedId);
    datasetPb.setLastModifiedTime(lastModified);
    datasetPb.setLocation(location);
    datasetPb.setSelfLink(selfLink);
    if (acl != null) {
        datasetPb.setAccess(Lists.transform(acl, new Function<Acl, Dataset.Access>() {

            @Override
            public Dataset.Access apply(Acl acl) {
                return acl.toPb();
            }
        }));
    }
    if (labels != null) {
        datasetPb.setLabels(labels);
    }
    return datasetPb;
}
Also used : Function(com.google.common.base.Function) Dataset(com.google.api.services.bigquery.model.Dataset)

Example 8 with Dataset

use of com.google.api.services.bigquery.model.Dataset in project beam by apache.

the class BigQueryTableRowIteratorTest method testReadFromQueryNoTables.

/**
   * Verifies that queries that reference no data can be read.
   */
@Test
public void testReadFromQueryNoTables() throws IOException, InterruptedException {
    // Mock job inserting.
    Job dryRunJob = new Job().setStatistics(new JobStatistics().setQuery(new JobStatistics2()));
    Job insertedJob = new Job().setJobReference(new JobReference());
    when(mockJobsInsert.execute()).thenReturn(dryRunJob, insertedJob);
    // Mock job polling.
    JobStatus status = new JobStatus().setState("DONE");
    JobConfigurationQuery resultQueryConfig = new JobConfigurationQuery().setDestinationTable(new TableReference().setProjectId("project").setDatasetId("tempdataset").setTableId("temptable"));
    Job getJob = new Job().setJobReference(new JobReference()).setStatus(status).setConfiguration(new JobConfiguration().setQuery(resultQueryConfig));
    when(mockJobsGet.execute()).thenReturn(getJob);
    // Mock table schema fetch.
    when(mockTablesGet.execute()).thenReturn(noTableQuerySchema());
    byte[] photoBytes = "photograph".getBytes();
    String photoBytesEncoded = BaseEncoding.base64().encode(photoBytes);
    // Mock table data fetch.
    when(mockTabledataList.execute()).thenReturn(rawDataList(rawRow("Arthur", 42, photoBytesEncoded)));
    // Run query and verify
    String query = String.format("SELECT \"Arthur\" as name, 42 as count, \"%s\" as photo", photoBytesEncoded);
    JobConfigurationQuery queryConfig = new JobConfigurationQuery().setQuery(query);
    try (BigQueryTableRowIterator iterator = BigQueryTableRowIterator.fromQuery(queryConfig, "project", mockClient)) {
        iterator.open();
        assertTrue(iterator.advance());
        TableRow row = iterator.getCurrent();
        assertTrue(row.containsKey("name"));
        assertTrue(row.containsKey("count"));
        assertTrue(row.containsKey("photo"));
        assertEquals("Arthur", row.get("name"));
        assertEquals(42, row.get("count"));
        assertEquals(photoBytesEncoded, row.get("photo"));
        assertFalse(iterator.advance());
    }
    // Temp dataset created and later deleted.
    verify(mockClient, times(2)).datasets();
    verify(mockDatasets).insert(anyString(), any(Dataset.class));
    verify(mockDatasetsInsert).execute();
    verify(mockDatasets).delete(anyString(), anyString());
    verify(mockDatasetsDelete).execute();
    // Job inserted to run the query, polled once.
    verify(mockClient, times(3)).jobs();
    verify(mockJobs, times(2)).insert(anyString(), any(Job.class));
    verify(mockJobsInsert, times(2)).execute();
    verify(mockJobs).get(anyString(), anyString());
    verify(mockJobsGet).execute();
    // Temp table get after query finish, deleted after reading.
    verify(mockClient, times(2)).tables();
    verify(mockTables, times(1)).get(anyString(), anyString(), anyString());
    verify(mockTablesGet, times(1)).execute();
    verify(mockTables).delete(anyString(), anyString(), anyString());
    verify(mockTablesDelete).execute();
    // Table data read.
    verify(mockClient).tabledata();
    verify(mockTabledata).list("project", "tempdataset", "temptable");
    verify(mockTabledataList).execute();
}
Also used : JobStatistics(com.google.api.services.bigquery.model.JobStatistics) JobStatistics2(com.google.api.services.bigquery.model.JobStatistics2) JobReference(com.google.api.services.bigquery.model.JobReference) JobConfigurationQuery(com.google.api.services.bigquery.model.JobConfigurationQuery) Dataset(com.google.api.services.bigquery.model.Dataset) Matchers.anyString(org.mockito.Matchers.anyString) Matchers.containsString(org.hamcrest.Matchers.containsString) JobStatus(com.google.api.services.bigquery.model.JobStatus) TableReference(com.google.api.services.bigquery.model.TableReference) TableRow(com.google.api.services.bigquery.model.TableRow) Job(com.google.api.services.bigquery.model.Job) JobConfiguration(com.google.api.services.bigquery.model.JobConfiguration) Test(org.junit.Test)

Example 9 with Dataset

use of com.google.api.services.bigquery.model.Dataset in project beam by apache.

the class BigQueryTableRowIterator method createDataset.

// Create a new BigQuery dataset
private void createDataset(String datasetId, @Nullable String location) throws IOException, InterruptedException {
    Dataset dataset = new Dataset();
    DatasetReference reference = new DatasetReference();
    reference.setProjectId(projectId);
    reference.setDatasetId(datasetId);
    dataset.setDatasetReference(reference);
    if (location != null) {
        dataset.setLocation(location);
    }
    executeWithBackOff(client.datasets().insert(projectId, dataset), String.format("Error when trying to create the temporary dataset %s in project %s.", datasetId, projectId));
}
Also used : DatasetReference(com.google.api.services.bigquery.model.DatasetReference) Dataset(com.google.api.services.bigquery.model.Dataset)

Aggregations

Dataset (com.google.api.services.bigquery.model.Dataset)9 TableReference (com.google.api.services.bigquery.model.TableReference)4 Test (org.junit.Test)4 DatasetReference (com.google.api.services.bigquery.model.DatasetReference)3 Datasets (com.google.api.services.bigquery.Bigquery.Datasets)2 Tables (com.google.api.services.bigquery.Bigquery.Tables)2 Job (com.google.api.services.bigquery.model.Job)2 JobConfiguration (com.google.api.services.bigquery.model.JobConfiguration)2 JobConfigurationQuery (com.google.api.services.bigquery.model.JobConfigurationQuery)2 JobReference (com.google.api.services.bigquery.model.JobReference)2 JobStatistics (com.google.api.services.bigquery.model.JobStatistics)2 JobStatistics2 (com.google.api.services.bigquery.model.JobStatistics2)2 JobStatus (com.google.api.services.bigquery.model.JobStatus)2 Table (com.google.api.services.bigquery.model.Table)2 TableRow (com.google.api.services.bigquery.model.TableRow)2 View (com.google.cloud.bigquery.Acl.View)2 Function (com.google.common.base.Function)2 BigQueryOptions (org.apache.beam.sdk.io.gcp.bigquery.BigQueryOptions)2 Matchers.containsString (org.hamcrest.Matchers.containsString)2 Matchers.anyString (org.mockito.Matchers.anyString)2