Search in sources :

Example 31 with Dataset

use of in project java-automl by googleapis.

the class DatasetApi method importData.

// [START automl_translate_import_data]
 * Import sentence pairs to the dataset.
 * @param projectId the Google Cloud Project ID.
 * @param computeRegion the Region name. (e.g., "us-central1").
 * @param datasetId the Id of the dataset.
 * @param path the remote Path of the training data csv file.
public static void importData(String projectId, String computeRegion, String datasetId, String path) throws IOException, InterruptedException, ExecutionException {
    // Instantiates a client
    try (AutoMlClient client = AutoMlClient.create()) {
        // Get the complete path of the dataset.
        DatasetName datasetFullId = DatasetName.of(projectId, computeRegion, datasetId);
        GcsSource.Builder gcsSource = GcsSource.newBuilder();
        // Get multiple Google Cloud Storage URIs to import data from
        String[] inputUris = path.split(",");
        for (String inputUri : inputUris) {
        // Import data from the input URI
        InputConfig inputConfig = InputConfig.newBuilder().setGcsSource(gcsSource).build();
        System.out.println("Processing import...");
        Empty response = client.importDataAsync(datasetFullId, inputConfig).get();
        System.out.println(String.format("Dataset imported. %s", response));
Also used : Empty( GcsSource( DatasetName( InputConfig( AutoMlClient(

Example 32 with Dataset

use of in project java-automl by googleapis.

the class DeleteDatasetTest method setUp.

public void setUp() throws IOException {
    // Create a fake dataset to be deleted
    // Create a random dataset name with a length of 32 characters (max allowed by AutoML)
    // To prevent name collisions when running tests in multiple java versions at once.
    // AutoML doesn't allow "-", but accepts "_"
    String datasetName = String.format("test_%s", UUID.randomUUID().toString().replace("-", "_").substring(0, 26));
    try (AutoMlClient client = AutoMlClient.create()) {
        LocationName projectLocation = LocationName.of(PROJECT_ID, "us-central1");
        TextExtractionDatasetMetadata metadata = TextExtractionDatasetMetadata.newBuilder().build();
        Dataset dataset = Dataset.newBuilder().setDisplayName(datasetName).setTextExtractionDatasetMetadata(metadata).build();
        Dataset createdDataset = client.createDataset(projectLocation, dataset);
        String[] names = createdDataset.getName().split("/");
        datasetId = names[names.length - 1];
    bout = new ByteArrayOutputStream();
    out = new PrintStream(bout);
    originalPrintStream = System.out;
Also used : PrintStream( Dataset( TextExtractionDatasetMetadata( ByteArrayOutputStream( AutoMlClient( LocationName( Before(org.junit.Before)

Example 33 with Dataset

use of in project java-automl by googleapis.

the class VisionClassificationCreateDataset method createDataset.

// Create a dataset
static void createDataset(String projectId, String displayName) throws IOException, ExecutionException, InterruptedException {
    // the "close" method on the client to safely clean up any remaining background resources.
    try (AutoMlClient client = AutoMlClient.create()) {
        // A resource that represents Google Cloud Platform location.
        LocationName projectLocation = LocationName.of(projectId, "us-central1");
        // Specify the classification type
        // Types:
        // MultiLabel: Multiple labels are allowed for one example.
        // MultiClass: At most one label is allowed per example.
        ClassificationType classificationType = ClassificationType.MULTILABEL;
        ImageClassificationDatasetMetadata metadata = ImageClassificationDatasetMetadata.newBuilder().setClassificationType(classificationType).build();
        Dataset dataset = Dataset.newBuilder().setDisplayName(displayName).setImageClassificationDatasetMetadata(metadata).build();
        OperationFuture<Dataset, OperationMetadata> future = client.createDatasetAsync(projectLocation, dataset);
        Dataset createdDataset = future.get();
        // Display the dataset information.
        System.out.format("Dataset name: %s\n", createdDataset.getName());
        // To get the dataset id, you have to parse it out of the `name` field. As dataset Ids are
        // required for other methods.
        // Name Form: `projects/{project_id}/locations/{location_id}/datasets/{dataset_id}`
        String[] names = createdDataset.getName().split("/");
        String datasetId = names[names.length - 1];
        System.out.format("Dataset id: %s\n", datasetId);
Also used : ImageClassificationDatasetMetadata( Dataset( OperationMetadata( ClassificationType( AutoMlClient( LocationName(

Example 34 with Dataset

use of in project java-automl by googleapis.

the class SetEndpoint method setEndpoint.

// Change your endpoint
static void setEndpoint(String projectId) throws IOException {
    // [START automl_set_endpoint]
    AutoMlSettings settings = AutoMlSettings.newBuilder().setEndpoint("").build();
    // Initialize client that will be used to send requests. This client only needs to be created
    // once, and can be reused for multiple requests. After completing all of your requests, call
    // the "close" method on the client to safely clean up any remaining background resources.
    AutoMlClient client = AutoMlClient.create(settings);
    // A resource that represents Google Cloud Platform location.
    LocationName projectLocation = LocationName.of(projectId, "eu");
    // [END automl_set_endpoint]
    ListDatasetsRequest request = ListDatasetsRequest.newBuilder().setParent(projectLocation.toString()).setFilter("translation_dataset_metadata:*").build();
    // List all the datasets available
    System.out.println("List of datasets:");
    for (Dataset dataset : client.listDatasets(request).iterateAll()) {
Also used : Dataset( AutoMlSettings( AutoMlClient( LocationName( ListDatasetsRequest(

Example 35 with Dataset

use of in project java-automl by googleapis.

the class TablesCreateDataset method createDataset.

// Create a dataset
static void createDataset(String projectId, String displayName) throws IOException {
    // the "close" method on the client to safely clean up any remaining background resources.
    try (AutoMlClient client = AutoMlClient.create()) {
        // A resource that represents Google Cloud Platform location.
        LocationName projectLocation = LocationName.of(projectId, "us-central1");
        TablesDatasetMetadata metadata = TablesDatasetMetadata.newBuilder().build();
        Dataset dataset = Dataset.newBuilder().setDisplayName(displayName).setTablesDatasetMetadata(metadata).build();
        Dataset createdDataset = client.createDataset(projectLocation, dataset);
        // Display the dataset information.
        System.out.format("Dataset name: %s%n", createdDataset.getName());
        // To get the dataset id, you have to parse it out of the `name` field. As dataset Ids are
        // required for other methods.
        // Name Form: `projects/{project_id}/locations/{location_id}/datasets/{dataset_id}`
        String[] names = createdDataset.getName().split("/");
        String datasetId = names[names.length - 1];
        System.out.format("Dataset id: %s%n", datasetId);
Also used : TablesDatasetMetadata( Dataset( AutoMlClient( LocationName(


IOException ( AutoMlClient ( ByteArrayOutputStream ( PrintStream ( Before (org.junit.Before)10 Dataset ( ArrayList (java.util.ArrayList)9 Dataset ( LocationName ( OperationMetadata ( DataLabelingServiceClient ( ProjectName ( CreateDatasetOperationMetadata ( Dataset ( DatasetServiceClient ( DatasetServiceSettings ( LocationName ( AutoMlClient ( Dataset ( LocationName (