Search in sources :

Example 1 with MappingInspector

use of com.datastax.oss.dsbulk.mapping.MappingInspector in project dsbulk by datastax.

the class SchemaSettings method init.

public void init(CqlSession session, ConvertingCodecFactory codecFactory, boolean indexedMappingSupported, boolean mappedMappingSupported) {
    this.codecFactory = codecFactory;
    try {
        if (config.hasPath(KEYSPACE) && config.hasPath(GRAPH)) {
            throw new IllegalArgumentException("Settings schema.keyspace and schema.graph are mutually exclusive");
        }
        if (config.hasPath(TABLE) && config.hasPath(VERTEX)) {
            throw new IllegalArgumentException("Settings schema.table and schema.vertex are mutually exclusive");
        }
        if (config.hasPath(TABLE) && config.hasPath(EDGE)) {
            throw new IllegalArgumentException("Settings schema.table and schema.edge are mutually exclusive");
        }
        if (config.hasPath(VERTEX) && config.hasPath(EDGE)) {
            throw new IllegalArgumentException("Settings schema.vertex and schema.edge are mutually exclusive");
        }
        if (config.hasPath(EDGE)) {
            if (!config.hasPath(FROM)) {
                throw new IllegalArgumentException("Setting schema.from is required when schema.edge is specified");
            }
            if (!config.hasPath(TO)) {
                throw new IllegalArgumentException("Setting schema.to is required when schema.edge is specified");
            }
        }
        if (config.hasPath(QUERY) && (config.hasPath(TABLE) || config.hasPath(VERTEX) || config.hasPath(EDGE))) {
            throw new IllegalArgumentException("Setting schema.query must not be defined if schema.table, schema.vertex or schema.edge are defined");
        }
        if ((!config.hasPath(KEYSPACE) && !config.hasPath(GRAPH)) && (config.hasPath(TABLE) || config.hasPath(VERTEX) || config.hasPath(EDGE))) {
            throw new IllegalArgumentException("Settings schema.keyspace or schema.graph must be defined if schema.table, schema.vertex or schema.edge are defined");
        }
        if (config.hasPath(KEYSPACE)) {
            keyspace = locateKeyspace(session.getMetadata(), config.getString(KEYSPACE));
        } else if (config.hasPath(GRAPH)) {
            keyspace = locateKeyspace(session.getMetadata(), config.getString(GRAPH));
        }
        if (keyspace != null) {
            if (config.hasPath(TABLE)) {
                table = locateTable(keyspace, config.getString(TABLE));
            } else if (config.hasPath(VERTEX)) {
                table = locateVertexTable(keyspace, config.getString(VERTEX));
            } else if (config.hasPath(EDGE)) {
                table = locateEdgeTable(keyspace, config.getString(EDGE), config.getString(FROM), config.getString(TO));
            }
        }
        // Timestamp and TTL
        ttlSeconds = config.getInt(QUERY_TTL);
        if (config.hasPath(QUERY_TIMESTAMP)) {
            String timestampStr = config.getString(QUERY_TIMESTAMP);
            try {
                ConvertingCodec<String, Instant> codec = codecFactory.createConvertingCodec(DataTypes.TIMESTAMP, GenericType.STRING, true);
                Instant instant = codec.externalToInternal(timestampStr);
                this.timestampMicros = instantToNumber(instant, MICROSECONDS, EPOCH);
            } catch (Exception e) {
                Object format = codecFactory.getContext().getAttribute(TIMESTAMP_PATTERN);
                throw new IllegalArgumentException(String.format("Expecting schema.queryTimestamp to be in %s format but got '%s'", format, timestampStr));
            }
        } else {
            this.timestampMicros = -1L;
        }
        preserveTimestamp = config.getBoolean(PRESERVE_TIMESTAMP);
        preserveTtl = config.getBoolean(PRESERVE_TTL);
        if (config.hasPath(QUERY)) {
            query = config.getString(QUERY);
            queryInspector = new QueryInspector(query);
            if (queryInspector.getKeyspaceName().isPresent()) {
                if (keyspace != null) {
                    throw new IllegalArgumentException("Setting schema.keyspace must not be provided when schema.query contains a keyspace-qualified statement");
                }
                CQLWord keyspaceName = queryInspector.getKeyspaceName().get();
                keyspace = session.getMetadata().getKeyspace(keyspaceName.asIdentifier()).orElse(null);
                if (keyspace == null) {
                    throw new IllegalArgumentException(String.format("Value for schema.query references a non-existent keyspace: %s", keyspaceName.render(VARIABLE)));
                }
            } else if (keyspace == null) {
                throw new IllegalArgumentException("Setting schema.keyspace must be provided when schema.query does not contain a keyspace-qualified statement");
            }
            CQLWord tableName = queryInspector.getTableName();
            table = keyspace.getTable(tableName.asIdentifier()).orElse(null);
            if (table == null) {
                table = keyspace.getView(tableName.asIdentifier()).orElse(null);
                if (table == null) {
                    throw new IllegalArgumentException(String.format("Value for schema.query references a non-existent table or materialized view: %s", tableName.render(VARIABLE)));
                }
            }
            // If a query is provided, ttl and timestamp must not be.
            if (timestampMicros != -1 || ttlSeconds != -1) {
                throw new IllegalArgumentException("Setting schema.query must not be defined if schema.queryTtl or schema.queryTimestamp is defined");
            }
            if (preserveTimestamp || preserveTtl) {
                throw new IllegalArgumentException("Setting schema.query must not be defined if schema.preserveTimestamp or schema.preserveTtl is defined");
            }
        } else {
            if (keyspace == null || table == null) {
                // Either the keyspace and table must be present, or the query must be present.
                throw new IllegalArgumentException("When schema.query is not defined, " + "then either schema.keyspace or schema.graph must be defined, " + "and either schema.table, schema.vertex or schema.edge must be defined");
            }
        }
        assert keyspace != null;
        assert table != null;
        keyspaceName = CQLWord.fromCqlIdentifier(keyspace.getName());
        tableName = CQLWord.fromCqlIdentifier(table.getName());
        if (indexedMappingSupported && mappedMappingSupported) {
            mappingPreference = MAPPED_OR_INDEXED;
        } else if (indexedMappingSupported) {
            mappingPreference = INDEXED_ONLY;
        } else if (mappedMappingSupported) {
            mappingPreference = MAPPED_ONLY;
        } else if (schemaGenerationStrategy.isMapping()) {
            throw new IllegalArgumentException("Connector must support at least one of indexed or mapped mappings");
        }
        if (config.hasPath(MAPPING)) {
            if (!schemaGenerationStrategy.isMapping()) {
                throw new IllegalArgumentException("Setting schema.mapping must not be defined when counting rows in a table");
            }
            Supplier<CQLWord> usingTimestampVariable = null;
            Supplier<CQLWord> usingTTLVariable = null;
            if (queryInspector != null) {
                usingTimestampVariable = queryInspector.getUsingTimestampVariable()::get;
                usingTTLVariable = queryInspector.getUsingTTLVariable()::get;
            }
            // TODO remove support for providing external variable names for the deprecated
            // __ttl and __timestamp mapping tokens.
            @SuppressWarnings("deprecation") MappingInspector mapping = new MappingInspector(config.getString(MAPPING), schemaGenerationStrategy.isWriting(), mappingPreference, usingTimestampVariable, usingTTLVariable);
            this.mapping = mapping;
            Set<MappingField> fields = mapping.getExplicitMappings().keySet();
            Collection<CQLFragment> variables = mapping.getExplicitMappings().values();
            if (schemaGenerationStrategy.isWriting()) {
                // now() = c1 only allowed if schema.query not present
                if (containsFunctionCalls(variables, WRITETIME_OR_TTL.negate())) {
                    throw new IllegalArgumentException("Misplaced function call detected on the right side of a mapping entry; " + "please review your schema.mapping setting");
                }
                if (query != null && containsFunctionCalls(variables, WRITETIME_OR_TTL)) {
                    throw new IllegalArgumentException("Setting schema.query must not be defined when loading if schema.mapping " + "contains a writetime or ttl function on the right side of a mapping entry");
                }
                if (query != null && containsFunctionCalls(fields)) {
                    throw new IllegalArgumentException("Setting schema.query must not be defined when loading if schema.mapping " + "contains a function on the left side of a mapping entry");
                }
                if (containsWritetimeOrTTLFunctionCalls(mapping.getExplicitMappings())) {
                    throw new IllegalArgumentException("Misplaced function call detected on the left side of a writetime or TTL mapping entry; " + "please review your schema.mapping setting");
                }
                // (text)'abc' = c1 only allowed if schema.query not present
                if (containsConstantExpressions(variables)) {
                    throw new IllegalArgumentException("Misplaced constant expression detected on the right side of a mapping entry; " + "please review your schema.mapping setting");
                }
                if (query != null && containsConstantExpressions(fields)) {
                    throw new IllegalArgumentException("Setting schema.query must not be defined when loading if schema.mapping " + "contains a constant expression on the left side of a mapping entry");
                }
            }
            if (schemaGenerationStrategy.isReading()) {
                // f1 = now() only allowed if schema.query not present
                if (containsFunctionCalls(fields)) {
                    throw new IllegalArgumentException("Misplaced function call detected on the left side of a mapping entry; " + "please review your schema.mapping setting");
                }
                if (query != null && containsFunctionCalls(variables)) {
                    throw new IllegalArgumentException("Setting schema.query must not be defined when unloading if schema.mapping " + "contains a function on the right side of a mapping entry");
                }
                // supported
                if (containsConstantExpressions(fields)) {
                    throw new IllegalArgumentException("Misplaced constant expression detected on the left side of a mapping entry; " + "please review your schema.mapping setting");
                }
                if (containsConstantExpressions(variables)) {
                    if (query != null) {
                        throw new IllegalArgumentException("Setting schema.query must not be defined when unloading if schema.mapping " + "contains a constant expression on the right side of a mapping entry");
                    }
                    if (!checkLiteralSelectorsSupported(session)) {
                        throw new IllegalStateException("At least one constant expression appears on the right side of a mapping entry, " + "but the cluster does not support CQL literals in the SELECT clause; " + " please review your schema.mapping setting");
                    }
                }
            }
            if ((preserveTimestamp || preserveTtl) && !mapping.isInferring()) {
                throw new IllegalStateException("Setting schema.mapping must contain an inferring entry (e.g. '*=*') " + "when schema.preserveTimestamp or schema.preserveTtl is enabled");
            }
        } else {
            mapping = new MappingInspector("*=*", schemaGenerationStrategy.isWriting(), mappingPreference);
        }
        // Misc
        nullToUnset = config.getBoolean(NULL_TO_UNSET);
        allowExtraFields = config.getBoolean(ALLOW_EXTRA_FIELDS);
        allowMissingFields = config.getBoolean(ALLOW_MISSING_FIELDS);
        splits = ConfigUtils.getThreads(config, SPLITS);
        if (hasGraphOptions(config)) {
            GraphUtils.checkGraphCompatibility(session);
            if (!isGraph(keyspace)) {
                throw new IllegalStateException("Graph operations requested but provided keyspace is not a graph: " + keyspaceName);
            }
            if (!isSupportedGraph(keyspace)) {
                assert ((DseGraphKeyspaceMetadata) keyspace).getGraphEngine().isPresent();
                throw new IllegalStateException(String.format("Graph operations requested but provided graph %s was created with an unsupported graph engine: %s", keyspaceName, ((DseGraphKeyspaceMetadata) keyspace).getGraphEngine().get()));
            }
        } else if (isGraph(keyspace)) {
            if (isSupportedGraph(keyspace)) {
                if (config.hasPath(KEYSPACE) || config.hasPath(TABLE)) {
                    LOGGER.warn("Provided keyspace is a graph; " + "instead of schema.keyspace and schema.table, please use graph-specific options " + "such as schema.graph, schema.vertex, schema.edge, schema.from and schema.to.");
                }
            } else {
                if (schemaGenerationStrategy == SchemaGenerationStrategy.MAP_AND_WRITE) {
                    LOGGER.warn("Provided keyspace is a graph created with a legacy graph engine: " + ((DseGraphKeyspaceMetadata) keyspace).getGraphEngine().get() + "; attempting to load data into such a keyspace is not supported and " + "may put the graph in an inconsistent state.");
                }
            }
        }
    } catch (ConfigException e) {
        throw ConfigUtils.convertConfigException(e, "dsbulk.schema");
    }
}
Also used : Instant(java.time.Instant) ConfigException(com.typesafe.config.ConfigException) CQLFragment(com.datastax.oss.dsbulk.mapping.CQLFragment) IndexedMappingField(com.datastax.oss.dsbulk.mapping.IndexedMappingField) MappingField(com.datastax.oss.dsbulk.mapping.MappingField) MappedMappingField(com.datastax.oss.dsbulk.mapping.MappedMappingField) ConfigException(com.typesafe.config.ConfigException) NestedBatchException(com.datastax.oss.dsbulk.workflow.commons.schema.NestedBatchException) QueryInspector(com.datastax.oss.dsbulk.workflow.commons.schema.QueryInspector) DseGraphKeyspaceMetadata(com.datastax.dse.driver.api.core.metadata.schema.DseGraphKeyspaceMetadata) MappingInspector(com.datastax.oss.dsbulk.mapping.MappingInspector) CQLWord(com.datastax.oss.dsbulk.mapping.CQLWord)

Aggregations

DseGraphKeyspaceMetadata (com.datastax.dse.driver.api.core.metadata.schema.DseGraphKeyspaceMetadata)1 CQLFragment (com.datastax.oss.dsbulk.mapping.CQLFragment)1 CQLWord (com.datastax.oss.dsbulk.mapping.CQLWord)1 IndexedMappingField (com.datastax.oss.dsbulk.mapping.IndexedMappingField)1 MappedMappingField (com.datastax.oss.dsbulk.mapping.MappedMappingField)1 MappingField (com.datastax.oss.dsbulk.mapping.MappingField)1 MappingInspector (com.datastax.oss.dsbulk.mapping.MappingInspector)1 NestedBatchException (com.datastax.oss.dsbulk.workflow.commons.schema.NestedBatchException)1 QueryInspector (com.datastax.oss.dsbulk.workflow.commons.schema.QueryInspector)1 ConfigException (com.typesafe.config.ConfigException)1 Instant (java.time.Instant)1