use of de.lmu.ifi.dbs.elki.utilities.ELKIBuilder in project elki by elki-project.
the class FastMultidimensionalScalingTransformTest method parameters.
/**
* Test with parameters.
*/
@Test
public void parameters() {
int pdim = 2;
String filename = UNITTEST + "transformation-test-1.csv";
FastMultidimensionalScalingTransform<DoubleVector, DoubleVector> filter = //
new ELKIBuilder<FastMultidimensionalScalingTransform<DoubleVector, DoubleVector>>(FastMultidimensionalScalingTransform.class).with(ClassicMultidimensionalScalingTransform.Parameterizer.DIM_ID, //
pdim).with(FastMultidimensionalScalingTransform.Parameterizer.RANDOM_ID, //
0L).with(ClassicMultidimensionalScalingTransform.Parameterizer.DISTANCE_ID, //
EuclideanDistanceFunction.class).build();
MultipleObjectsBundle filteredBundle = readBundle(filename, filter);
// Load the test data again without a filter.
MultipleObjectsBundle unfilteredBundle = readBundle(filename);
int dimu = getFieldDimensionality(unfilteredBundle, 0, TypeUtil.NUMBER_VECTOR_FIELD);
int dimf = getFieldDimensionality(filteredBundle, 0, TypeUtil.NUMBER_VECTOR_FIELD);
assertEquals("Dimensionality not as requested", pdim, dimf);
// Verify that the Euclidean distance between any two points is identical
// before and after the MDS transform is performed - O(n^2)!
// Calculate the covariance matricies of the filtered and unfiltered
// bundles.
CovarianceMatrix cmUnfil = new CovarianceMatrix(dimu);
CovarianceMatrix cmFil = new CovarianceMatrix(dimf);
for (int outer = 0; outer < filteredBundle.dataLength(); outer++) {
DoubleVector dFil_1 = get(filteredBundle, outer, 0, DoubleVector.class);
DoubleVector dUnfil_1 = get(unfilteredBundle, outer, 0, DoubleVector.class);
cmUnfil.put(dUnfil_1);
cmFil.put(dFil_1);
for (int row = outer + 1; row < filteredBundle.dataLength(); row++) {
DoubleVector dFil_2 = get(filteredBundle, row, 0, DoubleVector.class);
DoubleVector dUnfil_2 = get(unfilteredBundle, row, 0, DoubleVector.class);
final double distF = EuclideanDistanceFunction.STATIC.distance(dFil_1, dFil_2);
final double distU = EuclideanDistanceFunction.STATIC.distance(dUnfil_1, dUnfil_2);
assertEquals("Expected same distance", distU, distF, 1e-10);
}
}
// Calculate the SVD of the covariance matrix of the unfiltered data.
// Verify that this SVD represents the diagonals of the covariance matrix of
// the filtered data.
double[][] ncmUnfil = cmUnfil.destroyToPopulationMatrix();
double[][] ncmFil = cmFil.destroyToPopulationMatrix();
SingularValueDecomposition svd = new SingularValueDecomposition(ncmUnfil);
double[] dia = svd.getSingularValues();
for (int ii = 0; ii < dia.length; ii++) {
assertEquals("Unexpected covariance", dia[ii], ncmFil[ii][ii], 1e-8);
}
}
use of de.lmu.ifi.dbs.elki.utilities.ELKIBuilder in project elki by elki-project.
the class ExternalIDFilterTest method parameters.
/**
* Test with parameter c as the column whose label is to be extacted.
*/
@Test
public void parameters() {
final int c = 2;
String filename = UNITTEST + "external-id-test-1.csv";
ExternalIDFilter filter = //
new ELKIBuilder<>(ExternalIDFilter.class).with(ExternalIDFilter.Parameterizer.EXTERNALID_INDEX_ID, c).build();
MultipleObjectsBundle bundle = readBundle(filename, filter);
// Ensure that the filter has correctly formed the bundle.
// We expect that the bundle's first column is a number vector field.
// We expect that the bundle's second column is an ExternalID
// We expect that the bundle's third column is a LabelList object.
// Ensure the first column are the vectors.
assertTrue("Test file not as expected", TypeUtil.NUMBER_VECTOR_FIELD.isAssignableFromType(bundle.meta(0)));
// Ensure that the second column are the ExternalID objects.
Object obj = bundle.data(0, 1);
assertEquals("Unexpected data type", ExternalID.class, obj.getClass());
// Ensure that the length of the list of ExternalID objects has the correct
// length.
assertEquals("Unexpected data length", bundle.dataLength(), bundle.getColumn(1).size());
// Ensure that the third column are the LabelList objects.
obj = bundle.data(0, 2);
assertEquals("Unexpected data type", LabelList.class, obj.getClass());
}
use of de.lmu.ifi.dbs.elki.utilities.ELKIBuilder in project elki by elki-project.
the class VectorDimensionalityFilterTest method parameters.
/**
* Test with parameter dim_keep as the dimensionality of the vectors to leave.
*/
@Test
public void parameters() {
final int dim_keep = 10;
String filename = UNITTEST + "dimensionality-test-2.csv";
VectorDimensionalityFilter<DoubleVector> filter = //
new ELKIBuilder<VectorDimensionalityFilter<DoubleVector>>(VectorDimensionalityFilter.class).with(VectorDimensionalityFilter.Parameterizer.DIM_P, dim_keep).build();
MultipleObjectsBundle filteredBundle = readBundle(filename, filter);
// Load the test data again without a filter.
MultipleObjectsBundle unfilteredBundle = readBundle(filename);
// Verify that the filter has removed the vectors of the wrong
// dimensionality.
boolean foundTooSmall = false;
for (int row = 0; row < unfilteredBundle.dataLength(); row++) {
Object obj = unfilteredBundle.data(row, 0);
assertEquals("Unexpected data type", DoubleVector.class, obj.getClass());
DoubleVector d = (DoubleVector) obj;
if (d.getDimensionality() != dim_keep) {
foundTooSmall = true;
break;
}
}
assertTrue("Expected a vector with filterable dimensionality", foundTooSmall);
assertTrue("Expected smaller data length", filteredBundle.dataLength() < unfilteredBundle.dataLength());
}
use of de.lmu.ifi.dbs.elki.utilities.ELKIBuilder in project elki by elki-project.
the class SampleKMeansInitializationTest method testSampleKMeansInitialization.
/**
* Run KMeans with fixed parameters and compare the result to a golden
* standard.
*/
@Test
public void testSampleKMeansInitialization() {
Database db = makeSimpleDatabase(UNITTEST + "different-densities-2d-no-noise.ascii", 1000);
Clustering<?> result = //
new ELKIBuilder<SingleAssignmentKMeans<DoubleVector>>(SingleAssignmentKMeans.class).with(KMeans.K_ID, //
5).with(KMeans.SEED_ID, //
8).with(KMeans.INIT_ID, //
SampleKMeansInitialization.class).with(SampleKMeansInitialization.Parameterizer.KMEANS_ID, //
KMeansHamerly.class).with(KMeans.SEED_ID, //
8).with(SampleKMeansInitialization.Parameterizer.SAMPLE_ID, //
100).build().run(db);
testFMeasure(db, result, 0.99601);
testClusterSizes(result, new int[] { 199, 199, 200, 201, 201 });
}
use of de.lmu.ifi.dbs.elki.utilities.ELKIBuilder in project elki by elki-project.
the class CLIQUETest method testCLIQUEResults.
/**
* Run CLIQUE with fixed parameters and compare the result to a golden
* standard.
*/
@Test
public void testCLIQUEResults() {
Database db = makeSimpleDatabase(UNITTEST + "subspace-simple.csv", 600);
Clustering<SubspaceModel> result = //
new ELKIBuilder<CLIQUE<DoubleVector>>(CLIQUE.class).with(CLIQUE.Parameterizer.TAU_ID, //
"0.1").with(CLIQUE.Parameterizer.XSI_ID, //
20).build().run(db);
// PairCounting is not appropriate here: overlapping clusterings!
// testFMeasure(db, result, 0.9882);
testClusterSizes(result, new int[] { 200, 200, 216, 400 });
}
Aggregations