package de.lmu.ifi.dbs.elki.datasource.filter; /* This file is part of ELKI: Environment for Developing KDD-Applications Supported by Index-Structures Copyright (C) 2011 Ludwig-Maximilians-Universität München Lehr- und Forschungseinheit für Datenbanksysteme ELKI Development Team This program is free software: you can redistribute it and/or modify it under the terms of the GNU Affero General Public License as published by the Free Software Foundation, either version 3 of the License, or (at your option) any later version. This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU Affero General Public License for more details. You should have received a copy of the GNU Affero General Public License along with this program. If not, see . */ import java.util.BitSet; import java.util.Random; import de.lmu.ifi.dbs.elki.data.FeatureVector; import de.lmu.ifi.dbs.elki.data.NumberVector; import de.lmu.ifi.dbs.elki.data.type.SimpleTypeInformation; import de.lmu.ifi.dbs.elki.data.type.VectorFieldTypeInformation; import de.lmu.ifi.dbs.elki.utilities.Util; import de.lmu.ifi.dbs.elki.utilities.optionhandling.AbstractParameterizer; import de.lmu.ifi.dbs.elki.utilities.optionhandling.OptionID; import de.lmu.ifi.dbs.elki.utilities.optionhandling.constraints.GreaterEqualConstraint; import de.lmu.ifi.dbs.elki.utilities.optionhandling.parameterization.Parameterization; import de.lmu.ifi.dbs.elki.utilities.optionhandling.parameters.IntParameter; /** *

* A RandomProjectionParser selects a subset of attributes randomly for * projection of a ParsingResult. *

* * The cardinality of the subset of attributes is specified as a parameter. * * * @author Arthur Zimek * @author Erich Schubert * * @param the type of FeatureVector contained in both the original data of * the base parser and the projected data of this ProjectionParser */ public abstract class AbstractRandomFeatureSelectionFilter> extends AbstractConversionFilter { /** * The selected attributes */ protected BitSet selectedAttributes = null; /** * Parameter for the desired cardinality of the subset of attributes selected * for projection. * *

* Key: -randomprojection.numberselected *

*

* Default: 1 *

*

* Constraint: ≥1 *

*/ public static final OptionID NUMBER_SELECTED_ATTRIBUTES_ID = OptionID.getOrCreateOptionID("randomprojection.numberselected", "number of selected attributes"); /** * Holds the desired cardinality of the subset of attributes selected for * projection. */ protected int k; /** * Holds a random object. */ protected final Random random = new Random(); /** * Constructor. * * @param dim dimensionality */ public AbstractRandomFeatureSelectionFilter(int dim) { super(); this.k = dim; } @Override protected boolean prepareStart(SimpleTypeInformation in) { int d = ((VectorFieldTypeInformation) in).dimensionality(); selectedAttributes = Util.randomBitSet(k, d, random); // We don't need the full loop, so return false. return false; } /** * Parameterization class. * * @author Erich Schubert * * @apiviz.exclude */ public static abstract class Parameterizer> extends AbstractParameterizer { protected int k = 0; @Override protected void makeOptions(Parameterization config) { super.makeOptions(config); IntParameter kP = new IntParameter(NUMBER_SELECTED_ATTRIBUTES_ID, new GreaterEqualConstraint(1), 1); if(config.grab(kP)) { k = kP.getValue(); } } } }