diff options
author | Andrej Shadura <andrewsh@debian.org> | 2019-03-09 22:30:40 +0000 |
---|---|---|
committer | Andrej Shadura <andrewsh@debian.org> | 2019-03-09 22:30:40 +0000 |
commit | 337087b668d3a54f3afee3a9adb597a32e9f7e94 (patch) | |
tree | d860094269622472f8079d497ac7af02dbb4e038 /src/de/lmu/ifi/dbs/elki/datasource/filter/selection/RandomSamplingStreamFilter.java | |
parent | 14a486343aef55f97f54082d6b542dedebf6f3ba (diff) |
Import Upstream version 0.6.5~20141030
Diffstat (limited to 'src/de/lmu/ifi/dbs/elki/datasource/filter/selection/RandomSamplingStreamFilter.java')
-rw-r--r-- | src/de/lmu/ifi/dbs/elki/datasource/filter/selection/RandomSamplingStreamFilter.java | 144 |
1 files changed, 144 insertions, 0 deletions
diff --git a/src/de/lmu/ifi/dbs/elki/datasource/filter/selection/RandomSamplingStreamFilter.java b/src/de/lmu/ifi/dbs/elki/datasource/filter/selection/RandomSamplingStreamFilter.java new file mode 100644 index 00000000..3e1a3d89 --- /dev/null +++ b/src/de/lmu/ifi/dbs/elki/datasource/filter/selection/RandomSamplingStreamFilter.java @@ -0,0 +1,144 @@ +package de.lmu.ifi.dbs.elki.datasource.filter.selection; + +/* + This file is part of ELKI: + Environment for Developing KDD-Applications Supported by Index-Structures + + Copyright (C) 2014 + Ludwig-Maximilians-Universität München + Lehr- und Forschungseinheit für Datenbanksysteme + ELKI Development Team + + This program is free software: you can redistribute it and/or modify + it under the terms of the GNU Affero General Public License as published by + the Free Software Foundation, either version 3 of the License, or + (at your option) any later version. + + This program is distributed in the hope that it will be useful, + but WITHOUT ANY WARRANTY; without even the implied warranty of + MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + GNU Affero General Public License for more details. + + You should have received a copy of the GNU Affero General Public License + along with this program. If not, see <http://www.gnu.org/licenses/>. + */ + +import java.util.Random; + +import de.lmu.ifi.dbs.elki.datasource.bundle.BundleMeta; +import de.lmu.ifi.dbs.elki.datasource.filter.AbstractStreamFilter; +import de.lmu.ifi.dbs.elki.math.random.RandomFactory; +import de.lmu.ifi.dbs.elki.utilities.Alias; +import de.lmu.ifi.dbs.elki.utilities.optionhandling.AbstractParameterizer; +import de.lmu.ifi.dbs.elki.utilities.optionhandling.OptionID; +import de.lmu.ifi.dbs.elki.utilities.optionhandling.constraints.CommonConstraints; +import de.lmu.ifi.dbs.elki.utilities.optionhandling.parameterization.Parameterization; +import de.lmu.ifi.dbs.elki.utilities.optionhandling.parameters.DoubleParameter; +import de.lmu.ifi.dbs.elki.utilities.optionhandling.parameters.RandomParameter; + +/** + * Subsampling stream filter. + * + * @author Erich Schubert + */ +@Alias({ "de.lmu.ifi.dbs.elki.datasource.filter.normalization.RandomSamplingStreamFilter" }) +public class RandomSamplingStreamFilter extends AbstractStreamFilter { + /** + * Probability + */ + protected double prob; + + /** + * Random generator + */ + protected Random random; + + /** + * Constructor. + * + * @param prob Probability + * @param rnd Random generator + */ + public RandomSamplingStreamFilter(double prob, RandomFactory rnd) { + super(); + this.prob = prob; + this.random = rnd.getSingleThreadedRandom(); + } + + @Override + public BundleMeta getMeta() { + return source.getMeta(); + } + + @Override + public Object data(int rnum) { + return source.data(rnum); + } + + @Override + public Event nextEvent() { + while(true) { + Event ev = source.nextEvent(); + switch(ev){ + case END_OF_STREAM: + return ev; + case META_CHANGED: + return ev; + case NEXT_OBJECT: + if(random.nextDouble() < prob) { + return ev; + } + continue; + } + } + } + + /** + * Parameterization class + * + * @author Erich Schubert + * + * @apiviz.exclude + */ + public static class Parameterizer extends AbstractParameterizer { + /** + * Option ID for sampling probability + */ + private static final OptionID PROB_ID = new OptionID("sampling.p", "Sampling probability. Each object has a chance of being samples with this probability."); + + /** + * Option ID for random seed + */ + private static final OptionID SEED_ID = new OptionID("sampling.seed", "Random generator seed for sampling."); + + /** + * Probability + */ + protected double prob; + + /** + * Random generator + */ + protected RandomFactory rnd; + + @Override + protected void makeOptions(Parameterization config) { + super.makeOptions(config); + DoubleParameter probP = new DoubleParameter(PROB_ID); + probP.addConstraint(CommonConstraints.GREATER_EQUAL_ZERO_DOUBLE); + probP.addConstraint(CommonConstraints.LESS_EQUAL_ONE_DOUBLE); + if(config.grab(probP)) { + prob = probP.getValue().doubleValue(); + } + RandomParameter rndP = new RandomParameter(SEED_ID); + if(config.grab(rndP)) { + rnd = rndP.getValue(); + } + } + + @Override + protected RandomSamplingStreamFilter makeInstance() { + return new RandomSamplingStreamFilter(prob, rnd); + } + } +} |