package de.lmu.ifi.dbs.elki.algorithm.outlier; /* This file is part of ELKI: Environment for Developing KDD-Applications Supported by Index-Structures Copyright (C) 2011 Ludwig-Maximilians-Universität München Lehr- und Forschungseinheit für Datenbanksysteme ELKI Development Team This program is free software: you can redistribute it and/or modify it under the terms of the GNU Affero General Public License as published by the Free Software Foundation, either version 3 of the License, or (at your option) any later version. This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU Affero General Public License for more details. You should have received a copy of the GNU Affero General Public License along with this program. If not, see . */ import de.lmu.ifi.dbs.elki.algorithm.AbstractDistanceBasedAlgorithm; import de.lmu.ifi.dbs.elki.data.type.TypeInformation; import de.lmu.ifi.dbs.elki.data.type.TypeUtil; import de.lmu.ifi.dbs.elki.database.Database; import de.lmu.ifi.dbs.elki.database.datastore.DataStore; import de.lmu.ifi.dbs.elki.database.relation.MaterializedRelation; import de.lmu.ifi.dbs.elki.database.relation.Relation; import de.lmu.ifi.dbs.elki.distance.distancefunction.DistanceFunction; import de.lmu.ifi.dbs.elki.distance.distancevalue.Distance; import de.lmu.ifi.dbs.elki.result.outlier.OutlierResult; import de.lmu.ifi.dbs.elki.result.outlier.OutlierScoreMeta; import de.lmu.ifi.dbs.elki.result.outlier.ProbabilisticOutlierScore; import de.lmu.ifi.dbs.elki.utilities.optionhandling.OptionID; import de.lmu.ifi.dbs.elki.utilities.optionhandling.parameterization.Parameterization; import de.lmu.ifi.dbs.elki.utilities.optionhandling.parameters.DistanceParameter; /** * Simple distance based outlier detection algorithms. * *

* Reference: E.M. Knorr, R. T. Ng: Algorithms for Mining Distance-Based * Outliers in Large Datasets, In: Procs Int. Conf. on Very Large Databases * (VLDB'98), New York, USA, 1998. * * @author Lisa Reichert * * @param the type of DatabaseObjects handled by this Algorithm * @param the type of Distance used by this Algorithm */ public abstract class AbstractDBOutlier> extends AbstractDistanceBasedAlgorithm implements OutlierAlgorithm { /** * Parameter to specify the size of the D-neighborhood */ public static final OptionID D_ID = OptionID.getOrCreateOptionID("dbod.d", "size of the D-neighborhood"); /** * Holds the value of {@link #D_ID}. */ private D d; /** * Constructor with actual parameters. * * @param distanceFunction distance function to use * @param d d value */ public AbstractDBOutlier(DistanceFunction distanceFunction, D d) { super(distanceFunction); this.d = d; } /** * Runs the algorithm in the timed evaluation part. * */ public OutlierResult run(Database database, Relation relation) throws IllegalStateException { // Run the actual score process DataStore dbodscore = computeOutlierScores(database, relation, d); // Build result representation. Relation scoreResult = new MaterializedRelation("Density-Based Outlier Detection", "db-outlier", TypeUtil.DOUBLE, dbodscore, relation.getDBIDs()); OutlierScoreMeta scoreMeta = new ProbabilisticOutlierScore(); return new OutlierResult(scoreMeta, scoreResult); } /** * computes an outlier score for each object of the database. * * @param database Database * @param relation Relation * @param d distance * @return computed scores */ protected abstract DataStore computeOutlierScores(Database database, Relation relation, D d); @Override public TypeInformation[] getInputTypeRestriction() { return TypeUtil.array(getDistanceFunction().getInputTypeRestriction()); } /** * Parameterization class. * * @author Erich Schubert * * @apiviz.exclude */ public static abstract class Parameterizer> extends AbstractDistanceBasedAlgorithm.Parameterizer { /** * Query radius */ protected D d = null; @Override protected void makeOptions(Parameterization config) { super.makeOptions(config); configD(config, distanceFunction); } /** * Grab the 'd' configuration option. * * @param config Parameterization */ protected void configD(Parameterization config, DistanceFunction distanceFunction) { final D distanceFactory = (distanceFunction != null) ? distanceFunction.getDistanceFactory() : null; final DistanceParameter param = new DistanceParameter(D_ID, distanceFactory); if(config.grab(param)) { d = param.getValue(); } } } }