package de.lmu.ifi.dbs.elki.algorithm.outlier;
/*
This file is part of ELKI:
Environment for Developing KDD-Applications Supported by Index-Structures
Copyright (C) 2011
Ludwig-Maximilians-Universität München
Lehr- und Forschungseinheit für Datenbanksysteme
ELKI Development Team
This program is free software: you can redistribute it and/or modify
it under the terms of the GNU Affero General Public License as published by
the Free Software Foundation, either version 3 of the License, or
(at your option) any later version.
This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU Affero General Public License for more details.
You should have received a copy of the GNU Affero General Public License
along with this program. If not, see .
*/
import de.lmu.ifi.dbs.elki.algorithm.AbstractDistanceBasedAlgorithm;
import de.lmu.ifi.dbs.elki.data.type.TypeInformation;
import de.lmu.ifi.dbs.elki.data.type.TypeUtil;
import de.lmu.ifi.dbs.elki.database.Database;
import de.lmu.ifi.dbs.elki.database.datastore.DataStore;
import de.lmu.ifi.dbs.elki.database.relation.MaterializedRelation;
import de.lmu.ifi.dbs.elki.database.relation.Relation;
import de.lmu.ifi.dbs.elki.distance.distancefunction.DistanceFunction;
import de.lmu.ifi.dbs.elki.distance.distancevalue.Distance;
import de.lmu.ifi.dbs.elki.result.outlier.OutlierResult;
import de.lmu.ifi.dbs.elki.result.outlier.OutlierScoreMeta;
import de.lmu.ifi.dbs.elki.result.outlier.ProbabilisticOutlierScore;
import de.lmu.ifi.dbs.elki.utilities.optionhandling.OptionID;
import de.lmu.ifi.dbs.elki.utilities.optionhandling.parameterization.Parameterization;
import de.lmu.ifi.dbs.elki.utilities.optionhandling.parameters.DistanceParameter;
/**
* Simple distance based outlier detection algorithms.
*
*
* Reference: E.M. Knorr, R. T. Ng: Algorithms for Mining Distance-Based
* Outliers in Large Datasets, In: Procs Int. Conf. on Very Large Databases
* (VLDB'98), New York, USA, 1998.
*
* @author Lisa Reichert
*
* @param the type of DatabaseObjects handled by this Algorithm
* @param the type of Distance used by this Algorithm
*/
public abstract class AbstractDBOutlier> extends AbstractDistanceBasedAlgorithm implements OutlierAlgorithm {
/**
* Parameter to specify the size of the D-neighborhood
*/
public static final OptionID D_ID = OptionID.getOrCreateOptionID("dbod.d", "size of the D-neighborhood");
/**
* Holds the value of {@link #D_ID}.
*/
private D d;
/**
* Constructor with actual parameters.
*
* @param distanceFunction distance function to use
* @param d d value
*/
public AbstractDBOutlier(DistanceFunction super O, D> distanceFunction, D d) {
super(distanceFunction);
this.d = d;
}
/**
* Runs the algorithm in the timed evaluation part.
*
*/
public OutlierResult run(Database database, Relation relation) throws IllegalStateException {
// Run the actual score process
DataStore dbodscore = computeOutlierScores(database, relation, d);
// Build result representation.
Relation scoreResult = new MaterializedRelation("Density-Based Outlier Detection", "db-outlier", TypeUtil.DOUBLE, dbodscore, relation.getDBIDs());
OutlierScoreMeta scoreMeta = new ProbabilisticOutlierScore();
return new OutlierResult(scoreMeta, scoreResult);
}
/**
* computes an outlier score for each object of the database.
*
* @param database Database
* @param relation Relation
* @param d distance
* @return computed scores
*/
protected abstract DataStore computeOutlierScores(Database database, Relation relation, D d);
@Override
public TypeInformation[] getInputTypeRestriction() {
return TypeUtil.array(getDistanceFunction().getInputTypeRestriction());
}
/**
* Parameterization class.
*
* @author Erich Schubert
*
* @apiviz.exclude
*/
public static abstract class Parameterizer> extends AbstractDistanceBasedAlgorithm.Parameterizer {
/**
* Query radius
*/
protected D d = null;
@Override
protected void makeOptions(Parameterization config) {
super.makeOptions(config);
configD(config, distanceFunction);
}
/**
* Grab the 'd' configuration option.
*
* @param config Parameterization
*/
protected void configD(Parameterization config, DistanceFunction, D> distanceFunction) {
final D distanceFactory = (distanceFunction != null) ? distanceFunction.getDistanceFactory() : null;
final DistanceParameter param = new DistanceParameter(D_ID, distanceFactory);
if(config.grab(param)) {
d = param.getValue();
}
}
}
}