@Deprecated public class CanopyDriver extends AbstractJob
Modifier and Type | Field and Description |
---|---|
static String |
DEFAULT_CLUSTERED_POINTS_DIRECTORY
Deprecated.
|
argMap, inputFile, inputPath, outputFile, outputPath, tempPath
Constructor and Description |
---|
CanopyDriver()
Deprecated.
|
Modifier and Type | Method and Description |
---|---|
static org.apache.hadoop.fs.Path |
buildClusters(org.apache.hadoop.conf.Configuration conf,
org.apache.hadoop.fs.Path input,
org.apache.hadoop.fs.Path output,
DistanceMeasure measure,
double t1,
double t2,
double t3,
double t4,
int clusterFilter,
boolean runSequential)
Deprecated.
Build a directory of Canopy clusters from the input vectors and other
arguments.
|
static org.apache.hadoop.fs.Path |
buildClusters(org.apache.hadoop.conf.Configuration conf,
org.apache.hadoop.fs.Path input,
org.apache.hadoop.fs.Path output,
DistanceMeasure measure,
double t1,
double t2,
int clusterFilter,
boolean runSequential)
Deprecated.
Convenience method for backwards compatibility
|
static void |
main(String[] args)
Deprecated.
|
static void |
run(org.apache.hadoop.conf.Configuration conf,
org.apache.hadoop.fs.Path input,
org.apache.hadoop.fs.Path output,
DistanceMeasure measure,
double t1,
double t2,
boolean runClustering,
double clusterClassificationThreshold,
boolean runSequential)
Deprecated.
Convenience method to provide backward compatibility
|
static void |
run(org.apache.hadoop.conf.Configuration conf,
org.apache.hadoop.fs.Path input,
org.apache.hadoop.fs.Path output,
DistanceMeasure measure,
double t1,
double t2,
double t3,
double t4,
int clusterFilter,
boolean runClustering,
double clusterClassificationThreshold,
boolean runSequential)
Deprecated.
Build a directory of Canopy clusters from the input arguments and, if
requested, cluster the input vectors using these clusters
|
static void |
run(org.apache.hadoop.fs.Path input,
org.apache.hadoop.fs.Path output,
DistanceMeasure measure,
double t1,
double t2,
boolean runClustering,
double clusterClassificationThreshold,
boolean runSequential)
Deprecated.
Convenience method creates new Configuration() Build a directory of Canopy
clusters from the input arguments and, if requested, cluster the input
vectors using these clusters
|
int |
run(String[] args)
Deprecated.
|
addFlag, addInputOption, addOption, addOption, addOption, addOption, addOutputOption, buildOption, buildOption, getAnalyzerClassFromOption, getCLIOption, getConf, getDimensions, getFloat, getFloat, getGroup, getInputFile, getInputPath, getInt, getInt, getOption, getOption, getOption, getOptions, getOutputFile, getOutputPath, getOutputPath, getTempPath, getTempPath, hasOption, keyFor, maybePut, parseArguments, parseArguments, parseDirectories, prepareJob, prepareJob, prepareJob, prepareJob, setConf, setS3SafeCombinedInputPath, shouldRunNextPhase
public static final String DEFAULT_CLUSTERED_POINTS_DIRECTORY
public static void run(org.apache.hadoop.conf.Configuration conf, org.apache.hadoop.fs.Path input, org.apache.hadoop.fs.Path output, DistanceMeasure measure, double t1, double t2, double t3, double t4, int clusterFilter, boolean runClustering, double clusterClassificationThreshold, boolean runSequential) throws IOException, InterruptedException, ClassNotFoundException
conf
- the Configurationinput
- the Path to the directory containing input vectorsoutput
- the Path for all output directoriesmeasure
- the DistanceMeasuret1
- the double T1 distance metrict2
- the double T2 distance metrict3
- the reducer's double T1 distance metrict4
- the reducer's double T2 distance metricclusterFilter
- the minimum canopy size output by the mappersrunClustering
- cluster the input vectors if trueclusterClassificationThreshold
- vectors having pdf below this value will not be clustered. Its value should be between 0 and 1.runSequential
- execute sequentially if trueIOException
InterruptedException
ClassNotFoundException
public static void run(org.apache.hadoop.conf.Configuration conf, org.apache.hadoop.fs.Path input, org.apache.hadoop.fs.Path output, DistanceMeasure measure, double t1, double t2, boolean runClustering, double clusterClassificationThreshold, boolean runSequential) throws IOException, InterruptedException, ClassNotFoundException
public static void run(org.apache.hadoop.fs.Path input, org.apache.hadoop.fs.Path output, DistanceMeasure measure, double t1, double t2, boolean runClustering, double clusterClassificationThreshold, boolean runSequential) throws IOException, InterruptedException, ClassNotFoundException
input
- the Path to the directory containing input vectorsoutput
- the Path for all output directoriest1
- the double T1 distance metrict2
- the double T2 distance metricrunClustering
- cluster the input vectors if trueclusterClassificationThreshold
- vectors having pdf below this value will not be clustered. Its value should be between 0 and 1.runSequential
- execute sequentially if trueIOException
InterruptedException
ClassNotFoundException
public static org.apache.hadoop.fs.Path buildClusters(org.apache.hadoop.conf.Configuration conf, org.apache.hadoop.fs.Path input, org.apache.hadoop.fs.Path output, DistanceMeasure measure, double t1, double t2, int clusterFilter, boolean runSequential) throws IOException, InterruptedException, ClassNotFoundException
public static org.apache.hadoop.fs.Path buildClusters(org.apache.hadoop.conf.Configuration conf, org.apache.hadoop.fs.Path input, org.apache.hadoop.fs.Path output, DistanceMeasure measure, double t1, double t2, double t3, double t4, int clusterFilter, boolean runSequential) throws IOException, InterruptedException, ClassNotFoundException
conf
- the Configuration to useinput
- the Path to the directory containing input vectorsoutput
- the Path for all output directoriesmeasure
- the DistanceMeasuret1
- the double T1 distance metrict2
- the double T2 distance metrict3
- the reducer's double T1 distance metrict4
- the reducer's double T2 distance metricclusterFilter
- the int minimum size of canopies producedrunSequential
- a boolean indicates to run the sequential (reference) algorithmIOException
InterruptedException
ClassNotFoundException
Copyright © 2008–2015 The Apache Software Foundation. All rights reserved.