mahout-user mailing list archives

Site index · List index
Message view « Date » · « Thread »
Top « Date » · « Thread »
From Aleksander Sadecki <aleksander.sade...@pi.esisar.grenoble-inp.fr>
Subject Apache Mahout - KMeans Clustering
Date Wed, 21 May 2014 12:39:31 GMT
Hi,

Thank you for your answer.

I changed my pom.xml:

		<mahout.version>0.7</mahout.version>
		
		<mahout.groupid>org.apache.mahout</mahout.groupid>

	        <dependency>
			<groupId>${mahout.groupid}</groupId>
			<artifactId>mahout-core</artifactId>
			<version>${mahout.version}</version>
		</dependency>
		<dependency>
			<groupId>${mahout.groupid}</groupId>
			<artifactId>mahout-core</artifactId>
			<type>test-jar</type>
			<scope>test</scope>
			<version>${mahout.version}</version>
		</dependency>
		<dependency>
			<groupId>${mahout.groupid}</groupId>
			<artifactId>mahout-math</artifactId>
			<version>${mahout.version}</version>
		</dependency>
		<dependency>
			<groupId>${mahout.groupid}</groupId>
			<artifactId>mahout-math</artifactId>
			<type>test-jar</type>
			<scope>test</scope>
			<version>${mahout.version}</version>
		</dependency>
		<dependency>
			<groupId>${mahout.groupid}</groupId>
			<artifactId>mahout-examples</artifactId>
			<version>${mahout.version}</version>
		</dependency>

I copied classes:

mia.clustering.ClusterHelper
mia.clustering.ClustersFilter
mia.clustering.ch07.SimpleKMeansClustering

and finally I can compile it.

When I run it, I can see an error:

DEBUG Configuration - java.io.IOException: config()
	at org.apache.hadoop.conf.Configuration.<init>(Configuration.java:226)
	at org.apache.hadoop.conf.Configuration.<init>(Configuration.java:213)
	at com.sicap.targetme.bi.kmeans.KMeansClustering.main(KMeansClustering.java:53)

DEBUG Configuration - java.io.IOException: config()
	at org.apache.hadoop.conf.Configuration.<init>(Configuration.java:226)
	at org.apache.hadoop.conf.Configuration.<init>(Configuration.java:213)
	at org.apache.hadoop.security.UserGroupInformation.ensureInitialized(UserGroupInformation.java:159)
	at org.apache.hadoop.security.UserGroupInformation.isSecurityEnabled(UserGroupInformation.java:216)
	at org.apache.hadoop.security.UserGroupInformation.getLoginUser(UserGroupInformation.java:409)
	at org.apache.hadoop.security.UserGroupInformation.getCurrentUser(UserGroupInformation.java:395)
	at org.apache.hadoop.fs.FileSystem$Cache$Key.<init>(FileSystem.java:1418)
	at org.apache.hadoop.fs.FileSystem$Cache.get(FileSystem.java:1319)
	at org.apache.hadoop.fs.FileSystem.get(FileSystem.java:226)
	at org.apache.hadoop.fs.FileSystem.get(FileSystem.java:109)
	at com.sicap.targetme.bi.kmeans.KMeansClustering.main(KMeansClustering.java:54)

DEBUG Groups -  Creating new Groups object
DEBUG Groups - Group mapping impl=org.apache.hadoop.security.ShellBasedUnixGroupsMapping;
cacheTimeout=300000
DEBUG FileSystem - Creating filesystem for file:///
INFO  HadoopUtil - Deleting output
INFO  KMeansDriver - Input: testdata/points Clusters In: testdata/clusters Out: output Distance:
org.apache.mahout.common.distance.EuclideanDistanceMeasure
INFO  KMeansDriver - convergence: 0.001 max Iterations: 10 num Reduce Tasks: org.apache.mahout.math.VectorWritable
Input Vectors: {}
DEBUG KMeansUtil - Read 1 Cluster from testdata/clusters
DEBUG KMeansUtil - Read 1 Cluster from testdata/clusters
DEBUG Configuration - java.io.IOException: config()
	at org.apache.hadoop.conf.Configuration.<init>(Configuration.java:226)
	at org.apache.hadoop.conf.Configuration.<init>(Configuration.java:213)
	at org.apache.mahout.clustering.classify.ClusterClassifier.writePolicy(ClusterClassifier.java:232)
	at org.apache.mahout.clustering.classify.ClusterClassifier.writeToSeqFiles(ClusterClassifier.java:185)
	at org.apache.mahout.clustering.kmeans.KMeansDriver.buildClusters(KMeansDriver.java:224)
	at org.apache.mahout.clustering.kmeans.KMeansDriver.run(KMeansDriver.java:149)
	at com.sicap.targetme.bi.kmeans.KMeansClustering.main(KMeansClustering.java:73)

DEBUG Configuration - java.io.IOException: config()
	at org.apache.hadoop.conf.Configuration.<init>(Configuration.java:226)
	at org.apache.hadoop.conf.Configuration.<init>(Configuration.java:213)
	at org.apache.mahout.clustering.classify.ClusterClassifier.writeToSeqFiles(ClusterClassifier.java:186)
	at org.apache.mahout.clustering.kmeans.KMeansDriver.buildClusters(KMeansDriver.java:224)
	at org.apache.mahout.clustering.kmeans.KMeansDriver.run(KMeansDriver.java:149)
	at com.sicap.targetme.bi.kmeans.KMeansClustering.main(KMeansClustering.java:73)

DEBUG Configuration - java.io.IOException: config()
	at org.apache.hadoop.conf.Configuration.<init>(Configuration.java:226)
	at org.apache.hadoop.conf.Configuration.<init>(Configuration.java:213)
	at org.apache.mahout.clustering.classify.ClusterClassifier.readPolicy(ClusterClassifier.java:221)
	at org.apache.mahout.clustering.iterator.ClusterIterator.iterateMR(ClusterIterator.java:160)
	at org.apache.mahout.clustering.kmeans.KMeansDriver.buildClusters(KMeansDriver.java:229)
	at org.apache.mahout.clustering.kmeans.KMeansDriver.run(KMeansDriver.java:149)
	at com.sicap.targetme.bi.kmeans.KMeansClustering.main(KMeansClustering.java:73)

Cluster Iterator running iteration 1 over priorPath: output/clusters-0
DEBUG Configuration - java.io.IOException: config(config)
	at org.apache.hadoop.conf.Configuration.<init>(Configuration.java:259)
	at org.apache.hadoop.mapred.JobConf.<init>(JobConf.java:343)
	at org.apache.hadoop.mapreduce.JobContext.<init>(JobContext.java:76)
	at org.apache.hadoop.mapreduce.Job.<init>(Job.java:50)
	at org.apache.hadoop.mapreduce.Job.<init>(Job.java:54)
	at org.apache.mahout.clustering.iterator.ClusterIterator.iterateMR(ClusterIterator.java:168)
	at org.apache.mahout.clustering.kmeans.KMeansDriver.buildClusters(KMeansDriver.java:229)
	at org.apache.mahout.clustering.kmeans.KMeansDriver.run(KMeansDriver.java:149)
	at com.sicap.targetme.bi.kmeans.KMeansClustering.main(KMeansClustering.java:73)

DEBUG Configuration - java.io.IOException: config(config)
	at org.apache.hadoop.conf.Configuration.<init>(Configuration.java:259)
	at org.apache.hadoop.mapred.JobConf.<init>(JobConf.java:343)
	at org.apache.hadoop.mapred.LocalJobRunner.<init>(LocalJobRunner.java:420)
	at org.apache.hadoop.mapred.JobClient.init(JobClient.java:468)
	at org.apache.hadoop.mapred.JobClient.<init>(JobClient.java:453)
	at org.apache.hadoop.mapreduce.Job$1.run(Job.java:478)
	at java.security.AccessController.doPrivileged(Native Method)
	at javax.security.auth.Subject.doAs(Unknown Source)
	at org.apache.hadoop.security.UserGroupInformation.doAs(UserGroupInformation.java:1059)
	at org.apache.hadoop.mapreduce.Job.connect(Job.java:476)
	at org.apache.hadoop.mapreduce.Job.submit(Job.java:464)
	at org.apache.hadoop.mapreduce.Job.waitForCompletion(Job.java:495)
	at org.apache.mahout.clustering.iterator.ClusterIterator.iterateMR(ClusterIterator.java:185)
	at org.apache.mahout.clustering.kmeans.KMeansDriver.buildClusters(KMeansDriver.java:229)
	at org.apache.mahout.clustering.kmeans.KMeansDriver.run(KMeansDriver.java:149)
	at com.sicap.targetme.bi.kmeans.KMeansClustering.main(KMeansClustering.java:73)

DEBUG Configuration - java.io.IOException: config(config)
	at org.apache.hadoop.conf.Configuration.<init>(Configuration.java:259)
	at org.apache.hadoop.mapred.JobConf.<init>(JobConf.java:343)
	at org.apache.hadoop.mapred.LocalJobRunner.<init>(LocalJobRunner.java:421)
	at org.apache.hadoop.mapred.JobClient.init(JobClient.java:468)
	at org.apache.hadoop.mapred.JobClient.<init>(JobClient.java:453)
	at org.apache.hadoop.mapreduce.Job$1.run(Job.java:478)
	at java.security.AccessController.doPrivileged(Native Method)
	at javax.security.auth.Subject.doAs(Unknown Source)
	at org.apache.hadoop.security.UserGroupInformation.doAs(UserGroupInformation.java:1059)
	at org.apache.hadoop.mapreduce.Job.connect(Job.java:476)
	at org.apache.hadoop.mapreduce.Job.submit(Job.java:464)
	at org.apache.hadoop.mapreduce.Job.waitForCompletion(Job.java:495)
	at org.apache.mahout.clustering.iterator.ClusterIterator.iterateMR(ClusterIterator.java:185)
	at org.apache.mahout.clustering.kmeans.KMeansDriver.buildClusters(KMeansDriver.java:229)
	at org.apache.mahout.clustering.kmeans.KMeansDriver.run(KMeansDriver.java:149)
	at com.sicap.targetme.bi.kmeans.KMeansClustering.main(KMeansClustering.java:73)

Exception in thread "main" java.io.IOException: Failed to set permissions of path: \tmp\hadoop-mynamehere\mapred\staging\mynamehere-965149672\.staging
to 0700
	at org.apache.hadoop.fs.FileUtil.checkReturnValue(FileUtil.java:680)
	at org.apache.hadoop.fs.FileUtil.setPermission(FileUtil.java:653)
	at org.apache.hadoop.fs.RawLocalFileSystem.setPermission(RawLocalFileSystem.java:483)
	at org.apache.hadoop.fs.RawLocalFileSystem.mkdirs(RawLocalFileSystem.java:318)
	at org.apache.hadoop.fs.FilterFileSystem.mkdirs(FilterFileSystem.java:183)
	at org.apache.hadoop.mapreduce.JobSubmissionFiles.getStagingDir(JobSubmissionFiles.java:116)
	at org.apache.hadoop.mapred.JobClient$2.run(JobClient.java:813)
	at org.apache.hadoop.mapred.JobClient$2.run(JobClient.java:807)
	at java.security.AccessController.doPrivileged(Native Method)
	at javax.security.auth.Subject.doAs(Unknown Source)
	at org.apache.hadoop.security.UserGroupInformation.doAs(UserGroupInformation.java:1059)
	at org.apache.hadoop.mapred.JobClient.submitJobInternal(JobClient.java:807)
	at org.apache.hadoop.mapreduce.Job.submit(Job.java:465)
	at org.apache.hadoop.mapreduce.Job.waitForCompletion(Job.java:495)
	at org.apache.mahout.clustering.iterator.ClusterIterator.iterateMR(ClusterIterator.java:185)
	at org.apache.mahout.clustering.kmeans.KMeansDriver.buildClusters(KMeansDriver.java:229)
	at org.apache.mahout.clustering.kmeans.KMeansDriver.run(KMeansDriver.java:149)
	at com.sicap.targetme.bi.kmeans.KMeansClustering.main(KMeansClustering.java:73)
DEBUG FileSystem - Starting clear of FileSystem cache with 1 elements.
DEBUG FileSystem - Removing filesystem for file:///
DEBUG FileSystem - Removing filesystem for file:///
DEBUG FileSystem - Done clearing cache

So, what I should do now? Is it not a problem with Windows platform?

Thank you in advance
Aleksander Sadecki

Mime
View raw message