jmannix | 24 May 2013 19:11
Picon
Favicon

svn commit: r1486122 [2/2] - in /mahout/trunk: core/src/main/java/org/apache/mahout/cf/taste/hadoop/als/ core/src/main/java/org/apache/mahout/cf/taste/hadoop/item/ core/src/main/java/org/apache/mahout/cf/taste/hadoop/preparation/ core/src/main/java/org...

Modified: mahout/trunk/core/src/test/java/org/apache/mahout/cf/taste/hadoop/als/ParallelALSFactorizationJobTest.java
URL: http://svn.apache.org/viewvc/mahout/trunk/core/src/test/java/org/apache/mahout/cf/taste/hadoop/als/ParallelALSFactorizationJobTest.java?rev=1486122&r1=1486121&r2=1486122&view=diff
==============================================================================
--- mahout/trunk/core/src/test/java/org/apache/mahout/cf/taste/hadoop/als/ParallelALSFactorizationJobTest.java (original)
+++ mahout/trunk/core/src/test/java/org/apache/mahout/cf/taste/hadoop/als/ParallelALSFactorizationJobTest.java Fri May 24 17:11:20 2013
 <at>  <at>  -27,6 +27,7  <at>  <at>  import org.apache.mahout.math.Matrix;
 import org.apache.mahout.math.MatrixSlice;
 import org.apache.mahout.math.SparseRowMatrix;
 import org.apache.mahout.math.Vector;
+import org.apache.mahout.math.Vector.Element;
 import org.apache.mahout.math.hadoop.MathHelper;
 import org.junit.Before;
 import org.junit.Test;
 <at>  <at>  -34,7 +35,6  <at>  <at>  import org.slf4j.Logger;
 import org.slf4j.LoggerFactory;
 
 import java.io.File;
-import java.util.Iterator;
 
 public class ParallelALSFactorizationJobTest extends TasteTestCase {
 
 <at>  <at>  -127,12 +127,8  <at>  <at>  public class ParallelALSFactorizationJob
     log.info(info.toString());
 
     RunningAverage avg = new FullRunningAverage();
-    Iterator<MatrixSlice> sliceIterator = preferences.iterateAll();
-    while (sliceIterator.hasNext()) {
-      MatrixSlice slice = sliceIterator.next();
-      Iterator<Vector.Element> elementIterator = slice.vector().iterateNonZero();
-      while (elementIterator.hasNext()) {
(Continue reading)

jmannix | 24 May 2013 19:11
Picon
Favicon

svn commit: r1486122 [1/2] - in /mahout/trunk: core/src/main/java/org/apache/mahout/cf/taste/hadoop/als/ core/src/main/java/org/apache/mahout/cf/taste/hadoop/item/ core/src/main/java/org/apache/mahout/cf/taste/hadoop/preparation/ core/src/main/java/org...

Author: jmannix
Date: Fri May 24 17:11:20 2013
New Revision: 1486122

URL: http://svn.apache.org/r1486122
Log:
Removes Iterable and iterateNonZero() from Vector interface, replaces with two Iterable-returning methods fixes MAHOUT-1227

Modified:
    mahout/trunk/core/src/main/java/org/apache/mahout/cf/taste/hadoop/als/ALS.java
    mahout/trunk/core/src/main/java/org/apache/mahout/cf/taste/hadoop/als/ParallelALSFactorizationJob.java
    mahout/trunk/core/src/main/java/org/apache/mahout/cf/taste/hadoop/als/PredictionMapper.java
    mahout/trunk/core/src/main/java/org/apache/mahout/cf/taste/hadoop/item/AggregateAndRecommendReducer.java
    mahout/trunk/core/src/main/java/org/apache/mahout/cf/taste/hadoop/item/UserVectorSplitterMapper.java
    mahout/trunk/core/src/main/java/org/apache/mahout/cf/taste/hadoop/preparation/ToItemVectorsMapper.java
    mahout/trunk/core/src/main/java/org/apache/mahout/cf/taste/hadoop/similarity/item/ItemSimilarityJob.java
    mahout/trunk/core/src/main/java/org/apache/mahout/classifier/discriminative/WinnowTrainer.java
    mahout/trunk/core/src/main/java/org/apache/mahout/classifier/naivebayes/AbstractNaiveBayesClassifier.java
    mahout/trunk/core/src/main/java/org/apache/mahout/classifier/naivebayes/test/TestNaiveBayesDriver.java
    mahout/trunk/core/src/main/java/org/apache/mahout/classifier/naivebayes/training/ComplementaryThetaTrainer.java
    mahout/trunk/core/src/main/java/org/apache/mahout/classifier/naivebayes/training/StandardThetaTrainer.java
    mahout/trunk/core/src/main/java/org/apache/mahout/classifier/sgd/AbstractOnlineLogisticRegression.java
    mahout/trunk/core/src/main/java/org/apache/mahout/classifier/sgd/ModelDissector.java
    mahout/trunk/core/src/main/java/org/apache/mahout/clustering/AbstractCluster.java
    mahout/trunk/core/src/main/java/org/apache/mahout/clustering/classify/ClusterClassificationDriver.java
    mahout/trunk/core/src/main/java/org/apache/mahout/clustering/classify/ClusterClassificationMapper.java
    mahout/trunk/core/src/main/java/org/apache/mahout/clustering/dirichlet/models/GaussianCluster.java
    mahout/trunk/core/src/main/java/org/apache/mahout/clustering/iterator/CIMapper.java
    mahout/trunk/core/src/main/java/org/apache/mahout/clustering/iterator/ClusterIterator.java
    mahout/trunk/core/src/main/java/org/apache/mahout/clustering/lda/cvb/TopicModel.java
(Continue reading)

srowen | 22 May 2013 18:37
Picon
Favicon

svn commit: r1485277 - in /mahout/trunk: integration/pom.xml integration/src/main/java/org/apache/mahout/cf/taste/impl/model/hbase/HBaseDataModel.java pom.xml

Author: srowen
Date: Wed May 22 16:37:44 2013
New Revision: 1485277

URL: http://svn.apache.org/r1485277
Log:
Update a few plugin and integration-related dependencies, and require Maven 3 for consistency

Modified:
    mahout/trunk/integration/pom.xml
    mahout/trunk/integration/src/main/java/org/apache/mahout/cf/taste/impl/model/hbase/HBaseDataModel.java
    mahout/trunk/pom.xml

Modified: mahout/trunk/integration/pom.xml
URL: http://svn.apache.org/viewvc/mahout/trunk/integration/pom.xml?rev=1485277&r1=1485276&r2=1485277&view=diff
==============================================================================
--- mahout/trunk/integration/pom.xml (original)
+++ mahout/trunk/integration/pom.xml Wed May 22 16:37:44 2013
 <at>  <at>  -78,7 +78,7  <at>  <at> 
       <plugin>
         <groupId>org.mortbay.jetty</groupId>
         <artifactId>maven-jetty-plugin</artifactId>
-        <version>6.1.10</version>
+        <version>6.1.26</version>
       </plugin>
     </plugins>

 <at>  <at>  -149,19 +149,19  <at>  <at> 
     <dependency>
       <groupId>org.mongodb</groupId>
(Continue reading)

dfilimon | 21 May 2013 12:52
Picon
Favicon

svn commit: r1484747 - in /mahout/trunk: CHANGELOG core/src/main/java/org/apache/mahout/clustering/streaming/cluster/StreamingKMeans.java

Author: dfilimon
Date: Tue May 21 10:52:25 2013
New Revision: 1484747

URL: http://svn.apache.org/r1484747
Log:
MAHOUT-1223: Fixed point being skipped in StreamingKMeans when iterating through centroids from a reducer

When calling StreamingKMeans in the reducer (to collapse the number of clusters
to they can fit into memory), the clustering is done on the Hadoop reducer
iterable.
Currently, the first Centroid is added directly as a special case and then is
skipped when iterating through the main loop.
However, Hadoop reducer iterables cannot be rewound therefore causing SKM to
skip one point.

Modified:
    mahout/trunk/CHANGELOG
    mahout/trunk/core/src/main/java/org/apache/mahout/clustering/streaming/cluster/StreamingKMeans.java

Modified: mahout/trunk/CHANGELOG
URL: http://svn.apache.org/viewvc/mahout/trunk/CHANGELOG?rev=1484747&r1=1484746&r2=1484747&view=diff
==============================================================================
--- mahout/trunk/CHANGELOG (original)
+++ mahout/trunk/CHANGELOG Tue May 21 10:52:25 2013
 <at>  <at>  -2,6 +2,8  <at>  <at>  Mahout Change Log

 Release 0.8 - unreleased

+__MAHOUT-1223: Fixed point skipped in StreamingKMeans when iterating through centroids from a reducer (dfilimon)
(Continue reading)

dfilimon | 21 May 2013 10:38
Picon
Favicon

svn commit: r1484697 - in /mahout/trunk: CHANGELOG core/src/main/java/org/apache/mahout/math/neighborhood/FastProjectionSearch.java

Author: dfilimon
Date: Tue May 21 08:38:48 2013
New Revision: 1484697

URL: http://svn.apache.org/r1484697
Log:
MAHOUT-1222: Fix total weight in FastProjectionSearch

Sometimes when removing a Vector that's in pendingAdditions, the wrong Vector
gets removed.
This happens because the closest Vector is removed rather than the one that's
equal to it.

Modified:
    mahout/trunk/CHANGELOG
    mahout/trunk/core/src/main/java/org/apache/mahout/math/neighborhood/FastProjectionSearch.java

Modified: mahout/trunk/CHANGELOG
URL: http://svn.apache.org/viewvc/mahout/trunk/CHANGELOG?rev=1484697&r1=1484696&r2=1484697&view=diff
==============================================================================
--- mahout/trunk/CHANGELOG (original)
+++ mahout/trunk/CHANGELOG Tue May 21 08:38:48 2013
 <at>  <at>  -2,6 +2,8  <at>  <at>  Mahout Change Log

 Release 0.8 - unreleased

+__MAHOUT-1222: Fix total weight in FastProjectionSearch (dfilimon)
+
 __MAHOUT-1219: Remove LSHSearcher from StreamingKMeansTest. It causes it to sometimes fail (dfilimon)

(Continue reading)

dfilimon | 20 May 2013 16:58
Picon
Favicon

svn commit: r1484495 - in /mahout/trunk: CHANGELOG core/src/test/java/org/apache/mahout/clustering/streaming/cluster/StreamingKMeansTest.java

Author: dfilimon
Date: Mon May 20 14:58:18 2013
New Revision: 1484495

URL: http://svn.apache.org/r1484495
Log:

MAHOUT-1219: Remove LSHSearcher from StreamingKMeansTest.

It causes it to sometimes fail.

Modified:
    mahout/trunk/CHANGELOG
    mahout/trunk/core/src/test/java/org/apache/mahout/clustering/streaming/cluster/StreamingKMeansTest.java

Modified: mahout/trunk/CHANGELOG
URL: http://svn.apache.org/viewvc/mahout/trunk/CHANGELOG?rev=1484495&r1=1484494&r2=1484495&view=diff
==============================================================================
--- mahout/trunk/CHANGELOG (original)
+++ mahout/trunk/CHANGELOG Mon May 20 14:58:18 2013
 <at>  <at>  -2,6 +2,8  <at>  <at>  Mahout Change Log

 Release 0.8 - unreleased

+__MAHOUT-1219: Remove LSHSearcher from StreamingKMeansTest. It causes it to sometimes fail (dfilimon)
+
   MAHOUT-1221: SparseMatrix.viewRow is sometimes readonly. (Maysam Yabandeh via smarthi)

 __MAHOUT-1219: Remove LSHSearcher from SearchQualityTest. It causes it to fail, but the failure is not
very meaningful (dfilimon)
(Continue reading)

smarthi | 20 May 2013 08:04
Picon
Favicon

svn commit: r1484376 - in /mahout/trunk: CHANGELOG math/src/main/java/org/apache/mahout/math/SparseMatrix.java math/src/test/java/org/apache/mahout/math/TestSparseMatrix.java

Author: smarthi
Date: Mon May 20 06:04:47 2013
New Revision: 1484376

URL: http://svn.apache.org/r1484376
Log:
MAHOUT-1221: SparseMatrix.viewRow is sometimes readonly

Modified:
    mahout/trunk/CHANGELOG
    mahout/trunk/math/src/main/java/org/apache/mahout/math/SparseMatrix.java
    mahout/trunk/math/src/test/java/org/apache/mahout/math/TestSparseMatrix.java

Modified: mahout/trunk/CHANGELOG
URL: http://svn.apache.org/viewvc/mahout/trunk/CHANGELOG?rev=1484376&r1=1484375&r2=1484376&view=diff
==============================================================================
--- mahout/trunk/CHANGELOG (original)
+++ mahout/trunk/CHANGELOG Mon May 20 06:04:47 2013
 <at>  <at>  -2,6 +2,8  <at>  <at>  Mahout Change Log

 Release 0.8 - unreleased

+  MAHOUT-1221: SparseMatrix.viewRow is sometimes readonly. (Maysam Yabandeh via smarthi)
+
 __MAHOUT-1219: Remove LSHSearcher from SearchQualityTest. It causes it to fail, but the failure is not
very meaningful (dfilimon)

 __MAHOUT-1217: Nearest neighbor searchers sometimes fail to remove points: fix in
FastProjectionSearch's searchFirst (dfilimon)

(Continue reading)

confluence | 19 May 2013 07:24
Picon
Favicon

[CONF] Apache Mahout > BuildingMahout

Space: Apache Mahout (https://cwiki.apache.org/confluence/display/MAHOUT)
Page: BuildingMahout (https://cwiki.apache.org/confluence/display/MAHOUT/BuildingMahout)

Change Comment:
---------------------------------------------------------------------
Added comment to build trunk with Maven 3.x; 2.2 seems not to work, but 3.x does.  See http://comments.gmane.org/gmane.comp.apache.mahout.user/16572

Edited by Chris Bouzek:
---------------------------------------------------------------------
h1. Prerequisites for Building Mahout

* Java JDK *1.6*
* Maven *2.2* or higher ([http://maven.apache.org/]).  Use *3.x* to build from SVN.

h1. Get the Source Code

h2. Latest (Recommended)

Use [Subversion|http://subversion.tigris.org] to check out the code:
{code}
svn co http://svn.apache.org/repos/asf/mahout/trunk
{code}

h2. Release

[Download source |http://www.apache.org/dyn/closer.cgi/mahout/]
Maven artifacts should be in the usual place: [http://repo2.maven.org/maven2/org/apache/mahout/]

h1. Compiling

(Continue reading)

confluence | 19 May 2013 07:21
Picon
Favicon

[CONF] Apache Mahout > System Requirements

Space: Apache Mahout (https://cwiki.apache.org/confluence/display/MAHOUT)
Page: System Requirements (https://cwiki.apache.org/confluence/display/MAHOUT/System+Requirements)

Change Comment:
---------------------------------------------------------------------
Maven 2.2 seems not to work, but 3.x does.  See http://comments.gmane.org/gmane.comp.apache.mahout.user/16572

Edited by Chris Bouzek:
---------------------------------------------------------------------
* Java 1.6.x or greater.
* Maven 3.x to build the source code.

CPU, Disk and Memory requirements are based on the many choices made in implementing your application with
Mahout (document size, number of documents, and number of hits retrieved to name a few.)

Several of the Mahout algorithms are implemented to work on Hadoop clusters. If not advertised
differently, those implementations work with Hadoop 0.20.0 or greater.

Change your notification preferences:
https://cwiki.apache.org/confluence/users/viewnotifications.action    

dfilimon | 17 May 2013 15:44
Picon
Favicon

svn commit: r1483799 - in /mahout/trunk: CHANGELOG core/src/test/java/org/apache/mahout/math/neighborhood/SearchQualityTest.java

Author: dfilimon
Date: Fri May 17 13:44:32 2013
New Revision: 1483799

URL: http://svn.apache.org/r1483799
Log:
MAHOUT-1219: LSHSearcher not always faster than BruteSearcher

The existing "benchmark" is not conclusive enough as it doesn't take into
account the adaptive nature of the JVM, doesn't run the test multiple times and
should be replaced with something more thorough.
Removing LSHSearcher from the tests for now.

Modified:
    mahout/trunk/CHANGELOG
    mahout/trunk/core/src/test/java/org/apache/mahout/math/neighborhood/SearchQualityTest.java

Modified: mahout/trunk/CHANGELOG
URL: http://svn.apache.org/viewvc/mahout/trunk/CHANGELOG?rev=1483799&r1=1483798&r2=1483799&view=diff
==============================================================================
--- mahout/trunk/CHANGELOG (original)
+++ mahout/trunk/CHANGELOG Fri May 17 13:44:32 2013
 <at>  <at>  -2,6 +2,8  <at>  <at>  Mahout Change Log

 Release 0.8 - unreleased

+__MAHOUT-1219: Remove LSHSearcher from SearchQualityTest. It causes it to fail, but the failure is not
very meaningful (dfilimon)
+
 __MAHOUT-1217: Nearest neighbor searchers sometimes fail to remove points: fix in
(Continue reading)

dfilimon | 17 May 2013 14:49
Picon
Favicon

svn commit: r1483776 - in /mahout/trunk: CHANGELOG core/src/main/java/org/apache/mahout/math/neighborhood/FastProjectionSearch.java core/src/test/java/org/apache/mahout/math/neighborhood/SearchSanityTest.java

Author: dfilimon
Date: Fri May 17 12:49:52 2013
New Revision: 1483776

URL: http://svn.apache.org/r1483776
Log:
MAHOUT-1217: Nearest neighbor searchers sometimes fail to remove points

This fixes FastProjectionSearch's searchFirst() which was not also searching
through pendingAdditions. I think I replicated the bug in the new testRemove()
in SearchSanityTest that now passes.

Modified:
    mahout/trunk/CHANGELOG
    mahout/trunk/core/src/main/java/org/apache/mahout/math/neighborhood/FastProjectionSearch.java
    mahout/trunk/core/src/test/java/org/apache/mahout/math/neighborhood/SearchSanityTest.java

Modified: mahout/trunk/CHANGELOG
URL: http://svn.apache.org/viewvc/mahout/trunk/CHANGELOG?rev=1483776&r1=1483775&r2=1483776&view=diff
==============================================================================
--- mahout/trunk/CHANGELOG (original)
+++ mahout/trunk/CHANGELOG Fri May 17 12:49:52 2013
 <at>  <at>  -2,6 +2,8  <at>  <at>  Mahout Change Log

 Release 0.8 - unreleased

+__MAHOUT-1217: Nearest neighbor searchers sometimes fail to remove points: fix in
FastProjectionSearch's searchFirst (dfilimon)
+
 __MAHOUT-1216: Add locality sensitive hashing and a LocalitySensitiveHash searcher (dfilimon)
(Continue reading)


Gmane