Felixhawk
diff --git a/‎benchmarks/bench_plot_nmf.py
Lines changed: 21 additions & 15 deletions b/‎benchmarks/bench_plot_nmf.py
Lines changed: 21 additions & 15 deletions
@@ -4,10 +4,12 @@
 
 from __future__ import print_function
 
+from collections import defaultdict
 import gc
 from time import time
+
 import numpy as np
-from collections import defaultdict
+from scipy.linalg import norm
 
 from sklearn.decomposition.nmf import NMF, _initialize_nmf
 from sklearn.datasets.samples_generator import make_low_rank_matrix
@@ -27,7 +29,7 @@ def alt_nnmf(V, r, max_iter=1000, tol=1e-3, R=None):
     r : integer
         number of latent features
     max_iter : integer, optional
-        maximum number of iterations (default: 10000)
+        maximum number of iterations (default: 1000)
     tol : double
         tolerance threshold for early exit (when the update factor is within
         tol of 1., the function exits)
@@ -62,25 +64,29 @@ def alt_nnmf(V, r, max_iter=1000, tol=1e-3, R=None):
         H *= updateH
         updateW = np.dot(V, H.T) / (np.dot(W, np.dot(H, H.T)) + eps)
         W *= updateW
-        if True or (i % 10) == 0:
+        if i % 10 == 0:
             max_update = max(updateW.max(), updateH.max())
             if abs(1. - max_update) < tol:
                 break
     return W, H
 
 
-def compute_bench(samples_range, features_range, rank=50, tolerance=1e-7):
+def report(error, time):
+    print("Frobenius loss: %.5f" % error)
+    print("Took: %.2fs" % time)
+    print()
+
+
+def benchmark(samples_range, features_range, rank=50, tolerance=1e-5):
     it = 0
     timeset = defaultdict(lambda: [])
     err = defaultdict(lambda: [])
 
     max_it = len(samples_range) * len(features_range)
     for n_samples in samples_range:
         for n_features in features_range:
-            it += 1
-            print('====================')
-            print('Iteration %03d of %03d' % (it, max_it))
-            print('====================')
+            print("%2d samples, %2d features" % (n_samples, n_features))
+            print('=======================')
             X = np.abs(make_low_rank_matrix(n_samples, n_features,
                        effective_rank=rank,  tail_strength=0.2))
 
@@ -91,7 +97,7 @@ def compute_bench(samples_range, features_range, rank=50, tolerance=1e-7):
             tend = time() - tstart
             timeset['nndsvd-nmf'].append(tend)
             err['nndsvd-nmf'].append(m.reconstruction_err_)
-            print(m.reconstruction_err_, tend)
+            report(m.reconstruction_err_, tend)
 
             gc.collect()
             print("benchmarking nndsvda-nmf: ")
@@ -101,7 +107,7 @@ def compute_bench(samples_range, features_range, rank=50, tolerance=1e-7):
             tend = time() - tstart
             timeset['nndsvda-nmf'].append(tend)
             err['nndsvda-nmf'].append(m.reconstruction_err_)
-            print(m.reconstruction_err_, tend)
+            report(m.reconstruction_err_, tend)
 
             gc.collect()
             print("benchmarking nndsvdar-nmf: ")
@@ -111,7 +117,7 @@ def compute_bench(samples_range, features_range, rank=50, tolerance=1e-7):
             tend = time() - tstart
             timeset['nndsvdar-nmf'].append(tend)
             err['nndsvdar-nmf'].append(m.reconstruction_err_)
-            print(m.reconstruction_err_, tend)
+            report(m.reconstruction_err_, tend)
 
             gc.collect()
             print("benchmarking random-nmf")
@@ -121,7 +127,7 @@ def compute_bench(samples_range, features_range, rank=50, tolerance=1e-7):
             tend = time() - tstart
             timeset['random-nmf'].append(tend)
             err['random-nmf'].append(m.reconstruction_err_)
-            print(m.reconstruction_err_, tend)
+            report(m.reconstruction_err_, tend)
 
             gc.collect()
             print("benchmarking alt-random-nmf")
@@ -130,7 +136,7 @@ def compute_bench(samples_range, features_range, rank=50, tolerance=1e-7):
             tend = time() - tstart
             timeset['alt-random-nmf'].append(tend)
             err['alt-random-nmf'].append(np.linalg.norm(X - np.dot(W, H)))
-            print(np.linalg.norm(X - np.dot(W, H)), tend)
+            report(norm(X - np.dot(W, H)), tend)
 
     return timeset, err
 
@@ -142,10 +148,10 @@ def compute_bench(samples_range, features_range, rank=50, tolerance=1e-7):
 
     samples_range = np.linspace(50, 500, 3).astype(np.int)
     features_range = np.linspace(50, 500, 3).astype(np.int)
-    timeset, err = compute_bench(samples_range, features_range)
+    timeset, err = benchmark(samples_range, features_range)
 
     for i, results in enumerate((timeset, err)):
-        fig = plt.figure('scikit-learn Non-Negative Matrix Factorization benchmkar results')
+        fig = plt.figure('scikit-learn Non-Negative Matrix Factorization benchmark results')
         ax = fig.gca(projection='3d')
         for c, (label, timings) in zip('rbgcm', sorted(results.iteritems())):
             X, Y = np.meshgrid(samples_range, features_range)