Merge pull request #81 from maciejkula/default_max_sampled

maciejkula · maciejkula · commit 810897a5c7b2 · 2016-05-24T10:26:55.000+01:00
Change default max_sampled to 10.
diff --git a/changelog.md b/changelog.md
@@ -14,6 +14,7 @@
 ### Changed
 - By default, an OpenMP-less version will be built on OSX. This allows much easier installation at the expense of
 performance.
+- The default value of the max_sampled argument is now 10. This represents a decent default value that allows fast training.
 
 ## [1.8][2016-01-14]
 ### Changed
diff --git a/lightfm/lightfm.py b/lightfm/lightfm.py
@@ -45,9 +45,11 @@ class LightFM(object):
     user_alpha: float, optional
         L2 penalty on user features.
     max_sampled: int, optional
-        maximum number of negative samples used during WARP fitting. Defaults to
-        the number of items divided by 10. Setting this to lower number may improve the speed of
-        WARP fitting at the expense of some accuracy.
+        maximum number of negative samples used during WARP fitting. It requires
+        a lot of sampling to find negative triplets for users that are already
+        well represented by the model; this can lead to very long training times
+        and overfitting. Setting this to a higher number will generally lead
+        to longer training times, but may in some cases improve accuracy.
     random_state: int seed, RandomState instance, or None
         The seed of the pseudo random number generator to use when shuffling the data and
         initializing the parameters.
@@ -116,7 +118,7 @@ def __init__(self, no_components=10, k=5, n=10,
                  learning_schedule='adagrad',
                  loss='logistic',
                  learning_rate=0.05, rho=0.95, epsilon=1e-6,
-                 item_alpha=0.0, user_alpha=0.0, max_sampled=None,
+                 item_alpha=0.0, user_alpha=0.0, max_sampled=10,
                  random_state=None):
 
         assert item_alpha >= 0.0
@@ -129,7 +131,7 @@ def __init__(self, no_components=10, k=5, n=10,
         assert learning_schedule in ('adagrad', 'adadelta')
         assert loss in ('logistic', 'warp', 'bpr', 'warp-kos')
 
-        if max_sampled is not None and max_sampled < 1:
+        if max_sampled < 1:
             raise ValueError('max_sampled must be a positive integer')
 
         self.loss = loss
@@ -294,9 +296,6 @@ def _process_sample_weight(self, interactions, sample_weight):
 
     def _get_lightfm_data(self):
 
-        max_sampled = (self.max_sampled if self.max_sampled is not None
-                       else self.item_embeddings.shape[0] / 10)
-
         lightfm_data = FastLightFM(self.item_embeddings,
                                    self.item_embedding_gradients,
                                    self.item_embedding_momentum,
@@ -314,7 +313,7 @@ def _get_lightfm_data(self):
                                    self.learning_rate,
                                    self.rho,
                                    self.epsilon,
-                                   max_sampled)
+                                   self.max_sampled)
 
         return lightfm_data