4 files changed, 104 insertions, 75 deletions
diff --git a/examples/plot_otda_color_images.py b/examples/plot_otda_color_images.py
index e77aec0..62383a2 100644
--- a/examples/plot_otda_color_images.py
+++ b/examples/plot_otda_color_images.py
@@ -4,7 +4,7 @@
 OT for image color adaptation
 =============================
 
-This example presents a way of transferring colors between two image
+This example presents a way of transferring colors between two images
 with Optimal Transport as introduced in [6]
 
 [6] Ferradans, S., Papadakis, N., Peyre, G., & Aujol, J. F. (2014).
@@ -27,7 +27,7 @@ r = np.random.RandomState(42)
 
 
 def im2mat(I):
-    """Converts and image to matrix (one pixel per line)"""
+    """Converts an image to matrix (one pixel per line)"""
     return I.reshape((I.shape[0] * I.shape[1], I.shape[2]))
 
 
@@ -115,8 +115,8 @@ ot_sinkhorn.fit(Xs=Xs, Xt=Xt)
 transp_Xs_emd = ot_emd.transform(Xs=X1)
 transp_Xt_emd = ot_emd.inverse_transform(Xt=X2)
 
-transp_Xs_sinkhorn = ot_emd.transform(Xs=X1)
-transp_Xt_sinkhorn = ot_emd.inverse_transform(Xt=X2)
+transp_Xs_sinkhorn = ot_sinkhorn.transform(Xs=X1)
+transp_Xt_sinkhorn = ot_sinkhorn.inverse_transform(Xt=X2)
 
 I1t = minmax(mat2im(transp_Xs_emd, I1.shape))
 I2t = minmax(mat2im(transp_Xt_emd, I2.shape))
diff --git a/examples/plot_stochastic.py b/examples/plot_stochastic.py
index b9375d4..742f8d9 100644
--- a/examples/plot_stochastic.py
+++ b/examples/plot_stochastic.py
@@ -21,9 +21,9 @@ import ot.plot
 #############################################################################
 # COMPUTE TRANSPORTATION MATRIX FOR SEMI-DUAL PROBLEM
 #############################################################################
-print("------------SEMI-DUAL PROBLEM------------")
 #############################################################################
-# DISCRETE CASE
+# DISCRETE CASE:
+#
 # Sample two discrete measures for the discrete case
 # ---------------------------------------------
 #
@@ -57,7 +57,8 @@ sag_pi = ot.stochastic.solve_semi_dual_entropic(a, b, M, reg, method,
 print(sag_pi)
 
 #############################################################################
-# SEMICONTINOUS CASE
+# SEMICONTINOUS CASE:
+#
 # Sample one general measure a, one discrete measures b for the semicontinous
 # case
 # ---------------------------------------------
@@ -139,9 +140,9 @@ pl.show()
 #############################################################################
 # COMPUTE TRANSPORTATION MATRIX FOR DUAL PROBLEM
 #############################################################################
-print("------------DUAL PROBLEM------------")
 #############################################################################
-# SEMICONTINOUS CASE
+# SEMICONTINOUS CASE:
+#
 # Sample one general measure a, one discrete measures b for the semicontinous
 # case
 # ---------------------------------------------
diff --git a/ot/stochastic.py b/ot/stochastic.py
index 959c6fa..0db39c8 100644
--- a/ot/stochastic.py
+++ b/ot/stochastic.py
@@ -12,16 +12,15 @@ import numpy as np
 
 def coordinate_grad_semi_dual(b, M, reg, beta, i):
     '''
-    Compute the coordinate gradient update for regularized discrete
-        distributions for (i, :)
+    Compute the coordinate gradient update for regularized discrete distributions for (i, :)
 
     The function computes the gradient of the semi dual problem:
 
     .. math::
-        \W_\varepsilon(a, b) = \max_\v \sum_i (\sum_j v_j * b_j
-            - \reg log(\sum_j exp((v_j - M_{i,j})/reg) * b_j)) * a_i
+        \max_v \sum_i (\sum_j v_j * b_j - reg * log(\sum_j exp((v_j - M_{i,j})/reg) * b_j)) * a_i
+
+    Where :
 
-    where :
     - M is the (ns,nt) metric cost matrix
     - v is a dual variable in R^J
     - reg is the regularization term
@@ -34,15 +33,15 @@ def coordinate_grad_semi_dual(b, M, reg, beta, i):
     Parameters
     ----------
 
-    b : np.ndarray(nt,),
+    b : np.ndarray(nt,)
         target measure
-    M : np.ndarray(ns, nt),
+    M : np.ndarray(ns, nt)
         cost matrix
-    reg : float nu,
+    reg : float nu
         Regularization term > 0
-    v : np.ndarray(nt,),
-        optimization vector
-    i : number int,
+    v : np.ndarray(nt,)
+        dual variable
+    i : number int
         picked number i
 
     Returns
@@ -93,14 +92,19 @@ def sag_entropic_transport(a, b, M, reg, numItermax=10000, lr=None):
 
     .. math::
         \gamma = arg\min_\gamma <\gamma,M>_F + reg\cdot\Omega(\gamma)
+
         s.t. \gamma 1 = a
-             \gamma^T 1= b
+
+             \gamma^T 1 = b
+
              \gamma \geq 0
-    where :
+
+    Where :
+
     - M is the (ns,nt) metric cost matrix
-    - :math:`\Omega` is the entropic regularization term
-        :math:`\Omega(\gamma)=\sum_{i,j} \gamma_{i,j}\log(\gamma_{i,j})`
+    - :math:`\Omega` is the entropic regularization term with :math:`\Omega(\gamma)=\sum_{i,j} \gamma_{i,j}\log(\gamma_{i,j})`
     - a and b are source and target weights (sum to 1)
+
     The algorithm used for solving the problem is the SAG algorithm
     as proposed in [18]_ [alg.1]
 
@@ -173,21 +177,25 @@ def sag_entropic_transport(a, b, M, reg, numItermax=10000, lr=None):
 
 def averaged_sgd_entropic_transport(a, b, M, reg, numItermax=300000, lr=None):
     '''
-    Compute the ASGD algorithm to solve the regularized semi contibous measures
-        optimal transport max problem
+    Compute the ASGD algorithm to solve the regularized semi continous measures optimal transport max problem
 
     The function solves the following optimization problem:
 
     .. math::
         \gamma = arg\min_\gamma <\gamma,M>_F + reg\cdot\Omega(\gamma)
+
         s.t. \gamma 1 = a
+
              \gamma^T 1= b
+
              \gamma \geq 0
-    where :
+
+    Where :
+
     - M is the (ns,nt) metric cost matrix
-    - :math:`\Omega` is the entropic regularization term
-        :math:`\Omega(\gamma)=\sum_{i,j} \gamma_{i,j}\log(\gamma_{i,j})`
+    - :math:`\Omega` is the entropic regularization term with :math:`\Omega(\gamma)=\sum_{i,j} \gamma_{i,j}\log(\gamma_{i,j})`
     - a and b are source and target weights (sum to 1)
+
     The algorithm used for solving the problem is the ASGD algorithm
     as proposed in [18]_ [alg.2]
 
@@ -195,11 +203,11 @@ def averaged_sgd_entropic_transport(a, b, M, reg, numItermax=300000, lr=None):
     Parameters
     ----------
 
-    b : np.ndarray(nt,),
+    b : np.ndarray(nt,)
         target measure
-    M : np.ndarray(ns, nt),
+    M : np.ndarray(ns, nt)
         cost matrix
-    reg : float number,
+    reg : float number
         Regularization term > 0
     numItermax : int number
         number of iteration
@@ -211,7 +219,7 @@ def averaged_sgd_entropic_transport(a, b, M, reg, numItermax=300000, lr=None):
     -------
 
     ave_v : np.ndarray(nt,)
-        optimization vector
+        dual variable
 
     Examples
     --------
@@ -265,7 +273,8 @@ def c_transform_entropic(b, M, reg, beta):
     .. math::
         u = v^{c,reg} = -reg \sum_j exp((v - M)/reg) b_j
 
-    where :
+    Where :
+
     - M is the (ns,nt) metric cost matrix
     - u, v are dual variables in R^IxR^J
     - reg is the regularization term
@@ -290,6 +299,7 @@ def c_transform_entropic(b, M, reg, beta):
     -------
 
     u : np.ndarray(ns,)
+        dual variable
 
     Examples
     --------
@@ -341,10 +351,11 @@ def solve_semi_dual_entropic(a, b, M, reg, method, numItermax=10000, lr=None,
         s.t. \gamma 1 = a
              \gamma^T 1= b
              \gamma \geq 0
-    where :
+
+    Where :
+
     - M is the (ns,nt) metric cost matrix
-    - :math:`\Omega` is the entropic regularization term
-        :math:`\Omega(\gamma)=\sum_{i,j} \gamma_{i,j}\log(\gamma_{i,j})`
+    - :math:`\Omega` is the entropic regularization term with :math:`\Omega(\gamma)=\sum_{i,j} \gamma_{i,j}\log(\gamma_{i,j})`
     - a and b are source and target weights (sum to 1)
     The algorithm used for solving the problem is the SAG or ASGD algorithms
     as proposed in [18]_
@@ -353,15 +364,15 @@ def solve_semi_dual_entropic(a, b, M, reg, method, numItermax=10000, lr=None,
     Parameters
     ----------
 
-    a : np.ndarray(ns,),
+    a : np.ndarray(ns,)
         source measure
-    b : np.ndarray(nt,),
+    b : np.ndarray(nt,)
         target measure
-    M : np.ndarray(ns, nt),
+    M : np.ndarray(ns, nt)
         cost matrix
-    reg : float number,
+    reg : float number
         Regularization term > 0
-    methode : str,
+    methode : str
         used method (SAG or ASGD)
     numItermax : int number
         number of iteration
@@ -438,40 +449,40 @@ def solve_semi_dual_entropic(a, b, M, reg, method, numItermax=10000, lr=None,
 def batch_grad_dual(a, b, M, reg, alpha, beta, batch_size, batch_alpha,
                     batch_beta):
     '''
-    Computes the partial gradient of F_\W_varepsilon
+    Computes the partial gradient of the dual optimal transport problem.
+
+    For each (i,j) in a batch of coordinates, the partial gradients are :
 
-    Compute the partial gradient of the dual problem:
+    .. math::
+        \partial_{u_i} F = u_i * b_s/l_{v} - \sum_{j \in B_v} exp((u_i + v_j - M_{i,j})/reg) * a_i * b_j
 
-    ..math:
-        \forall i in batch_alpha,
-            grad_alpha_i = alpha_i * batch_size/len(beta) -
-                sum_{j in batch_beta} exp((alpha_i + beta_j - M_{i,j})/reg)
-                    * a_i * b_j
+        \partial_{v_j} F = v_j * b_s/l_{u} - \sum_{i \in B_u} exp((u_i + v_j - M_{i,j})/reg) * a_i * b_j
+
+    Where :
 
-        \forall j in batch_alpha,
-            grad_beta_j = beta_j * batch_size/len(alpha) -
-                sum_{i in batch_alpha} exp((alpha_i + beta_j - M_{i,j})/reg)
-                    * a_i * b_j
-    where :
     - M is the (ns,nt) metric cost matrix
-    - alpha, beta are dual variables in R^ixR^J
+    - u, v are dual variables in R^ixR^J
     - reg is the regularization term
-    - batch_alpha and batch_beta are lists of index
+    - :math:`B_u` and :math:`B_v` are lists of index
+    - :math:`b_s` is the size of the batchs :math:`B_u` and :math:`B_v`
+    - :math:`l_u` and :math:`l_v` are the lenghts of :math:`B_u` and :math:`B_v`
     - a and b are source and target weights (sum to 1)
 
 
     The algorithm used for solving the dual problem is the SGD algorithm
     as proposed in [19]_ [alg.1]
 
+
     Parameters
     ----------
-    a : np.ndarray(ns,),
+
+    a : np.ndarray(ns,)
         source measure
-    b : np.ndarray(nt,),
+    b : np.ndarray(nt,)
         target measure
-    M : np.ndarray(ns, nt),
+    M : np.ndarray(ns, nt)
         cost matrix
-    reg : float number,
+    reg : float number
         Regularization term > 0
     alpha : np.ndarray(ns,)
         dual variable
@@ -542,24 +553,29 @@ def sgd_entropic_regularization(a, b, M, reg, batch_size, numItermax, lr):
 
     .. math::
         \gamma = arg\min_\gamma <\gamma,M>_F + reg\cdot\Omega(\gamma)
+
         s.t. \gamma 1 = a
+
              \gamma^T 1= b
+
              \gamma \geq 0
-    where :
+
+    Where :
+
     - M is the (ns,nt) metric cost matrix
-    - :math:`\Omega` is the entropic regularization term
-        :math:`\Omega(\gamma)=\sum_{i,j} \gamma_{i,j}\log(\gamma_{i,j})`
+    - :math:`\Omega` is the entropic regularization term with :math:`\Omega(\gamma)=\sum_{i,j} \gamma_{i,j}\log(\gamma_{i,j})`
     - a and b are source and target weights (sum to 1)
 
     Parameters
     ----------
-    a : np.ndarray(ns,),
+
+    a : np.ndarray(ns,)
         source measure
-    b : np.ndarray(nt,),
+    b : np.ndarray(nt,)
         target measure
-    M : np.ndarray(ns, nt),
+    M : np.ndarray(ns, nt)
         cost matrix
-    reg : float number,
+    reg : float number
         Regularization term > 0
     batch_size : int number
         size of the batch
@@ -633,25 +649,29 @@ def solve_dual_entropic(a, b, M, reg, batch_size, numItermax=10000, lr=1,
 
     .. math::
         \gamma = arg\min_\gamma <\gamma,M>_F + reg\cdot\Omega(\gamma)
+
         s.t. \gamma 1 = a
+
              \gamma^T 1= b
+
              \gamma \geq 0
-    where :
+
+    Where :
+
     - M is the (ns,nt) metric cost matrix
-    - :math:`\Omega` is the entropic regularization term
-        :math:`\Omega(\gamma)=\sum_{i,j} \gamma_{i,j}\log(\gamma_{i,j})`
+    - :math:`\Omega` is the entropic regularization term :math:`\Omega(\gamma)=\sum_{i,j} \gamma_{i,j}\log(\gamma_{i,j})`
     - a and b are source and target weights (sum to 1)
 
     Parameters
     ----------
 
-    a : np.ndarray(ns,),
+    a : np.ndarray(ns,)
         source measure
-    b : np.ndarray(nt,),
+    b : np.ndarray(nt,)
         target measure
-    M : np.ndarray(ns, nt),
+    M : np.ndarray(ns, nt)
         cost matrix
-    reg : float number,
+    reg : float number
         Regularization term > 0
     batch_size : int number
         size of the batch
diff --git a/setup.py b/setup.py
index c895034..bbcaf04 100755
--- a/setup.py
+++ b/setup.py
@@ -24,6 +24,12 @@ ROOT = os.path.abspath(os.path.dirname(__file__))
 with open(os.path.join(ROOT, 'README.md'), encoding="utf-8") as f:
     README = f.read()
 
+# add platform dependant optional compilation argument
+opt_arg=["-O3"]
+import platform
+if platform.system()=='Darwin':
+  if platform.release()=='18.0.0':
+      opt_arg.append("-stdlib=libc++") # correspond to a compilation problem with Mojave and XCode 10
 
 setup(name='POT',
       version=__version__,
@@ -39,7 +45,9 @@ setup(name='POT',
                  sources=["ot/lp/emd_wrap.pyx", "ot/lp/EMD_wrapper.cpp"], # the Cython source and
                                                         # additional C++ source files
                  language="c++",                        # generate and compile C++ code,
-                 include_dirs=[numpy.get_include(),os.path.join(ROOT,'ot/lp')])),
+                 include_dirs=[numpy.get_include(),os.path.join(ROOT,'ot/lp')],
+                 extra_compile_args=opt_arg
+                 )),
       platforms=['linux','macosx','windows'],
       download_url='https://github.com/rflamary/POT/archive/{}.tar.gz'.format(__version__),
       license = 'MIT',