From 3007f1da1094f93fa4216386666085cf60316b04 Mon Sep 17 00:00:00 2001
From: Nicolas Courty <Nico@pc-mna-08.univ-ubs.fr>
Date: Thu, 31 Aug 2017 16:44:18 +0200
Subject: Minor corrections suggested by @agramfort + new barycenter example +
 test function

---
 test/test_gromov.py | 38 ++++++++++++++++++++++++++++++++++++++
 1 file changed, 38 insertions(+)
 create mode 100644 test/test_gromov.py

(limited to 'test')

diff --git a/test/test_gromov.py b/test/test_gromov.py
new file mode 100644
index 0000000..75eeaab
--- /dev/null
+++ b/test/test_gromov.py
@@ -0,0 +1,38 @@
+"""Tests for module gromov  """
+
+# Author: Erwan Vautier <erwan.vautier@gmail.com>
+#         Nicolas Courty <ncourty@irisa.fr>
+#
+# License: MIT License
+
+import numpy as np
+import ot
+
+
+def test_gromov():
+    n = 50  # nb samples
+
+    mu_s = np.array([0, 0])
+    cov_s = np.array([[1, 0], [0, 1]])
+
+    xs = ot.datasets.get_2D_samples_gauss(n, mu_s, cov_s)
+
+    xt = [xs[n - (i + 1)] for i in range(n)]
+    xt = np.array(xt)
+
+    p = ot.unif(n)
+    q = ot.unif(n)
+
+    C1 = ot.dist(xs, xs)
+    C2 = ot.dist(xt, xt)
+
+    C1 /= C1.max()
+    C2 /= C2.max()
+
+    G = ot.gromov_wasserstein(C1, C2, p, q, 'square_loss', epsilon=5e-4)
+
+    # check constratints
+    np.testing.assert_allclose(
+        p, G.sum(1), atol=1e-04)  # cf convergence gromov
+    np.testing.assert_allclose(
+        q, G.sum(0), atol=1e-04)  # cf convergence gromov
-- 
cgit v1.2.3


From c7eaaf4caa03d759c4255bdf8b6eebd10ee539a5 Mon Sep 17 00:00:00 2001
From: Slasnista <stan.chambon@gmail.com>
Date: Tue, 1 Aug 2017 10:42:09 +0200
Subject: update SinkhornTransport class + added test for class

---
 ot/da.py        | 56 +++++++++++++++++++++-----------------------------------
 test/test_da.py | 51 +++++++++++++++++++++++++++++++++++++++++++++++++++
 2 files changed, 72 insertions(+), 35 deletions(-)

(limited to 'test')

diff --git a/ot/da.py b/ot/da.py
index d30c821..6b98a17 100644
--- a/ot/da.py
+++ b/ot/da.py
@@ -15,6 +15,7 @@ from .lp import emd
 from .utils import unif, dist, kernel
 from .optim import cg
 from .optim import gcg
+import warnings
 
 
 def sinkhorn_lpl1_mm(a, labels_a, b, M, reg, eta=0.1, numItermax=10,
@@ -921,15 +922,8 @@ class OTDA_mapping_kernel(OTDA_mapping_linear):
 # proposal
 ##############################################################################
 
-# from sklearn.base import BaseEstimator
-# from sklearn.metrics import pairwise_distances
-
-##############################################################################
-# adapted from scikit-learn
-
-import warnings
-# from .externals.six import string_types, iteritems
 
+# adapted from sklearn
 
 class BaseEstimator(object):
     """Base class for all estimators in scikit-learn
@@ -1067,7 +1061,7 @@ def distribution_estimation_uniform(X):
         The uniform distribution estimated from X
     """
 
-    return np.ones(X.shape[0]) / float(X.shape[0])
+    return unif(X.shape[0])
 
 
 class BaseTransport(BaseEstimator):
@@ -1092,29 +1086,20 @@ class BaseTransport(BaseEstimator):
         """
 
         # pairwise distance
-        Cost = dist(Xs, Xt, metric=self.metric)
+        self.Cost = dist(Xs, Xt, metric=self.metric)
 
         if self.mode == "semisupervised":
             print("TODO: modify cost matrix accordingly")
             pass
 
         # distribution estimation
-        mu_s = self.distribution_estimation(Xs)
-        mu_t = self.distribution_estimation(Xt)
+        self.mu_s = self.distribution_estimation(Xs)
+        self.mu_t = self.distribution_estimation(Xt)
 
         # store arrays of samples
         self.Xs = Xs
         self.Xt = Xt
 
-        # coupling estimation
-        if self.method == "sinkhorn":
-            self.gamma_ = sinkhorn(
-                a=mu_s, b=mu_t, M=Cost, reg=self.reg_e,
-                numItermax=self.max_iter, stopThr=self.tol,
-                verbose=self.verbose, log=self.log)
-        else:
-            print("TODO: implement the other methods")
-
         return self
 
     def fit_transform(self, Xs=None, ys=None, Xt=None, yt=None):
@@ -1157,8 +1142,7 @@ class BaseTransport(BaseEstimator):
             The transport source samples.
         """
 
-        # TODO: check whether Xs is new or not
-        if self.Xs == Xs:
+        if np.array_equal(self.Xs, Xs):
             # perform standard barycentric mapping
             transp = self.gamma_ / np.sum(self.gamma_, 1)[:, None]
 
@@ -1169,7 +1153,9 @@ class BaseTransport(BaseEstimator):
             transp_Xs = np.dot(transp, self.Xt)
         else:
             # perform out of sample mapping
-            print("out of sample mapping not yet implemented")
+            print("Warning: out of sample mapping not yet implemented")
+            print("input data will be returned")
+            transp_Xs = Xs
 
         return transp_Xs
 
@@ -1191,8 +1177,7 @@ class BaseTransport(BaseEstimator):
             The transported target samples.
         """
 
-        # TODO: check whether Xt is new or not
-        if self.Xt == Xt:
+        if np.array_equal(self.Xt, Xt):
             # perform standard barycentric mapping
             transp_ = self.gamma_.T / np.sum(self.gamma_, 0)[:, None]
 
@@ -1203,7 +1188,9 @@ class BaseTransport(BaseEstimator):
             transp_Xt = np.dot(transp_, self.Xs)
         else:
             # perform out of sample mapping
-            print("out of sample mapping not yet implemented")
+            print("Warning: out of sample mapping not yet implemented")
+            print("input data will be returned")
+            transp_Xt = Xt
 
         return transp_Xt
 
@@ -1254,7 +1241,7 @@ class SinkhornTransport(BaseTransport):
     """
 
     def __init__(self, reg_e=1., mode="unsupervised", max_iter=1000,
-                 tol=10e-9, verbose=False, log=False, mapping="barycentric",
+                 tol=10e-9, verbose=False, log=False,
                  metric="sqeuclidean",
                  distribution_estimation=distribution_estimation_uniform,
                  out_of_sample_map='ferradans'):
@@ -1265,7 +1252,6 @@ class SinkhornTransport(BaseTransport):
         self.tol = tol
         self.verbose = verbose
         self.log = log
-        self.mapping = mapping
         self.metric = metric
         self.distribution_estimation = distribution_estimation
         self.method = "sinkhorn"
@@ -1290,10 +1276,10 @@ class SinkhornTransport(BaseTransport):
             Returns self.
         """
 
-        return super(SinkhornTransport, self).fit(Xs, ys, Xt, yt)
-
+        self = super(SinkhornTransport, self).fit(Xs, ys, Xt, yt)
 
-if __name__ == "__main__":
-    print("Small test")
-
-    st = SinkhornTransport()
+        # coupling estimation
+        self.gamma_ = sinkhorn(
+            a=self.mu_s, b=self.mu_t, M=self.Cost, reg=self.reg_e,
+            numItermax=self.max_iter, stopThr=self.tol,
+            verbose=self.verbose, log=self.log)
diff --git a/test/test_da.py b/test/test_da.py
index dfba83f..e7b4ed1 100644
--- a/test/test_da.py
+++ b/test/test_da.py
@@ -6,6 +6,57 @@
 
 import numpy as np
 import ot
+from numpy.testing.utils import assert_allclose, assert_equal
+from ot.datasets import get_data_classif
+from ot.utils import unif
+
+np.random.seed(42)
+
+
+def test_sinkhorn_transport():
+    """test_sinkhorn_transport
+    """
+
+    ns = 150
+    nt = 200
+
+    Xs, ys = get_data_classif('3gauss', ns)
+    Xt, yt = get_data_classif('3gauss2', nt)
+
+    clf = ot.da.SinkhornTransport()
+
+    # test its computed
+    clf.fit(Xs=Xs, Xt=Xt)
+
+    # test dimensions of coupling
+    assert_equal(clf.Cost.shape, ((Xs.shape[0], Xt.shape[0])))
+    assert_equal(clf.gamma_.shape, ((Xs.shape[0], Xt.shape[0])))
+
+    # test margin constraints
+    mu_s = unif(ns)
+    mu_t = unif(nt)
+    assert_allclose(np.sum(clf.gamma_, axis=0), mu_t, rtol=1e-3, atol=1e-3)
+    assert_allclose(np.sum(clf.gamma_, axis=1), mu_s, rtol=1e-3, atol=1e-3)
+
+    # test transform
+    transp_Xs = clf.transform(Xs=Xs)
+    assert_equal(transp_Xs.shape, Xs.shape)
+
+    Xs_new, _ = get_data_classif('3gauss', ns + 1)
+    transp_Xs_new = clf.transform(Xs_new)
+
+    # check that the oos method is not working
+    assert_equal(transp_Xs_new, Xs_new)
+
+    # test inverse transform
+    transp_Xt = clf.inverse_transform(Xt=Xt)
+    assert_equal(transp_Xt.shape, Xt.shape)
+
+    Xt_new, _ = get_data_classif('3gauss2', nt + 1)
+    transp_Xt_new = clf.inverse_transform(Xt=Xt_new)
+
+    # check that the oos method is not working and returns the input data
+    assert_equal(transp_Xt_new, Xt_new)
 
 
 def test_otda():
-- 
cgit v1.2.3


From d5c6cc178a731d955e5eb85e9f477805fa086518 Mon Sep 17 00:00:00 2001
From: Slasnista <stan.chambon@gmail.com>
Date: Tue, 1 Aug 2017 13:13:50 +0200
Subject: added EMDTransport Class from NG's code + added dedicated test

---
 ot/da.py        | 86 +++++++++++++++++++++++++++++++++++++++++++++++++++++----
 test/test_da.py | 59 ++++++++++++++++++++++++++++++++++++---
 2 files changed, 135 insertions(+), 10 deletions(-)

(limited to 'test')

diff --git a/ot/da.py b/ot/da.py
index 6b98a17..fb2fd36 100644
--- a/ot/da.py
+++ b/ot/da.py
@@ -1144,7 +1144,7 @@ class BaseTransport(BaseEstimator):
 
         if np.array_equal(self.Xs, Xs):
             # perform standard barycentric mapping
-            transp = self.gamma_ / np.sum(self.gamma_, 1)[:, None]
+            transp = self.Coupling_ / np.sum(self.Coupling_, 1)[:, None]
 
             # set nans to 0
             transp[~ np.isfinite(transp)] = 0
@@ -1179,7 +1179,7 @@ class BaseTransport(BaseEstimator):
 
         if np.array_equal(self.Xt, Xt):
             # perform standard barycentric mapping
-            transp_ = self.gamma_.T / np.sum(self.gamma_, 0)[:, None]
+            transp_ = self.Coupling_.T / np.sum(self.Coupling_, 0)[:, None]
 
             # set nans to 0
             transp_[~ np.isfinite(transp_)] = 0
@@ -1228,7 +1228,7 @@ class SinkhornTransport(BaseTransport):
         Controls the logs of the optimization algorithm
     Attributes
     ----------
-    gamma_ : the optimal coupling
+    Coupling_ : the optimal coupling
 
     References
     ----------
@@ -1254,7 +1254,6 @@ class SinkhornTransport(BaseTransport):
         self.log = log
         self.metric = metric
         self.distribution_estimation = distribution_estimation
-        self.method = "sinkhorn"
         self.out_of_sample_map = out_of_sample_map
 
     def fit(self, Xs=None, ys=None, Xt=None, yt=None):
@@ -1276,10 +1275,85 @@ class SinkhornTransport(BaseTransport):
             Returns self.
         """
 
-        self = super(SinkhornTransport, self).fit(Xs, ys, Xt, yt)
+        super(SinkhornTransport, self).fit(Xs, ys, Xt, yt)
 
         # coupling estimation
-        self.gamma_ = sinkhorn(
+        self.Coupling_ = sinkhorn(
             a=self.mu_s, b=self.mu_t, M=self.Cost, reg=self.reg_e,
             numItermax=self.max_iter, stopThr=self.tol,
             verbose=self.verbose, log=self.log)
+
+
+class EMDTransport(BaseTransport):
+    """Domain Adapatation OT method based on Earth Mover's Distance
+    Parameters
+    ----------
+    mode : string, optional (default="unsupervised")
+        The DA mode. If "unsupervised" no target labels are taken into account
+        to modify the cost matrix. If "semisupervised" the target labels
+        are taken into account to set coefficients of the pairwise distance
+        matrix to 0 for row and columns indices that correspond to source and
+        target samples which share the same labels.
+    mapping : string, optional (default="barycentric")
+        The kind of mapping to apply to transport samples from a domain into
+        another one.
+        if "barycentric" only the samples used to estimate the coupling can
+        be transported from a domain to another one.
+    metric : string, optional (default="sqeuclidean")
+        The ground metric for the Wasserstein problem
+    distribution : string, optional (default="uniform")
+        The kind of distribution estimation to employ
+    verbose : int, optional (default=0)
+        Controls the verbosity of the optimization algorithm
+    log : int, optional (default=0)
+        Controls the logs of the optimization algorithm
+    Attributes
+    ----------
+    Coupling_ : the optimal coupling
+
+    References
+    ----------
+    .. [1] N. Courty; R. Flamary; D. Tuia; A. Rakotomamonjy,
+           "Optimal Transport for Domain Adaptation," in IEEE Transactions
+           on Pattern Analysis and Machine Intelligence , vol.PP, no.99, pp.1-1
+    """
+
+    def __init__(self, mode="unsupervised", verbose=False,
+                 log=False, metric="sqeuclidean",
+                 distribution_estimation=distribution_estimation_uniform,
+                 out_of_sample_map='ferradans'):
+
+        self.mode = mode
+        self.verbose = verbose
+        self.log = log
+        self.metric = metric
+        self.distribution_estimation = distribution_estimation
+        self.out_of_sample_map = out_of_sample_map
+
+    def fit(self, Xs, ys=None, Xt=None, yt=None):
+        """Build a coupling matrix from source and target sets of samples
+        (Xs, ys) and (Xt, yt)
+        Parameters
+        ----------
+        Xs : array-like of shape = [n_source_samples, n_features]
+            The training input samples.
+        ys : array-like, shape = [n_source_samples]
+            The class labels
+        Xt : array-like of shape = [n_target_samples, n_features]
+            The training input samples.
+        yt : array-like, shape = [n_labeled_target_samples]
+            The class labels
+        Returns
+        -------
+        self : object
+            Returns self.
+        """
+
+        super(EMDTransport, self).fit(Xs, ys, Xt, yt)
+
+        # coupling estimation
+        self.Coupling_ = emd(
+            a=self.mu_s, b=self.mu_t, M=self.Cost,
+            # verbose=self.verbose,
+            # log=self.log
+        )
diff --git a/test/test_da.py b/test/test_da.py
index e7b4ed1..33b3695 100644
--- a/test/test_da.py
+++ b/test/test_da.py
@@ -13,7 +13,7 @@ from ot.utils import unif
 np.random.seed(42)
 
 
-def test_sinkhorn_transport():
+def test_sinkhorn_transport_class():
     """test_sinkhorn_transport
     """
 
@@ -30,13 +30,59 @@ def test_sinkhorn_transport():
 
     # test dimensions of coupling
     assert_equal(clf.Cost.shape, ((Xs.shape[0], Xt.shape[0])))
-    assert_equal(clf.gamma_.shape, ((Xs.shape[0], Xt.shape[0])))
+    assert_equal(clf.Coupling_.shape, ((Xs.shape[0], Xt.shape[0])))
 
     # test margin constraints
     mu_s = unif(ns)
     mu_t = unif(nt)
-    assert_allclose(np.sum(clf.gamma_, axis=0), mu_t, rtol=1e-3, atol=1e-3)
-    assert_allclose(np.sum(clf.gamma_, axis=1), mu_s, rtol=1e-3, atol=1e-3)
+    assert_allclose(np.sum(clf.Coupling_, axis=0), mu_t, rtol=1e-3, atol=1e-3)
+    assert_allclose(np.sum(clf.Coupling_, axis=1), mu_s, rtol=1e-3, atol=1e-3)
+
+    # test transform
+    transp_Xs = clf.transform(Xs=Xs)
+    assert_equal(transp_Xs.shape, Xs.shape)
+
+    Xs_new, _ = get_data_classif('3gauss', ns + 1)
+    transp_Xs_new = clf.transform(Xs_new)
+
+    # check that the oos method is not working
+    assert_equal(transp_Xs_new, Xs_new)
+
+    # test inverse transform
+    transp_Xt = clf.inverse_transform(Xt=Xt)
+    assert_equal(transp_Xt.shape, Xt.shape)
+
+    Xt_new, _ = get_data_classif('3gauss2', nt + 1)
+    transp_Xt_new = clf.inverse_transform(Xt=Xt_new)
+
+    # check that the oos method is not working and returns the input data
+    assert_equal(transp_Xt_new, Xt_new)
+
+
+def test_emd_transport_class():
+    """test_sinkhorn_transport
+    """
+
+    ns = 150
+    nt = 200
+
+    Xs, ys = get_data_classif('3gauss', ns)
+    Xt, yt = get_data_classif('3gauss2', nt)
+
+    clf = ot.da.EMDTransport()
+
+    # test its computed
+    clf.fit(Xs=Xs, Xt=Xt)
+
+    # test dimensions of coupling
+    assert_equal(clf.Cost.shape, ((Xs.shape[0], Xt.shape[0])))
+    assert_equal(clf.Coupling_.shape, ((Xs.shape[0], Xt.shape[0])))
+
+    # test margin constraints
+    mu_s = unif(ns)
+    mu_t = unif(nt)
+    assert_allclose(np.sum(clf.Coupling_, axis=0), mu_t, rtol=1e-3, atol=1e-3)
+    assert_allclose(np.sum(clf.Coupling_, axis=1), mu_s, rtol=1e-3, atol=1e-3)
 
     # test transform
     transp_Xs = clf.transform(Xs=Xs)
@@ -119,3 +165,8 @@ def test_otda():
     da_emd = ot.da.OTDA_mapping_kernel()     # init class
     da_emd.fit(xs, xt, numItermax=10)       # fit distributions
     da_emd.predict(xs)    # interpolation of source samples
+
+
+if __name__ == "__main__":
+    test_sinkhorn_transport_class()
+    test_emd_transport_class()
-- 
cgit v1.2.3


From cd4fa7275dc65e04f7b256dec4208d68006abc25 Mon Sep 17 00:00:00 2001
From: Slasnista <stan.chambon@gmail.com>
Date: Fri, 4 Aug 2017 11:16:30 +0200
Subject: added test for fit_transform + correction of fit_transform bug
 (missing return self)

---
 ot/da.py        |  4 ++++
 test/test_da.py | 13 ++++++++-----
 2 files changed, 12 insertions(+), 5 deletions(-)

(limited to 'test')

diff --git a/ot/da.py b/ot/da.py
index fb2fd36..80649a7 100644
--- a/ot/da.py
+++ b/ot/da.py
@@ -1283,6 +1283,8 @@ class SinkhornTransport(BaseTransport):
             numItermax=self.max_iter, stopThr=self.tol,
             verbose=self.verbose, log=self.log)
 
+        return self
+
 
 class EMDTransport(BaseTransport):
     """Domain Adapatation OT method based on Earth Mover's Distance
@@ -1357,3 +1359,5 @@ class EMDTransport(BaseTransport):
             # verbose=self.verbose,
             # log=self.log
         )
+
+        return self
diff --git a/test/test_da.py b/test/test_da.py
index 33b3695..68807ec 100644
--- a/test/test_da.py
+++ b/test/test_da.py
@@ -58,6 +58,10 @@ def test_sinkhorn_transport_class():
     # check that the oos method is not working and returns the input data
     assert_equal(transp_Xt_new, Xt_new)
 
+    # test fit_transform
+    transp_Xs = clf.fit_transform(Xs=Xs, Xt=Xt)
+    assert_equal(transp_Xs.shape, Xs.shape)
+
 
 def test_emd_transport_class():
     """test_sinkhorn_transport
@@ -104,6 +108,10 @@ def test_emd_transport_class():
     # check that the oos method is not working and returns the input data
     assert_equal(transp_Xt_new, Xt_new)
 
+    # test fit_transform
+    transp_Xs = clf.fit_transform(Xs=Xs, Xt=Xt)
+    assert_equal(transp_Xs.shape, Xs.shape)
+
 
 def test_otda():
 
@@ -165,8 +173,3 @@ def test_otda():
     da_emd = ot.da.OTDA_mapping_kernel()     # init class
     da_emd.fit(xs, xt, numItermax=10)       # fit distributions
     da_emd.predict(xs)    # interpolation of source samples
-
-
-if __name__ == "__main__":
-    test_sinkhorn_transport_class()
-    test_emd_transport_class()
-- 
cgit v1.2.3


From 0659abe79c15f786a017b62e2a1313f0625af329 Mon Sep 17 00:00:00 2001
From: Slasnista <stan.chambon@gmail.com>
Date: Fri, 4 Aug 2017 11:34:21 +0200
Subject: added new class SinkhornLpl1Transport() + dedicated test

---
 ot/da.py        | 91 +++++++++++++++++++++++++++++++++++++++++++++++++++++++++
 test/test_da.py | 50 +++++++++++++++++++++++++++++++
 2 files changed, 141 insertions(+)

(limited to 'test')

diff --git a/ot/da.py b/ot/da.py
index 80649a7..3031f63 100644
--- a/ot/da.py
+++ b/ot/da.py
@@ -1361,3 +1361,94 @@ class EMDTransport(BaseTransport):
         )
 
         return self
+
+
+class SinkhornLpl1Transport(BaseTransport):
+    """Domain Adapatation OT method based on sinkhorn algorithm +
+    LpL1 class regularization.
+
+    Parameters
+    ----------
+    mode : string, optional (default="unsupervised")
+        The DA mode. If "unsupervised" no target labels are taken into account
+        to modify the cost matrix. If "semisupervised" the target labels
+        are taken into account to set coefficients of the pairwise distance
+        matrix to 0 for row and columns indices that correspond to source and
+        target samples which share the same labels.
+    mapping : string, optional (default="barycentric")
+        The kind of mapping to apply to transport samples from a domain into
+        another one.
+        if "barycentric" only the samples used to estimate the coupling can
+        be transported from a domain to another one.
+    metric : string, optional (default="sqeuclidean")
+        The ground metric for the Wasserstein problem
+    distribution : string, optional (default="uniform")
+        The kind of distribution estimation to employ
+    verbose : int, optional (default=0)
+        Controls the verbosity of the optimization algorithm
+    log : int, optional (default=0)
+        Controls the logs of the optimization algorithm
+    Attributes
+    ----------
+    Coupling_ : the optimal coupling
+
+    References
+    ----------
+
+    .. [1] N. Courty; R. Flamary; D. Tuia; A. Rakotomamonjy,
+       "Optimal Transport for Domain Adaptation," in IEEE
+       Transactions on Pattern Analysis and Machine Intelligence ,
+       vol.PP, no.99, pp.1-1
+    .. [2] Rakotomamonjy, A., Flamary, R., & Courty, N. (2015).
+       Generalized conditional gradient: analysis of convergence
+       and applications. arXiv preprint arXiv:1510.06567.
+
+    """
+
+    def __init__(self, reg_e=1., reg_cl=0.1, mode="unsupervised",
+                 max_iter=10, max_inner_iter=200,
+                 tol=10e-9, verbose=False, log=False,
+                 metric="sqeuclidean",
+                 distribution_estimation=distribution_estimation_uniform,
+                 out_of_sample_map='ferradans'):
+
+        self.reg_e = reg_e
+        self.reg_cl = reg_cl
+        self.mode = mode
+        self.max_iter = max_iter
+        self.max_inner_iter = max_inner_iter
+        self.tol = tol
+        self.verbose = verbose
+        self.log = log
+        self.metric = metric
+        self.distribution_estimation = distribution_estimation
+        self.out_of_sample_map = out_of_sample_map
+
+    def fit(self, Xs, ys=None, Xt=None, yt=None):
+        """Build a coupling matrix from source and target sets of samples
+        (Xs, ys) and (Xt, yt)
+        Parameters
+        ----------
+        Xs : array-like of shape = [n_source_samples, n_features]
+            The training input samples.
+        ys : array-like, shape = [n_source_samples]
+            The class labels
+        Xt : array-like of shape = [n_target_samples, n_features]
+            The training input samples.
+        yt : array-like, shape = [n_labeled_target_samples]
+            The class labels
+        Returns
+        -------
+        self : object
+            Returns self.
+        """
+
+        super(SinkhornLpl1Transport, self).fit(Xs, ys, Xt, yt)
+
+        self.Coupling_ = sinkhorn_lpl1_mm(
+            a=self.mu_s, labels_a=ys, b=self.mu_t, M=self.Cost,
+            reg=self.reg_e, eta=self.reg_cl, numItermax=self.max_iter,
+            numInnerItermax=self.max_inner_iter, stopInnerThr=self.tol,
+            verbose=self.verbose, log=self.log)
+
+        return self
diff --git a/test/test_da.py b/test/test_da.py
index 68807ec..7d00cfb 100644
--- a/test/test_da.py
+++ b/test/test_da.py
@@ -13,6 +13,56 @@ from ot.utils import unif
 np.random.seed(42)
 
 
+def test_sinkhorn_lpl1_transport_class():
+    """test_sinkhorn_transport
+    """
+
+    ns = 150
+    nt = 200
+
+    Xs, ys = get_data_classif('3gauss', ns)
+    Xt, yt = get_data_classif('3gauss2', nt)
+
+    clf = ot.da.SinkhornLpl1Transport()
+
+    # test its computed
+    clf.fit(Xs=Xs, ys=ys, Xt=Xt)
+
+    # test dimensions of coupling
+    assert_equal(clf.Cost.shape, ((Xs.shape[0], Xt.shape[0])))
+    assert_equal(clf.Coupling_.shape, ((Xs.shape[0], Xt.shape[0])))
+
+    # test margin constraints
+    mu_s = unif(ns)
+    mu_t = unif(nt)
+    assert_allclose(np.sum(clf.Coupling_, axis=0), mu_t, rtol=1e-3, atol=1e-3)
+    assert_allclose(np.sum(clf.Coupling_, axis=1), mu_s, rtol=1e-3, atol=1e-3)
+
+    # test transform
+    transp_Xs = clf.transform(Xs=Xs)
+    assert_equal(transp_Xs.shape, Xs.shape)
+
+    Xs_new, _ = get_data_classif('3gauss', ns + 1)
+    transp_Xs_new = clf.transform(Xs_new)
+
+    # check that the oos method is not working
+    assert_equal(transp_Xs_new, Xs_new)
+
+    # test inverse transform
+    transp_Xt = clf.inverse_transform(Xt=Xt)
+    assert_equal(transp_Xt.shape, Xt.shape)
+
+    Xt_new, _ = get_data_classif('3gauss2', nt + 1)
+    transp_Xt_new = clf.inverse_transform(Xt=Xt_new)
+
+    # check that the oos method is not working and returns the input data
+    assert_equal(transp_Xt_new, Xt_new)
+
+    # test fit_transform
+    transp_Xs = clf.fit_transform(Xs=Xs, ys=ys, Xt=Xt)
+    assert_equal(transp_Xs.shape, Xs.shape)
+
+
 def test_sinkhorn_transport_class():
     """test_sinkhorn_transport
     """
-- 
cgit v1.2.3


From 2005a09548a6f6d42cd9aafadbb4583e4029936c Mon Sep 17 00:00:00 2001
From: Slasnista <stan.chambon@gmail.com>
Date: Fri, 4 Aug 2017 11:40:44 +0200
Subject: added new class SinkhornL1l2Transport() + dedicated test

---
 ot/da.py        | 109 ++++++++++++++++++++++++++++++++++++++++++++++++++++++++
 test/test_da.py |  50 ++++++++++++++++++++++++++
 2 files changed, 159 insertions(+)

(limited to 'test')

diff --git a/ot/da.py b/ot/da.py
index 3031f63..6100d15 100644
--- a/ot/da.py
+++ b/ot/da.py
@@ -1369,6 +1369,10 @@ class SinkhornLpl1Transport(BaseTransport):
 
     Parameters
     ----------
+    reg_e : float, optional (default=1)
+        Entropic regularization parameter
+    reg_cl : float, optional (default=0.1)
+        Class regularization parameter
     mode : string, optional (default="unsupervised")
         The DA mode. If "unsupervised" no target labels are taken into account
         to modify the cost matrix. If "semisupervised" the target labels
@@ -1384,6 +1388,11 @@ class SinkhornLpl1Transport(BaseTransport):
         The ground metric for the Wasserstein problem
     distribution : string, optional (default="uniform")
         The kind of distribution estimation to employ
+    max_iter : int, float, optional (default=10)
+        The minimum number of iteration before stopping the optimization
+        algorithm if no it has not converged
+    max_inner_iter : int, float, optional (default=200)
+        The number of iteration in the inner loop
     verbose : int, optional (default=0)
         Controls the verbosity of the optimization algorithm
     log : int, optional (default=0)
@@ -1452,3 +1461,103 @@ class SinkhornLpl1Transport(BaseTransport):
             verbose=self.verbose, log=self.log)
 
         return self
+
+
+class SinkhornL1l2Transport(BaseTransport):
+    """Domain Adapatation OT method based on sinkhorn algorithm +
+    l1l2 class regularization.
+
+    Parameters
+    ----------
+    reg_e : float, optional (default=1)
+        Entropic regularization parameter
+    reg_cl : float, optional (default=0.1)
+        Class regularization parameter
+    mode : string, optional (default="unsupervised")
+        The DA mode. If "unsupervised" no target labels are taken into account
+        to modify the cost matrix. If "semisupervised" the target labels
+        are taken into account to set coefficients of the pairwise distance
+        matrix to 0 for row and columns indices that correspond to source and
+        target samples which share the same labels.
+    mapping : string, optional (default="barycentric")
+        The kind of mapping to apply to transport samples from a domain into
+        another one.
+        if "barycentric" only the samples used to estimate the coupling can
+        be transported from a domain to another one.
+    metric : string, optional (default="sqeuclidean")
+        The ground metric for the Wasserstein problem
+    distribution : string, optional (default="uniform")
+        The kind of distribution estimation to employ
+    max_iter : int, float, optional (default=10)
+        The minimum number of iteration before stopping the optimization
+        algorithm if no it has not converged
+    max_inner_iter : int, float, optional (default=200)
+        The number of iteration in the inner loop
+    verbose : int, optional (default=0)
+        Controls the verbosity of the optimization algorithm
+    log : int, optional (default=0)
+        Controls the logs of the optimization algorithm
+    Attributes
+    ----------
+    Coupling_ : the optimal coupling
+
+    References
+    ----------
+
+    .. [1] N. Courty; R. Flamary; D. Tuia; A. Rakotomamonjy,
+       "Optimal Transport for Domain Adaptation," in IEEE
+       Transactions on Pattern Analysis and Machine Intelligence ,
+       vol.PP, no.99, pp.1-1
+    .. [2] Rakotomamonjy, A., Flamary, R., & Courty, N. (2015).
+       Generalized conditional gradient: analysis of convergence
+       and applications. arXiv preprint arXiv:1510.06567.
+
+    """
+
+    def __init__(self, reg_e=1., reg_cl=0.1, mode="unsupervised",
+                 max_iter=10, max_inner_iter=200,
+                 tol=10e-9, verbose=False, log=False,
+                 metric="sqeuclidean",
+                 distribution_estimation=distribution_estimation_uniform,
+                 out_of_sample_map='ferradans'):
+
+        self.reg_e = reg_e
+        self.reg_cl = reg_cl
+        self.mode = mode
+        self.max_iter = max_iter
+        self.max_inner_iter = max_inner_iter
+        self.tol = tol
+        self.verbose = verbose
+        self.log = log
+        self.metric = metric
+        self.distribution_estimation = distribution_estimation
+        self.out_of_sample_map = out_of_sample_map
+
+    def fit(self, Xs, ys=None, Xt=None, yt=None):
+        """Build a coupling matrix from source and target sets of samples
+        (Xs, ys) and (Xt, yt)
+        Parameters
+        ----------
+        Xs : array-like of shape = [n_source_samples, n_features]
+            The training input samples.
+        ys : array-like, shape = [n_source_samples]
+            The class labels
+        Xt : array-like of shape = [n_target_samples, n_features]
+            The training input samples.
+        yt : array-like, shape = [n_labeled_target_samples]
+            The class labels
+        Returns
+        -------
+        self : object
+            Returns self.
+        """
+
+        super(SinkhornL1l2Transport, self).fit(Xs, ys, Xt, yt)
+
+        self.Coupling_ = sinkhorn_l1l2_gl(
+            a=self.mu_s, labels_a=ys, b=self.mu_t, M=self.Cost,
+            reg=self.reg_e, eta=self.reg_cl, numItermax=self.max_iter,
+            numInnerItermax=self.max_inner_iter, stopInnerThr=self.tol,
+            verbose=self.verbose, log=self.log)
+
+        return self
diff --git a/test/test_da.py b/test/test_da.py
index 7d00cfb..68d1958 100644
--- a/test/test_da.py
+++ b/test/test_da.py
@@ -63,6 +63,56 @@ def test_sinkhorn_lpl1_transport_class():
     assert_equal(transp_Xs.shape, Xs.shape)
 
 
+def test_sinkhorn_l1l2_transport_class():
+    """test_sinkhorn_transport
+    """
+
+    ns = 150
+    nt = 200
+
+    Xs, ys = get_data_classif('3gauss', ns)
+    Xt, yt = get_data_classif('3gauss2', nt)
+
+    clf = ot.da.SinkhornL1l2Transport()
+
+    # test its computed
+    clf.fit(Xs=Xs, ys=ys, Xt=Xt)
+
+    # test dimensions of coupling
+    assert_equal(clf.Cost.shape, ((Xs.shape[0], Xt.shape[0])))
+    assert_equal(clf.Coupling_.shape, ((Xs.shape[0], Xt.shape[0])))
+
+    # test margin constraints
+    mu_s = unif(ns)
+    mu_t = unif(nt)
+    assert_allclose(np.sum(clf.Coupling_, axis=0), mu_t, rtol=1e-3, atol=1e-3)
+    assert_allclose(np.sum(clf.Coupling_, axis=1), mu_s, rtol=1e-3, atol=1e-3)
+
+    # test transform
+    transp_Xs = clf.transform(Xs=Xs)
+    assert_equal(transp_Xs.shape, Xs.shape)
+
+    Xs_new, _ = get_data_classif('3gauss', ns + 1)
+    transp_Xs_new = clf.transform(Xs_new)
+
+    # check that the oos method is not working
+    assert_equal(transp_Xs_new, Xs_new)
+
+    # test inverse transform
+    transp_Xt = clf.inverse_transform(Xt=Xt)
+    assert_equal(transp_Xt.shape, Xt.shape)
+
+    Xt_new, _ = get_data_classif('3gauss2', nt + 1)
+    transp_Xt_new = clf.inverse_transform(Xt=Xt_new)
+
+    # check that the oos method is not working and returns the input data
+    assert_equal(transp_Xt_new, Xt_new)
+
+    # test fit_transform
+    transp_Xs = clf.fit_transform(Xs=Xs, ys=ys, Xt=Xt)
+    assert_equal(transp_Xs.shape, Xs.shape)
+
+
 def test_sinkhorn_transport_class():
     """test_sinkhorn_transport
     """
-- 
cgit v1.2.3


From 4e562a1ce24119b8c9c1efb9d078762904c5d78a Mon Sep 17 00:00:00 2001
From: Slasnista <stan.chambon@gmail.com>
Date: Fri, 4 Aug 2017 12:04:04 +0200
Subject: semi supervised mode supported

---
 ot/da.py        | 21 +++++++++++++++++++--
 test/test_da.py | 52 ++++++++++++++++++++++++++++++++++++++++++++++++++++
 2 files changed, 71 insertions(+), 2 deletions(-)

(limited to 'test')

diff --git a/ot/da.py b/ot/da.py
index 6100d15..8294e8d 100644
--- a/ot/da.py
+++ b/ot/da.py
@@ -1089,8 +1089,25 @@ class BaseTransport(BaseEstimator):
         self.Cost = dist(Xs, Xt, metric=self.metric)
 
         if self.mode == "semisupervised":
-            print("TODO: modify cost matrix accordingly")
-            pass
+
+            if (ys is not None) and (yt is not None):
+
+                # assumes labeled source samples occupy the first rows
+                # and labeled target samples occupy the first columns
+                classes = np.unique(ys)
+                for c in classes:
+                    ids = np.where(ys == c)
+                    idt = np.where(yt == c)
+
+                    # all the coefficients corresponding to a source sample
+                    # and a target sample with the same label gets a 0
+                    # transport cost
+                    for j in idt[0]:
+                        self.Cost[ids[0], j] = 0
+            else:
+                print("Warning: using unsupervised mode\
+                       \nto use semisupervised mode, please provide ys and yt")
+                pass
 
         # distribution estimation
         self.mu_s = self.distribution_estimation(Xs)
diff --git a/test/test_da.py b/test/test_da.py
index 68d1958..497a8ee 100644
--- a/test/test_da.py
+++ b/test/test_da.py
@@ -62,6 +62,19 @@ def test_sinkhorn_lpl1_transport_class():
     transp_Xs = clf.fit_transform(Xs=Xs, ys=ys, Xt=Xt)
     assert_equal(transp_Xs.shape, Xs.shape)
 
+    # test semi supervised mode
+    clf = ot.da.SinkhornTransport(mode="semisupervised")
+    clf.fit(Xs=Xs, Xt=Xt)
+    n_unsup = np.sum(clf.Cost)
+
+    # test semi supervised mode
+    clf = ot.da.SinkhornTransport(mode="semisupervised")
+    clf.fit(Xs=Xs, ys=ys, Xt=Xt, yt=yt)
+    assert_equal(clf.Cost.shape, ((Xs.shape[0], Xt.shape[0])))
+    n_semisup = np.sum(clf.Cost)
+
+    assert n_unsup != n_semisup, "semisupervised mode not working"
+
 
 def test_sinkhorn_l1l2_transport_class():
     """test_sinkhorn_transport
@@ -112,6 +125,19 @@ def test_sinkhorn_l1l2_transport_class():
     transp_Xs = clf.fit_transform(Xs=Xs, ys=ys, Xt=Xt)
     assert_equal(transp_Xs.shape, Xs.shape)
 
+    # test semi supervised mode
+    clf = ot.da.SinkhornTransport(mode="semisupervised")
+    clf.fit(Xs=Xs, Xt=Xt)
+    n_unsup = np.sum(clf.Cost)
+
+    # test semi supervised mode
+    clf = ot.da.SinkhornTransport(mode="semisupervised")
+    clf.fit(Xs=Xs, ys=ys, Xt=Xt, yt=yt)
+    assert_equal(clf.Cost.shape, ((Xs.shape[0], Xt.shape[0])))
+    n_semisup = np.sum(clf.Cost)
+
+    assert n_unsup != n_semisup, "semisupervised mode not working"
+
 
 def test_sinkhorn_transport_class():
     """test_sinkhorn_transport
@@ -162,6 +188,19 @@ def test_sinkhorn_transport_class():
     transp_Xs = clf.fit_transform(Xs=Xs, Xt=Xt)
     assert_equal(transp_Xs.shape, Xs.shape)
 
+    # test semi supervised mode
+    clf = ot.da.SinkhornTransport(mode="semisupervised")
+    clf.fit(Xs=Xs, Xt=Xt)
+    n_unsup = np.sum(clf.Cost)
+
+    # test semi supervised mode
+    clf = ot.da.SinkhornTransport(mode="semisupervised")
+    clf.fit(Xs=Xs, ys=ys, Xt=Xt, yt=yt)
+    assert_equal(clf.Cost.shape, ((Xs.shape[0], Xt.shape[0])))
+    n_semisup = np.sum(clf.Cost)
+
+    assert n_unsup != n_semisup, "semisupervised mode not working"
+
 
 def test_emd_transport_class():
     """test_sinkhorn_transport
@@ -212,6 +251,19 @@ def test_emd_transport_class():
     transp_Xs = clf.fit_transform(Xs=Xs, Xt=Xt)
     assert_equal(transp_Xs.shape, Xs.shape)
 
+    # test semi supervised mode
+    clf = ot.da.SinkhornTransport(mode="semisupervised")
+    clf.fit(Xs=Xs, Xt=Xt)
+    n_unsup = np.sum(clf.Cost)
+
+    # test semi supervised mode
+    clf = ot.da.SinkhornTransport(mode="semisupervised")
+    clf.fit(Xs=Xs, ys=ys, Xt=Xt, yt=yt)
+    assert_equal(clf.Cost.shape, ((Xs.shape[0], Xt.shape[0])))
+    n_semisup = np.sum(clf.Cost)
+
+    assert n_unsup != n_semisup, "semisupervised mode not working"
+
 
 def test_otda():
 
-- 
cgit v1.2.3


From 62b40a9993e9ccca27d1677aa1294fff6246e904 Mon Sep 17 00:00:00 2001
From: Slasnista <stan.chambon@gmail.com>
Date: Fri, 4 Aug 2017 13:56:51 +0200
Subject: correction of semi supervised mode

---
 ot/da.py        | 77 +++++++++++++++++++++++++++++++++------------------------
 test/test_da.py | 20 +++++++--------
 2 files changed, 55 insertions(+), 42 deletions(-)

(limited to 'test')

diff --git a/ot/da.py b/ot/da.py
index 8294e8d..08e8a8d 100644
--- a/ot/da.py
+++ b/ot/da.py
@@ -1088,26 +1088,23 @@ class BaseTransport(BaseEstimator):
         # pairwise distance
         self.Cost = dist(Xs, Xt, metric=self.metric)
 
-        if self.mode == "semisupervised":
-
-            if (ys is not None) and (yt is not None):
-
-                # assumes labeled source samples occupy the first rows
-                # and labeled target samples occupy the first columns
-                classes = np.unique(ys)
-                for c in classes:
-                    ids = np.where(ys == c)
-                    idt = np.where(yt == c)
-
-                    # all the coefficients corresponding to a source sample
-                    # and a target sample with the same label gets a 0
-                    # transport cost
-                    for j in idt[0]:
-                        self.Cost[ids[0], j] = 0
-            else:
-                print("Warning: using unsupervised mode\
-                       \nto use semisupervised mode, please provide ys and yt")
-                pass
+        if (ys is not None) and (yt is not None):
+
+            if self.limit_max != np.infty:
+                self.limit_max = self.limit_max * np.max(self.Cost)
+
+            # assumes labeled source samples occupy the first rows
+            # and labeled target samples occupy the first columns
+            classes = np.unique(ys)
+            for c in classes:
+                idx_s = np.where((ys != c) & (ys != -1))
+                idx_t = np.where(yt == c)
+
+                # all the coefficients corresponding to a source sample
+                # and a target sample :
+                # with different labels get a infinite
+                for j in idx_t[0]:
+                    self.Cost[idx_s[0], j] = self.limit_max
 
         # distribution estimation
         self.mu_s = self.distribution_estimation(Xs)
@@ -1243,6 +1240,9 @@ class SinkhornTransport(BaseTransport):
         Controls the verbosity of the optimization algorithm
     log : int, optional (default=0)
         Controls the logs of the optimization algorithm
+    limit_max: float, optional (defaul=np.infty)
+        Controls the semi supervised mode. Transport between labeled source
+        and target samples of different classes will exhibit an infinite cost
     Attributes
     ----------
     Coupling_ : the optimal coupling
@@ -1257,19 +1257,19 @@ class SinkhornTransport(BaseTransport):
            26, 2013
     """
 
-    def __init__(self, reg_e=1., mode="unsupervised", max_iter=1000,
+    def __init__(self, reg_e=1., max_iter=1000,
                  tol=10e-9, verbose=False, log=False,
                  metric="sqeuclidean",
                  distribution_estimation=distribution_estimation_uniform,
-                 out_of_sample_map='ferradans'):
+                 out_of_sample_map='ferradans', limit_max=np.infty):
 
         self.reg_e = reg_e
-        self.mode = mode
         self.max_iter = max_iter
         self.tol = tol
         self.verbose = verbose
         self.log = log
         self.metric = metric
+        self.limit_max = limit_max
         self.distribution_estimation = distribution_estimation
         self.out_of_sample_map = out_of_sample_map
 
@@ -1326,6 +1326,10 @@ class EMDTransport(BaseTransport):
         Controls the verbosity of the optimization algorithm
     log : int, optional (default=0)
         Controls the logs of the optimization algorithm
+    limit_max: float, optional (default=10)
+        Controls the semi supervised mode. Transport between labeled source
+        and target samples of different classes will exhibit an infinite cost
+        (10 times the maximum value of the cost matrix)
     Attributes
     ----------
     Coupling_ : the optimal coupling
@@ -1337,15 +1341,15 @@ class EMDTransport(BaseTransport):
            on Pattern Analysis and Machine Intelligence , vol.PP, no.99, pp.1-1
     """
 
-    def __init__(self, mode="unsupervised", verbose=False,
+    def __init__(self, verbose=False,
                  log=False, metric="sqeuclidean",
                  distribution_estimation=distribution_estimation_uniform,
-                 out_of_sample_map='ferradans'):
+                 out_of_sample_map='ferradans', limit_max=10):
 
-        self.mode = mode
         self.verbose = verbose
         self.log = log
         self.metric = metric
+        self.limit_max = limit_max
         self.distribution_estimation = distribution_estimation
         self.out_of_sample_map = out_of_sample_map
 
@@ -1414,6 +1418,10 @@ class SinkhornLpl1Transport(BaseTransport):
         Controls the verbosity of the optimization algorithm
     log : int, optional (default=0)
         Controls the logs of the optimization algorithm
+    limit_max: float, optional (defaul=np.infty)
+        Controls the semi supervised mode. Transport between labeled source
+        and target samples of different classes will exhibit an infinite cost
+
     Attributes
     ----------
     Coupling_ : the optimal coupling
@@ -1431,16 +1439,15 @@ class SinkhornLpl1Transport(BaseTransport):
 
     """
 
-    def __init__(self, reg_e=1., reg_cl=0.1, mode="unsupervised",
+    def __init__(self, reg_e=1., reg_cl=0.1,
                  max_iter=10, max_inner_iter=200,
                  tol=10e-9, verbose=False, log=False,
                  metric="sqeuclidean",
                  distribution_estimation=distribution_estimation_uniform,
-                 out_of_sample_map='ferradans'):
+                 out_of_sample_map='ferradans', limit_max=np.infty):
 
         self.reg_e = reg_e
         self.reg_cl = reg_cl
-        self.mode = mode
         self.max_iter = max_iter
         self.max_inner_iter = max_inner_iter
         self.tol = tol
@@ -1449,6 +1456,7 @@ class SinkhornLpl1Transport(BaseTransport):
         self.metric = metric
         self.distribution_estimation = distribution_estimation
         self.out_of_sample_map = out_of_sample_map
+        self.limit_max = limit_max
 
     def fit(self, Xs, ys=None, Xt=None, yt=None):
         """Build a coupling matrix from source and target sets of samples
@@ -1514,6 +1522,11 @@ class SinkhornL1l2Transport(BaseTransport):
         Controls the verbosity of the optimization algorithm
     log : int, optional (default=0)
         Controls the logs of the optimization algorithm
+    limit_max: float, optional (default=10)
+        Controls the semi supervised mode. Transport between labeled source
+        and target samples of different classes will exhibit an infinite cost
+        (10 times the maximum value of the cost matrix)
+
     Attributes
     ----------
     Coupling_ : the optimal coupling
@@ -1531,16 +1544,15 @@ class SinkhornL1l2Transport(BaseTransport):
 
     """
 
-    def __init__(self, reg_e=1., reg_cl=0.1, mode="unsupervised",
+    def __init__(self, reg_e=1., reg_cl=0.1,
                  max_iter=10, max_inner_iter=200,
                  tol=10e-9, verbose=False, log=False,
                  metric="sqeuclidean",
                  distribution_estimation=distribution_estimation_uniform,
-                 out_of_sample_map='ferradans'):
+                 out_of_sample_map='ferradans', limit_max=10):
 
         self.reg_e = reg_e
         self.reg_cl = reg_cl
-        self.mode = mode
         self.max_iter = max_iter
         self.max_inner_iter = max_inner_iter
         self.tol = tol
@@ -1549,6 +1561,7 @@ class SinkhornL1l2Transport(BaseTransport):
         self.metric = metric
         self.distribution_estimation = distribution_estimation
         self.out_of_sample_map = out_of_sample_map
+        self.limit_max = limit_max
 
     def fit(self, Xs, ys=None, Xt=None, yt=None):
         """Build a coupling matrix from source and target sets of samples
diff --git a/test/test_da.py b/test/test_da.py
index 497a8ee..ecd2a3a 100644
--- a/test/test_da.py
+++ b/test/test_da.py
@@ -63,12 +63,12 @@ def test_sinkhorn_lpl1_transport_class():
     assert_equal(transp_Xs.shape, Xs.shape)
 
     # test semi supervised mode
-    clf = ot.da.SinkhornTransport(mode="semisupervised")
-    clf.fit(Xs=Xs, Xt=Xt)
+    clf = ot.da.SinkhornLpl1Transport()
+    clf.fit(Xs=Xs, ys=ys, Xt=Xt)
     n_unsup = np.sum(clf.Cost)
 
     # test semi supervised mode
-    clf = ot.da.SinkhornTransport(mode="semisupervised")
+    clf = ot.da.SinkhornLpl1Transport()
     clf.fit(Xs=Xs, ys=ys, Xt=Xt, yt=yt)
     assert_equal(clf.Cost.shape, ((Xs.shape[0], Xt.shape[0])))
     n_semisup = np.sum(clf.Cost)
@@ -126,12 +126,12 @@ def test_sinkhorn_l1l2_transport_class():
     assert_equal(transp_Xs.shape, Xs.shape)
 
     # test semi supervised mode
-    clf = ot.da.SinkhornTransport(mode="semisupervised")
-    clf.fit(Xs=Xs, Xt=Xt)
+    clf = ot.da.SinkhornL1l2Transport()
+    clf.fit(Xs=Xs, ys=ys, Xt=Xt)
     n_unsup = np.sum(clf.Cost)
 
     # test semi supervised mode
-    clf = ot.da.SinkhornTransport(mode="semisupervised")
+    clf = ot.da.SinkhornL1l2Transport()
     clf.fit(Xs=Xs, ys=ys, Xt=Xt, yt=yt)
     assert_equal(clf.Cost.shape, ((Xs.shape[0], Xt.shape[0])))
     n_semisup = np.sum(clf.Cost)
@@ -189,12 +189,12 @@ def test_sinkhorn_transport_class():
     assert_equal(transp_Xs.shape, Xs.shape)
 
     # test semi supervised mode
-    clf = ot.da.SinkhornTransport(mode="semisupervised")
+    clf = ot.da.SinkhornTransport()
     clf.fit(Xs=Xs, Xt=Xt)
     n_unsup = np.sum(clf.Cost)
 
     # test semi supervised mode
-    clf = ot.da.SinkhornTransport(mode="semisupervised")
+    clf = ot.da.SinkhornTransport()
     clf.fit(Xs=Xs, ys=ys, Xt=Xt, yt=yt)
     assert_equal(clf.Cost.shape, ((Xs.shape[0], Xt.shape[0])))
     n_semisup = np.sum(clf.Cost)
@@ -252,12 +252,12 @@ def test_emd_transport_class():
     assert_equal(transp_Xs.shape, Xs.shape)
 
     # test semi supervised mode
-    clf = ot.da.SinkhornTransport(mode="semisupervised")
+    clf = ot.da.EMDTransport()
     clf.fit(Xs=Xs, Xt=Xt)
     n_unsup = np.sum(clf.Cost)
 
     # test semi supervised mode
-    clf = ot.da.SinkhornTransport(mode="semisupervised")
+    clf = ot.da.EMDTransport()
     clf.fit(Xs=Xs, ys=ys, Xt=Xt, yt=yt)
     assert_equal(clf.Cost.shape, ((Xs.shape[0], Xt.shape[0])))
     n_semisup = np.sum(clf.Cost)
-- 
cgit v1.2.3


From b8672f67639e9daa3f91e555581256f984115f56 Mon Sep 17 00:00:00 2001
From: Slasnista <stan.chambon@gmail.com>
Date: Fri, 4 Aug 2017 14:55:54 +0200
Subject: out of samples by Ferradans supported for transform and
 inverse_transform

---
 ot/da.py        | 29 +++++++++++++++++++++++------
 test/test_da.py | 32 ++++++++++++++++----------------
 2 files changed, 39 insertions(+), 22 deletions(-)

(limited to 'test')

diff --git a/ot/da.py b/ot/da.py
index 92a8f12..87d056d 100644
--- a/ot/da.py
+++ b/ot/da.py
@@ -1167,9 +1167,18 @@ class BaseTransport(BaseEstimator):
             transp_Xs = np.dot(transp, self.Xt)
         else:
             # perform out of sample mapping
-            print("Warning: out of sample mapping not yet implemented")
-            print("input data will be returned")
-            transp_Xs = Xs
+
+            # get the nearest neighbor in the source domain
+            D0 = dist(Xs, self.Xs)
+            idx = np.argmin(D0, axis=1)
+
+            # transport the source samples
+            transp = self.Coupling_ / np.sum(self.Coupling_, 1)[:, None]
+            transp[~ np.isfinite(transp)] = 0
+            transp_Xs_ = np.dot(transp, self.Xt)
+
+            # define the transported points
+            transp_Xs = transp_Xs_[idx, :] + Xs - self.Xs[idx, :]
 
         return transp_Xs
 
@@ -1202,9 +1211,17 @@ class BaseTransport(BaseEstimator):
             transp_Xt = np.dot(transp_, self.Xs)
         else:
             # perform out of sample mapping
-            print("Warning: out of sample mapping not yet implemented")
-            print("input data will be returned")
-            transp_Xt = Xt
+
+            D0 = dist(Xt, self.Xt)
+            idx = np.argmin(D0, axis=1)
+
+            # transport the target samples
+            transp_ = self.Coupling_.T / np.sum(self.Coupling_, 0)[:, None]
+            transp_[~ np.isfinite(transp_)] = 0
+            transp_Xt_ = np.dot(transp_, self.Xs)
+
+            # define the transported points
+            transp_Xt = transp_Xt_[idx, :] + Xt - self.Xt[idx, :]
 
         return transp_Xt
 
diff --git a/test/test_da.py b/test/test_da.py
index ecd2a3a..aed9f61 100644
--- a/test/test_da.py
+++ b/test/test_da.py
@@ -45,8 +45,8 @@ def test_sinkhorn_lpl1_transport_class():
     Xs_new, _ = get_data_classif('3gauss', ns + 1)
     transp_Xs_new = clf.transform(Xs_new)
 
-    # check that the oos method is not working
-    assert_equal(transp_Xs_new, Xs_new)
+    # check that the oos method is working
+    assert_equal(transp_Xs_new.shape, Xs_new.shape)
 
     # test inverse transform
     transp_Xt = clf.inverse_transform(Xt=Xt)
@@ -55,8 +55,8 @@ def test_sinkhorn_lpl1_transport_class():
     Xt_new, _ = get_data_classif('3gauss2', nt + 1)
     transp_Xt_new = clf.inverse_transform(Xt=Xt_new)
 
-    # check that the oos method is not working and returns the input data
-    assert_equal(transp_Xt_new, Xt_new)
+    # check that the oos method is working
+    assert_equal(transp_Xt_new.shape, Xt_new.shape)
 
     # test fit_transform
     transp_Xs = clf.fit_transform(Xs=Xs, ys=ys, Xt=Xt)
@@ -108,8 +108,8 @@ def test_sinkhorn_l1l2_transport_class():
     Xs_new, _ = get_data_classif('3gauss', ns + 1)
     transp_Xs_new = clf.transform(Xs_new)
 
-    # check that the oos method is not working
-    assert_equal(transp_Xs_new, Xs_new)
+    # check that the oos method is working
+    assert_equal(transp_Xs_new.shape, Xs_new.shape)
 
     # test inverse transform
     transp_Xt = clf.inverse_transform(Xt=Xt)
@@ -118,8 +118,8 @@ def test_sinkhorn_l1l2_transport_class():
     Xt_new, _ = get_data_classif('3gauss2', nt + 1)
     transp_Xt_new = clf.inverse_transform(Xt=Xt_new)
 
-    # check that the oos method is not working and returns the input data
-    assert_equal(transp_Xt_new, Xt_new)
+    # check that the oos method is working
+    assert_equal(transp_Xt_new.shape, Xt_new.shape)
 
     # test fit_transform
     transp_Xs = clf.fit_transform(Xs=Xs, ys=ys, Xt=Xt)
@@ -171,8 +171,8 @@ def test_sinkhorn_transport_class():
     Xs_new, _ = get_data_classif('3gauss', ns + 1)
     transp_Xs_new = clf.transform(Xs_new)
 
-    # check that the oos method is not working
-    assert_equal(transp_Xs_new, Xs_new)
+    # check that the oos method is working
+    assert_equal(transp_Xs_new.shape, Xs_new.shape)
 
     # test inverse transform
     transp_Xt = clf.inverse_transform(Xt=Xt)
@@ -181,8 +181,8 @@ def test_sinkhorn_transport_class():
     Xt_new, _ = get_data_classif('3gauss2', nt + 1)
     transp_Xt_new = clf.inverse_transform(Xt=Xt_new)
 
-    # check that the oos method is not working and returns the input data
-    assert_equal(transp_Xt_new, Xt_new)
+    # check that the oos method is working
+    assert_equal(transp_Xt_new.shape, Xt_new.shape)
 
     # test fit_transform
     transp_Xs = clf.fit_transform(Xs=Xs, Xt=Xt)
@@ -234,8 +234,8 @@ def test_emd_transport_class():
     Xs_new, _ = get_data_classif('3gauss', ns + 1)
     transp_Xs_new = clf.transform(Xs_new)
 
-    # check that the oos method is not working
-    assert_equal(transp_Xs_new, Xs_new)
+    # check that the oos method is working
+    assert_equal(transp_Xs_new.shape, Xs_new.shape)
 
     # test inverse transform
     transp_Xt = clf.inverse_transform(Xt=Xt)
@@ -244,8 +244,8 @@ def test_emd_transport_class():
     Xt_new, _ = get_data_classif('3gauss2', nt + 1)
     transp_Xt_new = clf.inverse_transform(Xt=Xt_new)
 
-    # check that the oos method is not working and returns the input data
-    assert_equal(transp_Xt_new, Xt_new)
+    # check that the oos method is working
+    assert_equal(transp_Xt_new.shape, Xt_new.shape)
 
     # test fit_transform
     transp_Xs = clf.fit_transform(Xs=Xs, Xt=Xt)
-- 
cgit v1.2.3


From d20a067f91dcca318e2841ac52a8c578c78b89b2 Mon Sep 17 00:00:00 2001
From: Slasnista <stan.chambon@gmail.com>
Date: Wed, 23 Aug 2017 11:45:06 +0200
Subject: make doc strings compliant with numpy / modif according to AG review

---
 ot/da.py        | 139 +++++++++++++++++++++++++++++++++-----------------------
 test/test_da.py |  13 ++++--
 2 files changed, 93 insertions(+), 59 deletions(-)

(limited to 'test')

diff --git a/ot/da.py b/ot/da.py
index 0616d17..044d567 100644
--- a/ot/da.py
+++ b/ot/da.py
@@ -967,11 +967,13 @@ class BaseEstimator(object):
 
     def get_params(self, deep=True):
         """Get parameters for this estimator.
+
         Parameters
         ----------
         deep : boolean, optional
             If True, will return the parameters for this estimator and
             contained subobjects that are estimators.
+
         Returns
         -------
         params : mapping of string to any
@@ -1002,10 +1004,12 @@ class BaseEstimator(object):
 
     def set_params(self, **params):
         """Set the parameters of this estimator.
+
         The method works on simple estimators as well as on nested objects
         (such as pipelines). The latter have parameters of the form
         ``<component>__<parameter>`` so that it's possible to update each
         component of a nested object.
+
         Returns
         -------
         self
@@ -1053,11 +1057,12 @@ def distribution_estimation_uniform(X):
 
     Parameters
     ----------
-    X : array-like of shape = (n_samples, n_features)
+    X : array-like, shape (n_samples, n_features)
         The array of samples
+
     Returns
     -------
-    mu : array-like, shape = (n_samples,)
+    mu : array-like, shape (n_samples,)
         The uniform distribution estimated from X
     """
 
@@ -1069,16 +1074,18 @@ class BaseTransport(BaseEstimator):
     def fit(self, Xs=None, ys=None, Xt=None, yt=None):
         """Build a coupling matrix from source and target sets of samples
         (Xs, ys) and (Xt, yt)
+
         Parameters
         ----------
-        Xs : array-like of shape = (n_source_samples, n_features)
+        Xs : array-like, shape (n_source_samples, n_features)
             The training input samples.
-        ys : array-like, shape = (n_source_samples,)
+        ys : array-like, shape (n_source_samples,)
             The class labels
-        Xt : array-like of shape = (n_target_samples, n_features)
+        Xt : array-like, shape (n_target_samples, n_features)
             The training input samples.
-        yt : array-like, shape = (n_labeled_target_samples,)
+        yt : array-like, shape (n_labeled_target_samples,)
             The class labels
+
         Returns
         -------
         self : object
@@ -1086,12 +1093,12 @@ class BaseTransport(BaseEstimator):
         """
 
         # pairwise distance
-        self.Cost = dist(Xs, Xt, metric=self.metric)
+        self.cost_ = dist(Xs, Xt, metric=self.metric)
 
         if (ys is not None) and (yt is not None):
 
             if self.limit_max != np.infty:
-                self.limit_max = self.limit_max * np.max(self.Cost)
+                self.limit_max = self.limit_max * np.max(self.cost_)
 
             # assumes labeled source samples occupy the first rows
             # and labeled target samples occupy the first columns
@@ -1104,7 +1111,7 @@ class BaseTransport(BaseEstimator):
                 # and a target sample :
                 # with different labels get a infinite
                 for j in idx_t[0]:
-                    self.Cost[idx_s[0], j] = self.limit_max
+                    self.cost_[idx_s[0], j] = self.limit_max
 
         # distribution estimation
         self.mu_s = self.distribution_estimation(Xs)
@@ -1120,19 +1127,21 @@ class BaseTransport(BaseEstimator):
         """Build a coupling matrix from source and target sets of samples
         (Xs, ys) and (Xt, yt) and transports source samples Xs onto target
         ones Xt
+
         Parameters
         ----------
-        Xs : array-like of shape = (n_source_samples, n_features)
+        Xs : array-like, shape (n_source_samples, n_features)
             The training input samples.
-        ys : array-like, shape = (n_source_samples,)
+        ys : array-like, shape (n_source_samples,)
             The class labels
-        Xt : array-like of shape = (n_target_samples, n_features)
+        Xt : array-like, shape (n_target_samples, n_features)
             The training input samples.
-        yt : array-like, shape = (n_labeled_target_samples,)
+        yt : array-like, shape (n_labeled_target_samples,)
             The class labels
+
         Returns
         -------
-        transp_Xs : array-like of shape = (n_source_samples, n_features)
+        transp_Xs : array-like, shape (n_source_samples, n_features)
             The source samples samples.
         """
 
@@ -1140,25 +1149,27 @@ class BaseTransport(BaseEstimator):
 
     def transform(self, Xs=None, ys=None, Xt=None, yt=None):
         """Transports source samples Xs onto target ones Xt
+
         Parameters
         ----------
-        Xs : array-like of shape = (n_source_samples, n_features)
+        Xs : array-like, shape (n_source_samples, n_features)
             The training input samples.
-        ys : array-like, shape = (n_source_samples,)
+        ys : array-like, shape (n_source_samples,)
             The class labels
-        Xt : array-like of shape = (n_target_samples, n_features)
+        Xt : array-like, shape (n_target_samples, n_features)
             The training input samples.
-        yt : array-like, shape = (n_labeled_target_samples,)
+        yt : array-like, shape (n_labeled_target_samples,)
             The class labels
+
         Returns
         -------
-        transp_Xs : array-like of shape = (n_source_samples, n_features)
+        transp_Xs : array-like, shape (n_source_samples, n_features)
             The transport source samples.
         """
 
         if np.array_equal(self.Xs, Xs):
             # perform standard barycentric mapping
-            transp = self.Coupling_ / np.sum(self.Coupling_, 1)[:, None]
+            transp = self.coupling_ / np.sum(self.coupling_, 1)[:, None]
 
             # set nans to 0
             transp[~ np.isfinite(transp)] = 0
@@ -1173,7 +1184,7 @@ class BaseTransport(BaseEstimator):
             idx = np.argmin(D0, axis=1)
 
             # transport the source samples
-            transp = self.Coupling_ / np.sum(self.Coupling_, 1)[:, None]
+            transp = self.coupling_ / np.sum(self.coupling_, 1)[:, None]
             transp[~ np.isfinite(transp)] = 0
             transp_Xs_ = np.dot(transp, self.Xt)
 
@@ -1184,25 +1195,27 @@ class BaseTransport(BaseEstimator):
 
     def inverse_transform(self, Xs=None, ys=None, Xt=None, yt=None):
         """Transports target samples Xt onto target samples Xs
+
         Parameters
         ----------
-        Xs : array-like of shape = (n_source_samples, n_features)
+        Xs : array-like, shape (n_source_samples, n_features)
             The training input samples.
         ys : array-like, shape = (n_source_samples,)
             The class labels
-        Xt : array-like of shape = (n_target_samples, n_features)
+        Xt : array-like, shape (n_target_samples, n_features)
             The training input samples.
         yt : array-like, shape = (n_labeled_target_samples,)
             The class labels
+
         Returns
         -------
-        transp_Xt : array-like of shape = (n_source_samples, n_features)
+        transp_Xt : array-like, shape (n_source_samples, n_features)
             The transported target samples.
         """
 
         if np.array_equal(self.Xt, Xt):
             # perform standard barycentric mapping
-            transp_ = self.Coupling_.T / np.sum(self.Coupling_, 0)[:, None]
+            transp_ = self.coupling_.T / np.sum(self.coupling_, 0)[:, None]
 
             # set nans to 0
             transp_[~ np.isfinite(transp_)] = 0
@@ -1216,7 +1229,7 @@ class BaseTransport(BaseEstimator):
             idx = np.argmin(D0, axis=1)
 
             # transport the target samples
-            transp_ = self.Coupling_.T / np.sum(self.Coupling_, 0)[:, None]
+            transp_ = self.coupling_.T / np.sum(self.coupling_, 0)[:, None]
             transp_[~ np.isfinite(transp_)] = 0
             transp_Xt_ = np.dot(transp_, self.Xs)
 
@@ -1254,9 +1267,10 @@ class SinkhornTransport(BaseTransport):
     limit_max: float, optional (defaul=np.infty)
         Controls the semi supervised mode. Transport between labeled source
         and target samples of different classes will exhibit an infinite cost
+
     Attributes
     ----------
-    Coupling_ : the optimal coupling
+    coupling_ : the optimal coupling
 
     References
     ----------
@@ -1287,16 +1301,18 @@ class SinkhornTransport(BaseTransport):
     def fit(self, Xs=None, ys=None, Xt=None, yt=None):
         """Build a coupling matrix from source and target sets of samples
         (Xs, ys) and (Xt, yt)
+
         Parameters
         ----------
-        Xs : array-like of shape = (n_source_samples, n_features)
+        Xs : array-like, shape (n_source_samples, n_features)
             The training input samples.
         ys : array-like, shape = (n_source_samples,)
             The class labels
-        Xt : array-like of shape = (n_target_samples, n_features)
+        Xt : array-like, shape (n_target_samples, n_features)
             The training input samples.
         yt : array-like, shape = (n_labeled_target_samples,)
             The class labels
+
         Returns
         -------
         self : object
@@ -1306,8 +1322,8 @@ class SinkhornTransport(BaseTransport):
         super(SinkhornTransport, self).fit(Xs, ys, Xt, yt)
 
         # coupling estimation
-        self.Coupling_ = sinkhorn(
-            a=self.mu_s, b=self.mu_t, M=self.Cost, reg=self.reg_e,
+        self.coupling_ = sinkhorn(
+            a=self.mu_s, b=self.mu_t, M=self.cost_, reg=self.reg_e,
             numItermax=self.max_iter, stopThr=self.tol,
             verbose=self.verbose, log=self.log)
 
@@ -1316,6 +1332,7 @@ class SinkhornTransport(BaseTransport):
 
 class EMDTransport(BaseTransport):
     """Domain Adapatation OT method based on Earth Mover's Distance
+
     Parameters
     ----------
     mapping : string, optional (default="barycentric")
@@ -1335,9 +1352,10 @@ class EMDTransport(BaseTransport):
         Controls the semi supervised mode. Transport between labeled source
         and target samples of different classes will exhibit an infinite cost
         (10 times the maximum value of the cost matrix)
+
     Attributes
     ----------
-    Coupling_ : the optimal coupling
+    coupling_ : the optimal coupling
 
     References
     ----------
@@ -1358,16 +1376,18 @@ class EMDTransport(BaseTransport):
     def fit(self, Xs, ys=None, Xt=None, yt=None):
         """Build a coupling matrix from source and target sets of samples
         (Xs, ys) and (Xt, yt)
+
         Parameters
         ----------
-        Xs : array-like of shape = (n_source_samples, n_features)
+        Xs : array-like, shape (n_source_samples, n_features)
             The training input samples.
         ys : array-like, shape = (n_source_samples,)
             The class labels
-        Xt : array-like of shape = (n_target_samples, n_features)
+        Xt : array-like, shape (n_target_samples, n_features)
             The training input samples.
         yt : array-like, shape = (n_labeled_target_samples,)
             The class labels
+
         Returns
         -------
         self : object
@@ -1377,8 +1397,8 @@ class EMDTransport(BaseTransport):
         super(EMDTransport, self).fit(Xs, ys, Xt, yt)
 
         # coupling estimation
-        self.Coupling_ = emd(
-            a=self.mu_s, b=self.mu_t, M=self.Cost,
+        self.coupling_ = emd(
+            a=self.mu_s, b=self.mu_t, M=self.cost_,
         )
 
         return self
@@ -1418,7 +1438,7 @@ class SinkhornLpl1Transport(BaseTransport):
 
     Attributes
     ----------
-    Coupling_ : the optimal coupling
+    coupling_ : the optimal coupling
 
     References
     ----------
@@ -1455,16 +1475,18 @@ class SinkhornLpl1Transport(BaseTransport):
     def fit(self, Xs, ys=None, Xt=None, yt=None):
         """Build a coupling matrix from source and target sets of samples
         (Xs, ys) and (Xt, yt)
+
         Parameters
         ----------
-        Xs : array-like of shape = (n_source_samples, n_features)
+        Xs : array-like, shape (n_source_samples, n_features)
             The training input samples.
         ys : array-like, shape = (n_source_samples,)
             The class labels
-        Xt : array-like of shape = (n_target_samples, n_features)
+        Xt : array-like, shape (n_target_samples, n_features)
             The training input samples.
         yt : array-like, shape = (n_labeled_target_samples,)
             The class labels
+
         Returns
         -------
         self : object
@@ -1473,8 +1495,8 @@ class SinkhornLpl1Transport(BaseTransport):
 
         super(SinkhornLpl1Transport, self).fit(Xs, ys, Xt, yt)
 
-        self.Coupling_ = sinkhorn_lpl1_mm(
-            a=self.mu_s, labels_a=ys, b=self.mu_t, M=self.Cost,
+        self.coupling_ = sinkhorn_lpl1_mm(
+            a=self.mu_s, labels_a=ys, b=self.mu_t, M=self.cost_,
             reg=self.reg_e, eta=self.reg_cl, numItermax=self.max_iter,
             numInnerItermax=self.max_inner_iter, stopInnerThr=self.tol,
             verbose=self.verbose, log=self.log)
@@ -1517,7 +1539,7 @@ class SinkhornL1l2Transport(BaseTransport):
 
     Attributes
     ----------
-    Coupling_ : the optimal coupling
+    coupling_ : the optimal coupling
 
     References
     ----------
@@ -1554,16 +1576,18 @@ class SinkhornL1l2Transport(BaseTransport):
     def fit(self, Xs, ys=None, Xt=None, yt=None):
         """Build a coupling matrix from source and target sets of samples
         (Xs, ys) and (Xt, yt)
+
         Parameters
         ----------
-        Xs : array-like of shape = (n_source_samples, n_features)
+        Xs : array-like, shape (n_source_samples, n_features)
             The training input samples.
         ys : array-like, shape = (n_source_samples,)
             The class labels
-        Xt : array-like of shape = (n_target_samples, n_features)
+        Xt : array-like, shape (n_target_samples, n_features)
             The training input samples.
         yt : array-like, shape = (n_labeled_target_samples,)
             The class labels
+
         Returns
         -------
         self : object
@@ -1572,8 +1596,8 @@ class SinkhornL1l2Transport(BaseTransport):
 
         super(SinkhornL1l2Transport, self).fit(Xs, ys, Xt, yt)
 
-        self.Coupling_ = sinkhorn_l1l2_gl(
-            a=self.mu_s, labels_a=ys, b=self.mu_t, M=self.Cost,
+        self.coupling_ = sinkhorn_l1l2_gl(
+            a=self.mu_s, labels_a=ys, b=self.mu_t, M=self.cost_,
             reg=self.reg_e, eta=self.reg_cl, numItermax=self.max_iter,
             numInnerItermax=self.max_inner_iter, stopInnerThr=self.tol,
             verbose=self.verbose, log=self.log)
@@ -1614,8 +1638,8 @@ class MappingTransport(BaseEstimator):
 
     Attributes
     ----------
-    Coupling_ : the optimal coupling
-    Mapping_ : the mapping associated
+    coupling_ : the optimal coupling
+    mapping_ : the mapping associated
 
     References
     ----------
@@ -1646,16 +1670,18 @@ class MappingTransport(BaseEstimator):
     def fit(self, Xs=None, ys=None, Xt=None, yt=None):
         """Builds an optimal coupling and estimates the associated mapping
         from source and target sets of samples (Xs, ys) and (Xt, yt)
+
         Parameters
         ----------
-        Xs : array-like of shape = (n_source_samples, n_features)
+        Xs : array-like, shape (n_source_samples, n_features)
             The training input samples.
         ys : array-like, shape = (n_source_samples,)
             The class labels
-        Xt : array-like of shape = (n_target_samples, n_features)
+        Xt : array-like, shape (n_target_samples, n_features)
             The training input samples.
         yt : array-like, shape = (n_labeled_target_samples,)
             The class labels
+
         Returns
         -------
         self : object
@@ -1666,14 +1692,14 @@ class MappingTransport(BaseEstimator):
         self.Xt = Xt
 
         if self.kernel == "linear":
-            self.Coupling_, self.Mapping_ = joint_OT_mapping_linear(
+            self.coupling_, self.mapping_ = joint_OT_mapping_linear(
                 Xs, Xt, mu=self.mu, eta=self.eta, bias=self.bias,
                 verbose=self.verbose, verbose2=self.verbose2,
                 numItermax=self.max_iter, numInnerItermax=self.max_inner_iter,
                 stopThr=self.tol, stopInnerThr=self.inner_tol, log=self.log)
 
         elif self.kernel == "gaussian":
-            self.Coupling_, self.Mapping_ = joint_OT_mapping_kernel(
+            self.coupling_, self.mapping_ = joint_OT_mapping_kernel(
                 Xs, Xt, mu=self.mu, eta=self.eta, bias=self.bias,
                 sigma=self.sigma, verbose=self.verbose, verbose2=self.verbose,
                 numItermax=self.max_iter, numInnerItermax=self.max_inner_iter,
@@ -1683,20 +1709,21 @@ class MappingTransport(BaseEstimator):
 
     def transform(self, Xs):
         """Transports source samples Xs onto target ones Xt
+
         Parameters
         ----------
-        Xs : array-like of shape = (n_source_samples, n_features)
+        Xs : array-like, shape (n_source_samples, n_features)
             The training input samples.
 
         Returns
         -------
-        transp_Xs : array-like of shape = (n_source_samples, n_features)
+        transp_Xs : array-like, shape (n_source_samples, n_features)
             The transport source samples.
         """
 
         if np.array_equal(self.Xs, Xs):
             # perform standard barycentric mapping
-            transp = self.Coupling_ / np.sum(self.Coupling_, 1)[:, None]
+            transp = self.coupling_ / np.sum(self.coupling_, 1)[:, None]
 
             # set nans to 0
             transp[~ np.isfinite(transp)] = 0
@@ -1710,6 +1737,6 @@ class MappingTransport(BaseEstimator):
                 K = Xs
             if self.bias:
                 K = np.hstack((K, np.ones((Xs.shape[0], 1))))
-            transp_Xs = K.dot(self.Mapping_)
+            transp_Xs = K.dot(self.mapping_)
 
         return transp_Xs
diff --git a/test/test_da.py b/test/test_da.py
index aed9f61..93f7e83 100644
--- a/test/test_da.py
+++ b/test/test_da.py
@@ -5,13 +5,12 @@
 # License: MIT License
 
 import numpy as np
-import ot
 from numpy.testing.utils import assert_allclose, assert_equal
+
+import ot
 from ot.datasets import get_data_classif
 from ot.utils import unif
 
-np.random.seed(42)
-
 
 def test_sinkhorn_lpl1_transport_class():
     """test_sinkhorn_transport
@@ -325,3 +324,11 @@ def test_otda():
     da_emd = ot.da.OTDA_mapping_kernel()     # init class
     da_emd.fit(xs, xt, numItermax=10)       # fit distributions
     da_emd.predict(xs)    # interpolation of source samples
+
+
+if __name__ == "__main__":
+
+    test_sinkhorn_transport_class()
+    test_emd_transport_class()
+    test_sinkhorn_l1l2_transport_class()
+    test_sinkhorn_lpl1_transport_class()
-- 
cgit v1.2.3


From 8d19d365446efc00d8443c6ddb5b93fded3fa5ab Mon Sep 17 00:00:00 2001
From: Slasnista <stan.chambon@gmail.com>
Date: Wed, 23 Aug 2017 13:50:24 +0200
Subject: out of samples transform and inverse transform by batch

---
 ot/da.py        | 89 +++++++++++++++++++++++++++++++++++++--------------------
 test/test_da.py | 66 +++++++++++++++++++++---------------------
 2 files changed, 91 insertions(+), 64 deletions(-)

(limited to 'test')

diff --git a/ot/da.py b/ot/da.py
index 044d567..0c83ae6 100644
--- a/ot/da.py
+++ b/ot/da.py
@@ -1147,7 +1147,7 @@ class BaseTransport(BaseEstimator):
 
         return self.fit(Xs, ys, Xt, yt).transform(Xs, ys, Xt, yt)
 
-    def transform(self, Xs=None, ys=None, Xt=None, yt=None):
+    def transform(self, Xs=None, ys=None, Xt=None, yt=None, batch_size=128):
         """Transports source samples Xs onto target ones Xt
 
         Parameters
@@ -1160,6 +1160,8 @@ class BaseTransport(BaseEstimator):
             The training input samples.
         yt : array-like, shape (n_labeled_target_samples,)
             The class labels
+        batch_size : int, optional (default=128)
+            The batch size for out of sample inverse transform
 
         Returns
         -------
@@ -1178,34 +1180,48 @@ class BaseTransport(BaseEstimator):
             transp_Xs = np.dot(transp, self.Xt)
         else:
             # perform out of sample mapping
+            indices = np.arange(Xs.shape[0])
+            batch_ind = [
+                indices[i:i + batch_size]
+                for i in range(0, len(indices), batch_size)]
 
-            # get the nearest neighbor in the source domain
-            D0 = dist(Xs, self.Xs)
-            idx = np.argmin(D0, axis=1)
+            transp_Xs = []
+            for bi in batch_ind:
 
-            # transport the source samples
-            transp = self.coupling_ / np.sum(self.coupling_, 1)[:, None]
-            transp[~ np.isfinite(transp)] = 0
-            transp_Xs_ = np.dot(transp, self.Xt)
+                # get the nearest neighbor in the source domain
+                D0 = dist(Xs[bi], self.Xs)
+                idx = np.argmin(D0, axis=1)
+
+                # transport the source samples
+                transp = self.coupling_ / np.sum(self.coupling_, 1)[:, None]
+                transp[~ np.isfinite(transp)] = 0
+                transp_Xs_ = np.dot(transp, self.Xt)
 
-            # define the transported points
-            transp_Xs = transp_Xs_[idx, :] + Xs - self.Xs[idx, :]
+                # define the transported points
+                transp_Xs_ = transp_Xs_[idx, :] + Xs[bi] - self.Xs[idx, :]
+
+                transp_Xs.append(transp_Xs_)
+
+            transp_Xs = np.concatenate(transp_Xs, axis=0)
 
         return transp_Xs
 
-    def inverse_transform(self, Xs=None, ys=None, Xt=None, yt=None):
+    def inverse_transform(self, Xs=None, ys=None, Xt=None, yt=None,
+                          batch_size=128):
         """Transports target samples Xt onto target samples Xs
 
         Parameters
         ----------
         Xs : array-like, shape (n_source_samples, n_features)
             The training input samples.
-        ys : array-like, shape = (n_source_samples,)
+        ys : array-like, shape (n_source_samples,)
             The class labels
         Xt : array-like, shape (n_target_samples, n_features)
             The training input samples.
-        yt : array-like, shape = (n_labeled_target_samples,)
+        yt : array-like, shape (n_labeled_target_samples,)
             The class labels
+        batch_size : int, optional (default=128)
+            The batch size for out of sample inverse transform
 
         Returns
         -------
@@ -1224,17 +1240,28 @@ class BaseTransport(BaseEstimator):
             transp_Xt = np.dot(transp_, self.Xs)
         else:
             # perform out of sample mapping
+            indices = np.arange(Xt.shape[0])
+            batch_ind = [
+                indices[i:i + batch_size]
+                for i in range(0, len(indices), batch_size)]
 
-            D0 = dist(Xt, self.Xt)
-            idx = np.argmin(D0, axis=1)
+            transp_Xt = []
+            for bi in batch_ind:
 
-            # transport the target samples
-            transp_ = self.coupling_.T / np.sum(self.coupling_, 0)[:, None]
-            transp_[~ np.isfinite(transp_)] = 0
-            transp_Xt_ = np.dot(transp_, self.Xs)
+                D0 = dist(Xt[bi], self.Xt)
+                idx = np.argmin(D0, axis=1)
+
+                # transport the target samples
+                transp_ = self.coupling_.T / np.sum(self.coupling_, 0)[:, None]
+                transp_[~ np.isfinite(transp_)] = 0
+                transp_Xt_ = np.dot(transp_, self.Xs)
+
+                # define the transported points
+                transp_Xt_ = transp_Xt_[idx, :] + Xt[bi] - self.Xt[idx, :]
 
-            # define the transported points
-            transp_Xt = transp_Xt_[idx, :] + Xt - self.Xt[idx, :]
+                transp_Xt.append(transp_Xt_)
+
+            transp_Xt = np.concatenate(transp_Xt, axis=0)
 
         return transp_Xt
 
@@ -1306,11 +1333,11 @@ class SinkhornTransport(BaseTransport):
         ----------
         Xs : array-like, shape (n_source_samples, n_features)
             The training input samples.
-        ys : array-like, shape = (n_source_samples,)
+        ys : array-like, shape (n_source_samples,)
             The class labels
         Xt : array-like, shape (n_target_samples, n_features)
             The training input samples.
-        yt : array-like, shape = (n_labeled_target_samples,)
+        yt : array-like, shape (n_labeled_target_samples,)
             The class labels
 
         Returns
@@ -1381,11 +1408,11 @@ class EMDTransport(BaseTransport):
         ----------
         Xs : array-like, shape (n_source_samples, n_features)
             The training input samples.
-        ys : array-like, shape = (n_source_samples,)
+        ys : array-like, shape (n_source_samples,)
             The class labels
         Xt : array-like, shape (n_target_samples, n_features)
             The training input samples.
-        yt : array-like, shape = (n_labeled_target_samples,)
+        yt : array-like, shape (n_labeled_target_samples,)
             The class labels
 
         Returns
@@ -1480,11 +1507,11 @@ class SinkhornLpl1Transport(BaseTransport):
         ----------
         Xs : array-like, shape (n_source_samples, n_features)
             The training input samples.
-        ys : array-like, shape = (n_source_samples,)
+        ys : array-like, shape (n_source_samples,)
             The class labels
         Xt : array-like, shape (n_target_samples, n_features)
             The training input samples.
-        yt : array-like, shape = (n_labeled_target_samples,)
+        yt : array-like, shape (n_labeled_target_samples,)
             The class labels
 
         Returns
@@ -1581,11 +1608,11 @@ class SinkhornL1l2Transport(BaseTransport):
         ----------
         Xs : array-like, shape (n_source_samples, n_features)
             The training input samples.
-        ys : array-like, shape = (n_source_samples,)
+        ys : array-like, shape (n_source_samples,)
             The class labels
         Xt : array-like, shape (n_target_samples, n_features)
             The training input samples.
-        yt : array-like, shape = (n_labeled_target_samples,)
+        yt : array-like, shape (n_labeled_target_samples,)
             The class labels
 
         Returns
@@ -1675,11 +1702,11 @@ class MappingTransport(BaseEstimator):
         ----------
         Xs : array-like, shape (n_source_samples, n_features)
             The training input samples.
-        ys : array-like, shape = (n_source_samples,)
+        ys : array-like, shape (n_source_samples,)
             The class labels
         Xt : array-like, shape (n_target_samples, n_features)
             The training input samples.
-        yt : array-like, shape = (n_labeled_target_samples,)
+        yt : array-like, shape (n_labeled_target_samples,)
             The class labels
 
         Returns
diff --git a/test/test_da.py b/test/test_da.py
index 93f7e83..196f4c4 100644
--- a/test/test_da.py
+++ b/test/test_da.py
@@ -28,14 +28,14 @@ def test_sinkhorn_lpl1_transport_class():
     clf.fit(Xs=Xs, ys=ys, Xt=Xt)
 
     # test dimensions of coupling
-    assert_equal(clf.Cost.shape, ((Xs.shape[0], Xt.shape[0])))
-    assert_equal(clf.Coupling_.shape, ((Xs.shape[0], Xt.shape[0])))
+    assert_equal(clf.cost_.shape, ((Xs.shape[0], Xt.shape[0])))
+    assert_equal(clf.coupling_.shape, ((Xs.shape[0], Xt.shape[0])))
 
     # test margin constraints
     mu_s = unif(ns)
     mu_t = unif(nt)
-    assert_allclose(np.sum(clf.Coupling_, axis=0), mu_t, rtol=1e-3, atol=1e-3)
-    assert_allclose(np.sum(clf.Coupling_, axis=1), mu_s, rtol=1e-3, atol=1e-3)
+    assert_allclose(np.sum(clf.coupling_, axis=0), mu_t, rtol=1e-3, atol=1e-3)
+    assert_allclose(np.sum(clf.coupling_, axis=1), mu_s, rtol=1e-3, atol=1e-3)
 
     # test transform
     transp_Xs = clf.transform(Xs=Xs)
@@ -64,13 +64,13 @@ def test_sinkhorn_lpl1_transport_class():
     # test semi supervised mode
     clf = ot.da.SinkhornLpl1Transport()
     clf.fit(Xs=Xs, ys=ys, Xt=Xt)
-    n_unsup = np.sum(clf.Cost)
+    n_unsup = np.sum(clf.cost_)
 
     # test semi supervised mode
     clf = ot.da.SinkhornLpl1Transport()
     clf.fit(Xs=Xs, ys=ys, Xt=Xt, yt=yt)
-    assert_equal(clf.Cost.shape, ((Xs.shape[0], Xt.shape[0])))
-    n_semisup = np.sum(clf.Cost)
+    assert_equal(clf.cost_.shape, ((Xs.shape[0], Xt.shape[0])))
+    n_semisup = np.sum(clf.cost_)
 
     assert n_unsup != n_semisup, "semisupervised mode not working"
 
@@ -91,14 +91,14 @@ def test_sinkhorn_l1l2_transport_class():
     clf.fit(Xs=Xs, ys=ys, Xt=Xt)
 
     # test dimensions of coupling
-    assert_equal(clf.Cost.shape, ((Xs.shape[0], Xt.shape[0])))
-    assert_equal(clf.Coupling_.shape, ((Xs.shape[0], Xt.shape[0])))
+    assert_equal(clf.cost_.shape, ((Xs.shape[0], Xt.shape[0])))
+    assert_equal(clf.coupling_.shape, ((Xs.shape[0], Xt.shape[0])))
 
     # test margin constraints
     mu_s = unif(ns)
     mu_t = unif(nt)
-    assert_allclose(np.sum(clf.Coupling_, axis=0), mu_t, rtol=1e-3, atol=1e-3)
-    assert_allclose(np.sum(clf.Coupling_, axis=1), mu_s, rtol=1e-3, atol=1e-3)
+    assert_allclose(np.sum(clf.coupling_, axis=0), mu_t, rtol=1e-3, atol=1e-3)
+    assert_allclose(np.sum(clf.coupling_, axis=1), mu_s, rtol=1e-3, atol=1e-3)
 
     # test transform
     transp_Xs = clf.transform(Xs=Xs)
@@ -127,13 +127,13 @@ def test_sinkhorn_l1l2_transport_class():
     # test semi supervised mode
     clf = ot.da.SinkhornL1l2Transport()
     clf.fit(Xs=Xs, ys=ys, Xt=Xt)
-    n_unsup = np.sum(clf.Cost)
+    n_unsup = np.sum(clf.cost_)
 
     # test semi supervised mode
     clf = ot.da.SinkhornL1l2Transport()
     clf.fit(Xs=Xs, ys=ys, Xt=Xt, yt=yt)
-    assert_equal(clf.Cost.shape, ((Xs.shape[0], Xt.shape[0])))
-    n_semisup = np.sum(clf.Cost)
+    assert_equal(clf.cost_.shape, ((Xs.shape[0], Xt.shape[0])))
+    n_semisup = np.sum(clf.cost_)
 
     assert n_unsup != n_semisup, "semisupervised mode not working"
 
@@ -154,14 +154,14 @@ def test_sinkhorn_transport_class():
     clf.fit(Xs=Xs, Xt=Xt)
 
     # test dimensions of coupling
-    assert_equal(clf.Cost.shape, ((Xs.shape[0], Xt.shape[0])))
-    assert_equal(clf.Coupling_.shape, ((Xs.shape[0], Xt.shape[0])))
+    assert_equal(clf.cost_.shape, ((Xs.shape[0], Xt.shape[0])))
+    assert_equal(clf.coupling_.shape, ((Xs.shape[0], Xt.shape[0])))
 
     # test margin constraints
     mu_s = unif(ns)
     mu_t = unif(nt)
-    assert_allclose(np.sum(clf.Coupling_, axis=0), mu_t, rtol=1e-3, atol=1e-3)
-    assert_allclose(np.sum(clf.Coupling_, axis=1), mu_s, rtol=1e-3, atol=1e-3)
+    assert_allclose(np.sum(clf.coupling_, axis=0), mu_t, rtol=1e-3, atol=1e-3)
+    assert_allclose(np.sum(clf.coupling_, axis=1), mu_s, rtol=1e-3, atol=1e-3)
 
     # test transform
     transp_Xs = clf.transform(Xs=Xs)
@@ -190,13 +190,13 @@ def test_sinkhorn_transport_class():
     # test semi supervised mode
     clf = ot.da.SinkhornTransport()
     clf.fit(Xs=Xs, Xt=Xt)
-    n_unsup = np.sum(clf.Cost)
+    n_unsup = np.sum(clf.cost_)
 
     # test semi supervised mode
     clf = ot.da.SinkhornTransport()
     clf.fit(Xs=Xs, ys=ys, Xt=Xt, yt=yt)
-    assert_equal(clf.Cost.shape, ((Xs.shape[0], Xt.shape[0])))
-    n_semisup = np.sum(clf.Cost)
+    assert_equal(clf.cost_.shape, ((Xs.shape[0], Xt.shape[0])))
+    n_semisup = np.sum(clf.cost_)
 
     assert n_unsup != n_semisup, "semisupervised mode not working"
 
@@ -217,14 +217,14 @@ def test_emd_transport_class():
     clf.fit(Xs=Xs, Xt=Xt)
 
     # test dimensions of coupling
-    assert_equal(clf.Cost.shape, ((Xs.shape[0], Xt.shape[0])))
-    assert_equal(clf.Coupling_.shape, ((Xs.shape[0], Xt.shape[0])))
+    assert_equal(clf.cost_.shape, ((Xs.shape[0], Xt.shape[0])))
+    assert_equal(clf.coupling_.shape, ((Xs.shape[0], Xt.shape[0])))
 
     # test margin constraints
     mu_s = unif(ns)
     mu_t = unif(nt)
-    assert_allclose(np.sum(clf.Coupling_, axis=0), mu_t, rtol=1e-3, atol=1e-3)
-    assert_allclose(np.sum(clf.Coupling_, axis=1), mu_s, rtol=1e-3, atol=1e-3)
+    assert_allclose(np.sum(clf.coupling_, axis=0), mu_t, rtol=1e-3, atol=1e-3)
+    assert_allclose(np.sum(clf.coupling_, axis=1), mu_s, rtol=1e-3, atol=1e-3)
 
     # test transform
     transp_Xs = clf.transform(Xs=Xs)
@@ -253,13 +253,13 @@ def test_emd_transport_class():
     # test semi supervised mode
     clf = ot.da.EMDTransport()
     clf.fit(Xs=Xs, Xt=Xt)
-    n_unsup = np.sum(clf.Cost)
+    n_unsup = np.sum(clf.cost_)
 
     # test semi supervised mode
     clf = ot.da.EMDTransport()
     clf.fit(Xs=Xs, ys=ys, Xt=Xt, yt=yt)
-    assert_equal(clf.Cost.shape, ((Xs.shape[0], Xt.shape[0])))
-    n_semisup = np.sum(clf.Cost)
+    assert_equal(clf.cost_.shape, ((Xs.shape[0], Xt.shape[0])))
+    n_semisup = np.sum(clf.cost_)
 
     assert n_unsup != n_semisup, "semisupervised mode not working"
 
@@ -326,9 +326,9 @@ def test_otda():
     da_emd.predict(xs)    # interpolation of source samples
 
 
-if __name__ == "__main__":
+# if __name__ == "__main__":
 
-    test_sinkhorn_transport_class()
-    test_emd_transport_class()
-    test_sinkhorn_l1l2_transport_class()
-    test_sinkhorn_lpl1_transport_class()
+#     test_sinkhorn_transport_class()
+#     test_emd_transport_class()
+#     test_sinkhorn_l1l2_transport_class()
+#     test_sinkhorn_lpl1_transport_class()
-- 
cgit v1.2.3


From c8ae5843ae64dbf841deb3ad8c10024a94a93eec Mon Sep 17 00:00:00 2001
From: Slasnista <stan.chambon@gmail.com>
Date: Wed, 23 Aug 2017 14:11:13 +0200
Subject: test functions for MappingTransport Class

---
 ot/da.py        |  18 ++++++---
 test/test_da.py | 117 +++++++++++++++++++++++++++++++++++++++++++++++++++++---
 2 files changed, 125 insertions(+), 10 deletions(-)

(limited to 'test')

diff --git a/ot/da.py b/ot/da.py
index 0c83ae6..3ccb1b3 100644
--- a/ot/da.py
+++ b/ot/da.py
@@ -1665,8 +1665,14 @@ class MappingTransport(BaseEstimator):
 
     Attributes
     ----------
-    coupling_ : the optimal coupling
-    mapping_ : the mapping associated
+    coupling_ : array-like, shape (n_source_samples, n_features)
+        The optimal coupling
+    mapping_ : array-like, shape (n_features (+ 1), n_features)
+        (if bias) for kernel == linear
+        The associated mapping
+
+        array-like, shape (n_source_samples (+ 1), n_features)
+        (if bias) for kernel == gaussian
 
     References
     ----------
@@ -1679,20 +1685,22 @@ class MappingTransport(BaseEstimator):
 
     def __init__(self, mu=1, eta=0.001, bias=False, metric="sqeuclidean",
                  kernel="linear", sigma=1, max_iter=100, tol=1e-5,
-                 max_inner_iter=10, inner_tol=1e-6, log=False, verbose=False):
+                 max_inner_iter=10, inner_tol=1e-6, log=False, verbose=False,
+                 verbose2=False):
 
         self.metric = metric
         self.mu = mu
         self.eta = eta
         self.bias = bias
         self.kernel = kernel
-        self.sigma
+        self.sigma = sigma
         self.max_iter = max_iter
         self.tol = tol
         self.max_inner_iter = max_inner_iter
         self.inner_tol = inner_tol
         self.log = log
         self.verbose = verbose
+        self.verbose2 = verbose2
 
     def fit(self, Xs=None, ys=None, Xt=None, yt=None):
         """Builds an optimal coupling and estimates the associated mapping
@@ -1712,7 +1720,7 @@ class MappingTransport(BaseEstimator):
         Returns
         -------
         self : object
-            Returns self.
+            Returns self
         """
 
         self.Xs = Xs
diff --git a/test/test_da.py b/test/test_da.py
index 196f4c4..162f681 100644
--- a/test/test_da.py
+++ b/test/test_da.py
@@ -264,6 +264,112 @@ def test_emd_transport_class():
     assert n_unsup != n_semisup, "semisupervised mode not working"
 
 
+def test_mapping_transport_class():
+    """test_mapping_transport
+    """
+
+    ns = 150
+    nt = 200
+
+    Xs, ys = get_data_classif('3gauss', ns)
+    Xt, yt = get_data_classif('3gauss2', nt)
+    Xs_new, _ = get_data_classif('3gauss', ns + 1)
+
+    ##########################################################################
+    # kernel == linear mapping tests
+    ##########################################################################
+
+    # check computation and dimensions if bias == False
+    clf = ot.da.MappingTransport(kernel="linear", bias=False)
+    clf.fit(Xs=Xs, Xt=Xt)
+
+    assert_equal(clf.coupling_.shape, ((Xs.shape[0], Xt.shape[0])))
+    assert_equal(clf.mapping_.shape, ((Xs.shape[1], Xt.shape[1])))
+
+    # test margin constraints
+    mu_s = unif(ns)
+    mu_t = unif(nt)
+    assert_allclose(np.sum(clf.coupling_, axis=0), mu_t, rtol=1e-3, atol=1e-3)
+    assert_allclose(np.sum(clf.coupling_, axis=1), mu_s, rtol=1e-3, atol=1e-3)
+
+    # test transform
+    transp_Xs = clf.transform(Xs=Xs)
+    assert_equal(transp_Xs.shape, Xs.shape)
+
+    transp_Xs_new = clf.transform(Xs_new)
+
+    # check that the oos method is working
+    assert_equal(transp_Xs_new.shape, Xs_new.shape)
+
+    # check computation and dimensions if bias == True
+    clf = ot.da.MappingTransport(kernel="linear", bias=True)
+    clf.fit(Xs=Xs, Xt=Xt)
+    assert_equal(clf.coupling_.shape, ((Xs.shape[0], Xt.shape[0])))
+    assert_equal(clf.mapping_.shape, ((Xs.shape[1] + 1, Xt.shape[1])))
+
+    # test margin constraints
+    mu_s = unif(ns)
+    mu_t = unif(nt)
+    assert_allclose(np.sum(clf.coupling_, axis=0), mu_t, rtol=1e-3, atol=1e-3)
+    assert_allclose(np.sum(clf.coupling_, axis=1), mu_s, rtol=1e-3, atol=1e-3)
+
+    # test transform
+    transp_Xs = clf.transform(Xs=Xs)
+    assert_equal(transp_Xs.shape, Xs.shape)
+
+    transp_Xs_new = clf.transform(Xs_new)
+
+    # check that the oos method is working
+    assert_equal(transp_Xs_new.shape, Xs_new.shape)
+
+    ##########################################################################
+    # kernel == gaussian mapping tests
+    ##########################################################################
+
+    # check computation and dimensions if bias == False
+    clf = ot.da.MappingTransport(kernel="gaussian", bias=False)
+    clf.fit(Xs=Xs, Xt=Xt)
+
+    assert_equal(clf.coupling_.shape, ((Xs.shape[0], Xt.shape[0])))
+    assert_equal(clf.mapping_.shape, ((Xs.shape[0], Xt.shape[1])))
+
+    # test margin constraints
+    mu_s = unif(ns)
+    mu_t = unif(nt)
+    assert_allclose(np.sum(clf.coupling_, axis=0), mu_t, rtol=1e-3, atol=1e-3)
+    assert_allclose(np.sum(clf.coupling_, axis=1), mu_s, rtol=1e-3, atol=1e-3)
+
+    # test transform
+    transp_Xs = clf.transform(Xs=Xs)
+    assert_equal(transp_Xs.shape, Xs.shape)
+
+    transp_Xs_new = clf.transform(Xs_new)
+
+    # check that the oos method is working
+    assert_equal(transp_Xs_new.shape, Xs_new.shape)
+
+    # check computation and dimensions if bias == True
+    clf = ot.da.MappingTransport(kernel="gaussian", bias=True)
+    clf.fit(Xs=Xs, Xt=Xt)
+    assert_equal(clf.coupling_.shape, ((Xs.shape[0], Xt.shape[0])))
+    assert_equal(clf.mapping_.shape, ((Xs.shape[0] + 1, Xt.shape[1])))
+
+    # test margin constraints
+    mu_s = unif(ns)
+    mu_t = unif(nt)
+    assert_allclose(np.sum(clf.coupling_, axis=0), mu_t, rtol=1e-3, atol=1e-3)
+    assert_allclose(np.sum(clf.coupling_, axis=1), mu_s, rtol=1e-3, atol=1e-3)
+
+    # test transform
+    transp_Xs = clf.transform(Xs=Xs)
+    assert_equal(transp_Xs.shape, Xs.shape)
+
+    transp_Xs_new = clf.transform(Xs_new)
+
+    # check that the oos method is working
+    assert_equal(transp_Xs_new.shape, Xs_new.shape)
+
+
 def test_otda():
 
     n_samples = 150  # nb samples
@@ -326,9 +432,10 @@ def test_otda():
     da_emd.predict(xs)    # interpolation of source samples
 
 
-# if __name__ == "__main__":
+if __name__ == "__main__":
 
-#     test_sinkhorn_transport_class()
-#     test_emd_transport_class()
-#     test_sinkhorn_l1l2_transport_class()
-#     test_sinkhorn_lpl1_transport_class()
+    # test_sinkhorn_transport_class()
+    # test_emd_transport_class()
+    # test_sinkhorn_l1l2_transport_class()
+    # test_sinkhorn_lpl1_transport_class()
+    test_mapping_transport_class()
-- 
cgit v1.2.3


From fc58f39fc730a9e1bb2215ef063e37c50f0ebc1f Mon Sep 17 00:00:00 2001
From: Slasnista <stan.chambon@gmail.com>
Date: Wed, 23 Aug 2017 15:09:08 +0200
Subject: added deprecation warning on old classes

---
 ot/da.py          |  22 ++++++++++--
 ot/deprecation.py | 103 ++++++++++++++++++++++++++++++++++++++++++++++++++++++
 test/test_da.py   |   5 +--
 3 files changed, 126 insertions(+), 4 deletions(-)
 create mode 100644 ot/deprecation.py

(limited to 'test')

diff --git a/ot/da.py b/ot/da.py
index 3ccb1b3..8fa1895 100644
--- a/ot/da.py
+++ b/ot/da.py
@@ -10,12 +10,14 @@ Domain adaptation with optimal transport
 # License: MIT License
 
 import numpy as np
+import warnings
+
 from .bregman import sinkhorn
 from .lp import emd
 from .utils import unif, dist, kernel
 from .optim import cg
 from .optim import gcg
-import warnings
+from .deprecation import deprecated
 
 
 def sinkhorn_lpl1_mm(a, labels_a, b, M, reg, eta=0.1, numItermax=10,
@@ -632,6 +634,9 @@ def joint_OT_mapping_kernel(xs, xt, mu=1, eta=0.001, kerneltype='gaussian',
         return G, L
 
 
+@deprecated("The class OTDA is deprecated in 0.3.1 and will be "
+            "removed in 0.5"
+            "\n\tfor standard transport use class EMDTransport instead.")
 class OTDA(object):
 
     """Class for domain adaptation with optimal transport as proposed in [5]
@@ -758,10 +763,15 @@ class OTDA(object):
             self.M = np.log(1 + np.log(1 + self.M))
 
 
+@deprecated("The class OTDA_sinkhorn is deprecated in 0.3.1 and will be"
+            " removed in 0.5 \nUse class SinkhornTransport instead.")
 class OTDA_sinkhorn(OTDA):
 
     """Class for domain adaptation with optimal transport with entropic
-    regularization"""
+    regularization
+
+
+    """
 
     def fit(self, xs, xt, reg=1, ws=None, wt=None, norm=None, **kwargs):
         """Fit regularized domain adaptation between samples is xs and xt
@@ -783,6 +793,8 @@ class OTDA_sinkhorn(OTDA):
         self.computed = True
 
 
+@deprecated("The class OTDA_lpl1 is deprecated in 0.3.1 and will be"
+            " removed in 0.5 \nUse class SinkhornLpl1Transport instead.")
 class OTDA_lpl1(OTDA):
 
     """Class for domain adaptation with optimal transport with entropic and
@@ -810,6 +822,8 @@ class OTDA_lpl1(OTDA):
         self.computed = True
 
 
+@deprecated("The class OTDA_l1L2 is deprecated in 0.3.1 and will be"
+            " removed in 0.5 \nUse class SinkhornL1l2Transport instead.")
 class OTDA_l1l2(OTDA):
 
     """Class for domain adaptation with optimal transport with entropic
@@ -837,6 +851,8 @@ class OTDA_l1l2(OTDA):
         self.computed = True
 
 
+@deprecated("The class OTDA_mapping_linear is deprecated in 0.3.1 and will be"
+            " removed in 0.5 \nUse class MappingTransport instead.")
 class OTDA_mapping_linear(OTDA):
 
     """Class for optimal transport with joint linear mapping estimation as in
@@ -882,6 +898,8 @@ class OTDA_mapping_linear(OTDA):
             return None
 
 
+@deprecated("The class OTDA_mapping_kernel is deprecated in 0.3.1 and will be"
+            " removed in 0.5 \nUse class MappingTransport instead.")
 class OTDA_mapping_kernel(OTDA_mapping_linear):
 
     """Class for optimal transport with joint nonlinear mapping
diff --git a/ot/deprecation.py b/ot/deprecation.py
new file mode 100644
index 0000000..2b16427
--- /dev/null
+++ b/ot/deprecation.py
@@ -0,0 +1,103 @@
+"""
+    deprecated class from scikit-learn package
+    https://github.com/scikit-learn/scikit-learn/blob/master/sklearn/utils/deprecation.py
+"""
+
+import sys
+import warnings
+
+__all__ = ["deprecated", ]
+
+
+class deprecated(object):
+    """Decorator to mark a function or class as deprecated.
+    Issue a warning when the function is called/the class is instantiated and
+    adds a warning to the docstring.
+    The optional extra argument will be appended to the deprecation message
+    and the docstring. Note: to use this with the default value for extra, put
+    in an empty of parentheses:
+    >>> from ot.deprecation import deprecated
+    >>> @deprecated()
+    ... def some_function(): pass
+
+    Parameters
+    ----------
+    extra : string
+          to be added to the deprecation messages
+    """
+
+    # Adapted from http://wiki.python.org/moin/PythonDecoratorLibrary,
+    # but with many changes.
+
+    def __init__(self, extra=''):
+        self.extra = extra
+
+    def __call__(self, obj):
+        """Call method
+        Parameters
+        ----------
+        obj : object
+        """
+        if isinstance(obj, type):
+            return self._decorate_class(obj)
+        else:
+            return self._decorate_fun(obj)
+
+    def _decorate_class(self, cls):
+        msg = "Class %s is deprecated" % cls.__name__
+        if self.extra:
+            msg += "; %s" % self.extra
+
+        # FIXME: we should probably reset __new__ for full generality
+        init = cls.__init__
+
+        def wrapped(*args, **kwargs):
+            warnings.warn(msg, category=DeprecationWarning)
+            return init(*args, **kwargs)
+
+        cls.__init__ = wrapped
+
+        wrapped.__name__ = '__init__'
+        wrapped.__doc__ = self._update_doc(init.__doc__)
+        wrapped.deprecated_original = init
+
+        return cls
+
+    def _decorate_fun(self, fun):
+        """Decorate function fun"""
+
+        msg = "Function %s is deprecated" % fun.__name__
+        if self.extra:
+            msg += "; %s" % self.extra
+
+        def wrapped(*args, **kwargs):
+            warnings.warn(msg, category=DeprecationWarning)
+            return fun(*args, **kwargs)
+
+        wrapped.__name__ = fun.__name__
+        wrapped.__dict__ = fun.__dict__
+        wrapped.__doc__ = self._update_doc(fun.__doc__)
+
+        return wrapped
+
+    def _update_doc(self, olddoc):
+        newdoc = "DEPRECATED"
+        if self.extra:
+            newdoc = "%s: %s" % (newdoc, self.extra)
+        if olddoc:
+            newdoc = "%s\n\n%s" % (newdoc, olddoc)
+        return newdoc
+
+
+def _is_deprecated(func):
+    """Helper to check if func is wraped by our deprecated decorator"""
+    if sys.version_info < (3, 5):
+        raise NotImplementedError("This is only available for python3.5 "
+                                  "or above")
+    closures = getattr(func, '__closure__', [])
+    if closures is None:
+        closures = []
+    is_deprecated = ('deprecated' in ''.join([c.cell_contents
+                                              for c in closures
+                     if isinstance(c.cell_contents, str)]))
+    return is_deprecated
diff --git a/test/test_da.py b/test/test_da.py
index 162f681..9578b3d 100644
--- a/test/test_da.py
+++ b/test/test_da.py
@@ -432,10 +432,11 @@ def test_otda():
     da_emd.predict(xs)    # interpolation of source samples
 
 
-if __name__ == "__main__":
+# if __name__ == "__main__":
 
+    # test_otda()
     # test_sinkhorn_transport_class()
     # test_emd_transport_class()
     # test_sinkhorn_l1l2_transport_class()
     # test_sinkhorn_lpl1_transport_class()
-    test_mapping_transport_class()
+    # test_mapping_transport_class()
-- 
cgit v1.2.3


From 6167f34a721886d4b9038a8b1746a2c8c81132ce Mon Sep 17 00:00:00 2001
From: Slasnista <stan.chambon@gmail.com>
Date: Fri, 25 Aug 2017 10:29:41 +0200
Subject: solving log issues to avoid errors and adding further tests

---
 ot/da.py        | 57 ++++++++++++++++++++++++++++++++++++++++++---------------
 test/test_da.py | 39 +++++++++++++++++++++++++++++++++------
 2 files changed, 75 insertions(+), 21 deletions(-)

(limited to 'test')

diff --git a/ot/da.py b/ot/da.py
index 8fa1895..5a34979 100644
--- a/ot/da.py
+++ b/ot/da.py
@@ -1315,7 +1315,10 @@ class SinkhornTransport(BaseTransport):
 
     Attributes
     ----------
-    coupling_ : the optimal coupling
+    coupling_ : array-like, shape (n_source_samples, n_target_samples)
+        The optimal coupling
+    log_ : dictionary
+        The dictionary of log, empty dic if parameter log is not True
 
     References
     ----------
@@ -1367,11 +1370,18 @@ class SinkhornTransport(BaseTransport):
         super(SinkhornTransport, self).fit(Xs, ys, Xt, yt)
 
         # coupling estimation
-        self.coupling_ = sinkhorn(
+        returned_ = sinkhorn(
             a=self.mu_s, b=self.mu_t, M=self.cost_, reg=self.reg_e,
             numItermax=self.max_iter, stopThr=self.tol,
             verbose=self.verbose, log=self.log)
 
+        # deal with the value of log
+        if self.log:
+            self.coupling_, self.log_ = returned_
+        else:
+            self.coupling_ = returned_
+            self.log_ = dict()
+
         return self
 
 
@@ -1400,7 +1410,8 @@ class EMDTransport(BaseTransport):
 
     Attributes
     ----------
-    coupling_ : the optimal coupling
+    coupling_ : array-like, shape (n_source_samples, n_target_samples)
+        The optimal coupling
 
     References
     ----------
@@ -1475,15 +1486,14 @@ class SinkhornLpl1Transport(BaseTransport):
         The number of iteration in the inner loop
     verbose : int, optional (default=0)
         Controls the verbosity of the optimization algorithm
-    log : int, optional (default=0)
-        Controls the logs of the optimization algorithm
     limit_max: float, optional (defaul=np.infty)
         Controls the semi supervised mode. Transport between labeled source
         and target samples of different classes will exhibit an infinite cost
 
     Attributes
     ----------
-    coupling_ : the optimal coupling
+    coupling_ : array-like, shape (n_source_samples, n_target_samples)
+        The optimal coupling
 
     References
     ----------
@@ -1500,7 +1510,7 @@ class SinkhornLpl1Transport(BaseTransport):
 
     def __init__(self, reg_e=1., reg_cl=0.1,
                  max_iter=10, max_inner_iter=200,
-                 tol=10e-9, verbose=False, log=False,
+                 tol=10e-9, verbose=False,
                  metric="sqeuclidean",
                  distribution_estimation=distribution_estimation_uniform,
                  out_of_sample_map='ferradans', limit_max=np.infty):
@@ -1511,7 +1521,6 @@ class SinkhornLpl1Transport(BaseTransport):
         self.max_inner_iter = max_inner_iter
         self.tol = tol
         self.verbose = verbose
-        self.log = log
         self.metric = metric
         self.distribution_estimation = distribution_estimation
         self.out_of_sample_map = out_of_sample_map
@@ -1544,7 +1553,7 @@ class SinkhornLpl1Transport(BaseTransport):
             a=self.mu_s, labels_a=ys, b=self.mu_t, M=self.cost_,
             reg=self.reg_e, eta=self.reg_cl, numItermax=self.max_iter,
             numInnerItermax=self.max_inner_iter, stopInnerThr=self.tol,
-            verbose=self.verbose, log=self.log)
+            verbose=self.verbose)
 
         return self
 
@@ -1584,7 +1593,10 @@ class SinkhornL1l2Transport(BaseTransport):
 
     Attributes
     ----------
-    coupling_ : the optimal coupling
+    coupling_ : array-like, shape (n_source_samples, n_target_samples)
+        The optimal coupling
+    log_ : dictionary
+        The dictionary of log, empty dic if parameter log is not True
 
     References
     ----------
@@ -1641,12 +1653,19 @@ class SinkhornL1l2Transport(BaseTransport):
 
         super(SinkhornL1l2Transport, self).fit(Xs, ys, Xt, yt)
 
-        self.coupling_ = sinkhorn_l1l2_gl(
+        returned_ = sinkhorn_l1l2_gl(
             a=self.mu_s, labels_a=ys, b=self.mu_t, M=self.cost_,
             reg=self.reg_e, eta=self.reg_cl, numItermax=self.max_iter,
             numInnerItermax=self.max_inner_iter, stopInnerThr=self.tol,
             verbose=self.verbose, log=self.log)
 
+        # deal with the value of log
+        if self.log:
+            self.coupling_, self.log_ = returned_
+        else:
+            self.coupling_ = returned_
+            self.log_ = dict()
+
         return self
 
 
@@ -1683,14 +1702,15 @@ class MappingTransport(BaseEstimator):
 
     Attributes
     ----------
-    coupling_ : array-like, shape (n_source_samples, n_features)
+    coupling_ : array-like, shape (n_source_samples, n_target_samples)
         The optimal coupling
     mapping_ : array-like, shape (n_features (+ 1), n_features)
         (if bias) for kernel == linear
         The associated mapping
-
         array-like, shape (n_source_samples (+ 1), n_features)
         (if bias) for kernel == gaussian
+    log_ : dictionary
+        The dictionary of log, empty dic if parameter log is not True
 
     References
     ----------
@@ -1745,19 +1765,26 @@ class MappingTransport(BaseEstimator):
         self.Xt = Xt
 
         if self.kernel == "linear":
-            self.coupling_, self.mapping_ = joint_OT_mapping_linear(
+            returned_ = joint_OT_mapping_linear(
                 Xs, Xt, mu=self.mu, eta=self.eta, bias=self.bias,
                 verbose=self.verbose, verbose2=self.verbose2,
                 numItermax=self.max_iter, numInnerItermax=self.max_inner_iter,
                 stopThr=self.tol, stopInnerThr=self.inner_tol, log=self.log)
 
         elif self.kernel == "gaussian":
-            self.coupling_, self.mapping_ = joint_OT_mapping_kernel(
+            returned_ = joint_OT_mapping_kernel(
                 Xs, Xt, mu=self.mu, eta=self.eta, bias=self.bias,
                 sigma=self.sigma, verbose=self.verbose, verbose2=self.verbose,
                 numItermax=self.max_iter, numInnerItermax=self.max_inner_iter,
                 stopInnerThr=self.inner_tol, stopThr=self.tol, log=self.log)
 
+        # deal with the value of log
+        if self.log:
+            self.coupling_, self.mapping_, self.log_ = returned_
+        else:
+            self.coupling_, self.mapping_ = returned_
+            self.log_ = dict()
+
         return self
 
     def transform(self, Xs):
diff --git a/test/test_da.py b/test/test_da.py
index 9578b3d..104a798 100644
--- a/test/test_da.py
+++ b/test/test_da.py
@@ -26,6 +26,8 @@ def test_sinkhorn_lpl1_transport_class():
 
     # test its computed
     clf.fit(Xs=Xs, ys=ys, Xt=Xt)
+    assert hasattr(clf, "cost_")
+    assert hasattr(clf, "coupling_")
 
     # test dimensions of coupling
     assert_equal(clf.cost_.shape, ((Xs.shape[0], Xt.shape[0])))
@@ -89,6 +91,9 @@ def test_sinkhorn_l1l2_transport_class():
 
     # test its computed
     clf.fit(Xs=Xs, ys=ys, Xt=Xt)
+    assert hasattr(clf, "cost_")
+    assert hasattr(clf, "coupling_")
+    assert hasattr(clf, "log_")
 
     # test dimensions of coupling
     assert_equal(clf.cost_.shape, ((Xs.shape[0], Xt.shape[0])))
@@ -137,6 +142,11 @@ def test_sinkhorn_l1l2_transport_class():
 
     assert n_unsup != n_semisup, "semisupervised mode not working"
 
+    # check everything runs well with log=True
+    clf = ot.da.SinkhornL1l2Transport(log=True)
+    clf.fit(Xs=Xs, ys=ys, Xt=Xt)
+    assert len(clf.log_.keys()) != 0
+
 
 def test_sinkhorn_transport_class():
     """test_sinkhorn_transport
@@ -152,6 +162,9 @@ def test_sinkhorn_transport_class():
 
     # test its computed
     clf.fit(Xs=Xs, Xt=Xt)
+    assert hasattr(clf, "cost_")
+    assert hasattr(clf, "coupling_")
+    assert hasattr(clf, "log_")
 
     # test dimensions of coupling
     assert_equal(clf.cost_.shape, ((Xs.shape[0], Xt.shape[0])))
@@ -200,6 +213,11 @@ def test_sinkhorn_transport_class():
 
     assert n_unsup != n_semisup, "semisupervised mode not working"
 
+    # check everything runs well with log=True
+    clf = ot.da.SinkhornTransport(log=True)
+    clf.fit(Xs=Xs, ys=ys, Xt=Xt)
+    assert len(clf.log_.keys()) != 0
+
 
 def test_emd_transport_class():
     """test_sinkhorn_transport
@@ -215,6 +233,8 @@ def test_emd_transport_class():
 
     # test its computed
     clf.fit(Xs=Xs, Xt=Xt)
+    assert hasattr(clf, "cost_")
+    assert hasattr(clf, "coupling_")
 
     # test dimensions of coupling
     assert_equal(clf.cost_.shape, ((Xs.shape[0], Xt.shape[0])))
@@ -282,6 +302,9 @@ def test_mapping_transport_class():
     # check computation and dimensions if bias == False
     clf = ot.da.MappingTransport(kernel="linear", bias=False)
     clf.fit(Xs=Xs, Xt=Xt)
+    assert hasattr(clf, "coupling_")
+    assert hasattr(clf, "mapping_")
+    assert hasattr(clf, "log_")
 
     assert_equal(clf.coupling_.shape, ((Xs.shape[0], Xt.shape[0])))
     assert_equal(clf.mapping_.shape, ((Xs.shape[1], Xt.shape[1])))
@@ -369,6 +392,11 @@ def test_mapping_transport_class():
     # check that the oos method is working
     assert_equal(transp_Xs_new.shape, Xs_new.shape)
 
+    # check everything runs well with log=True
+    clf = ot.da.MappingTransport(kernel="gaussian", log=True)
+    clf.fit(Xs=Xs, Xt=Xt)
+    assert len(clf.log_.keys()) != 0
+
 
 def test_otda():
 
@@ -434,9 +462,8 @@ def test_otda():
 
 # if __name__ == "__main__":
 
-    # test_otda()
-    # test_sinkhorn_transport_class()
-    # test_emd_transport_class()
-    # test_sinkhorn_l1l2_transport_class()
-    # test_sinkhorn_lpl1_transport_class()
-    # test_mapping_transport_class()
+#     test_sinkhorn_transport_class()
+#     test_emd_transport_class()
+#     test_sinkhorn_l1l2_transport_class()
+#     test_sinkhorn_lpl1_transport_class()
+#     test_mapping_transport_class()
-- 
cgit v1.2.3


From 8c525174bb664cafa98dfff73dce9d42d7818f71 Mon Sep 17 00:00:00 2001
From: Nicolas Courty <Nico@pc-mna-08.univ-ubs.fr>
Date: Thu, 31 Aug 2017 16:44:18 +0200
Subject: Minor corrections suggested by @agramfort + new barycenter example +
 test function

---
 README.md                          |   2 +-
 data/carre.png                     | Bin 0 -> 168 bytes
 data/coeur.png                     | Bin 0 -> 225 bytes
 data/rond.png                      | Bin 0 -> 230 bytes
 data/triangle.png                  | Bin 0 -> 254 bytes
 examples/plot_gromov.py            |  14 +--
 examples/plot_gromov_barycenter.py | 240 +++++++++++++++++++++++++++++++++++++
 ot/gromov.py                       |  36 +++---
 test/test_gromov.py                |  38 ++++++
 9 files changed, 302 insertions(+), 28 deletions(-)
 create mode 100755 data/carre.png
 create mode 100755 data/coeur.png
 create mode 100755 data/rond.png
 create mode 100755 data/triangle.png
 create mode 100755 examples/plot_gromov_barycenter.py
 create mode 100644 test/test_gromov.py

(limited to 'test')

diff --git a/README.md b/README.md
index 257244b..22b20a4 100644
--- a/README.md
+++ b/README.md
@@ -185,4 +185,4 @@ You can also post bug reports and feature requests in Github issues. Make sure t
 
 [11] Flamary, R., Cuturi, M., Courty, N., & Rakotomamonjy, A. (2016). [Wasserstein Discriminant Analysis](https://arxiv.org/pdf/1608.08063.pdf). arXiv preprint arXiv:1608.08063.
 
-[12] Peyré, Gabriel, Marco Cuturi, and Justin Solomon, [Gromov-Wasserstein averaging of kernel and distance matrices](http://proceedings.mlr.press/v48/peyre16.html)  International Conference on Machine Learning (ICML). 2016.
+[12] Gabriel Peyré, Marco Cuturi, and Justin Solomon, [Gromov-Wasserstein averaging of kernel and distance matrices](http://proceedings.mlr.press/v48/peyre16.html)  International Conference on Machine Learning (ICML). 2016.
diff --git a/data/carre.png b/data/carre.png
new file mode 100755
index 0000000..45ff0ef
Binary files /dev/null and b/data/carre.png differ
diff --git a/data/coeur.png b/data/coeur.png
new file mode 100755
index 0000000..3f511a6
Binary files /dev/null and b/data/coeur.png differ
diff --git a/data/rond.png b/data/rond.png
new file mode 100755
index 0000000..1c1a068
Binary files /dev/null and b/data/rond.png differ
diff --git a/data/triangle.png b/data/triangle.png
new file mode 100755
index 0000000..ca36d09
Binary files /dev/null and b/data/triangle.png differ
diff --git a/examples/plot_gromov.py b/examples/plot_gromov.py
index a33fde1..9bbdbde 100644
--- a/examples/plot_gromov.py
+++ b/examples/plot_gromov.py
@@ -1,8 +1,8 @@
 # -*- coding: utf-8 -*-
 """
-====================
+==========================
 Gromov-Wasserstein example
-====================
+==========================
 This example is designed to show how to use the Gromov-Wassertsein distance
 computation in POT.
 """
@@ -14,14 +14,14 @@ computation in POT.
 
 import scipy as sp
 import numpy as np
+import matplotlib.pylab as pl
 
 import ot
-import matplotlib.pylab as pl
 
 
 """
 Sample two Gaussian distributions (2D and 3D)
-====================
+=============================================
 The Gromov-Wasserstein distance allows to compute distances with samples that do not belong to the same metric space.
 For demonstration purpose, we sample two Gaussian distributions in 2- and 3-dimensional spaces.
 """
@@ -42,7 +42,7 @@ xt = np.random.randn(n, 3).dot(P) + mu_t
 
 """
 Plotting the distributions
-====================
+==========================
 """
 fig = pl.figure()
 ax1 = fig.add_subplot(121)
@@ -54,7 +54,7 @@ pl.show()
 
 """
 Compute distance kernels, normalize them and then display
-====================
+=========================================================
 """
 
 C1 = sp.spatial.distance.cdist(xs, xs)
@@ -72,7 +72,7 @@ pl.show()
 
 """
 Compute Gromov-Wasserstein plans and distance
-====================
+=============================================
 """
 
 p = ot.unif(n)
diff --git a/examples/plot_gromov_barycenter.py b/examples/plot_gromov_barycenter.py
new file mode 100755
index 0000000..6a72b3b
--- /dev/null
+++ b/examples/plot_gromov_barycenter.py
@@ -0,0 +1,240 @@
+# -*- coding: utf-8 -*-
+"""
+=====================================
+Gromov-Wasserstein Barycenter example
+=====================================
+This example is designed to show how to use the Gromov-Wassertsein distance
+computation in POT.
+"""
+
+# Author: Erwan Vautier <erwan.vautier@gmail.com>
+#         Nicolas Courty <ncourty@irisa.fr>
+#
+# License: MIT License
+
+
+import numpy as np
+import scipy as sp
+
+import scipy.ndimage as spi
+import matplotlib.pylab as pl
+from sklearn import manifold
+from sklearn.decomposition import PCA
+
+import ot
+
+"""
+
+Smacof MDS
+==========
+This function allows to find an embedding of points given a dissimilarity matrix
+that will be given by the output of the algorithm
+"""
+
+
+def smacof_mds(C, dim, maxIter=3000, eps=1e-9):
+    """
+    Returns an interpolated point cloud following the dissimilarity matrix C using SMACOF
+    multidimensional scaling (MDS) in specific dimensionned target space
+
+    Parameters
+    ----------
+    C : np.ndarray(ns,ns)
+        dissimilarity matrix
+    dim : Integer
+          dimension of the targeted space
+    maxIter : Maximum number of iterations of the SMACOF algorithm for a single run
+
+    eps : relative tolerance w.r.t stress to declare converge
+
+
+    Returns
+    -------
+    npos : R**dim ndarray
+           Embedded coordinates of the interpolated point cloud (defined with one isometry)
+
+
+    """
+
+    seed = np.random.RandomState(seed=3)
+
+    mds = manifold.MDS(
+        dim,
+        max_iter=3000,
+        eps=1e-9,
+        dissimilarity='precomputed',
+        n_init=1)
+    pos = mds.fit(C).embedding_
+
+    nmds = manifold.MDS(
+        2,
+        max_iter=3000,
+        eps=1e-9,
+        dissimilarity="precomputed",
+        random_state=seed,
+        n_init=1)
+    npos = nmds.fit_transform(C, init=pos)
+
+    return npos
+
+
+"""
+Data preparation
+================
+The four distributions are constructed from 4 simple images
+"""
+
+
+def im2mat(I):
+    """Converts and image to matrix (one pixel per line)"""
+    return I.reshape((I.shape[0] * I.shape[1], I.shape[2]))
+
+
+carre = spi.imread('../data/carre.png').astype(np.float64) / 256
+rond = spi.imread('../data/rond.png').astype(np.float64) / 256
+triangle = spi.imread('../data/triangle.png').astype(np.float64) / 256
+fleche = spi.imread('../data/coeur.png').astype(np.float64) / 256
+
+shapes = [carre, rond, triangle, fleche]
+
+S = 4
+xs = [[] for i in range(S)]
+
+
+for nb in range(4):
+    for i in range(8):
+        for j in range(8):
+            if shapes[nb][i, j] < 0.95:
+                xs[nb].append([j, 8 - i])
+
+xs = np.array([np.array(xs[0]), np.array(xs[1]),
+               np.array(xs[2]), np.array(xs[3])])
+
+
+"""
+Barycenter computation
+======================
+The four distributions are constructed from 4 simple images
+"""
+ns = [len(xs[s]) for s in range(S)]
+N = 30
+
+"""Compute all distances matrices for the four shapes"""
+Cs = [sp.spatial.distance.cdist(xs[s], xs[s]) for s in range(S)]
+Cs = [cs / cs.max() for cs in Cs]
+
+ps = [ot.unif(ns[s]) for s in range(S)]
+p = ot.unif(N)
+
+
+lambdast = [[float(i) / 3, float(3 - i) / 3] for i in [1, 2]]
+
+Ct01 = [0 for i in range(2)]
+for i in range(2):
+    Ct01[i] = ot.gromov.gromov_barycenters(N, [Cs[0], Cs[1]], [
+                                           ps[0], ps[1]], p, lambdast[i], 'square_loss', 5e-4, numItermax=100, stopThr=1e-3)
+
+Ct02 = [0 for i in range(2)]
+for i in range(2):
+    Ct02[i] = ot.gromov.gromov_barycenters(N, [Cs[0], Cs[2]], [
+                                           ps[0], ps[2]], p, lambdast[i], 'square_loss', 5e-4, numItermax=100, stopThr=1e-3)
+
+Ct13 = [0 for i in range(2)]
+for i in range(2):
+    Ct13[i] = ot.gromov.gromov_barycenters(N, [Cs[1], Cs[3]], [
+                                           ps[1], ps[3]], p, lambdast[i], 'square_loss', 5e-4, numItermax=100, stopThr=1e-3)
+
+Ct23 = [0 for i in range(2)]
+for i in range(2):
+    Ct23[i] = ot.gromov.gromov_barycenters(N, [Cs[2], Cs[3]], [
+                                           ps[2], ps[3]], p, lambdast[i], 'square_loss', 5e-4, numItermax=100, stopThr=1e-3)
+
+"""
+Visualization
+=============
+"""
+
+"""The PCA helps in getting consistency between the rotations"""
+
+clf = PCA(n_components=2)
+npos = [0, 0, 0, 0]
+npos = [smacof_mds(Cs[s], 2) for s in range(S)]
+
+npost01 = [0, 0]
+npost01 = [smacof_mds(Ct01[s], 2) for s in range(2)]
+npost01 = [clf.fit_transform(npost01[s]) for s in range(2)]
+
+npost02 = [0, 0]
+npost02 = [smacof_mds(Ct02[s], 2) for s in range(2)]
+npost02 = [clf.fit_transform(npost02[s]) for s in range(2)]
+
+npost13 = [0, 0]
+npost13 = [smacof_mds(Ct13[s], 2) for s in range(2)]
+npost13 = [clf.fit_transform(npost13[s]) for s in range(2)]
+
+npost23 = [0, 0]
+npost23 = [smacof_mds(Ct23[s], 2) for s in range(2)]
+npost23 = [clf.fit_transform(npost23[s]) for s in range(2)]
+
+
+fig = pl.figure(figsize=(10, 10))
+
+ax1 = pl.subplot2grid((4, 4), (0, 0))
+pl.xlim((-1, 1))
+pl.ylim((-1, 1))
+ax1.scatter(npos[0][:, 0], npos[0][:, 1], color='r')
+
+ax2 = pl.subplot2grid((4, 4), (0, 1))
+pl.xlim((-1, 1))
+pl.ylim((-1, 1))
+ax2.scatter(npost01[1][:, 0], npost01[1][:, 1], color='b')
+
+ax3 = pl.subplot2grid((4, 4), (0, 2))
+pl.xlim((-1, 1))
+pl.ylim((-1, 1))
+ax3.scatter(npost01[0][:, 0], npost01[0][:, 1], color='b')
+
+ax4 = pl.subplot2grid((4, 4), (0, 3))
+pl.xlim((-1, 1))
+pl.ylim((-1, 1))
+ax4.scatter(npos[1][:, 0], npos[1][:, 1], color='r')
+
+ax5 = pl.subplot2grid((4, 4), (1, 0))
+pl.xlim((-1, 1))
+pl.ylim((-1, 1))
+ax5.scatter(npost02[1][:, 0], npost02[1][:, 1], color='b')
+
+ax6 = pl.subplot2grid((4, 4), (1, 3))
+pl.xlim((-1, 1))
+pl.ylim((-1, 1))
+ax6.scatter(npost13[1][:, 0], npost13[1][:, 1], color='b')
+
+ax7 = pl.subplot2grid((4, 4), (2, 0))
+pl.xlim((-1, 1))
+pl.ylim((-1, 1))
+ax7.scatter(npost02[0][:, 0], npost02[0][:, 1], color='b')
+
+ax8 = pl.subplot2grid((4, 4), (2, 3))
+pl.xlim((-1, 1))
+pl.ylim((-1, 1))
+ax8.scatter(npost13[0][:, 0], npost13[0][:, 1], color='b')
+
+ax9 = pl.subplot2grid((4, 4), (3, 0))
+pl.xlim((-1, 1))
+pl.ylim((-1, 1))
+ax9.scatter(npos[2][:, 0], npos[2][:, 1], color='r')
+
+ax10 = pl.subplot2grid((4, 4), (3, 1))
+pl.xlim((-1, 1))
+pl.ylim((-1, 1))
+ax10.scatter(npost23[1][:, 0], npost23[1][:, 1], color='b')
+
+ax11 = pl.subplot2grid((4, 4), (3, 2))
+pl.xlim((-1, 1))
+pl.ylim((-1, 1))
+ax11.scatter(npost23[0][:, 0], npost23[0][:, 1], color='b')
+
+ax12 = pl.subplot2grid((4, 4), (3, 3))
+pl.xlim((-1, 1))
+pl.ylim((-1, 1))
+ax12.scatter(npos[3][:, 0], npos[3][:, 1], color='r')
diff --git a/ot/gromov.py b/ot/gromov.py
index 7cf3b42..421ed3f 100644
--- a/ot/gromov.py
+++ b/ot/gromov.py
@@ -23,7 +23,7 @@ def square_loss(a, b):
     Returns the value of L(a,b)=(1/2)*|a-b|^2
     """
 
-    return (1 / 2) * (a - b)**2
+    return 0.5 * (a - b)**2
 
 
 def kl_loss(a, b):
@@ -54,9 +54,9 @@ def tensor_square_loss(C1, C2, T):
 
     Parameters
     ----------
-    C1 : np.ndarray(ns,ns)
+    C1 : ndarray, shape (ns, ns)
          Metric cost matrix in the source space
-    C2 : np.ndarray(nt,nt)
+    C2 : ndarray, shape (nt, nt)
          Metric costfr matrix in the target space
     T :  np.ndarray(ns,nt)
          Coupling between source and target spaces
@@ -87,7 +87,7 @@ def tensor_square_loss(C1, C2, T):
         return b
 
     tens = -np.dot(h1(C1), T).dot(h2(C2).T)
-    tens = tens - tens.min()
+    tens -= tens.min()
 
     return np.array(tens)
 
@@ -112,9 +112,9 @@ def tensor_kl_loss(C1, C2, T):
 
     Parameters
     ----------
-    C1 : np.ndarray(ns,ns)
+    C1 : ndarray, shape (ns, ns)
          Metric cost matrix in the source space
-    C2 : np.ndarray(nt,nt)
+    C2 : ndarray, shape (nt, nt)
          Metric costfr matrix in the target space
     T :  np.ndarray(ns,nt)
          Coupling between source and target spaces
@@ -149,7 +149,7 @@ def tensor_kl_loss(C1, C2, T):
         return np.log(b + 1e-15)
 
     tens = -np.dot(h1(C1), T).dot(h2(C2).T)
-    tens = tens - tens.min()
+    tens -= tens.min()
 
     return np.array(tens)
 
@@ -175,9 +175,8 @@ def update_square_loss(p, lambdas, T, Cs):
 
 
     """
-    tmpsum = np.sum([lambdas[s] * np.dot(T[s].T, Cs[s]).dot(T[s])
-                     for s in range(len(T))])
-    ppt = np.dot(p, p.T)
+    tmpsum = sum([lambdas[s] * np.dot(T[s].T, Cs[s]).dot(T[s]) for s in range(len(T))])
+    ppt = np.outer(p, p)
 
     return(np.divide(tmpsum, ppt))
 
@@ -203,9 +202,8 @@ def update_kl_loss(p, lambdas, T, Cs):
 
 
     """
-    tmpsum = np.sum([lambdas[s] * np.dot(T[s].T, Cs[s]).dot(T[s])
-                     for s in range(len(T))])
-    ppt = np.dot(p, p.T)
+    tmpsum = sum([lambdas[s] * np.dot(T[s].T, Cs[s]).dot(T[s]) for s in range(len(T))])
+    ppt = np.outer(p, p)
 
     return(np.exp(np.divide(tmpsum, ppt)))
 
@@ -239,9 +237,9 @@ def gromov_wasserstein(C1, C2, p, q, loss_fun, epsilon, numItermax=1000, stopThr
 
     Parameters
     ----------
-    C1 : np.ndarray(ns,ns)
+    C1 : ndarray, shape (ns, ns)
          Metric cost matrix in the source space
-    C2 : np.ndarray(nt,nt)
+    C2 : ndarray, shape (nt, nt)
          Metric costfr matrix in the target space
     p :  np.ndarray(ns,)
          distribution in the source space
@@ -271,7 +269,7 @@ def gromov_wasserstein(C1, C2, p, q, loss_fun, epsilon, numItermax=1000, stopThr
     C1 = np.asarray(C1, dtype=np.float64)
     C2 = np.asarray(C2, dtype=np.float64)
 
-    T = np.dot(p, q.T)  # Initialization
+    T = np.outer(p, q)  # Initialization
 
     cpt = 0
     err = 1
@@ -333,9 +331,9 @@ def gromov_wasserstein2(C1, C2, p, q, loss_fun, epsilon, numItermax=1000, stopTh
 
     Parameters
     ----------
-    C1 : np.ndarray(ns,ns)
+    C1 : ndarray, shape (ns, ns)
          Metric cost matrix in the source space
-    C2 : np.ndarray(nt,nt)
+    C2 : ndarray, shape (nt, nt)
          Metric costfr matrix in the target space
     p :  np.ndarray(ns,)
          distribution in the source space
@@ -434,8 +432,6 @@ def gromov_barycenters(N, Cs, ps, p, lambdas, loss_fun, epsilon, numItermax=1000
     Cs = [np.asarray(Cs[s], dtype=np.float64) for s in range(S)]
     lambdas = np.asarray(lambdas, dtype=np.float64)
 
-    T = [0 for s in range(S)]
-
     # Initialization of C : random SPD matrix
     xalea = np.random.randn(N, 2)
     C = dist(xalea, xalea)
diff --git a/test/test_gromov.py b/test/test_gromov.py
new file mode 100644
index 0000000..75eeaab
--- /dev/null
+++ b/test/test_gromov.py
@@ -0,0 +1,38 @@
+"""Tests for module gromov  """
+
+# Author: Erwan Vautier <erwan.vautier@gmail.com>
+#         Nicolas Courty <ncourty@irisa.fr>
+#
+# License: MIT License
+
+import numpy as np
+import ot
+
+
+def test_gromov():
+    n = 50  # nb samples
+
+    mu_s = np.array([0, 0])
+    cov_s = np.array([[1, 0], [0, 1]])
+
+    xs = ot.datasets.get_2D_samples_gauss(n, mu_s, cov_s)
+
+    xt = [xs[n - (i + 1)] for i in range(n)]
+    xt = np.array(xt)
+
+    p = ot.unif(n)
+    q = ot.unif(n)
+
+    C1 = ot.dist(xs, xs)
+    C2 = ot.dist(xt, xt)
+
+    C1 /= C1.max()
+    C2 /= C2.max()
+
+    G = ot.gromov_wasserstein(C1, C2, p, q, 'square_loss', epsilon=5e-4)
+
+    # check constratints
+    np.testing.assert_allclose(
+        p, G.sum(1), atol=1e-04)  # cf convergence gromov
+    np.testing.assert_allclose(
+        q, G.sum(0), atol=1e-04)  # cf convergence gromov
-- 
cgit v1.2.3


From ab6ed1df93cd78bb7f1a54282103d4d830e68bcb Mon Sep 17 00:00:00 2001
From: Nicolas Courty <Nico@MacBook-Pro-de-Nicolas.local>
Date: Fri, 1 Sep 2017 11:20:34 +0200
Subject: docstrings and naming

---
 examples/plot_gromov.py            | 10 +++++-----
 examples/plot_gromov_barycenter.py | 20 ++++++++++----------
 ot/gromov.py                       | 18 +++++++++---------
 test/test_gromov.py                | 10 +++++-----
 4 files changed, 29 insertions(+), 29 deletions(-)

(limited to 'test')

diff --git a/examples/plot_gromov.py b/examples/plot_gromov.py
index 9bbdbde..92312ae 100644
--- a/examples/plot_gromov.py
+++ b/examples/plot_gromov.py
@@ -26,7 +26,7 @@ The Gromov-Wasserstein distance allows to compute distances with samples that do
 For demonstration purpose, we sample two Gaussian distributions in 2- and 3-dimensional spaces.
 """
 
-n = 30  # nb samples
+n_samples = 30  # nb samples
 
 mu_s = np.array([0, 0])
 cov_s = np.array([[1, 0], [0, 1]])
@@ -35,9 +35,9 @@ mu_t = np.array([4, 4, 4])
 cov_t = np.array([[1, 0, 0], [0, 1, 0], [0, 0, 1]])
 
 
-xs = ot.datasets.get_2D_samples_gauss(n, mu_s, cov_s)
+xs = ot.datasets.get_2D_samples_gauss(n_samples, mu_s, cov_s)
 P = sp.linalg.sqrtm(cov_t)
-xt = np.random.randn(n, 3).dot(P) + mu_t
+xt = np.random.randn(n_samples, 3).dot(P) + mu_t
 
 
 """
@@ -75,8 +75,8 @@ Compute Gromov-Wasserstein plans and distance
 =============================================
 """
 
-p = ot.unif(n)
-q = ot.unif(n)
+p = ot.unif(n_samples)
+q = ot.unif(n_samples)
 
 gw = ot.gromov_wasserstein(C1, C2, p, q, 'square_loss', epsilon=5e-4)
 gw_dist = ot.gromov_wasserstein2(C1, C2, p, q, 'square_loss', epsilon=5e-4)
diff --git a/examples/plot_gromov_barycenter.py b/examples/plot_gromov_barycenter.py
index da52768..f0657e1 100755
--- a/examples/plot_gromov_barycenter.py
+++ b/examples/plot_gromov_barycenter.py
@@ -91,12 +91,12 @@ def im2mat(I):
     return I.reshape((I.shape[0] * I.shape[1], I.shape[2]))
 
 
-carre = spi.imread('../data/carre.png').astype(np.float64) / 256
-rond = spi.imread('../data/rond.png').astype(np.float64) / 256
+square = spi.imread('../data/carre.png').astype(np.float64) / 256
+circle = spi.imread('../data/rond.png').astype(np.float64) / 256
 triangle = spi.imread('../data/triangle.png').astype(np.float64) / 256
-fleche = spi.imread('../data/coeur.png').astype(np.float64) / 256
+arrow = spi.imread('../data/coeur.png').astype(np.float64) / 256
 
-shapes = [carre, rond, triangle, fleche]
+shapes = [square, circle, triangle, arrow]
 
 S = 4
 xs = [[] for i in range(S)]
@@ -118,36 +118,36 @@ Barycenter computation
 The four distributions are constructed from 4 simple images
 """
 ns = [len(xs[s]) for s in range(S)]
-N = 30
+n_samples = 30
 
 """Compute all distances matrices for the four shapes"""
 Cs = [sp.spatial.distance.cdist(xs[s], xs[s]) for s in range(S)]
 Cs = [cs / cs.max() for cs in Cs]
 
 ps = [ot.unif(ns[s]) for s in range(S)]
-p = ot.unif(N)
+p = ot.unif(n_samples)
 
 
 lambdast = [[float(i) / 3, float(3 - i) / 3] for i in [1, 2]]
 
 Ct01 = [0 for i in range(2)]
 for i in range(2):
-    Ct01[i] = ot.gromov.gromov_barycenters(N, [Cs[0], Cs[1]], [
+    Ct01[i] = ot.gromov.gromov_barycenters(n_samples, [Cs[0], Cs[1]], [
                                            ps[0], ps[1]], p, lambdast[i], 'square_loss', 5e-4, numItermax=100, stopThr=1e-3)
 
 Ct02 = [0 for i in range(2)]
 for i in range(2):
-    Ct02[i] = ot.gromov.gromov_barycenters(N, [Cs[0], Cs[2]], [
+    Ct02[i] = ot.gromov.gromov_barycenters(n_samples, [Cs[0], Cs[2]], [
                                            ps[0], ps[2]], p, lambdast[i], 'square_loss', 5e-4, numItermax=100, stopThr=1e-3)
 
 Ct13 = [0 for i in range(2)]
 for i in range(2):
-    Ct13[i] = ot.gromov.gromov_barycenters(N, [Cs[1], Cs[3]], [
+    Ct13[i] = ot.gromov.gromov_barycenters(n_samples, [Cs[1], Cs[3]], [
                                            ps[1], ps[3]], p, lambdast[i], 'square_loss', 5e-4, numItermax=100, stopThr=1e-3)
 
 Ct23 = [0 for i in range(2)]
 for i in range(2):
-    Ct23[i] = ot.gromov.gromov_barycenters(N, [Cs[2], Cs[3]], [
+    Ct23[i] = ot.gromov.gromov_barycenters(n_samples, [Cs[2], Cs[3]], [
                                            ps[2], ps[3]], p, lambdast[i], 'square_loss', 5e-4, numItermax=100, stopThr=1e-3)
 
 """
diff --git a/ot/gromov.py b/ot/gromov.py
index 421ed3f..ad85fcd 100644
--- a/ot/gromov.py
+++ b/ot/gromov.py
@@ -208,7 +208,7 @@ def update_kl_loss(p, lambdas, T, Cs):
     return(np.exp(np.divide(tmpsum, ppt)))
 
 
-def gromov_wasserstein(C1, C2, p, q, loss_fun, epsilon, numItermax=1000, stopThr=1e-9, verbose=False, log=False):
+def gromov_wasserstein(C1, C2, p, q, loss_fun, epsilon, max_iter=1000, stopThr=1e-9, verbose=False, log=False):
     """
     Returns the gromov-wasserstein coupling between the two measured similarity matrices
 
@@ -248,7 +248,7 @@ def gromov_wasserstein(C1, C2, p, q, loss_fun, epsilon, numItermax=1000, stopThr
     loss_fun :  loss function used for the solver either 'square_loss' or 'kl_loss'
     epsilon : float
         Regularization term >0
-    numItermax : int, optional
+    max_iter : int, optional
         Max number of iterations
     stopThr : float, optional
         Stop threshold on error (>0)
@@ -274,7 +274,7 @@ def gromov_wasserstein(C1, C2, p, q, loss_fun, epsilon, numItermax=1000, stopThr
     cpt = 0
     err = 1
 
-    while (err > stopThr and cpt < numItermax):
+    while (err > stopThr and cpt < max_iter):
 
         Tprev = T
 
@@ -307,7 +307,7 @@ def gromov_wasserstein(C1, C2, p, q, loss_fun, epsilon, numItermax=1000, stopThr
         return T
 
 
-def gromov_wasserstein2(C1, C2, p, q, loss_fun, epsilon, numItermax=1000, stopThr=1e-9, verbose=False, log=False):
+def gromov_wasserstein2(C1, C2, p, q, loss_fun, epsilon, max_iter=1000, stopThr=1e-9, verbose=False, log=False):
     """
     Returns the gromov-wasserstein discrepancy between the two measured similarity matrices
 
@@ -362,10 +362,10 @@ def gromov_wasserstein2(C1, C2, p, q, loss_fun, epsilon, numItermax=1000, stopTh
 
     if log:
         gw, logv = gromov_wasserstein(
-            C1, C2, p, q, loss_fun, epsilon, numItermax, stopThr, verbose, log)
+            C1, C2, p, q, loss_fun, epsilon, max_iter, stopThr, verbose, log)
     else:
         gw = gromov_wasserstein(C1, C2, p, q, loss_fun,
-                                epsilon, numItermax, stopThr, verbose, log)
+                                epsilon, max_iter, stopThr, verbose, log)
 
     if loss_fun == 'square_loss':
         gw_dist = np.sum(gw * tensor_square_loss(C1, C2, gw))
@@ -379,7 +379,7 @@ def gromov_wasserstein2(C1, C2, p, q, loss_fun, epsilon, numItermax=1000, stopTh
         return gw_dist
 
 
-def gromov_barycenters(N, Cs, ps, p, lambdas, loss_fun, epsilon, numItermax=1000, stopThr=1e-9, verbose=False, log=False):
+def gromov_barycenters(N, Cs, ps, p, lambdas, loss_fun, epsilon, max_iter=1000, stopThr=1e-9, verbose=False, log=False):
     """
     Returns the gromov-wasserstein barycenters of S measured similarity matrices
 
@@ -442,12 +442,12 @@ def gromov_barycenters(N, Cs, ps, p, lambdas, loss_fun, epsilon, numItermax=1000
 
     error = []
 
-    while(err > stopThr and cpt < numItermax):
+    while(err > stopThr and cpt < max_iter):
 
         Cprev = C
 
         T = [gromov_wasserstein(Cs[s], C, ps[s], p, loss_fun, epsilon,
-                                numItermax, 1e-5, verbose, log) for s in range(S)]
+                                max_iter, 1e-5, verbose, log) for s in range(S)]
 
         if loss_fun == 'square_loss':
             C = update_square_loss(p, lambdas, T, Cs)
diff --git a/test/test_gromov.py b/test/test_gromov.py
index 75eeaab..c26d898 100644
--- a/test/test_gromov.py
+++ b/test/test_gromov.py
@@ -10,18 +10,18 @@ import ot
 
 
 def test_gromov():
-    n = 50  # nb samples
+    n_samples = 50  # nb samples
 
     mu_s = np.array([0, 0])
     cov_s = np.array([[1, 0], [0, 1]])
 
-    xs = ot.datasets.get_2D_samples_gauss(n, mu_s, cov_s)
+    xs = ot.datasets.get_2D_samples_gauss(n_samples, mu_s, cov_s)
 
-    xt = [xs[n - (i + 1)] for i in range(n)]
+    xt = [xs[n_samples - (i + 1)] for i in range(n_samples)]
     xt = np.array(xt)
 
-    p = ot.unif(n)
-    q = ot.unif(n)
+    p = ot.unif(n_samples)
+    q = ot.unif(n_samples)
 
     C1 = ot.dist(xs, xs)
     C2 = ot.dist(xt, xt)
-- 
cgit v1.2.3


From 46fc12a298c49b715ac953cff391b18b54dab0f0 Mon Sep 17 00:00:00 2001
From: Nicolas Courty <Nico@MacBook-Pro-de-Nicolas.local>
Date: Fri, 1 Sep 2017 11:43:51 +0200
Subject: solving conflicts :/

---
 examples/plot_gromov.py            | 15 -------------
 examples/plot_gromov_barycenter.py | 33 -----------------------------
 ot/gromov.py                       | 43 +++++---------------------------------
 test/test_gromov.py                | 14 -------------
 4 files changed, 5 insertions(+), 100 deletions(-)

(limited to 'test')

diff --git a/examples/plot_gromov.py b/examples/plot_gromov.py
index 99aaf81..92312ae 100644
--- a/examples/plot_gromov.py
+++ b/examples/plot_gromov.py
@@ -26,11 +26,7 @@ The Gromov-Wasserstein distance allows to compute distances with samples that do
 For demonstration purpose, we sample two Gaussian distributions in 2- and 3-dimensional spaces.
 """
 
-<<<<<<< HEAD
 n_samples = 30  # nb samples
-=======
-n = 30  # nb samples
->>>>>>> 986f46ddde3ce2f550cb56f66620df377326423d
 
 mu_s = np.array([0, 0])
 cov_s = np.array([[1, 0], [0, 1]])
@@ -39,15 +35,9 @@ mu_t = np.array([4, 4, 4])
 cov_t = np.array([[1, 0, 0], [0, 1, 0], [0, 0, 1]])
 
 
-<<<<<<< HEAD
 xs = ot.datasets.get_2D_samples_gauss(n_samples, mu_s, cov_s)
 P = sp.linalg.sqrtm(cov_t)
 xt = np.random.randn(n_samples, 3).dot(P) + mu_t
-=======
-xs = ot.datasets.get_2D_samples_gauss(n, mu_s, cov_s)
-P = sp.linalg.sqrtm(cov_t)
-xt = np.random.randn(n, 3).dot(P) + mu_t
->>>>>>> 986f46ddde3ce2f550cb56f66620df377326423d
 
 
 """
@@ -85,13 +75,8 @@ Compute Gromov-Wasserstein plans and distance
 =============================================
 """
 
-<<<<<<< HEAD
 p = ot.unif(n_samples)
 q = ot.unif(n_samples)
-=======
-p = ot.unif(n)
-q = ot.unif(n)
->>>>>>> 986f46ddde3ce2f550cb56f66620df377326423d
 
 gw = ot.gromov_wasserstein(C1, C2, p, q, 'square_loss', epsilon=5e-4)
 gw_dist = ot.gromov_wasserstein2(C1, C2, p, q, 'square_loss', epsilon=5e-4)
diff --git a/examples/plot_gromov_barycenter.py b/examples/plot_gromov_barycenter.py
index 46ec4bc..f0657e1 100755
--- a/examples/plot_gromov_barycenter.py
+++ b/examples/plot_gromov_barycenter.py
@@ -91,21 +91,12 @@ def im2mat(I):
     return I.reshape((I.shape[0] * I.shape[1], I.shape[2]))
 
 
-<<<<<<< HEAD
 square = spi.imread('../data/carre.png').astype(np.float64) / 256
 circle = spi.imread('../data/rond.png').astype(np.float64) / 256
 triangle = spi.imread('../data/triangle.png').astype(np.float64) / 256
 arrow = spi.imread('../data/coeur.png').astype(np.float64) / 256
 
 shapes = [square, circle, triangle, arrow]
-=======
-carre = spi.imread('../data/carre.png').astype(np.float64) / 256
-rond = spi.imread('../data/rond.png').astype(np.float64) / 256
-triangle = spi.imread('../data/triangle.png').astype(np.float64) / 256
-fleche = spi.imread('../data/coeur.png').astype(np.float64) / 256
-
-shapes = [carre, rond, triangle, fleche]
->>>>>>> 986f46ddde3ce2f550cb56f66620df377326423d
 
 S = 4
 xs = [[] for i in range(S)]
@@ -127,60 +118,36 @@ Barycenter computation
 The four distributions are constructed from 4 simple images
 """
 ns = [len(xs[s]) for s in range(S)]
-<<<<<<< HEAD
 n_samples = 30
-=======
-N = 30
->>>>>>> 986f46ddde3ce2f550cb56f66620df377326423d
 
 """Compute all distances matrices for the four shapes"""
 Cs = [sp.spatial.distance.cdist(xs[s], xs[s]) for s in range(S)]
 Cs = [cs / cs.max() for cs in Cs]
 
 ps = [ot.unif(ns[s]) for s in range(S)]
-<<<<<<< HEAD
 p = ot.unif(n_samples)
-=======
-p = ot.unif(N)
->>>>>>> 986f46ddde3ce2f550cb56f66620df377326423d
 
 
 lambdast = [[float(i) / 3, float(3 - i) / 3] for i in [1, 2]]
 
 Ct01 = [0 for i in range(2)]
 for i in range(2):
-<<<<<<< HEAD
     Ct01[i] = ot.gromov.gromov_barycenters(n_samples, [Cs[0], Cs[1]], [
-=======
-    Ct01[i] = ot.gromov.gromov_barycenters(N, [Cs[0], Cs[1]], [
->>>>>>> 986f46ddde3ce2f550cb56f66620df377326423d
                                            ps[0], ps[1]], p, lambdast[i], 'square_loss', 5e-4, numItermax=100, stopThr=1e-3)
 
 Ct02 = [0 for i in range(2)]
 for i in range(2):
-<<<<<<< HEAD
     Ct02[i] = ot.gromov.gromov_barycenters(n_samples, [Cs[0], Cs[2]], [
-=======
-    Ct02[i] = ot.gromov.gromov_barycenters(N, [Cs[0], Cs[2]], [
->>>>>>> 986f46ddde3ce2f550cb56f66620df377326423d
                                            ps[0], ps[2]], p, lambdast[i], 'square_loss', 5e-4, numItermax=100, stopThr=1e-3)
 
 Ct13 = [0 for i in range(2)]
 for i in range(2):
-<<<<<<< HEAD
     Ct13[i] = ot.gromov.gromov_barycenters(n_samples, [Cs[1], Cs[3]], [
-=======
-    Ct13[i] = ot.gromov.gromov_barycenters(N, [Cs[1], Cs[3]], [
->>>>>>> 986f46ddde3ce2f550cb56f66620df377326423d
                                            ps[1], ps[3]], p, lambdast[i], 'square_loss', 5e-4, numItermax=100, stopThr=1e-3)
 
 Ct23 = [0 for i in range(2)]
 for i in range(2):
-<<<<<<< HEAD
     Ct23[i] = ot.gromov.gromov_barycenters(n_samples, [Cs[2], Cs[3]], [
-=======
-    Ct23[i] = ot.gromov.gromov_barycenters(N, [Cs[2], Cs[3]], [
->>>>>>> 986f46ddde3ce2f550cb56f66620df377326423d
                                            ps[2], ps[3]], p, lambdast[i], 'square_loss', 5e-4, numItermax=100, stopThr=1e-3)
 
 """
diff --git a/ot/gromov.py b/ot/gromov.py
index 197e3ea..9dbf463 100644
--- a/ot/gromov.py
+++ b/ot/gromov.py
@@ -208,11 +208,7 @@ def update_kl_loss(p, lambdas, T, Cs):
     return(np.exp(np.divide(tmpsum, ppt)))
 
 
-<<<<<<< HEAD
 def gromov_wasserstein(C1, C2, p, q, loss_fun, epsilon, max_iter=1000, stopThr=1e-9, verbose=False, log=False):
-=======
-def gromov_wasserstein(C1, C2, p, q, loss_fun, epsilon, numItermax=1000, stopThr=1e-9, verbose=False, log=False):
->>>>>>> 986f46ddde3ce2f550cb56f66620df377326423d
     """
     Returns the gromov-wasserstein coupling between the two measured similarity matrices
 
@@ -252,11 +248,11 @@ def gromov_wasserstein(C1, C2, p, q, loss_fun, epsilon, numItermax=1000, stopThr
     loss_fun :  loss function used for the solver either 'square_loss' or 'kl_loss'
     epsilon : float
         Regularization term >0
-<<<<<<< HEAD
+<<<<<<< HEAD
     max_iter : int, optional
-=======
+=======
     numItermax : int, optional
->>>>>>> 986f46ddde3ce2f550cb56f66620df377326423d
+>>>>>>> 986f46ddde3ce2f550cb56f66620df377326423d
         Max number of iterations
     stopThr : float, optional
         Stop threshold on error (>0)
@@ -282,11 +278,7 @@ def gromov_wasserstein(C1, C2, p, q, loss_fun, epsilon, numItermax=1000, stopThr
     cpt = 0
     err = 1
 
-<<<<<<< HEAD
     while (err > stopThr and cpt < max_iter):
-=======
-    while (err > stopThr and cpt < numItermax):
->>>>>>> 986f46ddde3ce2f550cb56f66620df377326423d
 
         Tprev = T
 
@@ -319,11 +311,7 @@ def gromov_wasserstein(C1, C2, p, q, loss_fun, epsilon, numItermax=1000, stopThr
         return T
 
 
-<<<<<<< HEAD
 def gromov_wasserstein2(C1, C2, p, q, loss_fun, epsilon, max_iter=1000, stopThr=1e-9, verbose=False, log=False):
-=======
-def gromov_wasserstein2(C1, C2, p, q, loss_fun, epsilon, numItermax=1000, stopThr=1e-9, verbose=False, log=False):
->>>>>>> 986f46ddde3ce2f550cb56f66620df377326423d
     """
     Returns the gromov-wasserstein discrepancy between the two measured similarity matrices
 
@@ -358,7 +346,7 @@ def gromov_wasserstein2(C1, C2, p, q, loss_fun, epsilon, numItermax=1000, stopTh
     loss_fun :  loss function used for the solver either 'square_loss' or 'kl_loss'
     epsilon : float
         Regularization term >0
-    numItermax : int, optional
+    max_iter : int, optional
         Max number of iterations
     stopThr : float, optional
         Stop threshold on error (>0)
@@ -378,17 +366,10 @@ def gromov_wasserstein2(C1, C2, p, q, loss_fun, epsilon, numItermax=1000, stopTh
 
     if log:
         gw, logv = gromov_wasserstein(
-<<<<<<< HEAD
             C1, C2, p, q, loss_fun, epsilon, max_iter, stopThr, verbose, log)
     else:
         gw = gromov_wasserstein(C1, C2, p, q, loss_fun,
                                 epsilon, max_iter, stopThr, verbose, log)
-=======
-            C1, C2, p, q, loss_fun, epsilon, numItermax, stopThr, verbose, log)
-    else:
-        gw = gromov_wasserstein(C1, C2, p, q, loss_fun,
-                                epsilon, numItermax, stopThr, verbose, log)
->>>>>>> 986f46ddde3ce2f550cb56f66620df377326423d
 
     if loss_fun == 'square_loss':
         gw_dist = np.sum(gw * tensor_square_loss(C1, C2, gw))
@@ -402,11 +383,7 @@ def gromov_wasserstein2(C1, C2, p, q, loss_fun, epsilon, numItermax=1000, stopTh
         return gw_dist
 
 
-<<<<<<< HEAD
 def gromov_barycenters(N, Cs, ps, p, lambdas, loss_fun, epsilon, max_iter=1000, stopThr=1e-9, verbose=False, log=False):
-=======
-def gromov_barycenters(N, Cs, ps, p, lambdas, loss_fun, epsilon, numItermax=1000, stopThr=1e-9, verbose=False, log=False):
->>>>>>> 986f46ddde3ce2f550cb56f66620df377326423d
     """
     Returns the gromov-wasserstein barycenters of S measured similarity matrices
 
@@ -439,7 +416,7 @@ def gromov_barycenters(N, Cs, ps, p, lambdas, loss_fun, epsilon, numItermax=1000
              with the S Ts couplings calculated at each iteration
     epsilon : float
         Regularization term >0
-    numItermax : int, optional
+    max_iter : int, optional
         Max number of iterations
     stopThr : float, optional
         Stop threshol on error (>0)
@@ -469,21 +446,11 @@ def gromov_barycenters(N, Cs, ps, p, lambdas, loss_fun, epsilon, numItermax=1000
 
     error = []
 
-<<<<<<< HEAD
     while(err > stopThr and cpt < max_iter):
-=======
-    while(err > stopThr and cpt < numItermax):
->>>>>>> 986f46ddde3ce2f550cb56f66620df377326423d
-
         Cprev = C
 
         T = [gromov_wasserstein(Cs[s], C, ps[s], p, loss_fun, epsilon,
-<<<<<<< HEAD
                                 max_iter, 1e-5, verbose, log) for s in range(S)]
-=======
-                                numItermax, 1e-5, verbose, log) for s in range(S)]
->>>>>>> 986f46ddde3ce2f550cb56f66620df377326423d
-
         if loss_fun == 'square_loss':
             C = update_square_loss(p, lambdas, T, Cs)
 
diff --git a/test/test_gromov.py b/test/test_gromov.py
index a6c89f2..c26d898 100644
--- a/test/test_gromov.py
+++ b/test/test_gromov.py
@@ -10,16 +10,11 @@ import ot
 
 
 def test_gromov():
-<<<<<<< HEAD
     n_samples = 50  # nb samples
-=======
-    n = 50  # nb samples
->>>>>>> 986f46ddde3ce2f550cb56f66620df377326423d
 
     mu_s = np.array([0, 0])
     cov_s = np.array([[1, 0], [0, 1]])
 
-<<<<<<< HEAD
     xs = ot.datasets.get_2D_samples_gauss(n_samples, mu_s, cov_s)
 
     xt = [xs[n_samples - (i + 1)] for i in range(n_samples)]
@@ -27,15 +22,6 @@ def test_gromov():
 
     p = ot.unif(n_samples)
     q = ot.unif(n_samples)
-=======
-    xs = ot.datasets.get_2D_samples_gauss(n, mu_s, cov_s)
-
-    xt = [xs[n - (i + 1)] for i in range(n)]
-    xt = np.array(xt)
-
-    p = ot.unif(n)
-    q = ot.unif(n)
->>>>>>> 986f46ddde3ce2f550cb56f66620df377326423d
 
     C1 = ot.dist(xs, xs)
     C2 = ot.dist(xt, xt)
-- 
cgit v1.2.3


From 53e1115349ddbdff83b74c5dd15fc4b258c46cd4 Mon Sep 17 00:00:00 2001
From: Nicolas Courty <Nico@MacBook-Pro-de-Nicolas.local>
Date: Fri, 1 Sep 2017 15:37:09 +0200
Subject: docstrings + naming

---
 examples/plot_gromov_barycenter.py | 34 ++++++++------
 ot/gromov.py                       | 92 +++++++++++++++++++-------------------
 test/test_gromov.py                |  2 +-
 3 files changed, 68 insertions(+), 60 deletions(-)

(limited to 'test')

diff --git a/examples/plot_gromov_barycenter.py b/examples/plot_gromov_barycenter.py
index f0657e1..4f17117 100755
--- a/examples/plot_gromov_barycenter.py
+++ b/examples/plot_gromov_barycenter.py
@@ -45,19 +45,19 @@ def smacof_mds(C, dim, max_iter=3000, eps=1e-9):
           dimension of the targeted space
     max_iter :  int
         Maximum number of iterations of the SMACOF algorithm for a single run
-
-    eps : relative tolerance w.r.t stress to declare converge
+    eps : float
+        relative tolerance w.r.t stress to declare converge
 
 
     Returns
     -------
-    npos : R**dim ndarray
+    npos : ndarray, shape (R, dim)
            Embedded coordinates of the interpolated point cloud (defined with one isometry)
 
 
     """
 
-    seed = np.random.RandomState(seed=3)
+    rng = np.random.RandomState(seed=3)
 
     mds = manifold.MDS(
         dim,
@@ -72,7 +72,7 @@ def smacof_mds(C, dim, max_iter=3000, eps=1e-9):
         max_iter=max_iter,
         eps=1e-9,
         dissimilarity="precomputed",
-        random_state=seed,
+        random_state=rng,
         n_init=1)
     npos = nmds.fit_transform(C, init=pos)
 
@@ -132,23 +132,31 @@ lambdast = [[float(i) / 3, float(3 - i) / 3] for i in [1, 2]]
 
 Ct01 = [0 for i in range(2)]
 for i in range(2):
-    Ct01[i] = ot.gromov.gromov_barycenters(n_samples, [Cs[0], Cs[1]], [
-                                           ps[0], ps[1]], p, lambdast[i], 'square_loss', 5e-4, numItermax=100, stopThr=1e-3)
+    Ct01[i] = ot.gromov.gromov_barycenters(n_samples, [Cs[0], Cs[1]],
+                                           [ps[0], ps[1]
+                                            ], p, lambdast[i], 'square_loss', 5e-4,
+                                           max_iter=100, stopThr=1e-3)
 
 Ct02 = [0 for i in range(2)]
 for i in range(2):
-    Ct02[i] = ot.gromov.gromov_barycenters(n_samples, [Cs[0], Cs[2]], [
-                                           ps[0], ps[2]], p, lambdast[i], 'square_loss', 5e-4, numItermax=100, stopThr=1e-3)
+    Ct02[i] = ot.gromov.gromov_barycenters(n_samples, [Cs[0], Cs[2]],
+                                           [ps[0], ps[2]
+                                            ], p, lambdast[i], 'square_loss', 5e-4,
+                                           max_iter=100, stopThr=1e-3)
 
 Ct13 = [0 for i in range(2)]
 for i in range(2):
-    Ct13[i] = ot.gromov.gromov_barycenters(n_samples, [Cs[1], Cs[3]], [
-                                           ps[1], ps[3]], p, lambdast[i], 'square_loss', 5e-4, numItermax=100, stopThr=1e-3)
+    Ct13[i] = ot.gromov.gromov_barycenters(n_samples, [Cs[1], Cs[3]],
+                                           [ps[1], ps[3]
+                                            ], p, lambdast[i], 'square_loss', 5e-4,
+                                           max_iter=100, stopThr=1e-3)
 
 Ct23 = [0 for i in range(2)]
 for i in range(2):
-    Ct23[i] = ot.gromov.gromov_barycenters(n_samples, [Cs[2], Cs[3]], [
-                                           ps[2], ps[3]], p, lambdast[i], 'square_loss', 5e-4, numItermax=100, stopThr=1e-3)
+    Ct23[i] = ot.gromov.gromov_barycenters(n_samples, [Cs[2], Cs[3]],
+                                           [ps[2], ps[3]
+                                            ], p, lambdast[i], 'square_loss', 5e-4,
+                                           max_iter=100, stopThr=1e-3)
 
 """
 Visualization
diff --git a/ot/gromov.py b/ot/gromov.py
index 9dbf463..cf9c4da 100644
--- a/ot/gromov.py
+++ b/ot/gromov.py
@@ -58,13 +58,13 @@ def tensor_square_loss(C1, C2, T):
          Metric cost matrix in the source space
     C2 : ndarray, shape (nt, nt)
          Metric costfr matrix in the target space
-    T :  np.ndarray(ns,nt)
+    T : ndarray, shape (ns, nt)
          Coupling between source and target spaces
 
 
     Returns
     -------
-    tens : (ns*nt) ndarray
+    tens : ndarray, shape (ns, nt)
            \mathcal{L}(C1,C2) \otimes T tensor-matrix multiplication result
 
 
@@ -89,7 +89,7 @@ def tensor_square_loss(C1, C2, T):
     tens = -np.dot(h1(C1), T).dot(h2(C2).T)
     tens -= tens.min()
 
-    return np.array(tens)
+    return tens
 
 
 def tensor_kl_loss(C1, C2, T):
@@ -116,13 +116,13 @@ def tensor_kl_loss(C1, C2, T):
          Metric cost matrix in the source space
     C2 : ndarray, shape (nt, nt)
          Metric costfr matrix in the target space
-    T :  np.ndarray(ns,nt)
+    T :  ndarray, shape (ns, nt)
          Coupling between source and target spaces
 
 
     Returns
     -------
-    tens : (ns*nt) ndarray
+    tens : ndarray, shape (ns, nt)
            \mathcal{L}(C1,C2) \otimes T tensor-matrix multiplication result
 
     References
@@ -151,34 +151,36 @@ def tensor_kl_loss(C1, C2, T):
     tens = -np.dot(h1(C1), T).dot(h2(C2).T)
     tens -= tens.min()
 
-    return np.array(tens)
+    return tens
 
 
 def update_square_loss(p, lambdas, T, Cs):
     """
-    Updates C according to the L2 Loss kernel with the S Ts couplings calculated at each iteration
+    Updates C according to the L2 Loss kernel with the S Ts couplings
+    calculated at each iteration
 
 
     Parameters
     ----------
-    p  : np.ndarray(N,)
+    p  : ndarray, shape (N,)
          weights in the targeted barycenter
     lambdas : list of the S spaces' weights
     T : list of S np.ndarray(ns,N)
         the S Ts couplings calculated at each iteration
-    Cs : Cs : list of S np.ndarray(ns,ns)
+    Cs : list of S ndarray, shape(ns,ns)
          Metric cost matrices
 
     Returns
     ----------
-    C updated
+    C : ndarray, shape (nt,nt)
+        updated C matrix
 
 
     """
     tmpsum = sum([lambdas[s] * np.dot(T[s].T, Cs[s]).dot(T[s]) for s in range(len(T))])
     ppt = np.outer(p, p)
 
-    return(np.divide(tmpsum, ppt))
+    return np.divide(tmpsum, ppt)
 
 
 def update_kl_loss(p, lambdas, T, Cs):
@@ -188,27 +190,28 @@ def update_kl_loss(p, lambdas, T, Cs):
 
     Parameters
     ----------
-    p  : np.ndarray(N,)
+    p  : ndarray, shape (N,)
          weights in the targeted barycenter
     lambdas : list of the S spaces' weights
     T : list of S np.ndarray(ns,N)
         the S Ts couplings calculated at each iteration
-    Cs : Cs : list of S np.ndarray(ns,ns)
+    Cs : list of S ndarray, shape(ns,ns)
          Metric cost matrices
 
     Returns
     ----------
-    C updated
+    C : ndarray, shape (ns,ns)
+        updated C matrix
 
 
     """
     tmpsum = sum([lambdas[s] * np.dot(T[s].T, Cs[s]).dot(T[s]) for s in range(len(T))])
     ppt = np.outer(p, p)
 
-    return(np.exp(np.divide(tmpsum, ppt)))
+    return np.exp(np.divide(tmpsum, ppt))
 
 
-def gromov_wasserstein(C1, C2, p, q, loss_fun, epsilon, max_iter=1000, stopThr=1e-9, verbose=False, log=False):
+def gromov_wasserstein(C1, C2, p, q, loss_fun, epsilon, max_iter=1000, tol=1e-9, verbose=False, log=False):
     """
     Returns the gromov-wasserstein coupling between the two measured similarity matrices
 
@@ -241,31 +244,28 @@ def gromov_wasserstein(C1, C2, p, q, loss_fun, epsilon, max_iter=1000, stopThr=1
          Metric cost matrix in the source space
     C2 : ndarray, shape (nt, nt)
          Metric costfr matrix in the target space
-    p :  np.ndarray(ns,)
+    p :  ndarray, shape (ns,)
          distribution in the source space
-    q :  np.ndarray(nt)
+    q :  ndarray, shape (nt,)
          distribution in the target space
-    loss_fun :  loss function used for the solver either 'square_loss' or 'kl_loss'
+    loss_fun :  string
+        loss function used for the solver either 'square_loss' or 'kl_loss'
     epsilon : float
         Regularization term >0
-<<<<<<< HEAD
     max_iter : int, optional
-=======
-    numItermax : int, optional
->>>>>>> 986f46ddde3ce2f550cb56f66620df377326423d
-        Max number of iterations
-    stopThr : float, optional
+       Max number of iterations
+    tol : float, optional
         Stop threshold on error (>0)
     verbose : bool, optional
         Print information along iterations
     log : bool, optional
         record log if True
-    forcing : np.ndarray(N,2)
-        list of forced couplings (where N is the number of forcing)
+
 
     Returns
     -------
-    T : coupling between the two spaces that minimizes :
+    T : ndarray, shape (ns, nt)
+        coupling between the two spaces that minimizes :
             \sum_{i,j,k,l} L(C1_{i,k},C2_{j,l})*T_{i,j}*T_{k,l}-\epsilon(H(T))
 
     """
@@ -278,7 +278,7 @@ def gromov_wasserstein(C1, C2, p, q, loss_fun, epsilon, max_iter=1000, stopThr=1
     cpt = 0
     err = 1
 
-    while (err > stopThr and cpt < max_iter):
+    while (err > tol and cpt < max_iter):
 
         Tprev = T
 
@@ -303,7 +303,7 @@ def gromov_wasserstein(C1, C2, p, q, loss_fun, epsilon, max_iter=1000, stopThr=1
                         'It.', 'Err') + '\n' + '-' * 19)
                 print('{:5d}|{:8e}|'.format(cpt, err))
 
-        cpt = cpt + 1
+        cpt += 1
 
     if log:
         return T, log
@@ -311,7 +311,7 @@ def gromov_wasserstein(C1, C2, p, q, loss_fun, epsilon, max_iter=1000, stopThr=1
         return T
 
 
-def gromov_wasserstein2(C1, C2, p, q, loss_fun, epsilon, max_iter=1000, stopThr=1e-9, verbose=False, log=False):
+def gromov_wasserstein2(C1, C2, p, q, loss_fun, epsilon, max_iter=1000, tol=1e-9, verbose=False, log=False):
     """
     Returns the gromov-wasserstein discrepancy between the two measured similarity matrices
 
@@ -339,37 +339,36 @@ def gromov_wasserstein2(C1, C2, p, q, loss_fun, epsilon, max_iter=1000, stopThr=
          Metric cost matrix in the source space
     C2 : ndarray, shape (nt, nt)
          Metric costfr matrix in the target space
-    p :  np.ndarray(ns,)
+    p :  ndarray, shape (ns,)
          distribution in the source space
-    q :  np.ndarray(nt)
+    q :  ndarray, shape (nt,)
          distribution in the target space
-    loss_fun :  loss function used for the solver either 'square_loss' or 'kl_loss'
+    loss_fun :  string
+        loss function used for the solver either 'square_loss' or 'kl_loss'
     epsilon : float
         Regularization term >0
     max_iter : int, optional
         Max number of iterations
-    stopThr : float, optional
+    tol : float, optional
         Stop threshold on error (>0)
     verbose : bool, optional
         Print information along iterations
     log : bool, optional
         record log if True
-    forcing : np.ndarray(N,2)
-        list of forced couplings (where N is the number of forcing)
 
     Returns
     -------
-    T : coupling between the two spaces that minimizes :
-            \sum_{i,j,k,l} L(C1_{i,k},C2_{j,l})*T_{i,j}*T_{k,l}-\epsilon(H(T))
+    gw_dist : float
+        Gromov-Wasserstein distance
 
     """
 
     if log:
         gw, logv = gromov_wasserstein(
-            C1, C2, p, q, loss_fun, epsilon, max_iter, stopThr, verbose, log)
+            C1, C2, p, q, loss_fun, epsilon, max_iter, tol, verbose, log)
     else:
         gw = gromov_wasserstein(C1, C2, p, q, loss_fun,
-                                epsilon, max_iter, stopThr, verbose, log)
+                                epsilon, max_iter, tol, verbose, log)
 
     if loss_fun == 'square_loss':
         gw_dist = np.sum(gw * tensor_square_loss(C1, C2, gw))
@@ -383,7 +382,7 @@ def gromov_wasserstein2(C1, C2, p, q, loss_fun, epsilon, max_iter=1000, stopThr=
         return gw_dist
 
 
-def gromov_barycenters(N, Cs, ps, p, lambdas, loss_fun, epsilon, max_iter=1000, stopThr=1e-9, verbose=False, log=False):
+def gromov_barycenters(N, Cs, ps, p, lambdas, loss_fun, epsilon, max_iter=1000, tol=1e-9, verbose=False, log=False):
     """
     Returns the gromov-wasserstein barycenters of S measured similarity matrices
 
@@ -408,7 +407,7 @@ def gromov_barycenters(N, Cs, ps, p, lambdas, loss_fun, epsilon, max_iter=1000,
          Metric cost matrices
     ps : list of S np.ndarray(ns,)
          sample weights in the S spaces
-    p  : np.ndarray(N,)
+    p  : ndarray, shape(N,)
          weights in the targeted barycenter
     lambdas : list of the S spaces' weights
     L :  tensor-matrix multiplication function based on specific loss function
@@ -418,7 +417,7 @@ def gromov_barycenters(N, Cs, ps, p, lambdas, loss_fun, epsilon, max_iter=1000,
         Regularization term >0
     max_iter : int, optional
         Max number of iterations
-    stopThr : float, optional
+    tol : float, optional
         Stop threshol on error (>0)
     verbose : bool, optional
         Print information along iterations
@@ -427,7 +426,8 @@ def gromov_barycenters(N, Cs, ps, p, lambdas, loss_fun, epsilon, max_iter=1000,
 
     Returns
     -------
-    C : Similarity matrix in the barycenter space (permutated arbitrarily)
+    C : ndarray, shape (N, N)
+        Similarity matrix in the barycenter space (permutated arbitrarily)
 
     """
 
@@ -446,7 +446,7 @@ def gromov_barycenters(N, Cs, ps, p, lambdas, loss_fun, epsilon, max_iter=1000,
 
     error = []
 
-    while(err > stopThr and cpt < max_iter):
+    while(err > tol and cpt < max_iter):
         Cprev = C
 
         T = [gromov_wasserstein(Cs[s], C, ps[s], p, loss_fun, epsilon,
diff --git a/test/test_gromov.py b/test/test_gromov.py
index c26d898..28495e1 100644
--- a/test/test_gromov.py
+++ b/test/test_gromov.py
@@ -17,7 +17,7 @@ def test_gromov():
 
     xs = ot.datasets.get_2D_samples_gauss(n_samples, mu_s, cov_s)
 
-    xt = [xs[n_samples - (i + 1)] for i in range(n_samples)]
+    xt = xs[::-1]
     xt = np.array(xt)
 
     p = ot.unif(n_samples)
-- 
cgit v1.2.3


From 36bf599552ff15d1ca1c6b505507e65a333fa55e Mon Sep 17 00:00:00 2001
From: Nicolas Courty <Nico@pc-mna-08.univ-ubs.fr>
Date: Tue, 12 Sep 2017 18:07:17 +0200
Subject: Corrections on Gromov

---
 data/carre.png                     | Bin 168 -> 0 bytes
 data/coeur.png                     | Bin 225 -> 0 bytes
 data/cross.png                     | Bin 0 -> 230 bytes
 data/rond.png                      | Bin 230 -> 0 bytes
 data/square.png                    | Bin 0 -> 168 bytes
 data/star.png                      | Bin 0 -> 225 bytes
 examples/plot_gromov.py            |   5 +++--
 examples/plot_gromov_barycenter.py |  13 +++++--------
 test/test_gromov.py                |   3 +--
 9 files changed, 9 insertions(+), 12 deletions(-)
 delete mode 100755 data/carre.png
 delete mode 100755 data/coeur.png
 create mode 100755 data/cross.png
 delete mode 100755 data/rond.png
 create mode 100755 data/square.png
 create mode 100755 data/star.png

(limited to 'test')

diff --git a/data/carre.png b/data/carre.png
deleted file mode 100755
index 45ff0ef..0000000
Binary files a/data/carre.png and /dev/null differ
diff --git a/data/coeur.png b/data/coeur.png
deleted file mode 100755
index 3f511a6..0000000
Binary files a/data/coeur.png and /dev/null differ
diff --git a/data/cross.png b/data/cross.png
new file mode 100755
index 0000000..1c1a068
Binary files /dev/null and b/data/cross.png differ
diff --git a/data/rond.png b/data/rond.png
deleted file mode 100755
index 1c1a068..0000000
Binary files a/data/rond.png and /dev/null differ
diff --git a/data/square.png b/data/square.png
new file mode 100755
index 0000000..45ff0ef
Binary files /dev/null and b/data/square.png differ
diff --git a/data/star.png b/data/star.png
new file mode 100755
index 0000000..3f511a6
Binary files /dev/null and b/data/star.png differ
diff --git a/examples/plot_gromov.py b/examples/plot_gromov.py
index 92312ae..0f839a3 100644
--- a/examples/plot_gromov.py
+++ b/examples/plot_gromov.py
@@ -22,8 +22,9 @@ import ot
 """
 Sample two Gaussian distributions (2D and 3D)
 =============================================
-The Gromov-Wasserstein distance allows to compute distances with samples that do not belong to the same metric space.
-For demonstration purpose, we sample two Gaussian distributions in 2- and 3-dimensional spaces.
+The Gromov-Wasserstein distance allows to compute distances with samples that 
+do not belong to the same metric space. For demonstration purpose, we sample 
+two Gaussian distributions in 2- and 3-dimensional spaces.
 """
 
 n_samples = 30  # nb samples
diff --git a/examples/plot_gromov_barycenter.py b/examples/plot_gromov_barycenter.py
index 4f17117..c138031 100755
--- a/examples/plot_gromov_barycenter.py
+++ b/examples/plot_gromov_barycenter.py
@@ -48,13 +48,10 @@ def smacof_mds(C, dim, max_iter=3000, eps=1e-9):
     eps : float
         relative tolerance w.r.t stress to declare converge
 
-
     Returns
     -------
     npos : ndarray, shape (R, dim)
            Embedded coordinates of the interpolated point cloud (defined with one isometry)
-
-
     """
 
     rng = np.random.RandomState(seed=3)
@@ -91,12 +88,12 @@ def im2mat(I):
     return I.reshape((I.shape[0] * I.shape[1], I.shape[2]))
 
 
-square = spi.imread('../data/carre.png').astype(np.float64) / 256
-circle = spi.imread('../data/rond.png').astype(np.float64) / 256
-triangle = spi.imread('../data/triangle.png').astype(np.float64) / 256
-arrow = spi.imread('../data/coeur.png').astype(np.float64) / 256
+square = spi.imread('../data/square.png').astype(np.float64)[:,:,2] / 256
+cross = spi.imread('../data/cross.png').astype(np.float64)[:,:,2] / 256
+triangle = spi.imread('../data/triangle.png').astype(np.float64)[:,:,2] / 256
+star = spi.imread('../data/star.png').astype(np.float64)[:,:,2] / 256
 
-shapes = [square, circle, triangle, arrow]
+shapes = [square, cross, triangle, star]
 
 S = 4
 xs = [[] for i in range(S)]
diff --git a/test/test_gromov.py b/test/test_gromov.py
index 28495e1..e808292 100644
--- a/test/test_gromov.py
+++ b/test/test_gromov.py
@@ -17,8 +17,7 @@ def test_gromov():
 
     xs = ot.datasets.get_2D_samples_gauss(n_samples, mu_s, cov_s)
 
-    xt = xs[::-1]
-    xt = np.array(xt)
+    xt = xs[::-1].copy()
 
     p = ot.unif(n_samples)
     q = ot.unif(n_samples)
-- 
cgit v1.2.3