summaryrefslogtreecommitdiff
path: root/ot/da.py
diff options
context:
space:
mode:
authorSlasnista <stan.chambon@gmail.com>2017-08-28 11:03:28 +0200
committerSlasnista <stan.chambon@gmail.com>2017-08-28 11:03:28 +0200
commita8fa91bec26caa93329e61a104e0ad6afdf37363 (patch)
tree64a11f115904921afe2b7d249aabc3b6bd43e9fe /ot/da.py
parent55840f6bccadd79caf722d86f06da857e3045453 (diff)
handling input arguments in fit, transform... methods + remove old examples
Diffstat (limited to 'ot/da.py')
-rw-r--r--ot/da.py217
1 files changed, 121 insertions, 96 deletions
diff --git a/ot/da.py b/ot/da.py
index 8c62669..369b6a2 100644
--- a/ot/da.py
+++ b/ot/da.py
@@ -976,36 +976,41 @@ class BaseTransport(BaseEstimator):
Returns self.
"""
- # pairwise distance
- self.cost_ = dist(Xs, Xt, metric=self.metric)
+ if Xs is not None and Xt is not None:
+ # pairwise distance
+ self.cost_ = dist(Xs, Xt, metric=self.metric)
- if (ys is not None) and (yt is not None):
+ if (ys is not None) and (yt is not None):
- if self.limit_max != np.infty:
- self.limit_max = self.limit_max * np.max(self.cost_)
+ if self.limit_max != np.infty:
+ self.limit_max = self.limit_max * np.max(self.cost_)
- # assumes labeled source samples occupy the first rows
- # and labeled target samples occupy the first columns
- classes = np.unique(ys)
- for c in classes:
- idx_s = np.where((ys != c) & (ys != -1))
- idx_t = np.where(yt == c)
+ # assumes labeled source samples occupy the first rows
+ # and labeled target samples occupy the first columns
+ classes = np.unique(ys)
+ for c in classes:
+ idx_s = np.where((ys != c) & (ys != -1))
+ idx_t = np.where(yt == c)
- # all the coefficients corresponding to a source sample
- # and a target sample :
- # with different labels get a infinite
- for j in idx_t[0]:
- self.cost_[idx_s[0], j] = self.limit_max
+ # all the coefficients corresponding to a source sample
+ # and a target sample :
+ # with different labels get a infinite
+ for j in idx_t[0]:
+ self.cost_[idx_s[0], j] = self.limit_max
- # distribution estimation
- self.mu_s = self.distribution_estimation(Xs)
- self.mu_t = self.distribution_estimation(Xt)
+ # distribution estimation
+ self.mu_s = self.distribution_estimation(Xs)
+ self.mu_t = self.distribution_estimation(Xt)
- # store arrays of samples
- self.Xs = Xs
- self.Xt = Xt
+ # store arrays of samples
+ self.Xs = Xs
+ self.Xt = Xt
- return self
+ return self
+ else:
+ print("POT-Warning")
+ print("Please provide both Xs and Xt arguments when calling")
+ print("fit method")
def fit_transform(self, Xs=None, ys=None, Xt=None, yt=None):
"""Build a coupling matrix from source and target sets of samples
@@ -1053,42 +1058,47 @@ class BaseTransport(BaseEstimator):
The transport source samples.
"""
- if np.array_equal(self.Xs, Xs):
- # perform standard barycentric mapping
- transp = self.coupling_ / np.sum(self.coupling_, 1)[:, None]
+ if Xs is not None:
+ if np.array_equal(self.Xs, Xs):
+ # perform standard barycentric mapping
+ transp = self.coupling_ / np.sum(self.coupling_, 1)[:, None]
- # set nans to 0
- transp[~ np.isfinite(transp)] = 0
+ # set nans to 0
+ transp[~ np.isfinite(transp)] = 0
- # compute transported samples
- transp_Xs = np.dot(transp, self.Xt)
- else:
- # perform out of sample mapping
- indices = np.arange(Xs.shape[0])
- batch_ind = [
- indices[i:i + batch_size]
- for i in range(0, len(indices), batch_size)]
+ # compute transported samples
+ transp_Xs = np.dot(transp, self.Xt)
+ else:
+ # perform out of sample mapping
+ indices = np.arange(Xs.shape[0])
+ batch_ind = [
+ indices[i:i + batch_size]
+ for i in range(0, len(indices), batch_size)]
- transp_Xs = []
- for bi in batch_ind:
+ transp_Xs = []
+ for bi in batch_ind:
- # get the nearest neighbor in the source domain
- D0 = dist(Xs[bi], self.Xs)
- idx = np.argmin(D0, axis=1)
+ # get the nearest neighbor in the source domain
+ D0 = dist(Xs[bi], self.Xs)
+ idx = np.argmin(D0, axis=1)
- # transport the source samples
- transp = self.coupling_ / np.sum(self.coupling_, 1)[:, None]
- transp[~ np.isfinite(transp)] = 0
- transp_Xs_ = np.dot(transp, self.Xt)
+ # transport the source samples
+ transp = self.coupling_ / np.sum(
+ self.coupling_, 1)[:, None]
+ transp[~ np.isfinite(transp)] = 0
+ transp_Xs_ = np.dot(transp, self.Xt)
- # define the transported points
- transp_Xs_ = transp_Xs_[idx, :] + Xs[bi] - self.Xs[idx, :]
+ # define the transported points
+ transp_Xs_ = transp_Xs_[idx, :] + Xs[bi] - self.Xs[idx, :]
- transp_Xs.append(transp_Xs_)
+ transp_Xs.append(transp_Xs_)
- transp_Xs = np.concatenate(transp_Xs, axis=0)
+ transp_Xs = np.concatenate(transp_Xs, axis=0)
- return transp_Xs
+ return transp_Xs
+ else:
+ print("POT-Warning")
+ print("Please provide Xs argument when calling transform method")
def inverse_transform(self, Xs=None, ys=None, Xt=None, yt=None,
batch_size=128):
@@ -1113,41 +1123,46 @@ class BaseTransport(BaseEstimator):
The transported target samples.
"""
- if np.array_equal(self.Xt, Xt):
- # perform standard barycentric mapping
- transp_ = self.coupling_.T / np.sum(self.coupling_, 0)[:, None]
+ if Xt is not None:
+ if np.array_equal(self.Xt, Xt):
+ # perform standard barycentric mapping
+ transp_ = self.coupling_.T / np.sum(self.coupling_, 0)[:, None]
- # set nans to 0
- transp_[~ np.isfinite(transp_)] = 0
+ # set nans to 0
+ transp_[~ np.isfinite(transp_)] = 0
- # compute transported samples
- transp_Xt = np.dot(transp_, self.Xs)
- else:
- # perform out of sample mapping
- indices = np.arange(Xt.shape[0])
- batch_ind = [
- indices[i:i + batch_size]
- for i in range(0, len(indices), batch_size)]
+ # compute transported samples
+ transp_Xt = np.dot(transp_, self.Xs)
+ else:
+ # perform out of sample mapping
+ indices = np.arange(Xt.shape[0])
+ batch_ind = [
+ indices[i:i + batch_size]
+ for i in range(0, len(indices), batch_size)]
- transp_Xt = []
- for bi in batch_ind:
+ transp_Xt = []
+ for bi in batch_ind:
- D0 = dist(Xt[bi], self.Xt)
- idx = np.argmin(D0, axis=1)
+ D0 = dist(Xt[bi], self.Xt)
+ idx = np.argmin(D0, axis=1)
- # transport the target samples
- transp_ = self.coupling_.T / np.sum(self.coupling_, 0)[:, None]
- transp_[~ np.isfinite(transp_)] = 0
- transp_Xt_ = np.dot(transp_, self.Xs)
+ # transport the target samples
+ transp_ = self.coupling_.T / np.sum(
+ self.coupling_, 0)[:, None]
+ transp_[~ np.isfinite(transp_)] = 0
+ transp_Xt_ = np.dot(transp_, self.Xs)
- # define the transported points
- transp_Xt_ = transp_Xt_[idx, :] + Xt[bi] - self.Xt[idx, :]
+ # define the transported points
+ transp_Xt_ = transp_Xt_[idx, :] + Xt[bi] - self.Xt[idx, :]
- transp_Xt.append(transp_Xt_)
+ transp_Xt.append(transp_Xt_)
- transp_Xt = np.concatenate(transp_Xt, axis=0)
+ transp_Xt = np.concatenate(transp_Xt, axis=0)
- return transp_Xt
+ return transp_Xt
+ else:
+ print("POT-Warning")
+ print("Please provide Xt argument when calling inverse_transform")
class SinkhornTransport(BaseTransport):
@@ -1413,15 +1428,20 @@ class SinkhornLpl1Transport(BaseTransport):
Returns self.
"""
- super(SinkhornLpl1Transport, self).fit(Xs, ys, Xt, yt)
+ if Xs is not None and Xt is not None and ys is not None:
- self.coupling_ = sinkhorn_lpl1_mm(
- a=self.mu_s, labels_a=ys, b=self.mu_t, M=self.cost_,
- reg=self.reg_e, eta=self.reg_cl, numItermax=self.max_iter,
- numInnerItermax=self.max_inner_iter, stopInnerThr=self.tol,
- verbose=self.verbose)
+ super(SinkhornLpl1Transport, self).fit(Xs, ys, Xt, yt)
- return self
+ self.coupling_ = sinkhorn_lpl1_mm(
+ a=self.mu_s, labels_a=ys, b=self.mu_t, M=self.cost_,
+ reg=self.reg_e, eta=self.reg_cl, numItermax=self.max_iter,
+ numInnerItermax=self.max_inner_iter, stopInnerThr=self.tol,
+ verbose=self.verbose)
+
+ return self
+ else:
+ print("POT-Warning")
+ print("Please provide both Xs, Xt, ys arguments to fit method")
class SinkhornL1l2Transport(BaseTransport):
@@ -1517,22 +1537,27 @@ class SinkhornL1l2Transport(BaseTransport):
Returns self.
"""
- super(SinkhornL1l2Transport, self).fit(Xs, ys, Xt, yt)
+ if Xs is not None and Xt is not None and ys is not None:
- returned_ = sinkhorn_l1l2_gl(
- a=self.mu_s, labels_a=ys, b=self.mu_t, M=self.cost_,
- reg=self.reg_e, eta=self.reg_cl, numItermax=self.max_iter,
- numInnerItermax=self.max_inner_iter, stopInnerThr=self.tol,
- verbose=self.verbose, log=self.log)
+ super(SinkhornL1l2Transport, self).fit(Xs, ys, Xt, yt)
- # deal with the value of log
- if self.log:
- self.coupling_, self.log_ = returned_
- else:
- self.coupling_ = returned_
- self.log_ = dict()
+ returned_ = sinkhorn_l1l2_gl(
+ a=self.mu_s, labels_a=ys, b=self.mu_t, M=self.cost_,
+ reg=self.reg_e, eta=self.reg_cl, numItermax=self.max_iter,
+ numInnerItermax=self.max_inner_iter, stopInnerThr=self.tol,
+ verbose=self.verbose, log=self.log)
- return self
+ # deal with the value of log
+ if self.log:
+ self.coupling_, self.log_ = returned_
+ else:
+ self.coupling_ = returned_
+ self.log_ = dict()
+
+ return self
+ else:
+ print("POT-Warning")
+ print("Please, provide both Xs, Xt and ys argument to fit method")
class MappingTransport(BaseEstimator):