Dual OT solvers for entropic and quadratic regularized OT with Pytorch

# Author: Remi Flamary <remi.flamary@polytechnique.edu>
# License: MIT License

# sphinx_gallery_thumbnail_number = 3

import numpy as np
import matplotlib.pyplot as pl
import torch
import ot
import ot.plot

Data generation


n_source_samples = 100
n_target_samples = 100
theta = 2 * np.pi / 20
noise_level = 0.1

Xs, ys = ot.datasets.make_data_classif("gaussrot", n_source_samples, nz=noise_level)
Xt, yt = ot.datasets.make_data_classif(
    "gaussrot", n_target_samples, theta=theta, nz=noise_level

# one of the target mode changes its variance (no linear mapping)
Xt[yt == 2] *= 3
Xt = Xt + 4

Plot data

pl.figure(1, (10, 5))
pl.scatter(Xs[:, 0], Xs[:, 1], marker="+", label="Source samples")
pl.scatter(Xt[:, 0], Xt[:, 1], marker="o", label="Target samples")
pl.title("Source and target distributions")
Source and target distributions
Text(0.5, 1.0, 'Source and target distributions')

Convert data to torch tensors

Estimating dual variables for entropic OT

u = torch.randn(n_source_samples, requires_grad=True)
v = torch.randn(n_source_samples, requires_grad=True)

reg = 0.5

optimizer = torch.optim.Adam([u, v], lr=1)

# number of iteration
n_iter = 200

losses = []

for i in range(n_iter):
    # generate noise samples

    # minus because we maximize the dual loss
    loss = -ot.stochastic.loss_dual_entropic(u, v, xs, xt, reg=reg)

    if i % 10 == 0:
        print("Iter: {:3d}, loss={}".format(i, losses[-1]))


pl.title("Dual objective (negative)")

Ge = ot.stochastic.plan_dual_entropic(u, v, xs, xt, reg=reg)
Dual objective (negative)
Iter:   0, loss=0.202049490022473
Iter:  10, loss=-19.713336352860086
Iter:  20, loss=-31.86816382664472
Iter:  30, loss=-36.46142062960647
Iter:  40, loss=-39.34338827964418
Iter:  50, loss=-40.69761727415776
Iter:  60, loss=-41.315846099087345
Iter:  70, loss=-41.68176560915176
Iter:  80, loss=-41.887343644405426
Iter:  90, loss=-41.994980773784704
Iter: 100, loss=-42.032959385774355
Iter: 110, loss=-42.05008691759669
Iter: 120, loss=-42.0595946246367
Iter: 130, loss=-42.06453550965614
Iter: 140, loss=-42.06773551352124
Iter: 150, loss=-42.069799205033185
Iter: 160, loss=-42.07125381567741
Iter: 170, loss=-42.07228832360748
Iter: 180, loss=-42.07305559053532
Iter: 190, loss=-42.07363263844281

Plot the estimated entropic OT plan

pl.figure(3, (10, 5))
ot.plot.plot2D_samples_mat(Xs, Xt, Ge.detach().numpy(), alpha=0.1)
pl.scatter(Xs[:, 0], Xs[:, 1], marker="+", label="Source samples", zorder=2)
pl.scatter(Xt[:, 0], Xt[:, 1], marker="o", label="Target samples", zorder=2)
pl.title("Source and target distributions")
Source and target distributions
Text(0.5, 1.0, 'Source and target distributions')

Estimating dual variables for quadratic OT

u = torch.randn(n_source_samples, requires_grad=True)
v = torch.randn(n_source_samples, requires_grad=True)

reg = 0.01

optimizer = torch.optim.Adam([u, v], lr=1)

# number of iteration
n_iter = 200

losses = []

for i in range(n_iter):
    # generate noise samples

    # minus because we maximize the dual loss
    loss = -ot.stochastic.loss_dual_quadratic(u, v, xs, xt, reg=reg)

    if i % 10 == 0:
        print("Iter: {:3d}, loss={}".format(i, losses[-1]))


pl.title("Dual objective (negative)")

Gq = ot.stochastic.plan_dual_quadratic(u, v, xs, xt, reg=reg)
Dual objective (negative)
Iter:   0, loss=-0.0018442196020623663
Iter:  10, loss=-19.719719930536872
Iter:  20, loss=-31.585189332659155
Iter:  30, loss=-36.05779112280298
Iter:  40, loss=-39.08217861417628
Iter:  50, loss=-40.480964035493265
Iter:  60, loss=-41.150977366711615
Iter:  70, loss=-41.57215105371474
Iter:  80, loss=-41.752753364835485
Iter:  90, loss=-41.85012696392124
Iter: 100, loss=-41.88723937279083
Iter: 110, loss=-41.90586248692544
Iter: 120, loss=-41.91580820247772
Iter: 130, loss=-41.92163900076693
Iter: 140, loss=-41.9251554466825
Iter: 150, loss=-41.92776411456393
Iter: 160, loss=-41.92942819907569
Iter: 170, loss=-41.930511591420746
Iter: 180, loss=-41.93119684020832
Iter: 190, loss=-41.931649543287755

Plot the estimated quadratic OT plan

pl.figure(5, (10, 5))
ot.plot.plot2D_samples_mat(Xs, Xt, Gq.detach().numpy(), alpha=0.1)
pl.scatter(Xs[:, 0], Xs[:, 1], marker="+", label="Source samples", zorder=2)
pl.scatter(Xt[:, 0], Xt[:, 1], marker="o", label="Target samples", zorder=2)
pl.title("OT plan with quadratic regularization")
OT plan with quadratic regularization
Text(0.5, 1.0, 'OT plan with quadratic regularization')

Total running time of the script: (0 minutes 11.213 seconds)

Gallery generated by Sphinx-Gallery