Briefly.
I am an assistant professor in statistics at ENSAE/CREST.
Previously, I was a Junior AI fellow at Université PSL and worked as a Courant instructor at New York University. I did my Ph.D. under the supervision of Frédéric Chazal and Pascal Massart at Université Paris-Saclay and Inria Saclay.
I am a theoretical statistician that likes geometry. My current interests include statistical optimal transport, fairness in machine learning, geometric inference, and graph Laplacians.
Contact.
- Email: firstname dot lastname at ensae dot fr
- Address: Office 3022, ENSAE
Publications.
2025
Divol, Yann Chaubet Vincent
Minimax spectral estimation of weighted Laplace operators Miscellaneous
2025.
Abstract | Links | BibTeX | Tags: Differential Geometry, Statistics Theory
@misc{nokey,
title = {Minimax spectral estimation of weighted Laplace operators},
author = {Yann Chaubet
Vincent Divol},
url = {https://arxiv.org/abs/2511.22694},
year = {2025},
date = {2025-11-27},
urldate = {2025-11-27},
abstract = {Given n i.i.d. observations, we study the problem of estimating the spectrum of weighted Laplace operators of the form Delta_f=Delta + alpha nabla log fcdot nabla, where f is a positive probability density on a known compact d-dimensional manifold without boundary and alphain mathbb{R} is a hyperparameter. These operators arise as continuum limits of graph Laplacian matrices and provide valuable geometric information on the underlying data distribution. We establish the exact minimax rates of estimation for this problem, by exhibiting two different rates of convergence for eigenfunctions and eigenvalues. When f belongs to a Hölder-Zygmund class mathscr{C}^s of regularity sgeqslant 2, the eigenfunctions can be estimated with respect to the mathrm{L}^q-norm (qgeqslant 1) via plug-in methods at the minimax rate n^{-frac{s+1}{2s+d}} for dgeqslant 3 (with different rates for dleqslant 2). Moreover, eigenvalues can be estimated at the minimax rate n^{-frac{4s}{4s+d}}+n^{-frac 12}. In the regime s>frac d4, we further show that asymptotically efficient estimators exist.
We also present a general framework for estimating nonlinear functionals over Hölder-Zygmund spaces, with potential applications to a broad class of statistical problems.},
keywords = {Differential Geometry, Statistics Theory},
pubstate = {published},
tppubtype = {misc}
}
We also present a general framework for estimating nonlinear functionals over Hölder-Zygmund spaces, with potential applications to a broad class of statistical problems.
Divol, Vincent; Guérin, Hélène; Nguyen, Dinh-Toan; Tran, Viet Chi
Measure estimation on a manifold explored by a diffusion process Journal Article
In: Probability Theory and Related Fields, 2025, (arXiv:2410.11777 [math]).
Abstract | Links | BibTeX | Tags: Differential Geometry, Geometric Inference, Optimal Transport, Statistics Theory
@article{divol_measure_2025,
title = {Measure estimation on a manifold explored by a diffusion process},
author = {Vincent Divol and Hélène Guérin and Dinh-Toan Nguyen and Viet Chi Tran},
url = {https://link.springer.com/article/10.1007/s00440-025-01437-x
http://arxiv.org/abs/2410.11777},
doi = {10.48550/arXiv.2410.11777},
year = {2025},
date = {2025-10-01},
urldate = {2025-10-01},
journal = {Probability Theory and Related Fields},
publisher = {arXiv},
abstract = {From the observation of a diffusion path (Xt)t∈[0,T ] on a compact connected d-dimensional manifold M without boundary, we consider the problem of estimating the stationary measure µ of the process. Wang and Zhu (2023) showed that for the Wasserstein metric W2 and for d ≥ 5, the convergence rate of T −1/(d−2) is attained by the occupation measure of the path (Xt)t∈[0,T ] when (Xt)t∈[0,T ] is a Langevin diffusion. We extend their result in several directions. First, we show that the rate of convergence holds for a large class of diffusion paths, whose generators are uniformly elliptic. Second, the regularity of the density p of the stationary measure µ with respect to the volume measure of M can be leveraged to obtain faster estimators: when p belongs to a Sobolev space of order ℓ ⩾ 2, smoothing the occupation measure by convolution with a kernel yields an estimator whose rate of convergence is of order T −(ℓ+1)/(2ℓ+d−2). We further show that this rate is the minimax rate of estimation for this problem.},
note = {arXiv:2410.11777 [math]},
keywords = {Differential Geometry, Geometric Inference, Optimal Transport, Statistics Theory},
pubstate = {published},
tppubtype = {article}
}
Divol, Vincent; Niles-Weed, Jonathan; Pooladian, Aram-Alexandre
Optimal transport map estimation in general function spaces Journal Article
In: The Annals of Statistics, vol. 53, no. 3, 2025, ISSN: 0090-5364.
Links | BibTeX | Tags: Optimal Transport, Statistics Theory
@article{divol_optimal_2025,
title = {Optimal transport map estimation in general function spaces},
author = {Vincent Divol and Jonathan Niles-Weed and Aram-Alexandre Pooladian},
url = {https://projecteuclid.org/journals/annals-of-statistics/volume-53/issue-3/Optimal-transport-map-estimation-in-general-function-spaces/10.1214/24-AOS2482.full},
doi = {10.1214/24-AOS2482},
issn = {0090-5364},
year = {2025},
date = {2025-06-01},
urldate = {2025-10-23},
journal = {The Annals of Statistics},
volume = {53},
number = {3},
keywords = {Optimal Transport, Statistics Theory},
pubstate = {published},
tppubtype = {article}
}
Divol, Vincent; Niles-Weed, Jonathan; Pooladian, Aram-Alexandre
Tight Stability Bounds for Entropic Brenier Maps Journal Article
In: International Mathematics Research Notices, vol. 2025, no. 7, pp. rnaf078, 2025, ISSN: 1073-7928, (_eprint: https://academic.oup.com/imrn/article-pdf/2025/7/rnaf078/62862069/rnaf078.pdf).
Abstract | Links | BibTeX | Tags: Optimal Transport
@article{divol_tight_2025,
title = {Tight Stability Bounds for Entropic Brenier Maps},
author = {Vincent Divol and Jonathan Niles-Weed and Aram-Alexandre Pooladian},
url = {https://doi.org/10.1093/imrn/rnaf078},
doi = {10.1093/imrn/rnaf078},
issn = {1073-7928},
year = {2025},
date = {2025-04-01},
journal = {International Mathematics Research Notices},
volume = {2025},
number = {7},
pages = {rnaf078},
abstract = {Entropic Brenier maps are regularized analogues of Brenier maps (optimal transport maps) which converge to Brenier maps as the regularization parameter shrinks. In this work, we prove quantitative stability bounds between entropic Brenier maps under variations of the target measure. In particular, when all measures have bounded support, we establish the optimal Lipschitz constant for the mapping from probability measures to entropic Brenier maps. This provides an exponential improvement to a result of Carlier, Chizat, and Laborde (2024). As an application, we prove near-optimal bounds for the stability of semi-discrete unregularized Brenier maps for a family of discrete target measures.},
note = {_eprint: https://academic.oup.com/imrn/article-pdf/2025/7/rnaf078/62862069/rnaf078.pdf},
keywords = {Optimal Transport},
pubstate = {published},
tppubtype = {article}
}
2024
Divol, Vincent; Gaucher, Solenne
Demographic parity in regression and classification within the unawareness framework Miscellaneous
2024, (arXiv:2409.02471 [stat]).
Abstract | Links | BibTeX | Tags: Fairness, Optimal Transport
@misc{divol_demographic_2024,
title = {Demographic parity in regression and classification within the unawareness framework},
author = {Vincent Divol and Solenne Gaucher},
url = {http://arxiv.org/abs/2409.02471},
doi = {10.48550/arXiv.2409.02471},
year = {2024},
date = {2024-09-01},
urldate = {2025-10-23},
publisher = {arXiv},
abstract = {This paper explores the theoretical foundations of fair regression under the constraint of demographic parity within the unawareness framework, where disparate treatment is prohibited, extending existing results where such treatment is permitted. Specifically, we aim to characterize the optimal fair regression function when minimizing the quadratic loss. Our results reveal that this function is given by the solution to a barycenter problem with optimal transport costs. Additionally, we study the connection between optimal fair cost-sensitive classification, and optimal fair regression. We demonstrate that nestedness of the decision sets of the classifiers is both necessary and sufficient to establish a form of equivalence between classification and regression. Under this nestedness assumption, the optimal classifiers can be derived by applying thresholds to the optimal fair regression function; conversely, the optimal fair regression function is characterized by the family of cost-sensitive classifiers.},
note = {arXiv:2409.02471 [stat]},
keywords = {Fairness, Optimal Transport},
pubstate = {published},
tppubtype = {misc}
}
Arnal, Charles; Cohen-Steiner, David; Divol, Vincent
Critical points of the distance function to a generic submanifold Miscellaneous
2024, (arXiv:2312.13147 [math]).
Abstract | Links | BibTeX | Tags: Differential Geometry, Persistence Diagrams
@misc{arnal_critical_2024,
title = {Critical points of the distance function to a generic submanifold},
author = {Charles Arnal and David Cohen-Steiner and Vincent Divol},
url = {http://arxiv.org/abs/2312.13147},
doi = {10.48550/arXiv.2312.13147},
year = {2024},
date = {2024-05-01},
urldate = {2025-10-23},
publisher = {arXiv},
abstract = {In general, the critical points of the distance function $d_textbackslashmathsfM$ to a compact submanifold $textbackslashmathsfM textbackslashsubset textbackslashmathbbRˆD$ can be poorly behaved. In this article, we show that this is generically not the case by listing regularity conditions on the critical and $textbackslashmu$-critical points of a submanifold and by proving that they are generically satisfied and stable with respect to small $Cˆ2$ perturbations. More specifically, for any compact abstract manifold $M$, the set of embeddings $i:Mtextbackslashrightarrow textbackslashmathbbRˆD$ such that the submanifold $i(M)$ satisfies those conditions is open and dense in the Whitney $Cˆ2$-topology. When those regularity conditions are fulfilled, we prove that the distance function to $i(M)$ satisfies Morse-like conditions and that the critical points of the distance function to an $textbackslashvarepsilon$-dense subset of the submanifold (e.g., obtained via some sampling process) are well-behaved. We also provide many examples that showcase how the absence of these conditions allows for pathological situations.},
note = {arXiv:2312.13147 [math]},
keywords = {Differential Geometry, Persistence Diagrams},
pubstate = {published},
tppubtype = {misc}
}
Arnal, Charles; Cohen-Steiner, David; Divol, Vincent
Wasserstein convergence of Čech persistence diagrams for samplings of submanifolds Proceedings Article
In: Globersons, Amir; Mackey, Lester; Belgrave, Danielle; Fan, Angela; Paquet, Ulrich; Tomczak, Jakub M.; Zhang, Cheng (Ed.): Advances in Neural Information Processing Systems 38: Annual Conference on Neural Information Processing Systems 2024, NeurIPS 2024, Vancouver, BC, Canada, December 10 – 15, 2024, pp. 40651–40698, 2024.
Abstract | Links | BibTeX | Tags: Differential Geometry, Optimal Transport, Persistence Diagrams
@inproceedings{arnal_wasserstein_2024,
title = {Wasserstein convergence of Čech persistence diagrams for samplings of submanifolds},
author = {Charles Arnal and David Cohen-Steiner and Vincent Divol},
editor = {Amir Globersons and Lester Mackey and Danielle Belgrave and Angela Fan and Ulrich Paquet and Jakub M. Tomczak and Cheng Zhang},
url = {http://papers.nips.cc/paper_files/paper/2024/hash/47bb4eff6321ae7a11fb6e3352c63125-Abstract-Conference.html},
year = {2024},
date = {2024-01-01},
booktitle = {Advances in Neural Information Processing Systems 38: Annual Conference
on Neural Information Processing Systems 2024, NeurIPS 2024, Vancouver,
BC, Canada, December 10 - 15, 2024},
pages = {40651–40698},
abstract = {ˇCech Persistence diagrams (PDs) are topological descriptors routinely used to capture the geometry of complex datasets. They are commonly compared using the Wasserstein distances OTp; however, the extent to which PDs are stable with respect to these metrics remains poorly understood. We partially close this gap by focusing on the case where datasets are sampled on an m-dimensional submanifold of Rd. Under this manifold hypothesis, we show that convergence with respect to the OTp metric happens exactly when p > m. We also provide improvements upon the bottleneck stability theorem in this case and prove new laws of large numbers for the total α-persistence of PDs. Finally, we show how these theoretical findings shed new light on the behavior of the feature maps on the space of PDs that are used in ML-oriented applications of Topological Data Analysis.},
keywords = {Differential Geometry, Optimal Transport, Persistence Diagrams},
pubstate = {published},
tppubtype = {inproceedings}
}
2023
Pooladian, Aram-Alexandre; Divol, Vincent; Niles-Weed, Jonathan
Minimax estimation of discontinuous optimal transport maps: The semi-discrete case Proceedings Article
In: Krause, Andreas; Brunskill, Emma; Cho, Kyunghyun; Engelhardt, Barbara; Sabato, Sivan; Scarlett, Jonathan (Ed.): International Conference on Machine Learning, ICML 2023, 23-29 July 2023, Honolulu, Hawaii, USA, pp. 28128–28150, PMLR, 2023.
Abstract | Links | BibTeX | Tags: Optimal Transport, Statistics Theory
@inproceedings{pooladian_minimax_2023,
title = {Minimax estimation of discontinuous optimal transport maps: The semi-discrete case},
author = {Aram-Alexandre Pooladian and Vincent Divol and Jonathan Niles-Weed},
editor = {Andreas Krause and Emma Brunskill and Kyunghyun Cho and Barbara Engelhardt and Sivan Sabato and Jonathan Scarlett},
url = {https://proceedings.mlr.press/v202/pooladian23b.html},
year = {2023},
date = {2023-01-01},
booktitle = {International Conference on Machine Learning, ICML 2023, 23-29 July
2023, Honolulu, Hawaii, USA},
volume = {202},
pages = {28128–28150},
publisher = {PMLR},
series = {Proceedings of Machine Learning Research},
abstract = {We consider the problem of estimating the optimal transport map between two probability distributions, P and Q in Rd, on the basis of i.i.d. samples. All existing statistical analyses of this problem require the assumption that the transport map is Lipschitz, a strong requirement that, in particular, excludes any examples where the transport map is discontinuous. As a first step towards developing estimation procedures for discontinuous maps, we consider the important special case where the data distribution Q is a discrete measure supported on a finite number of points in Rd. We study a computationally efficient estimator initially proposed by Pooladian & Niles-Weed (2021), based on entropic optimal transport, and show in the semi-discrete setting that it converges at the minimax-optimal rate n−1/2, independent of dimension. Other standard map estimation techniques both lack finite-sample guarantees in this setting and provably suffer from the curse of dimensionality. We confirm these results in numerical experiments, and provide experiments for other settings, not covered by our theory, which indicate that the entropic estimator is a promising methodology for other discontinuous transport map estimation problems.},
keywords = {Optimal Transport, Statistics Theory},
pubstate = {published},
tppubtype = {inproceedings}
}
2022
Divol, Vincent
Measure estimation on manifolds: an optimal transport approach Journal Article
In: Probability Theory and Related Fields, vol. 183, no. 1-2, pp. 581–647, 2022, ISSN: 0178-8051, 1432-2064.
Abstract | Links | BibTeX | Tags: Differential Geometry, Geometric Inference, Optimal Transport, Statistics Theory
@article{divol_measure_2022,
title = {Measure estimation on manifolds: an optimal transport approach},
author = {Vincent Divol},
url = {https://link.springer.com/10.1007/s00440-022-01118-z},
doi = {10.1007/s00440-022-01118-z},
issn = {0178-8051, 1432-2064},
year = {2022},
date = {2022-06-01},
urldate = {2025-10-23},
journal = {Probability Theory and Related Fields},
volume = {183},
number = {1-2},
pages = {581–647},
abstract = {Assume that we observe i.i.d. points lying close to some unknown d-dimensional Ck submanifold M in a possibly high-dimensional space. We study the problem of reconstructing the probability distribution generating the sample. After remarking that this problem is degenerate for a large class of standard losses (L p, Hellinger, total variation, etc.), we focus on the Wasserstein loss, for which we build an estimator, based on kernel density estimation, whose rate of convergence depends on d and the regularity s ≤ k − 1 of the underlying density, but not on the ambient dimension. In particular, we show that the estimator is minimax and matches previous rates in the literature in the case where the manifold M is a d-dimensional cube. The related problem of the estimation of the volume measure of M for the Wasserstein loss is also considered, for which a minimax estimator is exhibited.},
keywords = {Differential Geometry, Geometric Inference, Optimal Transport, Statistics Theory},
pubstate = {published},
tppubtype = {article}
}
2021
Divol, Vincent; Lacombe, Théo
Understanding the topology and the geometry of the space of persistence diagrams via optimal partial transport Journal Article
In: Journal of Applied and Computational Topology, vol. 5, no. 1, pp. 1–53, 2021, ISSN: 2367-1726, 2367-1734.
Abstract | Links | BibTeX | Tags: Optimal Transport, Persistence Diagrams
@article{divol_understanding_2021,
title = {Understanding the topology and the geometry of the space of persistence diagrams via optimal partial transport},
author = {Vincent Divol and Théo Lacombe},
url = {https://link.springer.com/10.1007/s41468-020-00061-z},
doi = {10.1007/s41468-020-00061-z},
issn = {2367-1726, 2367-1734},
year = {2021},
date = {2021-03-01},
urldate = {2025-10-23},
journal = {Journal of Applied and Computational Topology},
volume = {5},
number = {1},
pages = {1–53},
abstract = {Despite the obvious similarities between the metrics used in topological data analysis and those of optimal transport, an optimal-transport based formalism to study persistence diagrams and similar topological descriptors has yet to come. In this article, by considering the space of persistence diagrams as a space of discrete measures, and by observing that its metrics can be expressed as optimal partial transport problems, we introduce a generalization of persistence diagrams, namely Radon measures supported on the upper half plane. Such measures naturally appear in topological data analysis when considering continuous representations of persistence diagrams (e.g. persistence surfaces) but also as limits for laws of large numbers on persistence diagrams or as expectations of probability distributions on the space of persistence diagrams. We explore topological properties of this new space, which will also hold for the closed subspace of persistence diagrams. New results include a characterization of convergence with respect to Wasserstein metrics, a geometric description of barycenters (Fréchet means) for any distribution of diagrams, and an exhaustive description of continuous linear representations of persistence diagrams. We also showcase the strength of this framework to study random persistence diagrams by providing several statistical results made meaningful thanks to this new formalism.},
keywords = {Optimal Transport, Persistence Diagrams},
pubstate = {published},
tppubtype = {article}
}
Divol, Vincent
A short proof on the rate of convergence of the empirical measure for the Wasserstein distance Miscellaneous
2021, (arXiv:2101.08126 [math]).
Abstract | Links | BibTeX | Tags: Optimal Transport
@misc{divol_short_2021,
title = {A short proof on the rate of convergence of the empirical measure for the Wasserstein distance},
author = {Vincent Divol},
url = {http://arxiv.org/abs/2101.08126},
doi = {10.48550/arXiv.2101.08126},
year = {2021},
date = {2021-01-01},
urldate = {2025-10-23},
publisher = {arXiv},
abstract = {We provide a short proof that the Wasserstein distance between the empirical measure of a n-sample and the estimated measure is of order n−1/d, if the measure has a lower and upper bounded density on the d-dimensional flat torus.},
note = {arXiv:2101.08126 [math]},
keywords = {Optimal Transport},
pubstate = {published},
tppubtype = {misc}
}
Divol, Vincent; Lacombe, Théo
Estimation and Quantization of Expected Persistence Diagrams Proceedings Article
In: Meila, Marina; Zhang, Tong (Ed.): Proceedings of the 38th International Conference on Machine Learning, ICML 2021, 18-24 July 2021, Virtual Event, pp. 2760–2770, PMLR, 2021.
Abstract | Links | BibTeX | Tags: Persistence Diagrams, Statistics Theory
@inproceedings{divol_estimation_2021,
title = {Estimation and Quantization of Expected Persistence Diagrams},
author = {Vincent Divol and Théo Lacombe},
editor = {Marina Meila and Tong Zhang},
url = {http://proceedings.mlr.press/v139/divol21a.html},
year = {2021},
date = {2021-01-01},
booktitle = {Proceedings of the 38th International Conference on Machine Learning,
ICML 2021, 18-24 July 2021, Virtual Event},
volume = {139},
pages = {2760–2770},
publisher = {PMLR},
series = {Proceedings of Machine Learning Research},
abstract = {Persistence diagrams (PDs) are the most common descriptors used to encode the topology of structured data appearing in challenging learning tasks; think e.g. of graphs, time series or point clouds sampled close to a manifold. Given random objects and the corresponding distribution of PDs, one may want to build a statistical summary—such as a mean—of these random PDs, which is however not a trivial task as the natural geometry of the space of PDs is not linear. In this article, we study two such summaries, the Expected Persistence Diagram (EPD), and its quantization. The EPD is a measure supported on R2, which may be approximated by its empirical counterpart. We prove that this estimator is optimal from a minimax standpoint on a large class of models with a parametric rate of convergence. The empirical EPD is simple and efficient to compute, but possibly has a very large support, hindering its use in practice. To overcome this issue, we propose an algorithm to compute a quantization of the empirical EPD, a measure with small support which is shown to approximate with near-optimal rates a quantization of the theoretical EPD.},
keywords = {Persistence Diagrams, Statistics Theory},
pubstate = {published},
tppubtype = {inproceedings}
}
Divol, Vincent
Minimax adaptive estimation in manifold inference Journal Article
In: Electronic Journal of Statistics, vol. 15, no. 2, 2021, ISSN: 1935-7524.
Abstract | Links | BibTeX | Tags: Differential Geometry, Geometric Inference, Statistics Theory
@article{divol_minimax_2021,
title = {Minimax adaptive estimation in manifold inference},
author = {Vincent Divol},
url = {https://projecteuclid.org/journals/electronic-journal-of-statistics/volume-15/issue-2/Minimax-adaptive-estimation-in-manifold-inference/10.1214/21-EJS1934.full},
doi = {10.1214/21-EJS1934},
issn = {1935-7524},
year = {2021},
date = {2021-01-01},
urldate = {2025-10-23},
journal = {Electronic Journal of Statistics},
volume = {15},
number = {2},
abstract = {We focus on the problem of manifold estimation: given a set of observations sampled close to some unknown submanifold M , one wants to recover information about the geometry of M . Minimax estimators which have been proposed so far all depend crucially on the a priori knowledge of parameters quantifying the underlying distribution generating the sample (such as bounds on its density), whereas those quantities will be unknown in practice. Our contribution to the matter is twofold. First, we introduce a one-parameter family of manifold estimators (Mˆ t)t≥0 based on a localized version of convex hulls, and show that for some choice of t, the corresponding estimator is minimax on the class of models of C2 manifolds introduced in [21]. Second, we propose a completely data-driven selection procedure for the parameter t, leading to a minimax adaptive manifold estimator on this class of models. This selection procedure actually allows us to recover the Hausdorff distance between the set of observations and M , and can therefore be used as a scale parameter in other settings, such as tangent space estimation.},
keywords = {Differential Geometry, Geometric Inference, Statistics Theory},
pubstate = {published},
tppubtype = {article}
}
2019
Divol, Vincent; Polonik, Wolfgang
On the choice of weight functions for linear representations of persistence diagrams Journal Article
In: Journal of Applied and Computational Topology, vol. 3, no. 3, pp. 249–283, 2019, ISSN: 2367-1726, 2367-1734.
Abstract | Links | BibTeX | Tags: Persistence Diagrams
@article{divol_choice_2019,
title = {On the choice of weight functions for linear representations of persistence diagrams},
author = {Vincent Divol and Wolfgang Polonik},
url = {http://link.springer.com/10.1007/s41468-019-00032-z},
doi = {10.1007/s41468-019-00032-z},
issn = {2367-1726, 2367-1734},
year = {2019},
date = {2019-09-01},
urldate = {2025-10-23},
journal = {Journal of Applied and Computational Topology},
volume = {3},
number = {3},
pages = {249–283},
abstract = {Persistence diagrams are efficient descriptors of the topology of a point cloud. As they do not naturally belong to a Hilbert space, standard statistical methods cannot be directly applied to them. Instead, feature maps (or representations) are commonly used for the analysis. A large class of feature maps, which we call linear, depends on some weight functions, the choice of which is a critical issue. An important criterion to choose a weight function is to ensure stability of the feature maps with respect to Wasserstein distances on diagrams. We improve known results on the stability of such maps, and extend it to general weight functions. We also address the choice of the weight function by considering an asymptotic setting; assume that Xn is an i.i.d. sample from a density on [0, 1]d . For the Cˇ ech and Rips filtrations, we characterize the weight functions for which the corresponding feature maps converge as n approaches infinity, and by doing so, we prove laws of large numbers for the total persistences of such diagrams. Those two approaches (stability and convergence) lead to the same simple heuristic for tuning weight functions: if the data lies near a d-dimensional manifold, then a sensible choice of weight function is the persistence to the power α with α ≥ d.},
keywords = {Persistence Diagrams},
pubstate = {published},
tppubtype = {article}
}
Chazal, Frédéric; Divol, Vincent
The density of expected persistence diagrams and its kernel based estimation Journal Article
In: Journal of Computational Geometry, vol. 10, no. 2, pp. 127–153, 2019.
Abstract | Links | BibTeX | Tags: Persistence Diagrams, Statistics Theory
@article{chazal_density_2019,
title = {The density of expected persistence diagrams and its kernel based estimation},
author = {Frédéric Chazal and Vincent Divol},
url = {https://jocg.org/index.php/jocg/article/download/3090/2817/},
year = {2019},
date = {2019-01-01},
journal = {Journal of Computational Geometry},
volume = {10},
number = {2},
pages = {127–153},
abstract = {Persistence diagrams play a fundamental role in Topological Data Analysis where they are used as topological descriptors of filtrations built on top of data. They consist in discrete multisets of points in the plane R2 that can equivalently be seen as discrete measures in R2. When the data is assumed to be random, these discrete measures become random measures whose expectation is studied in this paper. First, we show that for a wide class of filtrations, including the Čech and Vietoris-Rips filtrations, but also the sublevels of a Brownian motion, the expected persistence diagram, that is a deterministic measure on R2, has a density with respect to the Lebesgue measure. Second, building on the previous result we show that the persistence surface recently introduced in Adams et al. [2017] can be seen as a kernel estimator of this density. We propose a cross-validation scheme for selecting an optimal bandwidth, which is proven to be a consistent procedure to estimate the density.},
keywords = {Persistence Diagrams, Statistics Theory},
pubstate = {published},
tppubtype = {article}
}