{ "id": "2310.03398", "version": "v1", "published": "2023-10-05T09:04:53.000Z", "updated": "2023-10-05T09:04:53.000Z", "title": "Interpolating between Clustering and Dimensionality Reduction with Gromov-Wasserstein", "authors": [ "Hugues Van Assel", "Cédric Vincent-Cuaz", "Titouan Vayer", "Rémi Flamary", "Nicolas Courty" ], "categories": [ "cs.LG", "stat.ML" ], "abstract": "We present a versatile adaptation of existing dimensionality reduction (DR) objectives, enabling the simultaneous reduction of both sample and feature sizes. Correspondances between input and embedding samples are computed through a semi-relaxed Gromov-Wasserstein optimal transport (OT) problem. When the embedding sample size matches that of the input, our model recovers classical popular DR models. When the embedding's dimensionality is unconstrained, we show that the OT plan delivers a competitive hard clustering. We emphasize the importance of intermediate stages that blend DR and clustering for summarizing real data and apply our method to visualize datasets of images.", "revisions": [ { "version": "v1", "updated": "2023-10-05T09:04:53.000Z" } ], "analyses": { "keywords": [ "dimensionality reduction", "clustering", "semi-relaxed gromov-wasserstein optimal transport", "ot plan delivers", "classical popular dr models" ], "note": { "typesetting": "TeX", "pages": 0, "language": "en", "license": "arXiv", "status": "editable" } } }