{ "id": "2310.20053", "version": "v1", "published": "2023-10-30T22:16:51.000Z", "updated": "2023-10-30T22:16:51.000Z", "title": "Estimating optimal PAC-Bayes bounds with Hamiltonian Monte Carlo", "authors": [ "Szilvia Ujváry", "Gergely Flamich", "Vincent Fortuin", "José Miguel Hernández Lobato" ], "comment": "Mathematics of Modern Machine Learning Workshop at NeurIPS 2023", "categories": [ "stat.ML", "cs.LG" ], "abstract": "An important yet underexplored question in the PAC-Bayes literature is how much tightness we lose by restricting the posterior family to factorized Gaussian distributions when optimizing a PAC-Bayes bound. We investigate this issue by estimating data-independent PAC-Bayes bounds using the optimal posteriors, comparing them to bounds obtained using MFVI. Concretely, we (1) sample from the optimal Gibbs posterior using Hamiltonian Monte Carlo, (2) estimate its KL divergence from the prior with thermodynamic integration, and (3) propose three methods to obtain high-probability bounds under different assumptions. Our experiments on the MNIST dataset reveal significant tightness gaps, as much as 5-6\\% in some cases.", "revisions": [ { "version": "v1", "updated": "2023-10-30T22:16:51.000Z" } ], "analyses": { "subjects": [ "G.3" ], "keywords": [ "estimating optimal pac-bayes bounds", "hamiltonian monte carlo", "dataset reveal significant tightness gaps", "mnist dataset reveal significant tightness" ], "note": { "typesetting": "TeX", "pages": 0, "language": "en", "license": "arXiv", "status": "editable" } } }