@phdthesis{12366,
  abstract     = {Recent substantial advances in the feld of superconducting circuits have shown its
potential as a leading platform for future quantum computing. In contrast to classical
computers based on bits that are represented by a single binary value, 0 or 1, quantum
bits (or qubits) can be in a superposition of both. Thus, quantum computers can store
and handle more information at the same time and a quantum advantage has already
been demonstrated for two types of computational tasks. Rapid progress in academic
and industry labs accelerates the development of superconducting processors which may
soon fnd applications in complex computations, chemical simulations, cryptography, and
optimization. Now that these machines are scaled up to tackle such problems the questions
of qubit interconnects and networks becomes very relevant. How to route signals on-chip
between diferent processor components? What is the most efcient way to entangle
qubits? And how to then send and process entangled signals between distant cryostats
hosting superconducting processors?
In this thesis, we are looking for solutions to these problems by studying the collective
behavior of superconducting qubit ensembles. We frst demonstrate on-demand tunable
directional scattering of microwave photons from a pair of qubits in a waveguide. Such a
device can route microwave photons on-chip with a high diode efciency. Then we focus
on studying ultra-strong coupling regimes between light (microwave photons) and matter
(superconducting qubits), a regime that could be promising for extremely fast multi-qubit
entanglement generation. Finally, we show coherent pulse storage and periodic revivals
in a fve qubit ensemble strongly coupled to a resonator. Such a reconfgurable storage
device could be used as part of a quantum repeater that is needed for longer-distance
quantum communication.
The achieved high degree of control over multi-qubit ensembles highlights not only the
beautiful physics of circuit quantum electrodynamics, it also represents the frst step
toward new quantum simulation and communication methods, and certain techniques
may also fnd applications in future superconducting quantum computing hardware.
},
  author       = {Redchenko, Elena},
  isbn         = {978-3-99078-024-4},
  issn         = {2663-337X},
  pages        = {168},
  publisher    = {Institute of Science and Technology Austria},
  title        = {{Controllable states of superconducting Qubit ensembles}},
  doi          = {10.15479/at:ista:12132},
  year         = {2022},
}

@phdthesis{12368,
  abstract     = {Metazoan development relies on the formation and remodeling of cell-cell contacts. The 
binding of adhesion receptors and remodeling of the actomyosin cell cortex at cell-cell 
interaction sites have been implicated in cell-cell contact formation. Yet, how these two 
processes functionally interact to drive cell-cell contact expansion and strengthening 
remains unclear. Here, we study how primary germ layer progenitor cells from zebrafish 
bind to supported lipid bilayers (SLB) functionalized with E-cadherin ectodomains as an 
assay system for monitoring cell-cell contact formation at high spatiotemporal resolution. 
We show that cell-cell contact formation represents a two-tiered process: E-cadherinmediated downregulation of the small GTPase RhoA at the forming contact leads to both 
depletion of Myosin-2 and decrease of F-actin. This is followed by centrifugal actin 
network flows at the contact triggered by a sharp gradient of Myosin-2 at the rim of the 
contact zone, with Myosin-2 displaying higher cortical localization outside than inside of 
the contact. These centrifugal cortical actin flows, in turn, not only further dilute the actin 
network at the contact disc, but also lead to an accumulation of both F-actin and Ecadherin at the contact rim. Eventually, this combination of actomyosin downregulation 
and flows at the contact contribute to the characteristic molecular organization implicated 
in contact formation and maintenance: depletion of cortical actomyosin at the contact disc, 
driving contact expansion by lowering interfacial tension at the contact, and accumulation 
of both E-cadherin and F-actin at the contact rim, mechanically linking the contractile 
cortices of the adhering cells. Thus, using a biomimetic assay, we exemplify how 
adhesion signaling and cell mechanics function together to modulate the spatial 
organization of cell-cell contacts.},
  author       = {Arslan, Feyza N},
  isbn         = { 978-3-99078-025-1 },
  issn         = {2663-337X},
  pages        = {113},
  publisher    = {Institute of Science and Technology Austria},
  title        = {{Remodeling of E-cadherin-mediated contacts via cortical  flows}},
  doi          = {10.15479/at:ista:12153},
  year         = {2022},
}

@phdthesis{12378,
  abstract     = {Environmental cues influence the highly dynamic morphology of microglia. Strategies to 
characterize these changes usually involve user-selected morphometric features, which 
preclude the identification of a spectrum of context-dependent morphological phenotypes. 
Here, we develop MorphOMICs, a topological data analysis approach, which enables semiautomatic mapping of microglial morphology into an atlas of cue-dependent phenotypes,
overcomes feature-selection bias and minimizes biological variability. 
First, with MorphOMICs we derive the morphological spectrum of microglia across seven 
brain regions during postnatal development and in two distinct Alzheimer’s disease 
degeneration mouse models. We uncover region-specific and sexually dimorphic
morphological trajectories, with females showing an earlier morphological shift than males in 
the degenerating brain. Overall, we demonstrate that both long primary- and short terminal 
processes provide distinct insights to morphological phenotypes. Moreover, using machine 
learning to map novel condition on the spectrum, we observe that microglia morphologies 
reflect a dose-dependent adaptation upon ketamine anesthesia and do not recover to control 
morphologies.
Next, we took advantage of MorphOMICs to build a high-resolution and layer-specific map of 
microglial morphological spectrum in the retina, covering postnatal development and rd10 
degeneration. Here, following photoreceptor death, microglia assume an early developmentlike morphology. Finally, we map microglial morphology following optic nerve crush on the 
retinal spectrum and observe a layer- and sex-dependent response. 
Overall, MorphOMICs opens a new perspective to analyze microglial morphology across 
multiple conditions, and provides a novel tool to characterize microglial morphology beyond 
the traditionally dichotomized view of microglia.},
  author       = {Colombo, Gloria},
  issn         = {2663-337X},
  pages        = {142},
  publisher    = {Institute of Science and Technology Austria},
  title        = {{MorphOMICs, a tool for mapping microglial morphology, reveals brain region- and sex-dependent phenotypes}},
  doi          = {10.15479/at:ista:12378},
  year         = {2022},
}

@phdthesis{12390,
  abstract     = {The scope of this thesis is to study quantum systems exhibiting a continuous symmetry that
is broken on the level of the corresponding effective theory. In particular we are going to
investigate translation-invariant Bose gases in the mean field limit, effectively described by
the Hartree functional, and the Fröhlich Polaron in the regime of strong coupling, effectively
described by the Pekar functional. The latter is a model describing the interaction between a
charged particle and the optical modes of a polar crystal. Regarding the former, we assume in
addition that the particles in the gas are unconfined, and typically we will consider particles
that are subject to an attractive interaction. In both cases the ground state energy of the
Hamiltonian is not a proper eigenvalue due to the underlying translation-invariance, while on
the contrary there exists a whole invariant orbit of minimizers for the corresponding effective
functionals. Both, the absence of proper eigenstates and the broken symmetry of the effective
theory, make the study significantly more involved and it is the content of this thesis to
develop a frameworks which allows for a systematic way to circumvent these issues.
It is a well-established result that the ground state energy of Bose gases in the mean field limit,
as well as the ground state energy of the Fröhlich Polaron in the regime of strong coupling, is
to leading order given by the minimal energy of the corresponding effective theory. As part
of this thesis we identify the sub-leading term in the expansion of the ground state energy,
which can be interpreted as the quantum correction to the classical energy, since the effective
theories under consideration can be seen as classical counterparts.
We are further going to establish an asymptotic expression for the energy-momentum relation
of the Fröhlich Polaron in the strong coupling limit. In the regime of suitably small momenta,
this asymptotic expression agrees with the energy-momentum relation of a free particle having
an effectively increased mass, and we find that this effectively increased mass agrees with the
conjectured value in the physics literature.
In addition we will discuss two unrelated papers written by the author during his stay at ISTA
in the appendix. The first one concerns the realization of anyons, which are quasi-particles
acquiring a non-trivial phase under the exchange of two particles, as molecular impurities.
The second one provides a classification of those vector fields defined on a given manifold
that can be written as the gradient of a given functional with respect to a suitable metric,
provided that some mild smoothness assumptions hold. This classification is subsequently
used to identify those quantum Markov semigroups that can be written as a gradient flow of
the relative entropy.
},
  author       = {Brooks, Morris},
  issn         = {2663-337X},
  pages        = {196},
  publisher    = {Institute of Science and Technology Austria},
  title        = {{Translation-invariant quantum systems with effectively broken symmetry}},
  doi          = {10.15479/at:ista:12390},
  year         = {2022},
}

@phdthesis{12401,
  abstract     = {Detachment of the cancer cells from the bulk of the tumor is the first step of metastasis, which
is the primary cause of cancer related deaths. It is unclear, which factors contribute to this step.
Recent studies indicate a crucial role of the tumor microenvironment in malignant
transformation and metastasis. Studying cancer cell invasion and detachments quantitatively in
the context of its physiological microenvironment is technically challenging. Especially, precise
control of microenvironmental properties in vivo is currently not possible. Here, I studied the
role of microenvironment geometry in the invasion and detachment of cancer cells from the
bulk with a simplistic and reductionist approach. In this approach, I engineered microfluidic
devices to mimic a pseudo 3D extracellular matrix environment, where I was able to
quantitatively tune the geometrical configuration of the microenvironment and follow tumor
cells with fluorescence live imaging. To aid quantitative analysis I developed a widely applicable
software application to automatically analyze and visualize particle tracking data.
Quantitative analysis of tumor cell invasion in isotropic and anisotropic microenvironments
showed that heterogeneity in the microenvironment promotes faster invasion and more
frequent detachment of cells. These observations correlated with overall higher speed of cells at
the edge of the bulk of the cells. In heterogeneous microenvironments cells preferentially
passed through larger pores, thus invading areas of least resistance and generating finger-like
invasive structures. The detachments occurred mostly at the tips of these structures.
To investigate the potential mechanism, we established a two dimensional model to simulate
active Brownian particles representing the cell nuclei dynamics. These simulations backed our in
vitro observations without the need of precise fitting the simulation parameters. Our model
suggests the importance of the pore heterogeneity in the direction perpendicular to the
orientation of bias field (lateral heterogeneity), which causes the interface roughening.},
  author       = {Tasciyan, Saren},
  issn         = {2663-337X},
  pages        = {105},
  publisher    = {Institute of Science and Technology Austria},
  title        = {{Role of microenvironment heterogeneity in cancer cell invasion}},
  doi          = {10.15479/at:ista:12401},
  year         = {2022},
}

@article{12431,
  abstract     = {This paper presents a new representation of curve dynamics, with applications to vortex filaments in fluid dynamics. Instead of representing these filaments with explicit curve geometry and Lagrangian equations of motion, we represent curves implicitly with a new co-dimensional 2 level set description. Our implicit representation admits several redundant mathematical degrees of freedom in both the configuration and the dynamics of the curves, which can be tailored specifically to improve numerical robustness, in contrast to naive approaches for implicit curve dynamics that suffer from overwhelming numerical stability problems. Furthermore, we note how these hidden degrees of freedom perfectly map to a Clebsch representation in fluid dynamics. Motivated by these observations, we introduce untwisted level set functions and non-swirling dynamics which successfully regularize sources of numerical instability, particularly in the twisting modes around curve filaments. A consequence is a novel simulation method which produces stable dynamics for large numbers of interacting vortex filaments and effortlessly handles topological changes and re-connection events.},
  author       = {Ishida, Sadashige and Wojtan, Christopher J and Chern, Albert},
  issn         = {1557-7368},
  journal      = {ACM Transactions on Graphics},
  number       = {6},
  publisher    = {Association for Computing Machinery},
  title        = {{Hidden degrees of freedom in implicit vortex filaments}},
  doi          = {10.1145/3550454.3555459},
  volume       = {41},
  year         = {2022},
}

@inproceedings{12432,
  abstract     = {We present CertifyHAM, a deterministic algorithm that takes a graph G as input and either finds a Hamilton cycle of G or outputs that such a cycle does not exist. If G ∼ G(n, p) and p ≥
100 log n/n then the expected running time of CertifyHAM is O(n/p) which is best possible. This improves upon previous results due to Gurevich and Shelah, Thomason and Alon, and
Krivelevich, who proved analogous results for p being constant, p ≥ 12n −1/3 and p ≥ 70n
−1/2 respectively.},
  author       = {Anastos, Michael},
  booktitle    = {63rd Annual IEEE Symposium on Foundations of Computer Science},
  isbn         = {9781665455190},
  issn         = {0272-5428},
  location     = {Denver, CO, United States},
  pages        = {919--930},
  publisher    = {Institute of Electrical and Electronics Engineers},
  title        = {{Solving the Hamilton cycle problem fast on average}},
  doi          = {10.1109/FOCS54457.2022.00091},
  volume       = {2022-October},
  year         = {2022},
}

@inproceedings{12452,
  abstract     = {Portrait viewpoint and illumination editing is an important problem with several applications in VR/AR, movies, and photography. Comprehensive knowledge of geometry and illumination is critical for obtaining photorealistic results. Current methods are unable to explicitly model in 3D while handing both viewpoint and illumination editing from a single image. In this paper, we propose VoRF, a novel approach that can take even a single portrait image as input and relight human heads under novel illuminations that can be viewed from arbitrary viewpoints. VoRF represents a human head as a continuous volumetric field and learns a prior model of human heads using a coordinate-based MLP with separate latent spaces for identity and illumination. The prior model is learnt in an auto-decoder manner over a diverse class of head shapes and appearances, allowing VoRF to generalize to novel test identities from a single input image. Additionally, VoRF has a reflectance MLP that uses the intermediate features of the prior model for rendering One-Light-at-A-Time (OLAT) images under novel views. We synthesize novel illuminations by combining these OLAT images with target environment maps. Qualitative and quantitative evaluations demonstrate the effectiveness of VoRF for relighting and novel view synthesis even when applied to unseen subjects under uncontrolled illuminations.},
  author       = {Rao, Pramod and B R, Mallikarjun and Fox, Gereon and Weyrich, Tim and Bickel, Bernd and Seidel, Hans-Peter and Pfister, Hanspeter and Matusik, Wojciech and Tewari, Ayush and Theobalt, Christian and Elgharib, Mohamed},
  booktitle    = {33rd British Machine Vision Conference},
  location     = {London, United Kingdom},
  publisher    = {British Machine Vision Association and Society for Pattern Recognition},
  title        = {{VoRF: Volumetric Relightable Faces}},
  year         = {2022},
}

@article{12480,
  abstract     = {We consider the problem of estimating a signal from measurements obtained via a generalized linear model. We focus on estimators based on approximate message passing (AMP), a family of iterative algorithms with many appealing features: the performance of AMP in the high-dimensional limit can be succinctly characterized under suitable model assumptions; AMP can also be tailored to the empirical distribution of the signal entries, and for a wide class of estimation problems, AMP is conjectured to be optimal among all polynomial-time algorithms. However, a major issue of AMP is that in many models (such as phase retrieval), it requires an initialization correlated with the ground-truth signal and independent from the measurement matrix. Assuming that such an initialization is available is typically not realistic. In this paper, we solve this problem by proposing an AMP algorithm initialized with a spectral estimator. With such an initialization, the standard AMP analysis fails since the spectral estimator depends in a complicated way on the design matrix. Our main contribution is a rigorous characterization of the performance of AMP with spectral initialization in the high-dimensional limit. The key technical idea is to define and analyze a two-phase artificial AMP algorithm that first produces the spectral estimator, and then closely approximates the iterates of the true AMP. We also provide numerical results that demonstrate the validity of the proposed approach.},
  author       = {Mondelli, Marco and Venkataramanan, Ramji},
  issn         = {1742-5468},
  journal      = {Journal of Statistical Mechanics: Theory and Experiment},
  keywords     = {Statistics, Probability and Uncertainty, Statistics and Probability, Statistical and Nonlinear Physics},
  number       = {11},
  publisher    = {IOP Publishing},
  title        = {{Approximate message passing with spectral initialization for generalized linear models}},
  doi          = {10.1088/1742-5468/ac9828},
  volume       = {2022},
  year         = {2022},
}

@article{12495,
  abstract     = {Fairness-aware learning aims at constructing classifiers that not only make accurate predictions, but also do not discriminate against specific groups. It is a fast-growing area of
machine learning with far-reaching societal impact. However, existing fair learning methods
are vulnerable to accidental or malicious artifacts in the training data, which can cause
them to unknowingly produce unfair classifiers. In this work we address the problem of
fair learning from unreliable training data in the robust multisource setting, where the
available training data comes from multiple sources, a fraction of which might not be representative of the true data distribution. We introduce FLEA, a filtering-based algorithm
that identifies and suppresses those data sources that would have a negative impact on
fairness or accuracy if they were used for training. As such, FLEA is not a replacement of
prior fairness-aware learning methods but rather an augmentation that makes any of them
robust against unreliable training data. We show the effectiveness of our approach by a
diverse range of experiments on multiple datasets. Additionally, we prove formally that
–given enough data– FLEA protects the learner against corruptions as long as the fraction of
affected data sources is less than half. Our source code and documentation are available at
https://github.com/ISTAustria-CVML/FLEA.},
  author       = {Iofinova, Eugenia B and Konstantinov, Nikola H and Lampert, Christoph},
  issn         = {2835-8856},
  journal      = {Transactions on Machine Learning Research},
  publisher    = {ML Research Press},
  title        = {{FLEA: Provably robust fair multisource learning from unreliable training data}},
  year         = {2022},
}

@inproceedings{12508,
  abstract     = {We explore the notion of history-determinism in the context of timed automata (TA). History-deterministic automata are those in which nondeterminism can be resolved on the fly, based on the run constructed thus far. History-determinism is a robust property that admits different game-based characterisations, and history-deterministic specifications allow for game-based verification without an expensive determinization step.
We show yet another characterisation of history-determinism in terms of fair simulation, at the general level of labelled transition systems: a system is history-deterministic precisely if and only if it fairly simulates all language smaller systems.
For timed automata over infinite timed words it is known that universality is undecidable for Büchi TA. We show that for history-deterministic TA with arbitrary parity acceptance, timed universality, inclusion, and synthesis all remain decidable and are ExpTime-complete.
For the subclass of TA with safety or reachability acceptance, we show that checking whether such an automaton is history-deterministic is decidable (in ExpTime), and history-deterministic TA with safety acceptance are effectively determinizable without introducing new automata states.},
  author       = {Henzinger, Thomas A and Lehtinen, Karoliina and Totzke, Patrick},
  booktitle    = {33rd International Conference on Concurrency Theory},
  isbn         = {9783959772464},
  issn         = {1868-8969},
  location     = {Warsaw, Poland},
  pages        = {14:1--14:21},
  publisher    = {Schloss Dagstuhl - Leibniz-Zentrum für Informatik},
  title        = {{History-deterministic timed automata}},
  doi          = {10.4230/LIPIcs.CONCUR.2022.14},
  volume       = {243},
  year         = {2022},
}

@inproceedings{12509,
  abstract     = {A graph game is a two-player zero-sum game in which the players move a token throughout a graph to produce an infinite path, which determines the winner or payoff of the game. In bidding games, both players have budgets, and in each turn, we hold an "auction" (bidding) to determine which player moves the token. In this survey, we consider several bidding mechanisms and their effect on the properties of the game. Specifically, bidding games, and in particular bidding games of infinite duration, have an intriguing equivalence with random-turn games in which in each turn, the player who moves is chosen randomly. We summarize how minor changes in the bidding mechanism lead to unexpected differences in the equivalence with random-turn games.},
  author       = {Avni, Guy and Henzinger, Thomas A},
  booktitle    = {47th International Symposium on Mathematical Foundations of Computer Science},
  isbn         = {9783959772563},
  issn         = {1868-8969},
  location     = {Vienna, Austria},
  pages        = {3:1--3:6},
  publisher    = {Schloss Dagstuhl - Leibniz-Zentrum für Informatik},
  title        = {{An updated survey of bidding games on graphs}},
  doi          = {10.4230/LIPIcs.MFCS.2022.3},
  volume       = {241},
  year         = {2022},
}

@article{12510,
  abstract     = {We introduce a new statistical verification algorithm that formally quantifies the behavioral robustness of any time-continuous process formulated as a continuous-depth model. Our algorithm solves a set of global optimization (Go) problems over a given time horizon to construct a tight enclosure (Tube) of the set of all process executions starting from a ball of initial states. We call our algorithm GoTube. Through its construction, GoTube ensures that the bounding tube is conservative up to a desired probability and up to a desired tightness.
 GoTube is implemented in JAX and optimized to scale to complex continuous-depth neural network models. Compared to advanced reachability analysis tools for time-continuous neural networks, GoTube does not accumulate overapproximation errors between time steps and avoids the infamous wrapping effect inherent in symbolic techniques. We show that GoTube substantially outperforms state-of-the-art verification tools in terms of the size of the initial ball, speed, time-horizon, task completion, and scalability on a large set of experiments.
 GoTube is stable and sets the state-of-the-art in terms of its ability to scale to time horizons well beyond what has been previously possible.},
  author       = {Gruenbacher, Sophie A. and Lechner, Mathias and Hasani, Ramin and Rus, Daniela and Henzinger, Thomas A and Smolka, Scott A. and Grosu, Radu},
  isbn         = {978577358350},
  issn         = {2374-3468},
  journal      = {Proceedings of the AAAI Conference on Artificial Intelligence},
  keywords     = {General Medicine},
  number       = {6},
  pages        = {6755--6764},
  publisher    = {Association for the Advancement of Artificial Intelligence},
  title        = {{GoTube: Scalable statistical verification of continuous-depth models}},
  doi          = {10.1609/aaai.v36i6.20631},
  volume       = {36},
  year         = {2022},
}

@article{12511,
  abstract     = {We consider the problem of formally verifying almost-sure (a.s.) asymptotic stability in discrete-time nonlinear stochastic control systems. While verifying stability in deterministic control systems is extensively studied in the literature, verifying stability in stochastic control systems is an open problem. The few existing works on this topic either consider only specialized forms of stochasticity or make restrictive assumptions on the system, rendering them inapplicable to learning algorithms with neural network policies. 
 In this work, we present an approach for general nonlinear stochastic control problems with two novel aspects: (a) instead of classical stochastic extensions of Lyapunov functions, we use ranking supermartingales (RSMs) to certify a.s. asymptotic stability, and (b) we present a method for learning neural network RSMs. 
 We prove that our approach guarantees a.s. asymptotic stability of the system and
 provides the first method to obtain bounds on the stabilization time, which stochastic Lyapunov functions do not.
 Finally, we validate our approach experimentally on a set of nonlinear stochastic reinforcement learning environments with neural network policies.},
  author       = {Lechner, Mathias and Zikelic, Dorde and Chatterjee, Krishnendu and Henzinger, Thomas A},
  isbn         = {9781577358350},
  issn         = {2374-3468},
  journal      = {Proceedings of the AAAI Conference on Artificial Intelligence},
  keywords     = {General Medicine},
  number       = {7},
  pages        = {7326--7336},
  publisher    = {Association for the Advancement of Artificial Intelligence},
  title        = {{Stability verification in stochastic control systems via neural network supermartingales}},
  doi          = {10.1609/aaai.v36i7.20695},
  volume       = {36},
  year         = {2022},
}

@inproceedings{12516,
  abstract     = {The homogeneous continuous LWE (hCLWE) problem is to distinguish samples of a specific high-dimensional Gaussian mixture from standard normal samples. It was shown to be at least as hard as Learning with Errors, but no reduction in the other direction is currently known.
We present four new public-key encryption schemes based on the hardness of hCLWE, with varying tradeoffs between decryption and security errors, and different discretization techniques. Our schemes yield a polynomial-time algorithm for solving hCLWE using a Statistical Zero-Knowledge oracle.},
  author       = {Bogdanov, Andrej and Cueto Noval, Miguel and Hoffmann, Charlotte and Rosen, Alon},
  booktitle    = {Theory of Cryptography},
  isbn         = {9783031223648},
  issn         = {1611-3349},
  location     = {Chicago, IL, United States},
  pages        = {565--592},
  publisher    = {Springer Nature},
  title        = {{Public-Key Encryption from Homogeneous CLWE}},
  doi          = {10.1007/978-3-031-22365-5_20},
  volume       = {13748},
  year         = {2022},
}

@misc{12522,
  abstract     = {This .zip File contains the transport data, the codes for the data analysis, the microscopy analysis and the codes for the theoretical simulations for "Majorana-like Coulomb spectroscopy in the absence of zero bias peaks" by M. Valentini, et. al. The transport data are saved with hdf5 file format. The files can be open with the log browser of Labber.},
  author       = {Valentini, Marco and San-Jose, Pablo and Arbiol, Jordi and Marti-Sanchez, Sara and Botifoll, Marc},
  publisher    = {Institute of Science and Technology Austria},
  title        = {{Data for "Majorana-like Coulomb spectroscopy in the absence of zero bias peaks"}},
  doi          = {10.15479/AT:ISTA:12102},
  year         = {2022},
}

@unpublished{12536,
  abstract     = {We consider the problem of estimating a rank-1 signal corrupted by structured rotationally invariant noise, and address the following question: how well do inference algorithms perform when the noise statistics is unknown and hence Gaussian noise is assumed? While the matched Bayes-optimal setting with unstructured noise is well understood, the analysis of this mismatched problem is only at its premises. In this paper, we make a step towards understanding the effect of the strong source of mismatch which is the noise statistics. Our main technical contribution is the rigorous analysis of a Bayes estimator and of an approximate message passing (AMP) algorithm, both of which incorrectly assume a Gaussian setup. The first result exploits the theory of spherical integrals and of low-rank matrix perturbations; the idea behind the second one is to design and analyze an artificial AMP which, by taking advantage of the flexibility in the denoisers, is able to "correct" the mismatch. Armed with these sharp asymptotic characterizations, we unveil a rich and often unexpected phenomenology. For example, despite AMP is in principle designed to efficiently compute the Bayes estimator, the former is outperformed by the latter in terms of mean-square error. We show that this performance gap is due to an incorrect estimation of the signal norm. In fact, when the SNR is large enough, the overlaps of the AMP and the Bayes estimator coincide, and they even match those of optimal estimators taking into account the structure of the noise.},
  author       = {Barbier, Jean and Hou, TianQi and Mondelli, Marco and Saenz, Manuel},
  booktitle    = {arXiv},
  title        = {{The price of ignorance: How much does it cost to forget noise structure in low-rank matrix estimation?}},
  doi          = {10.48550/arXiv.2205.10009},
  year         = {2022},
}

@inproceedings{12537,
  abstract     = {The Neural Tangent Kernel (NTK) has emerged as a powerful tool to provide memorization, optimization and generalization guarantees in deep neural networks. A line of work has studied the NTK spectrum for two-layer and deep networks with at least a layer with Ω(N) neurons, N being the number of training samples. Furthermore, there is increasing evidence suggesting that deep networks with sub-linear layer widths are powerful memorizers and optimizers, as long as the number of parameters exceeds the number of samples. Thus, a natural open question is whether the NTK is well conditioned in such a challenging sub-linear setup. In this paper, we answer this question in the affirmative. Our key technical contribution is a lower bound on the smallest NTK eigenvalue for deep networks with the minimum possible over-parameterization: the number of parameters is roughly Ω(N) and, hence, the number of neurons is as little as Ω(N−−√). To showcase the applicability of our NTK bounds, we provide two results concerning memorization capacity and optimization guarantees for gradient descent training.},
  author       = {Bombari, Simone and Amani, Mohammad Hossein and Mondelli, Marco},
  booktitle    = {36th Conference on Neural Information Processing Systems},
  isbn         = {9781713871088},
  pages        = {7628--7640},
  publisher    = {Curran Associates},
  title        = {{Memorization and optimization in deep neural networks with minimum over-parameterization}},
  volume       = {35},
  year         = {2022},
}

@article{12538,
  abstract     = {In this paper, we study the compression of a target two-layer neural network with N nodes into a compressed network with M<N nodes. More precisely, we consider the setting in which the weights of the target network are i.i.d. sub-Gaussian, and we minimize the population L_2 loss between the outputs of the target and of the compressed network, under the assumption of Gaussian inputs. By using tools from high-dimensional probability, we show that this non-convex problem can be simplified when the target network is sufficiently over-parameterized, and provide the error rate of this approximation as a function of the input dimension and N. In this mean-field limit, the simplified objective, as well as the optimal weights of the compressed network, does not depend on the realization of the target network, but only on expected scaling factors. Furthermore, for networks with ReLU activation, we conjecture that the optimum of the simplified optimization problem is achieved by taking weights on the Equiangular Tight Frame (ETF), while the scaling of the weights and the orientation of the ETF depend on the parameters of the target network. Numerical evidence is provided to support this conjecture.},
  author       = {Amani, Mohammad Hossein and Bombari, Simone and Mondelli, Marco and Pukdee, Rattana and Rini, Stefano},
  isbn         = {9781665483414},
  journal      = {IEEE Information Theory Workshop},
  location     = {Mumbai, India},
  pages        = {588--593},
  publisher    = {IEEE},
  title        = {{Sharp asymptotics on the compression of two-layer neural networks}},
  doi          = {10.1109/ITW54588.2022.9965870},
  year         = {2022},
}

@inproceedings{12540,
  abstract     = {We consider the problem of signal estimation in generalized linear models defined via rotationally invariant design matrices. Since these matrices can have an arbitrary spectral distribution, this model is well suited for capturing complex correlation structures which often arise in applications. We propose a novel family of approximate message passing (AMP) algorithms for signal estimation, and rigorously characterize their performance in the high-dimensional limit via a state evolution recursion. Our rotationally invariant AMP has complexity of the same order as the existing AMP derived under the restrictive assumption of a Gaussian design; our algorithm also recovers this existing AMP as a special case. Numerical results showcase a performance close to Vector AMP (which is conjectured to be Bayes-optimal in some settings), but obtained with a much lower complexity, as the proposed algorithm does not require a computationally expensive singular value decomposition.},
  author       = {Venkataramanan, Ramji and Kögler, Kevin and Mondelli, Marco},
  booktitle    = {Proceedings of the 39th International Conference on Machine Learning},
  location     = {Baltimore, MD, United States},
  publisher    = {ML Research Press},
  title        = {{Estimation in rotationally invariant generalized linear models via approximate message passing}},
  volume       = {162},
  year         = {2022},
}