@phdthesis{15020,
  abstract     = {This thesis consists of four distinct pieces of work within theoretical biology, with two themes in common: the concept of optimization in biological systems, and the use of information-theoretic tools to quantify biological stochasticity and statistical uncertainty.
Chapter 2 develops a statistical framework for studying biological systems which we believe to be optimized for a particular utility function, such as retinal neurons conveying information about visual stimuli. We formalize such beliefs as maximum-entropy Bayesian priors, constrained by the expected utility. We explore how such priors aid inference of system parameters with limited data and enable optimality hypothesis testing: is the utility higher than by chance?
Chapter 3 examines the ultimate biological optimization process: evolution by natural selection. As some individuals survive and reproduce more successfully than others, populations evolve towards fitter genotypes and phenotypes. We formalize this as accumulation of genetic information, and use population genetics theory to study how much such information can be accumulated per generation and maintained in the face of random mutation and genetic drift. We identify the population size and fitness variance as the key quantities that control information accumulation and maintenance.
Chapter 4 reuses the concept of genetic information from Chapter 3, but from a different perspective: we ask how much genetic information organisms actually need, in particular in the context of gene regulation. For example, how much information is needed to bind transcription factors at correct locations within the genome? Population genetics provides us with a refined answer: with an increasing population size, populations achieve higher fitness by maintaining more genetic information. Moreover, regulatory parameters experience selection pressure to optimize the fitness-information trade-off, i.e. minimize the information needed for a given fitness. This provides an evolutionary derivation of the optimization priors introduced in Chapter 2.
Chapter 5 proves an upper bound on mutual information between a signal and a communication channel output (such as neural activity). Mutual information is an important utility measure for biological systems, but its practical use can be difficult due to the large dimensionality of many biological channels. Sometimes, a lower bound on mutual information is computed by replacing the high-dimensional channel outputs with decodes (signal estimates). Our result provides a corresponding upper bound, provided that the decodes are the maximum posterior estimates of the signal.},
  author       = {Hledik, Michal},
  issn         = {2663 - 337X},
  keywords     = {Theoretical biology, Optimality, Evolution, Information},
  pages        = {158},
  publisher    = {Institute of Science and Technology Austria},
  title        = {{Genetic information and biological optimization}},
  doi          = {10.15479/at:ista:15020},
  year         = {2024},
}

@article{14751,
  abstract     = {We consider zero-error communication over a two-transmitter deterministic adversarial multiple access channel (MAC) governed by an adversary who has access to the transmissions of both senders (hence called omniscient ) and aims to maliciously corrupt the communication. None of the encoders, jammer and decoder is allowed to randomize using private or public randomness. This enforces a combinatorial nature of the problem. Our model covers a large family of channels studied in the literature, including all deterministic discrete memoryless noisy or noiseless MACs. In this work, given an arbitrary two-transmitter deterministic omniscient adversarial MAC, we characterize when the capacity region: 1) has nonempty interior (in particular, is two-dimensional); 2) consists of two line segments (in particular, has empty interior); 3) consists of one line segment (in particular, is one-dimensional); 4) or only contains (0,0) (in particular, is zero-dimensional). This extends a recent result by Wang et al. (201 9) from the point-to-point setting to the multiple access setting. Indeed, our converse arguments build upon their generalized Plotkin bound and involve delicate case analysis. One of the technical challenges is to take care of both “joint confusability” and “marginal confusability”. In particular, the treatment of marginal confusability does not follow from the point-to-point results by Wang et al. Our achievability results follow from random coding with expurgation.},
  author       = {Zhang, Yihan},
  issn         = {1557-9654},
  journal      = {IEEE Transactions on Information Theory},
  keywords     = {Computer Science Applications, Information Systems},
  number       = {7},
  pages        = {4093--4127},
  publisher    = {Institute of Electrical and Electronics Engineers},
  title        = {{Zero-error communication over adversarial MACs}},
  doi          = {10.1109/tit.2023.3257239},
  volume       = {69},
  year         = {2023},
}

@article{10602,
  abstract     = {Transforming ω-automata into parity automata is traditionally done using appearance records. We present an efficient variant of this idea, tailored to Rabin automata, and several optimizations applicable to all appearance records. We compare the methods experimentally and show that our method produces significantly smaller automata than previous approaches.},
  author       = {Kretinsky, Jan and Meggendorfer, Tobias and Waldmann, Clara and Weininger, Maximilian},
  issn         = {1432-0525},
  journal      = {Acta Informatica},
  keywords     = {computer networks and communications, information systems, software},
  pages        = {585--618},
  publisher    = {Springer Nature},
  title        = {{Index appearance record with preorders}},
  doi          = {10.1007/s00236-021-00412-y},
  volume       = {59},
  year         = {2022},
}

@article{12134,
  abstract     = {Standard epidemic models exhibit one continuous, second order phase transition to macroscopic outbreaks. However, interventions to control outbreaks may fundamentally alter epidemic dynamics. Here we reveal how such interventions modify the type of phase transition. In particular, we uncover three distinct types of explosive phase transitions for epidemic dynamics with capacity-limited interventions. Depending on the capacity limit, interventions may (i) leave the standard second order phase transition unchanged but exponentially suppress the probability of large outbreaks, (ii) induce a first-order discontinuous transition to macroscopic outbreaks, or (iii) cause a secondary explosive yet continuous third-order transition. These insights highlight inherent limitations in predicting and containing epidemic outbreaks. More generally our study offers a cornerstone example of a third-order explosive phase transition in complex systems.},
  author       = {Börner, Georg and Schröder, Malte and Scarselli, Davide and Budanur, Nazmi B and Hof, Björn and Timme, Marc},
  issn         = {2632-072X},
  journal      = {Journal of Physics: Complexity},
  keywords     = {Artificial Intelligence, Computer Networks and Communications, Computer Science Applications, Information Systems},
  number       = {4},
  publisher    = {IOP Publishing},
  title        = {{Explosive transitions in epidemic dynamics}},
  doi          = {10.1088/2632-072x/ac99cd},
  volume       = {3},
  year         = {2022},
}

@article{12261,
  abstract     = {Dose–response relationships are a general concept for quantitatively describing biological systems across multiple scales, from the molecular to the whole-cell level. A clinically relevant example is the bacterial growth response to antibiotics, which is routinely characterized by dose–response curves. The shape of the dose–response curve varies drastically between antibiotics and plays a key role in treatment, drug interactions, and resistance evolution. However, the mechanisms shaping the dose–response curve remain largely unclear. Here, we show in Escherichia coli that the distinctively shallow dose–response curve of the antibiotic trimethoprim is caused by a negative growth-mediated feedback loop: Trimethoprim slows growth, which in turn weakens the effect of this antibiotic. At the molecular level, this feedback is caused by the upregulation of the drug target dihydrofolate reductase (FolA/DHFR). We show that this upregulation is not a specific response to trimethoprim but follows a universal trend line that depends primarily on the growth rate, irrespective of its cause. Rewiring the feedback loop alters the dose–response curve in a predictable manner, which we corroborate using a mathematical model of cellular resource allocation and growth. Our results indicate that growth-mediated feedback loops may shape drug responses more generally and could be exploited to design evolutionary traps that enable selection against drug resistance.},
  author       = {Angermayr, Andreas and Pang, Tin Yau and Chevereau, Guillaume and Mitosch, Karin and Lercher, Martin J and Bollenbach, Mark Tobias},
  issn         = {1744-4292},
  journal      = {Molecular Systems Biology},
  keywords     = {Applied Mathematics, Computational Theory and Mathematics, General Agricultural and Biological Sciences, General Immunology and Microbiology, General Biochemistry, Genetics and Molecular Biology, Information Systems},
  number       = {9},
  publisher    = {Embo Press},
  title        = {{Growth‐mediated negative feedback shapes quantitative antibiotic response}},
  doi          = {10.15252/msb.202110490},
  volume       = {18},
  year         = {2022},
}

@article{10861,
  abstract     = {We introduce in this paper AMT2.0, a tool for qualitative and quantitative analysis of hybrid continuous and Boolean signals that combine numerical values and discrete events. The evaluation of the signals is based on rich temporal specifications expressed in extended signal temporal logic, which integrates timed regular expressions within signal temporal logic. The tool features qualitative monitoring (property satisfaction checking), trace diagnostics for explaining and justifying property violations and specification-driven measurement of quantitative features of the signal. We demonstrate the tool functionality on several running examples and case studies, and evaluate its performance.},
  author       = {Nickovic, Dejan and Lebeltel, Olivier and Maler, Oded and Ferrere, Thomas and Ulus, Dogan},
  issn         = {1433-2787},
  journal      = {International Journal on Software Tools for Technology Transfer},
  keywords     = {Information Systems, Software},
  number       = {6},
  pages        = {741--758},
  publisher    = {Springer Nature},
  title        = {{AMT 2.0: Qualitative and quantitative trace analysis with extended signal temporal logic}},
  doi          = {10.1007/s10009-020-00582-z},
  volume       = {22},
  year         = {2020},
}

@article{7369,
  abstract     = {Neuronal responses to complex stimuli and tasks can encompass a wide range of time scales. Understanding these responses requires measures that characterize how the information on these response patterns are represented across multiple temporal resolutions. In this paper we propose a metric – which we call multiscale relevance (MSR) – to capture the dynamical variability of the activity of single neurons across different time scales. The MSR is a non-parametric, fully featureless indicator in that it uses only the time stamps of the firing activity without resorting to any a priori covariate or invoking any specific structure in the tuning curve for neural activity. When applied to neural data from the mEC and from the ADn and PoS regions of freely-behaving rodents, we found that neurons having low MSR tend to have low mutual information and low firing sparsity across the correlates that are believed to be encoded by the region of the brain where the recordings were made. In addition, neurons with high MSR contain significant information on spatial navigation and allow to decode spatial position or head direction as efficiently as those neurons whose firing activity has high mutual information with the covariate to be decoded and significantly better than the set of neurons with high local variations in their interspike intervals. Given these results, we propose that the MSR can be used as a measure to rank and select neurons for their information content without the need to appeal to any a priori covariate.},
  author       = {Cubero, Ryan J and Marsili, Matteo and Roudi, Yasser},
  issn         = {1573-6873},
  journal      = {Journal of Computational Neuroscience},
  keywords     = {Time series analysis, Multiple time scale analysis, Spike train data, Information theory, Bayesian decoding},
  pages        = {85--102},
  publisher    = {Springer Nature},
  title        = {{Multiscale relevance and informative encoding in neuronal spike trains}},
  doi          = {10.1007/s10827-020-00740-x},
  volume       = {48},
  year         = {2020},
}

@phdthesis{6473,
  abstract     = {Single cells are constantly interacting with their environment and each other, more importantly, the accurate perception of environmental cues is crucial for growth, survival, and reproduction. This communication between cells and their environment can be formalized in mathematical terms and be quantified as the information flow between them, as prescribed by information theory. 
The recent availability of real–time dynamical patterns of signaling molecules in single cells has allowed us to identify encoding about the identity of the environment in the time–series. However, efficient estimation of the information transmitted by these signals has been a data–analysis challenge due to the high dimensionality of the trajectories and the limited number of samples. In the first part of this thesis, we develop and evaluate decoding–based estimation methods to lower bound the mutual information and derive model–based precise information estimates for biological reaction networks governed by the chemical master equation. This is followed by applying the decoding-based methods to study the intracellular representation of extracellular changes in budding yeast, by observing the transient dynamics of nuclear translocation of 10 transcription factors in response to 3 stress conditions. Additionally, we apply these estimators to previously published data on ERK and Ca2+ signaling and yeast stress response. We argue that this single cell decoding-based measure of information provides an unbiased, quantitative and interpretable measure for the fidelity of biological signaling processes. 
Finally, in the last section, we deal with gene regulation which is primarily controlled by transcription factors (TFs) that bind to the DNA to activate gene expression. The possibility that non-cognate TFs activate transcription diminishes the accuracy of regulation with potentially disastrous effects for the cell. This ’crosstalk’ acts as a previously unexplored source of noise in biochemical networks and puts a strong constraint on their performance. To mitigate erroneous initiation we propose an out of equilibrium scheme that implements kinetic proofreading. We show that such architectures are favored  over their equilibrium counterparts for complex organisms despite introducing noise in gene expression. },
  author       = {Cepeda Humerez, Sarah A},
  issn         = {2663-337X},
  keywords     = {Information estimation, Time-series, data analysis},
  pages        = {135},
  publisher    = {Institute of Science and Technology Austria},
  title        = {{Estimating information flow in single cells}},
  doi          = {10.15479/AT:ISTA:6473},
  year         = {2019},
}

