@article{9658,
  abstract     = {Macroscopic models of nucleation provide powerful tools for understanding activated phase transition processes. These models do not provide atomistic insights and can thus sometimes lack material-specific descriptions. Here, we provide a comprehensive framework for constructing a continuum picture from an atomistic simulation of homogeneous nucleation. We use this framework to determine the equilibrium shape of the solid nucleus that forms inside bulk liquid for a Lennard-Jones potential. From this shape, we then extract the anisotropy of the solid-liquid interfacial free energy, by performing a reverse Wulff construction in the space of spherical harmonic expansions. We find that the shape of the nucleus is nearly spherical and that its anisotropy can be perfectly described using classical models.},
  author       = {Cheng, Bingqing and Ceriotti, Michele and Tribello, Gareth A.},
  issn         = {1089-7690},
  journal      = {The Journal of Chemical Physics},
  number       = {4},
  publisher    = {AIP Publishing},
  title        = {{Classical nucleation theory predicts the shape of the nucleus in homogeneous solidification}},
  doi          = {10.1063/1.5134461},
  volume       = {152},
  year         = {2020},
}

@article{9664,
  abstract     = {Equilibrium molecular dynamics simulations, in combination with the Green-Kubo (GK) method, have been extensively used to compute the thermal conductivity of liquids. However, the GK method relies on an ambiguous definition of the microscopic heat flux, which depends on how one chooses to distribute energies over atoms. This ambiguity makes it problematic to employ the GK method for systems with nonpairwise interactions. In this work, we show that the hydrodynamic description of thermally driven density fluctuations can be used to obtain the thermal conductivity of a bulk fluid unambiguously, thereby bypassing the need to define the heat flux. We verify that, for a model fluid with only pairwise interactions, our method yields estimates of thermal conductivity consistent with the GK approach. We apply our approach to compute the thermal conductivity of a nonpairwise additive water model at supercritical conditions, and of a liquid hydrogen system described by a machine-learning interatomic potential, at 33 GPa and 2000 K.},
  author       = {Cheng, Bingqing and Frenkel, Daan},
  issn         = {1079-7114},
  journal      = {Physical Review Letters},
  number       = {13},
  publisher    = {American Physical Society},
  title        = {{Computing the heat conductivity of fluids from density fluctuations}},
  doi          = {10.1103/physrevlett.125.130602},
  volume       = {125},
  year         = {2020},
}

@article{9666,
  abstract     = {Predicting phase stabilities of crystal polymorphs is central to computational materials science and chemistry. Such predictions are challenging because they first require searching for potential energy minima and then performing arduous free-energy calculations to account for entropic effects at finite temperatures. Here, we develop a framework that facilitates such predictions by exploiting all the information obtained from random searches of crystal structures. This framework combines automated clustering, classification and visualisation of crystal structures with machine-learning estimation of their enthalpy and entropy. We demonstrate the framework on the technologically important system of TiO2, which has many polymorphs, without relying on prior knowledge of known phases. We find a number of new phases and predict the phase diagram and metastabilities of crystal polymorphs at 1600 K, benchmarking the results against full free-energy calculations.},
  author       = {Reinhardt, Aleks and Pickard, Chris J. and Cheng, Bingqing},
  issn         = {1463-9084},
  journal      = {Physical Chemistry Chemical Physics},
  number       = {22},
  pages        = {12697--12705},
  publisher    = {Royal Society of Chemistry},
  title        = {{Predicting the phase diagram of titanium dioxide with random search and pattern recognition}},
  doi          = {10.1039/d0cp02513e},
  volume       = {22},
  year         = {2020},
}

@article{9671,
  abstract     = {Water molecules can arrange into a liquid with complex hydrogen-bond networks and at least 17 experimentally confirmed ice phases with enormous structural diversity. It remains a puzzle how or whether this multitude of arrangements in different phases of water are related. Here we investigate the structural similarities between liquid water and a comprehensive set of 54 ice phases in simulations, by directly comparing their local environments using general atomic descriptors, and also by demonstrating that a machine-learning potential trained on liquid water alone can predict the densities, lattice energies, and vibrational properties of the ices. The finding that the local environments characterising the different ice phases are found in water sheds light on the phase behavior of water, and rationalizes the transferability of water models between different phases.},
  author       = {Monserrat, Bartomeu and Brandenburg, Jan Gerit and Engel, Edgar A. and Cheng, Bingqing},
  issn         = {2041-1723},
  journal      = {Nature Communications},
  number       = {1},
  publisher    = {Springer Nature},
  title        = {{Liquid water contains the building blocks of diverse ice phases}},
  doi          = {10.1038/s41467-020-19606-y},
  volume       = {11},
  year         = {2020},
}

@article{9675,
  abstract     = {The visualization of data is indispensable in scientific research, from the early stages when human insight forms to the final step of communicating results. In computational physics, chemistry and materials science, it can be as simple as making a scatter plot or as straightforward as looking through the snapshots of atomic positions manually. However, as a result of the "big data" revolution, these conventional approaches are often inadequate. The widespread adoption of high-throughput computation for materials discovery and the associated community-wide repositories have given rise to data sets that contain an enormous number of compounds and atomic configurations. A typical data set contains thousands to millions of atomic structures, along with a diverse range of properties such as formation energies, band gaps, or bioactivities.It would thus be desirable to have a data-driven and automated framework for visualizing and analyzing such structural data sets. The key idea is to construct a low-dimensional representation of the data, which facilitates navigation, reveals underlying patterns, and helps to identify data points with unusual attributes. Such data-intensive maps, often employing machine learning methods, are appearing more and more frequently in the literature. However, to the wider community, it is not always transparent how these maps are made and how they should be interpreted. Furthermore, while these maps undoubtedly serve a decorative purpose in academic publications, it is not always apparent what extra information can be garnered from reading or making them.This Account attempts to answer such questions. We start with a concise summary of the theory of representing chemical environments, followed by the introduction of a simple yet practical conceptual approach for generating structure maps in a generic and automated manner. Such analysis and mapping is made nearly effortless by employing the newly developed software tool ASAP. To showcase the applicability to a wide variety of systems in chemistry and materials science, we provide several illustrative examples, including crystalline and amorphous materials, interfaces, and organic molecules. In these examples, the maps not only help to sift through large data sets but also reveal hidden patterns that could be easily missed using conventional analyses.The explosion in the amount of computed information in chemistry and materials science has made visualization into a science in itself. Not only have we benefited from exploiting these visualization methods in previous works, we also believe that the automated mapping of data sets will in turn stimulate further creativity and exploration, as well as ultimately feed back into future advances in the respective fields.},
  author       = {Cheng, Bingqing and Griffiths, Ryan-Rhys and Wengert, Simon and Kunkel, Christian and Stenczel, Tamas and Zhu, Bonan and Deringer, Volker L. and Bernstein, Noam and Margraf, Johannes T. and Reuter, Karsten and Csanyi, Gabor},
  issn         = {1520-4898},
  journal      = {Accounts of Chemical Research},
  number       = {9},
  pages        = {1981--1991},
  publisher    = {American Chemical Society},
  title        = {{Mapping materials and molecules}},
  doi          = {10.1021/acs.accounts.0c00403},
  volume       = {53},
  year         = {2020},
}

@article{9685,
  abstract     = {Hydrogen, the simplest and most abundant element in the Universe, develops a remarkably complex behaviour upon compression^1. Since Wigner predicted the dissociation and metallization of solid hydrogen at megabar pressures almost a century ago^2, several efforts have been made to explain the many unusual properties of dense hydrogen, including a rich and poorly understood solid polymorphism^1,3-5, an anomalous melting line6 and the possible transition to a superconducting state^7. Experiments at such extreme conditions are challenging and often lead to hard-to-interpret and controversial observations, whereas theoretical investigations are constrained by the huge computational cost of sufficiently accurate quantum mechanical calculations. Here we present a theoretical study of the phase diagram of dense hydrogen that uses machine learning to 'learn' potential-energy surfaces and interatomic forces from reference calculations and then predict them at low computational cost, overcoming length- and timescale limitations. We reproduce both the re-entrant melting behaviour and the polymorphism of the solid phase. Simulations using our machine-learning-based potentials provide evidence for a continuous molecular-to-atomic transition in the liquid, with no first-order transition observed above the melting line. This suggests a smooth transition between insulating and metallic layers in giant gas planets, and reconciles existing discrepancies between experiments as a manifestation of supercritical behaviour.},
  author       = {Cheng, Bingqing and Mazzola, Guglielmo and Pickard, Chris J. and Ceriotti, Michele},
  issn         = {1476-4687},
  journal      = {Nature},
  number       = {7824},
  pages        = {217--220},
  publisher    = {Springer Nature},
  title        = {{Evidence for supercritical behaviour of high-pressure liquid hydrogen}},
  doi          = {10.1038/s41586-020-2677-y},
  volume       = {585},
  year         = {2020},
}

@unpublished{9699,
  abstract     = {We investigate the structural similarities between liquid water and 53 ices, including 20 known crystalline phases. We base such similarity comparison on the local environments that consist of atoms within a certain cutoff radius of a central atom. We reveal that liquid water explores the local environments of the diverse ice phases, by directly comparing the environments in these phases using general atomic descriptors, and also by demonstrating that a machine-learning potential trained on liquid water alone can predict the densities, the lattice energies, and vibrational properties of the
ices. The finding that the local environments characterising the different ice phases are found in water sheds light on water phase behaviors, and rationalizes the transferability of water models between different phases.},
  author       = {Monserrat, Bartomeu and Brandenburg, Jan Gerit and Engel, Edgar A. and Cheng, Bingqing},
  booktitle    = {arXiv},
  title        = {{Extracting ice phases from liquid water: Why a machine-learning water model generalizes so well}},
  doi          = {10.48550/arXiv.2006.13316},
  year         = {2020},
}

@misc{9706,
  abstract     = {Additional file 2: Supplementary Tables. The association of pre-adjusted protein levels with biological and technical covariates. Protein levels were adjusted for age, sex, array plate and four genetic principal components (population structure) prior to analyses. Significant associations are emboldened. (Table S1). pQTLs associated with inflammatory biomarker levels from Bayesian penalised regression model (Posterior Inclusion Probability > 95%). (Table S2). All pQTLs associated with inflammatory biomarker levels from ordinary least squares regression model (P < 7.14 × 10− 10). (Table S3). Summary of lambda values relating to ordinary least squares GWAS and EWAS performed on inflammatory protein levels (n = 70) in Lothian Birth Cohort 1936 study. (Table S4). Conditionally significant pQTLs associated with inflammatory biomarker levels from ordinary least squares regression model (P < 7.14 × 10− 10). (Table S5). Comparison of variance explained by ordinary least squares and Bayesian penalised regression models for concordantly identified SNPs. (Table S6). Estimate of heritability for blood protein levels as well as proportion of variance explained attributable to different prior mixtures. (Table S7). Comparison of heritability estimates from Ahsan et al. (maximum likelihood) and Hillary et al. (Bayesian penalised regression). (Table S8). List of concordant SNPs identified by linear model and Bayesian penalised regression and whether they have been previously identified as eQTLs. (Table S9). Bayesian tests of colocalisation for cis pQTLs and cis eQTLs. (Table S10). Sherlock algorithm: Genes whose expression are putatively associated with circulating inflammatory proteins that harbour pQTLs. (Table S11). CpGs associated with inflammatory protein biomarkers as identified by Bayesian model (Bayesian model; Posterior Inclusion Probability > 95%). (Table S12). CpGs associated with inflammatory protein biomarkers as identified by linear model (limma) at P < 5.14 × 10− 10. (Table S13). CpGs associated with inflammatory protein biomarkers as identified by mixed linear model (OSCA) at P < 5.14 × 10− 10. (Table S14). Estimate of variance explained for blood protein levels by DNA methylation as well as proportion of explained attributable to different prior mixtures - BayesR+. (Table S15). Comparison of variance in protein levels explained by genome-wide DNA methylation data by mixed linear model (OSCA) and Bayesian penalised regression model (BayesR+). (Table S16). Variance in circulating inflammatory protein biomarker levels explained by common genetic and methylation data (joint and conditional estimates from BayesR+). Ordered by combined variance explained by genetic and epigenetic data - smallest to largest. Significant results from t-tests comparing distributions for variance explained by methylation or genetics alone versus combined estimate are emboldened. (Table S17). Genetic and epigenetic factors identified by BayesR+ when conditioning on all SNPs and CpGs together. (Table S18). Mendelian Randomisation analyses to assess whether proteins with concordantly identified genetic signals are causally associated with Alzheimer’s disease risk. (Table S19).},
  author       = {Hillary, Robert F. and Trejo-Banos, Daniel and Kousathanas, Athanasios and McCartney, Daniel L. and Harris, Sarah E. and Stevenson, Anna J. and Patxot, Marion and Ojavee, Sven Erik and Zhang, Qian and Liewald, David C. and Ritchie, Craig W. and Evans, Kathryn L. and Tucker-Drob, Elliot M. and Wray, Naomi R. and McRae, Allan F.  and Visscher, Peter M. and Deary, Ian J. and Robinson, Matthew Richard and Marioni, Riccardo E. },
  publisher    = {Springer Nature},
  title        = {{Additional file 2 of multi-method genome- and epigenome-wide studies of inflammatory protein levels in healthy older adults}},
  doi          = {10.6084/m9.figshare.12629697.v1},
  year         = {2020},
}

@misc{9708,
  abstract     = {This research data supports 'Hard antinodal gap revealed by quantum oscillations in the pseudogap regime of underdoped high-Tc superconductors'. A Readme file for plotting each figure is provided.},
  author       = {Hartstein, Mate and Hsu, Yu-Te and Modic, Kimberly A and Porras, Juan and Loew, Toshinao and Le Tacon, Matthieu and Zuo, Huakun and Wang, Jinhua and Zhu, Zengwei and Chan, Mun and McDonald, Ross and Lonzarich, Gilbert and Keimer, Bernhard and Sebastian, Suchitra and Harrison, Neil},
  publisher    = {Apollo - University of Cambridge},
  title        = {{Accompanying dataset for 'Hard antinodal gap revealed by quantum oscillations in the pseudogap regime of underdoped high-Tc superconductors'}},
  doi          = {10.17863/cam.50169},
  year         = {2020},
}

@misc{9713,
  abstract     = {Additional analyses of the trajectories},
  author       = {Gupta, Chitrak and Khaniya, Umesh and Chan, Chun Kit and Dehez, Francois and Shekhar, Mrinal and Gunner, M.R. and Sazanov, Leonid A and Chipot, Christophe and Singharoy, Abhishek},
  publisher    = {American Chemical Society },
  title        = {{Supporting information}},
  doi          = {10.1021/jacs.9b13450.s001},
  year         = {2020},
}

@unpublished{9750,
  abstract     = {Tension of the actomyosin cell cortex plays a key role in determining cell-cell contact growth and size. The level of cortical tension outside of the cell-cell contact, when pulling at the contact edge, scales with the total size to which a cell-cell contact can grow1,2. Here we show in zebrafish primary germ layer progenitor cells that this monotonic relationship only applies to a narrow range of cortical tension increase, and that above a critical threshold, contact size inversely scales with cortical tension. This switch from cortical tension increasing to decreasing progenitor cell-cell contact size is caused by cortical tension promoting E-cadherin anchoring to the actomyosin cytoskeleton, thereby increasing clustering and stability of E-cadherin at the contact. Once tension-mediated E-cadherin stabilization at the contact exceeds a critical threshold level, the rate by which the contact expands in response to pulling forces from the cortex sharply drops, leading to smaller contacts at physiologically relevant timescales of contact formation. Thus, the activity of cortical tension in expanding cell-cell contact size is limited by tension stabilizing E-cadherin-actin complexes at the contact.},
  author       = {Slovakova, Jana and Sikora, Mateusz K and Caballero Mancebo, Silvia and Krens, Gabriel and Kaufmann, Walter and Huljev, Karla and Heisenberg, Carl-Philipp J},
  booktitle    = {bioRxiv},
  pages        = {41},
  publisher    = {Cold Spring Harbor Laboratory},
  title        = {{Tension-dependent stabilization of E-cadherin limits cell-cell contact expansion}},
  doi          = {10.1101/2020.11.20.391284},
  year         = {2020},
}

@misc{9776,
  author       = {Grah, Rok and Friedlander, Tamar},
  publisher    = {Public Library of Science},
  title        = {{Supporting information}},
  doi          = {10.1371/journal.pcbi.1007642.s001},
  year         = {2020},
}

@misc{9777,
  author       = {Grah, Rok and Friedlander, Tamar},
  publisher    = {Public Library of Science},
  title        = {{Maximizing crosstalk}},
  doi          = {10.1371/journal.pcbi.1007642.s002},
  year         = {2020},
}

@misc{9779,
  author       = {Grah, Rok and Friedlander, Tamar},
  publisher    = {Public Library of Science},
  title        = {{Distribution of crosstalk values}},
  doi          = {10.1371/journal.pcbi.1007642.s003},
  year         = {2020},
}

@misc{9780,
  abstract     = {PADREV : 4,4'-dimethoxy[1,1'-biphenyl]-2,2',5,5'-tetrol
Space Group: C 2 (5), Cell: a 24.488(16)Å b 5.981(4)Å c 3.911(3)Å, α 90° β 91.47(3)° γ 90°},
  author       = {Schlemmer, Werner and Nothdurft, Philipp and Petzold, Alina and Riess, Gisbert and Frühwirt, Philipp and Schmallegger, Max and Gescheidt-Demner, Georg and Fischer, Roland and Freunberger, Stefan Alexander and Kern, Wolfgang and Spirk, Stefan},
  publisher    = {CCDC},
  title        = {{CCDC 1991959: Experimental Crystal Structure Determination}},
  doi          = {10.5517/ccdc.csd.cc24vsrk},
  year         = {2020},
}

@article{9781,
  abstract     = {We consider the Pekar functional on a ball in ℝ3. We prove uniqueness of minimizers, and a quadratic lower bound in terms of the distance to the minimizer. The latter follows from nondegeneracy of the Hessian at the minimum.},
  author       = {Feliciangeli, Dario and Seiringer, Robert},
  issn         = {1095-7154},
  journal      = {SIAM Journal on Mathematical Analysis},
  keywords     = {Applied Mathematics, Computational Mathematics, Analysis},
  number       = {1},
  pages        = {605--622},
  publisher    = {Society for Industrial & Applied Mathematics },
  title        = {{Uniqueness and nondegeneracy of minimizers of the Pekar functional on a ball}},
  doi          = {10.1137/19m126284x},
  volume       = {52},
  year         = {2020},
}

@misc{9798,
  abstract     = {Fitness interactions between mutations can influence a population’s evolution in many different ways. While epistatic effects are difficult to measure precisely, important information is captured by the mean and variance of log fitnesses for individuals carrying different numbers of mutations. We derive predictions for these quantities from a class of simple fitness landscapes, based on models of optimizing selection on quantitative traits. We also explore extensions to the models, including modular pleiotropy, variable effect sizes, mutational bias and maladaptation of the wild type. We illustrate our approach by reanalysing a large dataset of mutant effects in a yeast snoRNA. Though characterized by some large epistatic effects, these data give a good overall fit to the non-epistatic null model, suggesting that epistasis might have limited influence on the evolutionary dynamics in this system. We also show how the amount of epistasis depends on both the underlying fitness landscape and the distribution of mutations, and so is expected to vary in consistent ways between new mutations, standing variation and fixed mutations.},
  author       = {Fraisse, Christelle and Welch, John J.},
  publisher    = {Royal Society of London},
  title        = {{Simulation code for Fig S2 from the distribution of epistasis on simple fitness landscapes}},
  doi          = {10.6084/m9.figshare.7957472.v1},
  year         = {2020},
}

@misc{9799,
  abstract     = {Fitness interactions between mutations can influence a population’s evolution in many different ways. While epistatic effects are difficult to measure precisely, important information is captured by the mean and variance of log fitnesses for individuals carrying different numbers of mutations. We derive predictions for these quantities from a class of simple fitness landscapes, based on models of optimizing selection on quantitative traits. We also explore extensions to the models, including modular pleiotropy, variable effect sizes, mutational bias and maladaptation of the wild type. We illustrate our approach by reanalysing a large dataset of mutant effects in a yeast snoRNA. Though characterized by some large epistatic effects, these data give a good overall fit to the non-epistatic null model, suggesting that epistasis might have limited influence on the evolutionary dynamics in this system. We also show how the amount of epistasis depends on both the underlying fitness landscape and the distribution of mutations, and so is expected to vary in consistent ways between new mutations, standing variation and fixed mutations.},
  author       = {Fraisse, Christelle and Welch, John J.},
  publisher    = {Royal Society of London},
  title        = {{Simulation code for Fig S1 from the distribution of epistasis on simple fitness landscapes}},
  doi          = {10.6084/m9.figshare.7957469.v1},
  year         = {2020},
}

@misc{9814,
  abstract     = {Data and mathematica notebooks for plotting figures from Language learning with communication between learners},
  author       = {Ibsen-Jensen, Rasmus and Tkadlec, Josef and Chatterjee, Krishnendu and Nowak, Martin},
  publisher    = {Royal Society},
  title        = {{Data and mathematica notebooks for plotting figures from language learning with communication between learners from language acquisition with communication between learners}},
  doi          = {10.6084/m9.figshare.5973013.v1},
  year         = {2020},
}

@misc{9878,
  author       = {Gupta, Chitrak and Khaniya, Umesh and Chan, Chun Kit and Dehez, Francois and Shekhar, Mrinal and Gunner, M.R. and Sazanov, Leonid A and Chipot, Christophe and Singharoy, Abhishek},
  publisher    = {American Chemical Society},
  title        = {{Movies}},
  doi          = {10.1021/jacs.9b13450.s002},
  year         = {2020},
}