@inproceedings{9632,
  abstract     = {Second-order information, in the form of Hessian- or Inverse-Hessian-vector products, is a fundamental tool for solving optimization problems. Recently, there has been significant interest in utilizing this information in the context of deep
neural networks; however, relatively little is known about the quality of existing approximations in this context. Our work examines this question, identifies issues with existing approaches, and proposes a method called WoodFisher to compute a faithful and efficient estimate of the inverse Hessian. Our main application is to neural network compression, where we build on the classic Optimal Brain Damage/Surgeon framework. We demonstrate that WoodFisher significantly outperforms popular state-of-the-art methods for oneshot pruning. Further, even when iterative, gradual pruning is allowed, our method results in a gain in test accuracy over the state-of-the-art approaches, for standard image classification datasets such as ImageNet ILSVRC. We examine how our method can be extended to take into account first-order information, as well as
illustrate its ability to automatically set layer-wise pruning thresholds and perform compression in the limited-data regime. The code is available at the following link, https://github.com/IST-DASLab/WoodFisher.},
  author       = {Singh, Sidak Pal and Alistarh, Dan-Adrian},
  isbn         = {9781713829546},
  issn         = {1049-5258},
  location     = {Vancouver, Canada},
  pages        = {18098--18109},
  publisher    = {Neural Information Processing Systems Foundation},
  title        = {{WoodFisher: Efficient second-order approximation for neural network compression}},
  volume       = {33},
  year         = {2020},
}

@misc{9708,
  abstract     = {This research data supports 'Hard antinodal gap revealed by quantum oscillations in the pseudogap regime of underdoped high-Tc superconductors'. A Readme file for plotting each figure is provided.},
  author       = {Hartstein, Mate and Hsu, Yu-Te and Modic, Kimberly A and Porras, Juan and Loew, Toshinao and Le Tacon, Matthieu and Zuo, Huakun and Wang, Jinhua and Zhu, Zengwei and Chan, Mun and McDonald, Ross and Lonzarich, Gilbert and Keimer, Bernhard and Sebastian, Suchitra and Harrison, Neil},
  publisher    = {Apollo - University of Cambridge},
  title        = {{Accompanying dataset for 'Hard antinodal gap revealed by quantum oscillations in the pseudogap regime of underdoped high-Tc superconductors'}},
  doi          = {10.17863/cam.50169},
  year         = {2020},
}

@misc{9713,
  abstract     = {Additional analyses of the trajectories},
  author       = {Gupta, Chitrak and Khaniya, Umesh and Chan, Chun Kit and Dehez, Francois and Shekhar, Mrinal and Gunner, M.R. and Sazanov, Leonid A and Chipot, Christophe and Singharoy, Abhishek},
  publisher    = {American Chemical Society },
  title        = {{Supporting information}},
  doi          = {10.1021/jacs.9b13450.s001},
  year         = {2020},
}

@misc{9776,
  author       = {Grah, Rok and Friedlander, Tamar},
  publisher    = {Public Library of Science},
  title        = {{Supporting information}},
  doi          = {10.1371/journal.pcbi.1007642.s001},
  year         = {2020},
}

@misc{9777,
  author       = {Grah, Rok and Friedlander, Tamar},
  publisher    = {Public Library of Science},
  title        = {{Maximizing crosstalk}},
  doi          = {10.1371/journal.pcbi.1007642.s002},
  year         = {2020},
}

@misc{9779,
  author       = {Grah, Rok and Friedlander, Tamar},
  publisher    = {Public Library of Science},
  title        = {{Distribution of crosstalk values}},
  doi          = {10.1371/journal.pcbi.1007642.s003},
  year         = {2020},
}

@misc{9780,
  abstract     = {PADREV : 4,4'-dimethoxy[1,1'-biphenyl]-2,2',5,5'-tetrol
Space Group: C 2 (5), Cell: a 24.488(16)Å b 5.981(4)Å c 3.911(3)Å, α 90° β 91.47(3)° γ 90°},
  author       = {Schlemmer, Werner and Nothdurft, Philipp and Petzold, Alina and Riess, Gisbert and Frühwirt, Philipp and Schmallegger, Max and Gescheidt-Demner, Georg and Fischer, Roland and Freunberger, Stefan Alexander and Kern, Wolfgang and Spirk, Stefan},
  publisher    = {CCDC},
  title        = {{CCDC 1991959: Experimental Crystal Structure Determination}},
  doi          = {10.5517/ccdc.csd.cc24vsrk},
  year         = {2020},
}

@misc{9798,
  abstract     = {Fitness interactions between mutations can influence a population’s evolution in many different ways. While epistatic effects are difficult to measure precisely, important information is captured by the mean and variance of log fitnesses for individuals carrying different numbers of mutations. We derive predictions for these quantities from a class of simple fitness landscapes, based on models of optimizing selection on quantitative traits. We also explore extensions to the models, including modular pleiotropy, variable effect sizes, mutational bias and maladaptation of the wild type. We illustrate our approach by reanalysing a large dataset of mutant effects in a yeast snoRNA. Though characterized by some large epistatic effects, these data give a good overall fit to the non-epistatic null model, suggesting that epistasis might have limited influence on the evolutionary dynamics in this system. We also show how the amount of epistasis depends on both the underlying fitness landscape and the distribution of mutations, and so is expected to vary in consistent ways between new mutations, standing variation and fixed mutations.},
  author       = {Fraisse, Christelle and Welch, John J.},
  publisher    = {Royal Society of London},
  title        = {{Simulation code for Fig S2 from the distribution of epistasis on simple fitness landscapes}},
  doi          = {10.6084/m9.figshare.7957472.v1},
  year         = {2020},
}

@misc{9799,
  abstract     = {Fitness interactions between mutations can influence a population’s evolution in many different ways. While epistatic effects are difficult to measure precisely, important information is captured by the mean and variance of log fitnesses for individuals carrying different numbers of mutations. We derive predictions for these quantities from a class of simple fitness landscapes, based on models of optimizing selection on quantitative traits. We also explore extensions to the models, including modular pleiotropy, variable effect sizes, mutational bias and maladaptation of the wild type. We illustrate our approach by reanalysing a large dataset of mutant effects in a yeast snoRNA. Though characterized by some large epistatic effects, these data give a good overall fit to the non-epistatic null model, suggesting that epistasis might have limited influence on the evolutionary dynamics in this system. We also show how the amount of epistasis depends on both the underlying fitness landscape and the distribution of mutations, and so is expected to vary in consistent ways between new mutations, standing variation and fixed mutations.},
  author       = {Fraisse, Christelle and Welch, John J.},
  publisher    = {Royal Society of London},
  title        = {{Simulation code for Fig S1 from the distribution of epistasis on simple fitness landscapes}},
  doi          = {10.6084/m9.figshare.7957469.v1},
  year         = {2020},
}

@misc{9814,
  abstract     = {Data and mathematica notebooks for plotting figures from Language learning with communication between learners},
  author       = {Ibsen-Jensen, Rasmus and Tkadlec, Josef and Chatterjee, Krishnendu and Nowak, Martin},
  publisher    = {Royal Society},
  title        = {{Data and mathematica notebooks for plotting figures from language learning with communication between learners from language acquisition with communication between learners}},
  doi          = {10.6084/m9.figshare.5973013.v1},
  year         = {2020},
}

@article{5681,
  abstract     = {We introduce dynamically warping grids for adaptive liquid simulation. Our primary contributions are a strategy for dynamically deforming regular grids over the course of a simulation and a method for efficiently utilizing these deforming grids for liquid simulation. Prior work has shown that unstructured grids are very effective for adaptive fluid simulations. However, unstructured grids often lead to complicated implementations and a poor cache hit rate due to inconsistent memory access. Regular grids, on the other hand, provide a fast, fixed memory access pattern and straightforward implementation. Our method combines the advantages of both: we leverage the simplicity of regular grids while still achieving practical and controllable spatial adaptivity. We demonstrate that our method enables adaptive simulations that are fast, flexible, and robust to null-space issues. At the same time, our method is simple to implement and takes advantage of existing highly-tuned algorithms.},
  author       = {Hikaru, Ibayashi and Wojtan, Christopher J and Thuerey, Nils and Igarashi, Takeo and Ando, Ryoichi},
  issn         = {1941-0506},
  journal      = {IEEE Transactions on Visualization and Computer Graphics},
  number       = {6},
  pages        = {2288--2302},
  publisher    = {IEEE},
  title        = {{Simulating liquids on dynamically warping grids}},
  doi          = {10.1109/TVCG.2018.2883628},
  volume       = {26},
  year         = {2020},
}

@article{6358,
  abstract     = {We study dynamical optimal transport metrics between density matricesassociated to symmetric Dirichlet forms on finite-dimensional C∗-algebras.  Our settingcovers  arbitrary  skew-derivations  and  it  provides  a  unified  framework  that  simultaneously  generalizes  recently  constructed  transport  metrics  for  Markov  chains,  Lindblad  equations,  and  the  Fermi  Ornstein–Uhlenbeck  semigroup.   We  develop  a  non-nommutative differential calculus that allows us to obtain non-commutative Ricci curvature  bounds,  logarithmic  Sobolev  inequalities,  transport-entropy  inequalities,  andspectral gap estimates.},
  author       = {Carlen, Eric A. and Maas, Jan},
  issn         = {1572-9613},
  journal      = {Journal of Statistical Physics},
  number       = {2},
  pages        = {319--378},
  publisher    = {Springer Nature},
  title        = {{Non-commutative calculus, optimal transport and functional inequalities  in dissipative quantum systems}},
  doi          = {10.1007/s10955-019-02434-w},
  volume       = {178},
  year         = {2020},
}

@article{6359,
  abstract     = {The strong rate of convergence of the Euler-Maruyama scheme for nondegenerate SDEs with irregular drift coefficients is considered. In the case of α-Hölder drift in the recent literature the rate α/2 was proved in many related situations. By exploiting the regularising effect of the noise more efficiently, we show that the rate is in fact arbitrarily close to 1/2 for all α>0. The result extends to Dini continuous coefficients, while in d=1 also to all bounded measurable coefficients.},
  author       = {Dareiotis, Konstantinos and Gerencser, Mate},
  issn         = {1083-6489},
  journal      = {Electronic Journal of Probability},
  publisher    = {Institute of Mathematical Statistics},
  title        = {{On the regularisation of the noise for the Euler-Maruyama scheme with irregular drift}},
  doi          = {10.1214/20-EJP479},
  volume       = {25},
  year         = {2020},
}

@article{6488,
  abstract     = {We prove a central limit theorem for the difference of linear eigenvalue statistics of a sample covariance matrix W˜ and its minor W. We find that the fluctuation of this difference is much smaller than those of the individual linear statistics, as a consequence of the strong correlation between the eigenvalues of W˜ and W. Our result identifies the fluctuation of the spatial derivative of the approximate Gaussian field in the recent paper by Dumitru and Paquette. Unlike in a similar result for Wigner matrices, for sample covariance matrices, the fluctuation may entirely vanish.},
  author       = {Cipolloni, Giorgio and Erdös, László},
  issn         = {2010-3271},
  journal      = {Random Matrices: Theory and Application},
  number       = {3},
  publisher    = {World Scientific Publishing},
  title        = {{Fluctuations for differences of linear eigenvalue statistics for sample covariance matrices}},
  doi          = {10.1142/S2010326320500069},
  volume       = {9},
  year         = {2020},
}

@article{6563,
  abstract     = {This paper presents two algorithms. The first decides the existence of a pointed homotopy between given simplicial maps 𝑓,𝑔:𝑋→𝑌, and the second computes the group [𝛴𝑋,𝑌]∗ of pointed homotopy classes of maps from a suspension; in both cases, the target Y is assumed simply connected. More generally, these algorithms work relative to 𝐴⊆𝑋.},
  author       = {Filakovský, Marek and Vokřínek, Lukas},
  issn         = {1615-3383},
  journal      = {Foundations of Computational Mathematics},
  pages        = {311--330},
  publisher    = {Springer Nature},
  title        = {{Are two given maps homotopic? An algorithmic viewpoint}},
  doi          = {10.1007/s10208-019-09419-x},
  volume       = {20},
  year         = {2020},
}

@article{6593,
  abstract     = {We consider the monotone variational inequality problem in a Hilbert space and describe a projection-type method with inertial terms under the following properties: (a) The method generates a strongly convergent iteration sequence; (b) The method requires, at each iteration, only one projection onto the feasible set and two evaluations of the operator; (c) The method is designed for variational inequality for which the underline operator is monotone and uniformly continuous; (d) The method includes an inertial term. The latter is also shown to speed up the convergence in our numerical results. A comparison with some related methods is given and indicates that the new method is promising.},
  author       = {Shehu, Yekini and Li, Xiao-Huan and Dong, Qiao-Li},
  issn         = {1572-9265},
  journal      = {Numerical Algorithms},
  pages        = {365--388},
  publisher    = {Springer Nature},
  title        = {{An efficient projection-type method for monotone variational inequalities in Hilbert spaces}},
  doi          = {10.1007/s11075-019-00758-y},
  volume       = {84},
  year         = {2020},
}

@article{6748,
  abstract     = {Fitting a function by using linear combinations of a large number N of `simple' components is one of the most fruitful ideas in statistical learning. This idea lies at the core of a variety of methods, from two-layer neural networks to kernel regression, to boosting. In general, the resulting risk minimization problem is non-convex and is solved by gradient descent or its variants. Unfortunately, little is known about global convergence properties of these approaches.
Here we consider the problem of learning a concave function f on a compact convex domain Ω⊆ℝd, using linear combinations of `bump-like' components (neurons). The parameters to be fitted are the centers of N bumps, and the resulting empirical risk minimization problem is highly non-convex. We prove that, in the limit in which the number of neurons diverges, the evolution of gradient descent converges to a Wasserstein gradient flow in the space of probability distributions over Ω. Further, when the bump width δ tends to 0, this gradient flow has a limit which is a viscous porous medium equation. Remarkably, the cost function optimized by this gradient flow exhibits a special property known as displacement convexity, which implies exponential convergence rates for N→∞, δ→0. Surprisingly, this asymptotic theory appears to capture well the behavior for moderate values of δ,N. Explaining this phenomenon, and understanding the dependence on δ,N in a quantitative manner remains an outstanding challenge.},
  author       = {Javanmard, Adel and Mondelli, Marco and Montanari, Andrea},
  issn         = {1941-7330},
  journal      = {Annals of Statistics},
  number       = {6},
  pages        = {3619--3642},
  publisher    = {Institute of Mathematical Statistics},
  title        = {{Analysis of a two-layer neural network via displacement convexity}},
  doi          = {10.1214/20-AOS1945},
  volume       = {48},
  year         = {2020},
}

@article{6796,
  abstract     = {Nearby grid cells have been observed to express a remarkable degree of long-rangeorder, which is often idealized as extending potentially to infinity. Yet their strict peri-odic firing and ensemble coherence are theoretically possible only in flat environments, much unlike the burrows which rodents usually live in. Are the symmetrical, coherent grid maps inferred in the lab relevant to chart their way in their natural habitat? We consider spheres as simple models of curved environments and waiting for the appropriate experiments to be performed, we use our adaptation model to predict what grid maps would emerge in a network with the same type of recurrent connections, which on the plane produce coherence among the units. We find that on the sphere such connections distort the maps that single grid units would express on their own, and aggregate them into clusters. When remapping to a different spherical environment, units in each cluster maintain only partial coherence, similar to what is observed in disordered materials, such as spin glasses.},
  author       = {Stella, Federico and Urdapilleta, Eugenio and Luo, Yifan and Treves, Alessandro},
  issn         = {1098-1063},
  journal      = {Hippocampus},
  number       = {4},
  pages        = {302--313},
  publisher    = {Wiley},
  title        = {{Partial coherence and frustration in self-organizing spherical grids}},
  doi          = {10.1002/hipo.23144},
  volume       = {30},
  year         = {2020},
}

@article{6808,
  abstract     = {Super-resolution fluorescence microscopy has become an important catalyst for discovery in the life sciences. In STimulated Emission Depletion (STED) microscopy, a pattern of light drives fluorophores from a signal-emitting on-state to a non-signalling off-state. Only emitters residing in a sub-diffraction volume around an intensity minimum are allowed to fluoresce, rendering them distinguishable from the nearby, but dark fluorophores. STED routinely achieves resolution in the few tens of nanometers range in biological samples and is suitable for live imaging. Here, we review the working principle of STED and provide general guidelines for successful STED imaging. The strive for ever higher resolution comes at the cost of increased light burden. We discuss techniques to reduce light exposure and mitigate its detrimental effects on the specimen. These include specialized illumination strategies as well as protecting fluorophores from photobleaching mediated by high-intensity STED light. This opens up the prospect of volumetric imaging in living cells and tissues with diffraction-unlimited resolution in all three spatial dimensions.},
  author       = {Jahr, Wiebke and Velicky, Philipp and Danzl, Johann G},
  issn         = {1046-2023},
  journal      = {Methods},
  number       = {3},
  pages        = {27--41},
  publisher    = {Elsevier},
  title        = {{Strategies to maximize performance in STimulated Emission Depletion (STED) nanoscopy of biological specimens}},
  doi          = {10.1016/j.ymeth.2019.07.019},
  volume       = {174},
  year         = {2020},
}

@article{6906,
  abstract     = {We consider systems of bosons trapped in a box, in the Gross–Pitaevskii regime. We show that low-energy states exhibit complete Bose–Einstein condensation with an optimal bound on the number of orthogonal excitations. This extends recent results obtained in Boccato et al. (Commun Math Phys 359(3):975–1026, 2018), removing the assumption of small interaction potential.},
  author       = {Boccato, Chiara and Brennecke, Christian and Cenatiempo, Serena and Schlein, Benjamin},
  issn         = {1432-0916},
  journal      = {Communications in Mathematical Physics},
  pages        = {1311--1395},
  publisher    = {Springer},
  title        = {{Optimal rate for Bose-Einstein condensation in the Gross-Pitaevskii regime}},
  doi          = {10.1007/s00220-019-03555-9},
  volume       = {376},
  year         = {2020},
}

