@misc{2007, abstract = {Maximum likelihood estimation under relational models, with or without the overall effect. For more information see the reference manual}, author = {Klimova, Anna and Rudas, Tamás}, publisher = {The Comprehensive R Archive Network}, title = {{gIPFrm: Generalized iterative proportional fitting for relational models}}, year = {2014}, } @article{2013, abstract = {An asymptotic theory is developed for computing volumes of regions in the parameter space of a directed Gaussian graphical model that are obtained by bounding partial correlations. We study these volumes using the method of real log canonical thresholds from algebraic geometry. Our analysis involves the computation of the singular loci of correlation hypersurfaces. Statistical applications include the strong-faithfulness assumption for the PC algorithm and the quantification of confounder bias in causal inference. A detailed analysis is presented for trees, bow ties, tripartite graphs, and complete graphs. }, author = {Lin, Shaowei and Uhler, Caroline and Sturmfels, Bernd and Bühlmann, Peter}, journal = {Foundations of Computational Mathematics}, number = {5}, pages = {1079 -- 1116}, publisher = {Springer}, title = {{Hypersurfaces and their singularities in partial correlation testing}}, doi = {10.1007/s10208-014-9205-0}, volume = {14}, year = {2014}, } @inproceedings{2047, abstract = {Following the publication of an attack on genome-wide association studies (GWAS) data proposed by Homer et al., considerable attention has been given to developing methods for releasing GWAS data in a privacy-preserving way. Here, we develop an end-to-end differentially private method for solving regression problems with convex penalty functions and selecting the penalty parameters by cross-validation. In particular, we focus on penalized logistic regression with elastic-net regularization, a method widely used to in GWAS analyses to identify disease-causing genes. We show how a differentially private procedure for penalized logistic regression with elastic-net regularization can be applied to the analysis of GWAS data and evaluate our method’s performance.}, author = {Yu, Fei and Rybar, Michal and Uhler, Caroline and Fienberg, Stephen}, booktitle = {Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)}, editor = {Domingo Ferrer, Josep}, location = {Ibiza, Spain}, pages = {170 -- 184}, publisher = {Springer}, title = {{Differentially-private logistic regression for detecting multiple-SNP association in GWAS databases}}, doi = {10.1007/978-3-319-11257-2_14}, volume = {8744}, year = {2014}, } @article{2178, abstract = {We consider the three-state toric homogeneous Markov chain model (THMC) without loops and initial parameters. At time T, the size of the design matrix is 6 × 3 · 2T-1 and the convex hull of its columns is the model polytope. We study the behavior of this polytope for T ≥ 3 and we show that it is defined by 24 facets for all T ≥ 5. Moreover, we give a complete description of these facets. From this, we deduce that the toric ideal associated with the design matrix is generated by binomials of degree at most 6. Our proof is based on a result due to Sturmfels, who gave a bound on the degree of the generators of a toric ideal, provided the normality of the corresponding toric variety. In our setting, we established the normality of the toric variety associated to the THMC model by studying the geometric properties of the model polytope.}, author = {Haws, David and Martin Del Campo Sanchez, Abraham and Takemura, Akimichi and Yoshida, Ruriko}, journal = {Beitrage zur Algebra und Geometrie}, number = {1}, pages = {161 -- 188}, publisher = {Springer}, title = {{Markov degree of the three-state toric homogeneous Markov chain model}}, doi = {10.1007/s13366-013-0178-y}, volume = {55}, year = {2014}, } @unpublished{2012, abstract = {The classical sphere packing problem asks for the best (infinite) arrangement of non-overlapping unit balls which cover as much space as possible. We define a generalized version of the problem, where we allow each ball a limited amount of overlap with other balls. We study two natural choices of overlap measures and obtain the optimal lattice packings in a parameterized family of lattices which contains the FCC, BCC, and integer lattice.}, author = {Iglesias Ham, Mabel and Kerber, Michael and Uhler, Caroline}, booktitle = {arXiv}, title = {{Sphere packing with limited overlap}}, doi = {10.48550/arXiv.1401.0468}, year = {2014}, } @article{2010, abstract = {Many algorithms for inferring causality rely heavily on the faithfulness assumption. The main justification for imposing this assumption is that the set of unfaithful distributions has Lebesgue measure zero, since it can be seen as a collection of hypersurfaces in a hypercube. However, due to sampling error the faithfulness condition alone is not sufficient for statistical estimation, and strong-faithfulness has been proposed and assumed to achieve uniform or high-dimensional consistency. In contrast to the plain faithfulness assumption, the set of distributions that is not strong-faithful has nonzero Lebesgue measure and in fact, can be surprisingly large as we show in this paper. We study the strong-faithfulness condition from a geometric and combinatorial point of view and give upper and lower bounds on the Lebesgue measure of strong-faithful distributions for various classes of directed acyclic graphs. Our results imply fundamental limitations for the PC-algorithm and potentially also for other algorithms based on partial correlation testing in the Gaussian case.}, author = {Uhler, Caroline and Raskutti, Garvesh and Bühlmann, Peter and Yu, Bin}, journal = {The Annals of Statistics}, number = {2}, pages = {436 -- 463}, publisher = {Institute of Mathematical Statistics}, title = {{Geometry of the faithfulness assumption in causal inference}}, doi = {10.1214/12-AOS1080}, volume = {41}, year = {2013}, } @article{2009, abstract = {Traditional statistical methods for confidentiality protection of statistical databases do not scale well to deal with GWAS databases especially in terms of guarantees regarding protection from linkage to external information. The more recent concept of differential privacy, introduced by the cryptographic community, is an approach which provides a rigorous definition of privacy with meaningful privacy guarantees in the presence of arbitrary external information, although the guarantees may come at a serious price in terms of data utility. Building on such notions, we propose new methods to release aggregate GWAS data without compromising an individual’s privacy. We present methods for releasing differentially private minor allele frequencies, chi-square statistics and p-values. We compare these approaches on simulated data and on a GWAS study of canine hair length involving 685 dogs. We also propose a privacy-preserving method for finding genome-wide associations based on a differentially-private approach to penalized logistic regression.}, author = {Uhler, Caroline and Slavkovic, Aleksandra and Fienberg, Stephen}, journal = {Journal of Privacy and Confidentiality }, number = {1}, pages = {137 -- 166}, publisher = {Carnegie Mellon University}, title = {{Privacy-preserving data sharing for genome-wide association studies}}, doi = {10.29012/jpc.v5i1.629}, volume = {5}, year = {2013}, } @article{2280, abstract = {The problem of packing ellipsoids of different sizes and shapes into an ellipsoidal container so as to minimize a measure of overlap between ellipsoids is considered. A bilevel optimization formulation is given, together with an algorithm for the general case and a simpler algorithm for the special case in which all ellipsoids are in fact spheres. Convergence results are proved and computational experience is described and illustrated. The motivating application-chromosome organization in the human cell nucleus-is discussed briefly, and some illustrative results are presented.}, author = {Uhler, Caroline and Wright, Stephen}, journal = {SIAM Review}, number = {4}, pages = {671 -- 706}, publisher = {Society for Industrial and Applied Mathematics }, title = {{Packing ellipsoids with overlap}}, doi = {10.1137/120872309}, volume = {55}, year = {2013}, } @article{2959, abstract = {We study maximum likelihood estimation in Gaussian graphical models from a geometric point of view. An algebraic elimination criterion allows us to find exact lower bounds on the number of observations needed to ensure that the maximum likelihood estimator (MLE) exists with probability one. This is applied to bipartite graphs, grids and colored graphs. We also study the ML degree, and we present the first instance of a graph for which the MLE exists with probability one, even when the number of observations equals the treewidth.}, author = {Uhler, Caroline}, journal = {Annals of Statistics}, number = {1}, pages = {238 -- 261}, publisher = {Institute of Mathematical Statistics}, title = {{Geometry of maximum likelihood estimation in Gaussian graphical models}}, doi = {10.1214/11-AOS957}, volume = {40}, year = {2012}, }