@inbook{a6006cfd24674571a9d9b34a8d6cfde9,

title = "Statistics is easy case studies on real scientific datasets",

abstract = "Computational analysis of natural science experiments often confronts noisy data due to natural variability in environment or measurement. Drawing conclusions in the face of such noise entails a statistical analysis. Parametric statistical methods assume that the data is a sample from a population that can be characterized by a specific distribution (e.g., a normal distribution). When the assumption is true, parametric approaches can lead to high confidence predictions. However, in many cases particular distribution assumptions do not hold. In that case, assuming a distribution may yield false conclusions. The companion book Statistics is Easy, gave a (nearly) equation-free introduction to nonparametric (i.e., no distribution assumption) statistical methods. The present book applies data preparation, machine learning, and nonparametric statistics to three quite different life science datasets. We provide the code as applied to each dataset in both R and Python 3. We also include exercises for self-study or classroom use.",

keywords = "Case studies, Data cleaning, Machine learning, Nonparametric statistics, Null value imputation, Scientific data",

author = "Katari, {Manpreet Singh} and Sudarshini Tyagi and Dennis Shasha",

note = "Funding Information: Shasha has been partially supported by NIH 1R01GM121753-01A1 the U.S. National Science Foundation under grants MCB-1412232 and IOS-1339362 and MCB-0929339. Katari has been partially supported by NIH-NIGMS: 1 R01 GM121753-01 and DOE-BER: DE-SC0014377. This support is greatly appreciated. Publisher Copyright: {\textcopyright} 2020 Lippincott Williams and Wilkins. All rights reserved.",

year = "2021",

month = apr,

day = "7",

language = "English (US)",

series = "Synthesis Lectures on Mathematics and Statistics",

publisher = "Morgan and Claypool Publishers",

number = "3",

pages = "1--73",

booktitle = "Synthesis Lectures on Mathematics and Statistics",

address = "United States",

edition = "3",

}