1a:[[["$","script",null,{"type":"application/ld+json","dangerouslySetInnerHTML":{"__html":"{\"@context\":\"https://schema.org\",\"@type\":\"BreadcrumbList\",\"itemListElement\":[{\"@type\":\"ListItem\",\"position\":1,\"name\":\"All Study Guides\",\"item\":\"https://library.fiveable.me\"},{\"@type\":\"ListItem\",\"position\":2,\"name\":\"Experimental Design\",\"item\":\"https://library.fiveable.me/experimental-design\"},{\"@type\":\"ListItem\",\"position\":3,\"name\":\"Unit 6 – Analysis Of Variance (ANOVA) Study Guides\",\"item\":\"https://library.fiveable.me/experimental-design/unit-6?q=study-guides\"},{\"@type\":\"ListItem\",\"position\":4,\"name\":\"Topic: 6.4\"}]}"}}]],["$","$L1b",null,{"initialReduxState":{"initialToc":{"units":[{"id":"iA2uesFTUGLgpseU","name":"Unit 1 – Introduction to Experimental Design","emoji":"📚","slug":"unit-1","hasResources":true,"resources":[{"id":"t8JQRQ0jW41TO6Vv","title":"1.1 Fundamentals of scientific method and experimentation","slug":"fundamentals-scientific-method-experimentation","type":"STUDY_GUIDE","date":null},{"id":"QZCSdDgVjjWs74Ct","title":"1.2 Historical perspective on experimental design","slug":"historical-perspective-experimental-design","type":"STUDY_GUIDE","date":null},{"id":"iKNy4skfmjBmXBOe","title":"1.3 Types of variables and their roles in experiments","slug":"types-variables-roles-experiments","type":"STUDY_GUIDE","date":null},{"id":"YINngz7x7lMt9Blf","title":"1.4 Importance of experimental design in research","slug":"importance-experimental-design-research","type":"STUDY_GUIDE","date":null}]},{"id":"3mVDpiHue9jAQ253","name":"Unit 2 – Principles of Experimental Design","emoji":"📚","slug":"unit-2","hasResources":true,"resources":[{"id":"4urivQ0hyvEgbaFT","title":"2.3 Bias and confounding variables","slug":"bias-confounding-variables","type":"STUDY_GUIDE","date":null},{"id":"iflBTr5TWimgzSob","title":"2.4 Experimental validity (internal and external)","slug":"experimental-validity-internal-external","type":"STUDY_GUIDE","date":null},{"id":"dj7Qxpc6NNlabYBv","title":"2.2 Experimental units and sampling techniques","slug":"experimental-units-sampling-techniques","type":"STUDY_GUIDE","date":null},{"id":"vIxW7WpYfRK9vDp0","title":"2.1 Replication, randomization, and local control","slug":"replication-randomization-local-control","type":"STUDY_GUIDE","date":null}]},{"id":"A1vH8NwymBXRHEvV","name":"Unit 3 – Randomization Techniques","emoji":"📚","slug":"unit-3","hasResources":true,"resources":[{"id":"gGnaMfZwHvcklVOt","title":"3.2 Stratified random sampling","slug":"stratified-random-sampling","type":"STUDY_GUIDE","date":null},{"id":"xWqmWA9kFg6QRIck","title":"3.3 Cluster sampling and systematic sampling","slug":"cluster-sampling-systematic-sampling","type":"STUDY_GUIDE","date":null},{"id":"Y6SDZWIfEEV2fdds","title":"3.4 Randomization in practice: methods and tools","slug":"randomization-practice-methods-tools","type":"STUDY_GUIDE","date":null},{"id":"ZYeHKub1RiyaLwY8","title":"3.1 Simple random sampling","slug":"simple-random-sampling","type":"STUDY_GUIDE","date":null}]},{"id":"U3RtoNW3k3bZREZj","name":"Unit 4 – Factorial Designs","emoji":"📚","slug":"unit-4","hasResources":true,"resources":[{"id":"WE0dGBdwZMo8dAsh","title":"4.1 Two-factor factorial designs","slug":"two-factor-factorial-designs","type":"STUDY_GUIDE","date":null},{"id":"Xz41WLyV6eIkDOtE","title":"4.2 Higher-order factorial designs","slug":"higher-order-factorial-designs","type":"STUDY_GUIDE","date":null},{"id":"9Hilbjc4aEiYbhKF","title":"4.3 Main effects and interactions","slug":"main-effects-interactions","type":"STUDY_GUIDE","date":null},{"id":"mBXAcVPXmJBqz2UX","title":"4.4 Fractional factorial designs","slug":"fractional-factorial-designs","type":"STUDY_GUIDE","date":null}]},{"id":"cZ8wtKJBydlRlTFK","name":"Unit 5 – Blocking and Confounding","emoji":"📚","slug":"unit-5","hasResources":true,"resources":[{"id":"9bxFr3Roj88rAoJB","title":"5.1 Principles of blocking","slug":"principles-blocking","type":"STUDY_GUIDE","date":null},{"id":"1x0ymRVIqTaJUmYf","title":"5.2 Randomized complete block designs","slug":"randomized-complete-block-designs","type":"STUDY_GUIDE","date":null},{"id":"reR6bieGMRfYfuiE","title":"5.3 Latin square and Graeco-Latin square designs","slug":"latin-square-graeco-latin-square-designs","type":"STUDY_GUIDE","date":null},{"id":"9k7XZWXBClXuM3vG","title":"5.4 Confounding in factorial experiments","slug":"confounding-factorial-experiments","type":"STUDY_GUIDE","date":null}]},{"id":"OGPAb8FIJ0ehgGEY","name":"Unit 6 – Analysis of Variance (ANOVA)","emoji":"📚","slug":"unit-6","hasResources":true,"resources":[{"id":"oO5NfvSqmH4AsbKN","title":"6.1 One-way ANOVA","slug":"one-way-anova","type":"STUDY_GUIDE","date":null},{"id":"0Lqbg6Q47lnTmiko","title":"6.2 Two-way ANOVA","slug":"two-way-anova","type":"STUDY_GUIDE","date":null},{"id":"L18Aw9UHrYsn4J29","title":"6.4 Assumptions and diagnostics for ANOVA","slug":"assumptions-diagnostics-anova","type":"STUDY_GUIDE","date":null},{"id":"mwehq4wy26ycGdG2","title":"6.3 Multifactor ANOVA","slug":"multifactor-anova","type":"STUDY_GUIDE","date":null}]},{"id":"A9bCi8OdM9i0ayuU","name":"Unit 7 – Statistical Power and Sample Size","emoji":"📚","slug":"unit-7","hasResources":true,"resources":[{"id":"HCLYvhOpM8wGXnQI","title":"7.1 Concepts of statistical power and effect size","slug":"concepts-statistical-power-effect-size","type":"STUDY_GUIDE","date":null},{"id":"W18kaCqTU0CM05ZZ","title":"7.2 Power analysis for different experimental designs","slug":"power-analysis-experimental-designs","type":"STUDY_GUIDE","date":null},{"id":"WzzDYAj1emuk4A9h","title":"7.3 Sample size calculation techniques","slug":"sample-size-calculation-techniques","type":"STUDY_GUIDE","date":null},{"id":"h4ukRDZpb3AEBIJn","title":"7.4 Trade-offs between power, sample size, and effect size","slug":"trade-offs-power-sample-size-effect-size","type":"STUDY_GUIDE","date":null}]},{"id":"1cvyYYPw1igkv41P","name":"Unit 8 – Split–Plot Designs","emoji":"📚","slug":"unit-8","hasResources":true,"resources":[{"id":"oIYOEnHj9hcGTfs5","title":"8.1 Principles of split-plot designs","slug":"principles-split-plot-designs","type":"STUDY_GUIDE","date":null},{"id":"P02eGA1IEX2WtTrv","title":"8.2 Analysis of split-plot experiments","slug":"analysis-split-plot-experiments","type":"STUDY_GUIDE","date":null},{"id":"cbgDMBbS9A27x3Yv","title":"8.4 Applications and limitations of split-plot designs","slug":"applications-limitations-split-plot-designs","type":"STUDY_GUIDE","date":null},{"id":"XwYcBW4wbIHs0zc0","title":"8.3 Split-split plot designs","slug":"split-split-plot-designs","type":"STUDY_GUIDE","date":null}]},{"id":"YZAcKIK3gA9QzbP3","name":"Unit 9 – Repeated Measures Designs","emoji":"📚","slug":"unit-9","hasResources":true,"resources":[{"id":"0rgNjiLL0grXjYHZ","title":"9.2 Between-subjects and within-subjects factors","slug":"between-subjects-within-subjects-factors","type":"STUDY_GUIDE","date":null},{"id":"qQU75Emt0wrKHm3h","title":"9.3 Analysis of repeated measures data","slug":"analysis-repeated-measures-data","type":"STUDY_GUIDE","date":null},{"id":"szM39nC3JyBaJFUc","title":"9.1 Fundamentals of repeated measures experiments","slug":"fundamentals-repeated-measures-experiments","type":"STUDY_GUIDE","date":null},{"id":"q0KhaZ92DrEtICET","title":"9.4 Handling missing data in repeated measures designs","slug":"handling-missing-data-repeated-measures-designs","type":"STUDY_GUIDE","date":null}]},{"id":"y2VEHrae1DqTze66","name":"Unit 10 – Response Surface Methodology","emoji":"📚","slug":"unit-10","hasResources":true,"resources":[{"id":"fiJBI8xrag8MxiNq","title":"10.2 First-order and second-order models","slug":"first-order-second-order-models","type":"STUDY_GUIDE","date":null},{"id":"q9IiCikLenSFfGN3","title":"10.1 Introduction to response surface designs","slug":"introduction-response-surface-designs","type":"STUDY_GUIDE","date":null},{"id":"1Pp7AJO4IRhGv2Ix","title":"10.4 Optimization techniques in response surface methodology","slug":"optimization-techniques-response-surface-methodology","type":"STUDY_GUIDE","date":null},{"id":"8yDKaI6k7DhHiR0L","title":"10.3 Central composite and Box-Behnken designs","slug":"central-composite-box-behnken-designs","type":"STUDY_GUIDE","date":null}]},{"id":"xaHDl0vzqzQytXXM","name":"Unit 11 – Designing Experiments for Analysis","emoji":"📚","slug":"unit-11","hasResources":true,"resources":[{"id":"9nvXsFlhY7MdoiSe","title":"11.2 Experimental design for regression analysis","slug":"experimental-design-regression-analysis","type":"STUDY_GUIDE","date":null},{"id":"yitbOl6RjXATqmGJ","title":"11.4 Bayesian approaches to experimental design","slug":"bayesian-approaches-experimental-design","type":"STUDY_GUIDE","date":null},{"id":"7kWNKi0GYQyGkEwo","title":"11.3 Designing experiments for non-parametric tests","slug":"designing-experiments-non-parametric-tests","type":"STUDY_GUIDE","date":null},{"id":"y7KKUeScH22364X1","title":"11.1 Choosing appropriate statistical tests","slug":"choosing-statistical-tests","type":"STUDY_GUIDE","date":null}]},{"id":"a6CutZV1R8FHiyXu","name":"Unit 12 – Interpreting Results & Drawing Conclusions","emoji":"📚","slug":"unit-12","hasResources":true,"resources":[{"id":"B1YTuE2olszq67i6","title":"12.3 Effect size interpretation and practical significance","slug":"effect-size-interpretation-practical-significance","type":"STUDY_GUIDE","date":null},{"id":"4wh5p53AlfHxJsqO","title":"12.4 Limitations and generalizability of experimental results","slug":"limitations-generalizability-experimental-results","type":"STUDY_GUIDE","date":null},{"id":"VsVZV4OfoTSssNIK","title":"12.1 Statistical inference and hypothesis testing","slug":"statistical-inference-hypothesis-testing","type":"STUDY_GUIDE","date":null},{"id":"ejQHVwPTrz04MHvZ","title":"12.2 Multiple comparisons and post-hoc tests","slug":"multiple-comparisons-post-hoc-tests","type":"STUDY_GUIDE","date":null}]},{"id":"roABkStwkw6YnHlS","name":"Unit 13 – Contemporary Issues in Experimental Design","emoji":"📚","slug":"unit-13","hasResources":true,"resources":[{"id":"UmSC1z6DtdRXKnN5","title":"13.4 Machine learning approaches in experimental design","slug":"machine-learning-approaches-experimental-design","type":"STUDY_GUIDE","date":null},{"id":"nKglpmUvpusG3h9i","title":"13.2 Reproducibility crisis and solutions","slug":"reproducibility-crisis-solutions","type":"STUDY_GUIDE","date":null},{"id":"zLLywsRZ8YtwnMC2","title":"13.3 Big data and high-dimensional experiments","slug":"big-data-high-dimensional-experiments","type":"STUDY_GUIDE","date":null},{"id":"rSGfFiBNg5pNgmug","title":"13.1 Ethical considerations in experimental research","slug":"ethical-considerations-experimental-research","type":"STUDY_GUIDE","date":null}]},{"id":"ihOO4Amp468JnBaj","name":"Unit 14 – Adaptive Designs","emoji":"📚","slug":"unit-14","hasResources":true,"resources":[{"id":"wyKcszFQtBXh1d6A","title":"14.1 Principles of adaptive experimental designs","slug":"principles-adaptive-experimental-designs","type":"STUDY_GUIDE","date":null},{"id":"KEyU7X82K60kEOH8","title":"14.2 Sequential and group sequential designs","slug":"sequential-group-sequential-designs","type":"STUDY_GUIDE","date":null},{"id":"9c08Y4coKXj0GOjO","title":"14.3 Sample size re-estimation methods","slug":"sample-size-re-estimation-methods","type":"STUDY_GUIDE","date":null},{"id":"1Vdv8UchzucUYSRi","title":"14.4 Applications of adaptive designs in clinical trials","slug":"applications-adaptive-designs-clinical-trials","type":"STUDY_GUIDE","date":null}]},{"id":"zhhlIIekmTz76GaB","name":"Unit 15 – Optimal Design Theory","emoji":"📚","slug":"unit-15","hasResources":true,"resources":[{"id":"AvvUCe8w6phXKuyA","title":"15.2 Alphabetic optimality criteria (A, D, E, G-optimality)","slug":"alphabetic-optimality-criteria-a-d-e-g-optimality","type":"STUDY_GUIDE","date":null},{"id":"mnHHCcSOhQaf2jU8","title":"15.1 Fundamentals of optimal design theory","slug":"fundamentals-optimal-design-theory","type":"STUDY_GUIDE","date":null},{"id":"yHLFIKBMsNCa1S1w","title":"15.3 Computer-aided optimal design generation","slug":"computer-aided-optimal-design-generation","type":"STUDY_GUIDE","date":null},{"id":"mJrxlf8sDYA6X1TO","title":"15.4 Robust optimal designs","slug":"robust-optimal-designs","type":"STUDY_GUIDE","date":null}]}],"activeUnit":{"id":"OGPAb8FIJ0ehgGEY","publicId":"OGPAb8FIJ0ehgGEY","name":"Unit 6 – Analysis of Variance (ANOVA)","order":6,"slug":"unit-6","description":"Unit 6 – Analysis of Variance (ANOVA)","h1":null,"active":true,"emoji":"📚","hasResources":true}},"keyTerms":{"keyTerms":[{"_id":"66c15dec31bf7f01700a5315","slug":"r","subjectSlug":"experimental-design","term":"r","definition":"In statistical analysis, 'r' typically represents the correlation coefficient, a measure that describes the strength and direction of a relationship between two variables. Understanding 'r' is crucial for assessing relationships in various designs, including experimental and observational studies, influencing how data is interpreted across multiple contexts.","shortDefinition":null,"relatedTerms":[{"term":"Correlation","definition":"A statistical technique used to determine the degree to which two variables move in relation to each other.","keyTermSlug":null},{"term":"Regression Analysis","definition":"A statistical method used to model and analyze the relationships between a dependent variable and one or more independent variables.","keyTermSlug":null},{"term":"Effect Size","definition":"A quantitative measure of the magnitude of a phenomenon or the strength of an effect in a statistical analysis.","keyTermSlug":null}],"parents":[{"id":"q0KhaZ92DrEtICET","type":"content"},{"id":"qQU75Emt0wrKHm3h","type":"content"},{"id":"mBXAcVPXmJBqz2UX","type":"content"},{"id":"mwehq4wy26ycGdG2","type":"content"},{"id":"zLLywsRZ8YtwnMC2","type":"content"},{"id":"oO5NfvSqmH4AsbKN","type":"content"},{"id":"L18Aw9UHrYsn4J29","type":"content"}]},{"_id":"66c15dec0c3319858544d736","slug":"p-value","subjectSlug":"experimental-design","term":"p-value","definition":"A p-value is a statistical measure that helps determine the significance of results obtained in hypothesis testing. It indicates the probability of observing data at least as extreme as the sample data, assuming the null hypothesis is true. Understanding p-values is crucial as they help researchers make decisions about rejecting or failing to reject the null hypothesis, and they are foundational to various statistical methods and analyses.","shortDefinition":null,"relatedTerms":[{"term":"Null Hypothesis","definition":"A statement asserting that there is no effect or no difference, which researchers aim to test against in hypothesis testing.","keyTermSlug":null},{"term":"Type I Error","definition":"The error that occurs when a true null hypothesis is incorrectly rejected, leading to a false positive result.","keyTermSlug":null},{"term":"Statistical Significance","definition":"A determination that an observed effect or relationship in data is unlikely to have occurred by random chance alone, often indicated by a low p-value.","keyTermSlug":null}],"parents":[{"id":"t8JQRQ0jW41TO6Vv","type":"content"},{"id":"B1YTuE2olszq67i6","type":"content"},{"id":"VsVZV4OfoTSssNIK","type":"content"},{"id":"mwehq4wy26ycGdG2","type":"content"},{"id":"oO5NfvSqmH4AsbKN","type":"content"},{"id":"L18Aw9UHrYsn4J29","type":"content"}]},{"_id":"66c15eb30c3319858544dcbc","slug":"eta-squared","subjectSlug":"experimental-design","term":"eta squared","definition":"Eta squared is a measure of effect size that indicates the proportion of total variance in a dependent variable that can be attributed to a particular independent variable or factor. This statistic helps researchers understand the strength of relationships and the impact of different variables in analyses, especially within the context of ANOVA, power calculations, and assessing practical significance.","shortDefinition":null,"relatedTerms":[{"term":"ANOVA","definition":"ANOVA stands for Analysis of Variance, a statistical method used to test differences between two or more group means.","keyTermSlug":null},{"term":"Effect Size","definition":"Effect size is a quantitative measure of the magnitude of a phenomenon or the strength of a relationship between variables.","keyTermSlug":null},{"term":"Statistical Power","definition":"Statistical power is the probability that a statistical test will correctly reject a false null hypothesis, often influenced by sample size and effect size.","keyTermSlug":null}],"parents":[{"id":"HCLYvhOpM8wGXnQI","type":"content"},{"id":"B1YTuE2olszq67i6","type":"content"},{"id":"L18Aw9UHrYsn4J29","type":"content"}]},{"_id":"66c15eb0a66f65e044c64943","slug":"effect-size","subjectSlug":"experimental-design","term":"Effect Size","definition":"Effect size is a quantitative measure that reflects the magnitude of a treatment effect or the strength of a relationship between variables in a study. It helps in understanding the practical significance of research findings beyond just statistical significance, offering insights into the size of differences or relationships observed.","shortDefinition":null,"relatedTerms":[{"term":"Cohen's d","definition":"A commonly used measure of effect size that calculates the difference between two means divided by the pooled standard deviation, indicating how far apart the two groups are in standard deviation units.","keyTermSlug":null},{"term":"Eta-squared","definition":"A measure of effect size used in the context of ANOVA, representing the proportion of total variance in the dependent variable that is attributed to a factor.","keyTermSlug":null},{"term":"Statistical Power","definition":"The probability that a statistical test will correctly reject a null hypothesis when it is false, which is influenced by sample size, effect size, and significance level.","keyTermSlug":null}],"parents":[{"id":"W18kaCqTU0CM05ZZ","type":"content"},{"id":"HCLYvhOpM8wGXnQI","type":"content"},{"id":"7kWNKi0GYQyGkEwo","type":"content"},{"id":"9c08Y4coKXj0GOjO","type":"content"},{"id":"WzzDYAj1emuk4A9h","type":"content"},{"id":"VsVZV4OfoTSssNIK","type":"content"},{"id":"iflBTr5TWimgzSob","type":"content"},{"id":"y7KKUeScH22364X1","type":"content"},{"id":"h4ukRDZpb3AEBIJn","type":"content"},{"id":"vIxW7WpYfRK9vDp0","type":"content"},{"id":"mwehq4wy26ycGdG2","type":"content"},{"id":"9Hilbjc4aEiYbhKF","type":"content"},{"id":"oO5NfvSqmH4AsbKN","type":"content"},{"id":"L18Aw9UHrYsn4J29","type":"content"},{"id":"0rgNjiLL0grXjYHZ","type":"content"}]},{"_id":"66c15eb90946f59b838b65c2","slug":"cohens-d","subjectSlug":"experimental-design","term":"Cohen's d","definition":"Cohen's d is a measure of effect size that quantifies the difference between two group means in standard deviation units. It provides insight into the magnitude of an effect, allowing researchers to understand how meaningful their findings are beyond just statistical significance. This measure connects deeply with concepts like statistical power, sample size, and practical significance, making it vital for analyzing research outcomes effectively.","shortDefinition":null,"relatedTerms":[{"term":"Effect Size","definition":"A quantitative measure that describes the strength of a relationship or the magnitude of an effect in research, helping to determine practical significance.","keyTermSlug":null},{"term":"Statistical Power","definition":"The probability that a statistical test will correctly reject a false null hypothesis, often influenced by sample size and effect size.","keyTermSlug":null},{"term":"ANOVA","definition":"Analysis of Variance, a statistical method used to compare means among three or more groups to determine if at least one group mean is significantly different.","keyTermSlug":null}],"parents":[{"id":"HCLYvhOpM8wGXnQI","type":"content"},{"id":"B1YTuE2olszq67i6","type":"content"},{"id":"WzzDYAj1emuk4A9h","type":"content"},{"id":"VsVZV4OfoTSssNIK","type":"content"},{"id":"h4ukRDZpb3AEBIJn","type":"content"},{"id":"nKglpmUvpusG3h9i","type":"content"},{"id":"L18Aw9UHrYsn4J29","type":"content"}]},{"_id":"66c15ebd2965e1696c1ef646","slug":"sas","subjectSlug":"experimental-design","term":"SAS","definition":"SAS stands for Statistical Analysis System, a software suite used for advanced analytics, business intelligence, and data management. It is commonly employed to perform various statistical analyses, including ANOVA and repeated measures designs, allowing researchers to evaluate data integrity and handle complex datasets effectively.","shortDefinition":null,"relatedTerms":[{"term":"ANOVA","definition":"Analysis of Variance, a statistical method used to test differences between two or more group means.","keyTermSlug":null},{"term":"Imputation","definition":"A statistical technique used to replace missing data with substituted values to maintain the integrity of analysis.","keyTermSlug":null},{"term":"Data Diagnostics","definition":"Procedures and methods used to assess the quality and validity of data before conducting statistical analyses.","keyTermSlug":null}],"parents":[{"id":"q0KhaZ92DrEtICET","type":"content"},{"id":"L18Aw9UHrYsn4J29","type":"content"}]},{"_id":"66c15ec04a470781133306dc","slug":"durbin-watson-statistic","subjectSlug":"experimental-design","term":"Durbin-Watson Statistic","definition":"The Durbin-Watson statistic is a test statistic used to detect the presence of autocorrelation in the residuals from a regression analysis. Specifically, it helps to assess whether the residuals are correlated across time or space, which can violate key assumptions in statistical modeling, such as independence. This statistic ranges from 0 to 4, with values around 2 indicating no autocorrelation, values less than 2 suggesting positive autocorrelation, and values greater than 2 suggesting negative autocorrelation.","shortDefinition":null,"relatedTerms":[{"term":"Autocorrelation","definition":"A statistical phenomenon where residuals from a regression model are correlated with each other over time or space.","keyTermSlug":null},{"term":"Residuals","definition":"The differences between observed values and the values predicted by a regression model.","keyTermSlug":null},{"term":"Assumptions of Regression","definition":"Key conditions that must be met for the results of regression analysis to be valid, including linearity, independence, homoscedasticity, and normality of residuals.","keyTermSlug":null}],"parents":[{"id":"L18Aw9UHrYsn4J29","type":"content"}]},{"_id":"66c15ec04a470781133306d5","slug":"levenes-test","subjectSlug":"experimental-design","term":"Levene's Test","definition":"Levene's Test is a statistical procedure used to assess the equality of variances across groups. It plays a crucial role in validating one of the key assumptions of ANOVA, which is that the variances among different groups being compared are approximately equal. By checking this assumption, researchers can ensure that their results are more reliable and that the conclusions drawn from an ANOVA analysis are valid.","shortDefinition":null,"relatedTerms":[{"term":"ANOVA","definition":"Analysis of Variance (ANOVA) is a statistical method used to compare means among three or more groups to determine if at least one group mean is significantly different from the others.","keyTermSlug":null},{"term":"Homogeneity of Variance","definition":"The assumption that different samples have the same variance, which is essential for the validity of ANOVA results.","keyTermSlug":null},{"term":"F-test","definition":"A statistical test used to compare the variances of two or more groups to determine if they are significantly different from each other.","keyTermSlug":null}],"parents":[{"id":"L18Aw9UHrYsn4J29","type":"content"}]},{"_id":"66c15ec02965e1696c1ef656","slug":"square-root-transformation","subjectSlug":"experimental-design","term":"square root transformation","definition":"A square root transformation is a statistical technique used to stabilize variance and make data more normally distributed by applying the square root function to each data point. This method is particularly useful when dealing with count data or datasets exhibiting heteroscedasticity, as it helps meet the assumptions required for analysis of variance (ANOVA). By reducing the influence of larger values, this transformation improves the reliability of statistical tests and enhances interpretability.","shortDefinition":null,"relatedTerms":[{"term":"Heteroscedasticity","definition":"A condition in which the variance of errors varies across observations, often violating the assumptions of linear regression models.","keyTermSlug":null},{"term":"Normality","definition":"The assumption that the residuals of a model are normally distributed, which is crucial for the validity of many statistical tests.","keyTermSlug":null},{"term":"Variance Stabilization","definition":"The process of transforming data to achieve constant variance across levels of an independent variable, enhancing the robustness of statistical analyses.","keyTermSlug":null}],"parents":[{"id":"L18Aw9UHrYsn4J29","type":"content"}]},{"_id":"66c15ec10946f59b838b6611","slug":"repeated-measures-anova","subjectSlug":"experimental-design","term":"repeated measures ANOVA","definition":"Repeated measures ANOVA is a statistical method used to compare means across multiple groups when the same subjects are measured under different conditions or over time. This approach is particularly useful for analyzing data where the same participants are involved in all treatments, allowing researchers to account for individual differences and reduce the error variance associated with those differences.","shortDefinition":null,"relatedTerms":[{"term":"Within-Subject Design","definition":"A research design where the same subjects are exposed to all levels of the independent variable, allowing for direct comparisons within individuals.","keyTermSlug":null},{"term":"Sphericity","definition":"An assumption of repeated measures ANOVA that states the variances of the differences between all combinations of related groups should be equal.","keyTermSlug":null},{"term":"Post Hoc Tests","definition":"Statistical tests conducted after an ANOVA to determine which specific group means are significantly different from each other.","keyTermSlug":null}],"parents":[{"id":"mwehq4wy26ycGdG2","type":"content"},{"id":"L18Aw9UHrYsn4J29","type":"content"}]},{"_id":"66c15ec031bf7f01700a589c","slug":"log-transformation","subjectSlug":"experimental-design","term":"log transformation","definition":"Log transformation is a mathematical operation that replaces each value in a dataset with its logarithm, typically using base 10 or the natural logarithm (base e). This technique is particularly useful in statistical analysis to stabilize variance, make data more normally distributed, and meet the assumptions required for various statistical tests like ANOVA.","shortDefinition":null,"relatedTerms":[{"term":"Variance Stabilization","definition":"A process used in statistics to make the variability of a dataset more consistent across different levels of an independent variable.","keyTermSlug":null},{"term":"Normal Distribution","definition":"A probability distribution that is symmetric about the mean, showing that data near the mean are more frequent in occurrence than data far from the mean.","keyTermSlug":null},{"term":"ANOVA (Analysis of Variance)","definition":"A statistical method used to compare means among three or more groups to determine if at least one group mean is significantly different from the others.","keyTermSlug":null}],"parents":[{"id":"L18Aw9UHrYsn4J29","type":"content"}]},{"_id":"66c15ec00c3319858544dce1","slug":"f-statistic","subjectSlug":"experimental-design","term":"f-statistic","definition":"The f-statistic is a ratio that compares the variance between group means to the variance within groups in ANOVA (Analysis of Variance). It helps determine if there are statistically significant differences between the means of three or more groups. A higher f-statistic indicates a greater disparity among group means relative to the variability within each group, suggesting that at least one group mean is different from the others.","shortDefinition":null,"relatedTerms":[{"term":"ANOVA","definition":"ANOVA stands for Analysis of Variance, a statistical method used to compare means among three or more groups to see if at least one differs significantly.","keyTermSlug":null},{"term":"Mean Square","definition":"Mean Square is a measure of variance calculated by dividing the sum of squares by the degrees of freedom, used in the computation of the f-statistic.","keyTermSlug":null},{"term":"Null Hypothesis","definition":"The null hypothesis states that there is no effect or difference; in ANOVA, it asserts that all group means are equal.","keyTermSlug":null}],"parents":[{"id":"L18Aw9UHrYsn4J29","type":"content"}]},{"_id":"66c15ec831bf7f01700a58cd","slug":"independence-of-observations","subjectSlug":"experimental-design","term":"independence of observations","definition":"Independence of observations means that the data collected from different subjects or experimental units are not influenced by each other. This concept is critical for ensuring the validity of statistical analyses, as violations can lead to biased results and incorrect conclusions. In statistical methods like ANOVA and multifactor ANOVA, this assumption must hold true to accurately assess group differences and interactions among factors.","shortDefinition":null,"relatedTerms":[{"term":"Random Sampling","definition":"The process of selecting a sample from a population in such a way that every individual has an equal chance of being chosen, helping to ensure independence among observations.","keyTermSlug":null},{"term":"Homogeneity of Variance","definition":"The assumption that different groups have similar variances, which works in conjunction with independence of observations in statistical analyses.","keyTermSlug":null},{"term":"Repeated Measures","definition":"A design where the same subjects are used for multiple measurements, which can introduce dependence among observations if not properly accounted for.","keyTermSlug":null}],"parents":[{"id":"mwehq4wy26ycGdG2","type":"content"},{"id":"L18Aw9UHrYsn4J29","type":"content"}]},{"_id":"66c15ec5a66f65e044c649ca","slug":"shapiro-wilk-test","subjectSlug":"experimental-design","term":"Shapiro-Wilk Test","definition":"The Shapiro-Wilk Test is a statistical test used to determine whether a given dataset is normally distributed. It's particularly useful in the context of ANOVA, as one of the key assumptions for ANOVA is that the data should be normally distributed within each group being compared. This test helps assess whether this assumption holds, allowing researchers to make valid inferences based on their data.","shortDefinition":null,"relatedTerms":[{"term":"Normal Distribution","definition":"A probability distribution that is symmetric about the mean, showing that data near the mean are more frequent in occurrence than data far from the mean.","keyTermSlug":null},{"term":"ANOVA Assumptions","definition":"Conditions that must be satisfied for ANOVA to produce valid results, including normality, homogeneity of variances, and independence of observations.","keyTermSlug":null},{"term":"P-Value","definition":"The probability of obtaining test results at least as extreme as the observed results, assuming that the null hypothesis is true.","keyTermSlug":null}],"parents":[{"id":"L18Aw9UHrYsn4J29","type":"content"}]},{"_id":"66c15ec931bf7f01700a58db","slug":"one-way-anova","subjectSlug":"experimental-design","term":"one-way anova","definition":"One-way ANOVA (Analysis of Variance) is a statistical technique used to compare the means of three or more independent groups to determine if at least one group mean is statistically different from the others. This method is essential for analyzing experimental data and helps in understanding the impact of a single independent variable on a dependent variable while checking assumptions and diagnostics, calculating sample size, and selecting appropriate tests.","shortDefinition":null,"relatedTerms":[{"term":"Independent Variable","definition":"A variable that is manipulated or categorized in an experiment to observe its effect on a dependent variable.","keyTermSlug":null},{"term":"Post-hoc Tests","definition":"Statistical tests performed after an ANOVA to determine which specific group means are different when the ANOVA indicates significant differences.","keyTermSlug":null},{"term":"F-test","definition":"A statistical test used to compare the variances of two or more groups, which is the basis for conducting an ANOVA.","keyTermSlug":null}],"parents":[{"id":"WzzDYAj1emuk4A9h","type":"content"},{"id":"y7KKUeScH22364X1","type":"content"},{"id":"L18Aw9UHrYsn4J29","type":"content"}]},{"_id":"66c15ed50c3319858544dd63","slug":"type-i-error","subjectSlug":"experimental-design","term":"Type I Error","definition":"A Type I error occurs when a null hypothesis is incorrectly rejected, leading to the conclusion that there is an effect or difference when none actually exists. This mistake can have serious implications in various statistical contexts, affecting the reliability of results and decision-making processes.","shortDefinition":null,"relatedTerms":[{"term":"Null Hypothesis","definition":"A statement that there is no effect or no difference, serving as the starting point for statistical testing.","keyTermSlug":null},{"term":"Significance Level","definition":"The probability of making a Type I error, commonly denoted as alpha (α), typically set at 0.05 or 0.01 in hypothesis testing.","keyTermSlug":null},{"term":"Type II Error","definition":"A Type II error occurs when a null hypothesis is not rejected when it is false, leading to the failure to detect an effect that is present.","keyTermSlug":null}],"parents":[{"id":"W18kaCqTU0CM05ZZ","type":"content"},{"id":"HCLYvhOpM8wGXnQI","type":"content"},{"id":"9c08Y4coKXj0GOjO","type":"content"},{"id":"VsVZV4OfoTSssNIK","type":"content"},{"id":"y7KKUeScH22364X1","type":"content"},{"id":"h4ukRDZpb3AEBIJn","type":"content"},{"id":"ejQHVwPTrz04MHvZ","type":"content"},{"id":"L18Aw9UHrYsn4J29","type":"content"},{"id":"9k7XZWXBClXuM3vG","type":"content"}]},{"_id":"66c15ed6a66f65e044c64a3e","slug":"type-ii-error","subjectSlug":"experimental-design","term":"Type II Error","definition":"A Type II error occurs when a statistical test fails to reject a false null hypothesis, leading to the incorrect conclusion that there is no effect or difference when one actually exists. This concept is crucial as it relates to the sensitivity of tests, impacting the reliability of experimental results and interpretations.","shortDefinition":null,"relatedTerms":[{"term":"Null Hypothesis","definition":"The hypothesis stating that there is no effect or no difference, which researchers aim to test against.","keyTermSlug":null},{"term":"Statistical Power","definition":"The probability that a test correctly rejects a false null hypothesis, indicating its ability to detect an effect when one truly exists.","keyTermSlug":null},{"term":"Type I Error","definition":"The error that occurs when a true null hypothesis is incorrectly rejected, leading to a false positive result.","keyTermSlug":null}],"parents":[{"id":"W18kaCqTU0CM05ZZ","type":"content"},{"id":"HCLYvhOpM8wGXnQI","type":"content"},{"id":"9c08Y4coKXj0GOjO","type":"content"},{"id":"VsVZV4OfoTSssNIK","type":"content"},{"id":"y7KKUeScH22364X1","type":"content"},{"id":"h4ukRDZpb3AEBIJn","type":"content"},{"id":"L18Aw9UHrYsn4J29","type":"content"},{"id":"9k7XZWXBClXuM3vG","type":"content"}]},{"_id":"66c15f0de7ad9f341d8d2b41","slug":"homogeneity-of-variance","subjectSlug":"experimental-design","term":"homogeneity of variance","definition":"Homogeneity of variance refers to the assumption that different groups in a statistical test have the same variance or spread in their data. This concept is crucial when performing analyses like ANOVA, as violating this assumption can lead to incorrect conclusions about the differences between groups. Ensuring homogeneity of variance helps validate the results and interpretations derived from statistical tests, making it a fundamental consideration when comparing multiple groups.","shortDefinition":null,"relatedTerms":[{"term":"ANOVA","definition":"Analysis of Variance, a statistical method used to compare means among three or more groups and determine if at least one group mean is statistically different from the others.","keyTermSlug":null},{"term":"Levene's Test","definition":"A statistical test used to assess the equality of variances across different groups, often employed before conducting ANOVA.","keyTermSlug":null},{"term":"Post-hoc tests","definition":"Statistical tests conducted after ANOVA to determine which specific group means are significantly different from one another.","keyTermSlug":null}],"parents":[{"id":"0Lqbg6Q47lnTmiko","type":"content"},{"id":"y7KKUeScH22364X1","type":"content"},{"id":"ejQHVwPTrz04MHvZ","type":"content"},{"id":"L18Aw9UHrYsn4J29","type":"content"}]},{"_id":"66c15f0d2965e1696c1ef853","slug":"bonferroni-correction","subjectSlug":"experimental-design","term":"Bonferroni correction","definition":"The Bonferroni correction is a statistical method used to counteract the problem of multiple comparisons by adjusting the significance level when conducting multiple tests. By dividing the desired alpha level (e.g., 0.05) by the number of comparisons being made, it helps to reduce the likelihood of Type I errors, which occur when a true null hypothesis is incorrectly rejected. This adjustment is particularly relevant in analyses involving multiple groups or factors, ensuring that findings remain statistically valid.","shortDefinition":null,"relatedTerms":[{"term":"Type I error","definition":"The error that occurs when a true null hypothesis is incorrectly rejected, leading to a false positive result.","keyTermSlug":null},{"term":"ANOVA","definition":"Analysis of variance, a statistical method used to compare means among three or more groups to determine if at least one group mean is significantly different.","keyTermSlug":null},{"term":"Post-hoc tests","definition":"Statistical tests conducted after an ANOVA to determine which specific group means are different when the overall test indicates significance.","keyTermSlug":null}],"parents":[{"id":"0Lqbg6Q47lnTmiko","type":"content"},{"id":"ejQHVwPTrz04MHvZ","type":"content"},{"id":"L18Aw9UHrYsn4J29","type":"content"}]},{"_id":"66c15f100946f59b838b6843","slug":"tukeys-hsd","subjectSlug":"experimental-design","term":"Tukey's HSD","definition":"Tukey's HSD (Honestly Significant Difference) is a post-hoc test used to determine which specific group means are different after conducting an ANOVA. It helps in comparing all possible pairs of means while controlling the overall error rate, making it particularly useful in situations with multiple comparisons. This test provides a straightforward way to identify significant differences between groups when the initial analysis indicates that at least one group mean is significantly different from others.","shortDefinition":null,"relatedTerms":[{"term":"ANOVA","definition":"Analysis of Variance, a statistical method used to compare the means of three or more groups to see if at least one differs significantly.","keyTermSlug":null},{"term":"Post-hoc tests","definition":"Statistical tests conducted after an initial analysis to identify specific group differences when an overall effect is detected.","keyTermSlug":null},{"term":"Type I Error","definition":"The incorrect rejection of a true null hypothesis, which can occur more frequently when conducting multiple comparisons without proper adjustments.","keyTermSlug":null}],"parents":[{"id":"0Lqbg6Q47lnTmiko","type":"content"},{"id":"ejQHVwPTrz04MHvZ","type":"content"},{"id":"L18Aw9UHrYsn4J29","type":"content"}]},{"_id":"66c15f1db5d70b6a27b76dbb","slug":"spss","subjectSlug":"experimental-design","term":"SPSS","definition":"SPSS, which stands for Statistical Package for the Social Sciences, is a software program widely used for statistical analysis and data management. It provides tools for performing complex statistical analyses, including various types of ANOVA, handling repeated measures data, and addressing issues like missing data, making it essential for researchers and students in fields that require robust data analysis.","shortDefinition":null,"relatedTerms":[{"term":"ANOVA","definition":"Analysis of Variance (ANOVA) is a statistical method used to test differences between two or more group means.","keyTermSlug":null},{"term":"Data Management","definition":"The process of collecting, organizing, and maintaining data to ensure its accuracy and accessibility for analysis.","keyTermSlug":null},{"term":"Missing Data","definition":"Refers to the absence of data points in a dataset, which can occur for various reasons and needs to be managed appropriately during analysis.","keyTermSlug":null}],"parents":[{"id":"q0KhaZ92DrEtICET","type":"content"},{"id":"qQU75Emt0wrKHm3h","type":"content"},{"id":"mwehq4wy26ycGdG2","type":"content"},{"id":"oO5NfvSqmH4AsbKN","type":"content"},{"id":"L18Aw9UHrYsn4J29","type":"content"}]},{"_id":"66c15f1ee7ad9f341d8d2ba5","slug":"two-way-anova","subjectSlug":"experimental-design","term":"two-way ANOVA","definition":"Two-way ANOVA is a statistical test used to determine the effect of two independent variables on a dependent variable while also examining the interaction between the two independent variables. This method is particularly useful when researchers want to understand how different groups or conditions affect outcomes and whether these effects vary based on the levels of another factor. The analysis helps in understanding complex relationships and interactions that one-way ANOVA might miss.","shortDefinition":null,"relatedTerms":[{"term":"Interaction Effect","definition":"The effect that occurs when the influence of one independent variable on the dependent variable changes at different levels of another independent variable.","keyTermSlug":null},{"term":"Main Effect","definition":"The direct effect of an independent variable on the dependent variable, ignoring other independent variables.","keyTermSlug":null},{"term":"Post Hoc Tests","definition":"Statistical tests conducted after ANOVA to determine which specific group means are significantly different from each other.","keyTermSlug":null}],"parents":[{"id":"0Lqbg6Q47lnTmiko","type":"content"},{"id":"y7KKUeScH22364X1","type":"content"},{"id":"mwehq4wy26ycGdG2","type":"content"},{"id":"L18Aw9UHrYsn4J29","type":"content"}]},{"_id":"66c15f2b0c3319858544df4d","slug":"normality","subjectSlug":"experimental-design","term":"Normality","definition":"Normality refers to the assumption that the data being analyzed follows a normal distribution, which is a bell-shaped curve where most of the observations cluster around the central peak and probabilities for values further away from the mean taper off equally in both directions. This concept is crucial in many statistical methods, as violations of this assumption can lead to misleading results, especially when comparing means across groups or examining relationships between variables.","shortDefinition":null,"relatedTerms":[{"term":"Normal Distribution","definition":"A probability distribution that is symmetric about the mean, showing that data near the mean are more frequent in occurrence than data far from the mean.","keyTermSlug":null},{"term":"Central Limit Theorem","definition":"A statistical theory that states that the distribution of sample means approaches a normal distribution as the sample size increases, regardless of the shape of the population distribution.","keyTermSlug":null},{"term":"Skewness","definition":"A measure of the asymmetry of the probability distribution of a real-valued random variable, which indicates whether data points tend to be more spread out on one side of the mean.","keyTermSlug":null}],"parents":[{"id":"0Lqbg6Q47lnTmiko","type":"content"},{"id":"qQU75Emt0wrKHm3h","type":"content"},{"id":"y7KKUeScH22364X1","type":"content"},{"id":"mwehq4wy26ycGdG2","type":"content"},{"id":"ejQHVwPTrz04MHvZ","type":"content"},{"id":"oO5NfvSqmH4AsbKN","type":"content"},{"id":"L18Aw9UHrYsn4J29","type":"content"}]}]},"pageData":{"subject":{"id":"experimental-design","name":"Experimental Design","keyTermsActive":null,"generationMetadata":{"group":"Group 7 – unit, topics, key terms","level":"college undergraduate","branch":"Math","duration":"one semester","subBranch":"Statistics","lengthVariant":"less text","model":"opus"}},"unit":{"id":"OGPAb8FIJ0ehgGEY","publicId":"OGPAb8FIJ0ehgGEY","name":"Unit 6 – Analysis of Variance (ANOVA)","order":6,"slug":"unit-6","description":"Unit 6 – Analysis of Variance (ANOVA)","h1":null,"active":true,"emoji":"📚","hasResources":true},"topic":{"id":"vUSJY4IzncXPoDnf","name":"6.4 Assumptions and diagnostics for ANOVA","fullNumber":"6.4"},"content":{"id":"L18Aw9UHrYsn4J29","topics":[{"id":"vUSJY4IzncXPoDnf","name":"6.4 Assumptions and diagnostics for ANOVA","fullNumber":"6.4"}],"title":"6.4 Assumptions and diagnostics for ANOVA","desc":null,"summary":null,"type":"STUDY_GUIDE","slug":"assumptions-diagnostics-anova","date":null,"vimeoLiveLink":null,"url":null,"markdown":"ANOVA assumptions are crucial for valid results. Normality, homogeneity of variance, and independence must be checked. Violations can lead to incorrect conclusions, so it's important to assess these assumptions using visual and formal methods.\n\nDiagnostic tests help evaluate ANOVA assumptions. Residual plots and formal tests like Levene's and Shapiro-Wilk are used. If violations occur, data transformations or robust methods can address issues, ensuring reliable analysis and interpretation of results.\n\n## Assumptions\n### Normality and Its Assessment\n\n ###### ![fiveable_image_carousel](https://fiveable.me)\n\n- Normality assumes the residuals (differences between observed and predicted values) are normally distributed\n- Violations of normality can lead to inaccurate p-values and confidence intervals\n- Assess normality visually using Q-Q plots or histograms of residuals\n - Q-Q plots compare the distribution of residuals to a theoretical normal distribution\n - Histograms should show a bell-shaped curve for normally distributed residuals\n- Formally test normality using the Shapiro-Wilk test\n - Null hypothesis: residuals are normally distributed\n - P-value < 0.05 suggests a significant departure from normality\n\n### Homogeneity of Variance and Independence\n- Homogeneity of variance (homoscedasticity) assumes equal variances across groups\n - Violations (heteroscedasticity) can affect the validity of F-tests and lead to incorrect conclusions\n - Assess homogeneity visually using residual plots (residuals vs. fitted values)\n - Patterns or increasing/decreasing spread indicate heteroscedasticity\n - Formally test homogeneity using Levene's test\n - Null hypothesis: variances are equal across groups\n - P-value < 0.05 suggests significant differences in variances\n- Independence of observations assumes that observations within and between groups are not related\n - Violations can occur due to repeated measures, clustering, or spatial/temporal correlation\n - Assess independence by examining the study design and data collection process\n - Violations may require alternative models (repeated measures ANOVA, mixed models)\n\n## Diagnostic Tests\n### Residual Plots for Assessing Assumptions\n- Residual plots are graphical tools for assessing ANOVA assumptions\n- Residuals vs. Fitted plot\n - Assess homogeneity of variance\n - Look for patterns, increasing/decreasing spread, or outliers\n- Normal Q-Q plot\n - Assess normality of residuals\n - Compare residuals to a theoretical normal distribution\n - Deviations from a straight line indicate non-normality\n- Scale-Location plot\n - Assess homogeneity of variance\n - Look for patterns or increasing/decreasing spread\n- Residuals vs. Leverage plot\n - Identify influential observations\n - Points with high leverage and large residuals may have a strong influence on the model\n\n### Formal Tests for Assumptions\n- Levene's test for homogeneity of variance\n - Null hypothesis: variances are equal across groups\n - P-value < 0.05 suggests significant differences in variances\n - Robust to non-normality, but sensitive to large sample sizes\n- Shapiro-Wilk test for normality\n - Null hypothesis: residuals are normally distributed\n - P-value < 0.05 suggests a significant departure from normality\n - More powerful than visual assessment, but sensitive to large sample sizes\n - Alternative: Anderson-Darling test\n\n## Addressing Violations\n### Data Transformations\n- Transformations can help stabilize variances and improve normality\n- Common transformations: logarithmic, square root, reciprocal\n - Logarithmic: $log(x)$ or $log(x+1)$ for data with zero values\n - Square root: $\\sqrt{x}$ for data with a Poisson distribution\n - Reciprocal: $\\frac{1}{x}$ for data with a strong right skew\n- Choose a transformation based on the nature of the data and the severity of the violation\n- Interpret results on the transformed scale or back-transform for interpretation\n\n### Robust ANOVA Methods and Non-Parametric Alternatives\n- Robust ANOVA methods are less sensitive to violations of assumptions\n - Welch's ANOVA: does not assume equal variances\n - Trimmed means ANOVA: robust to non-normality and outliers\n - Bootstrapping: resampling method to obtain robust confidence intervals and p-values\n- Non-parametric alternatives do not rely on distributional assumptions\n - Kruskal-Wallis test: rank-based test for comparing medians across groups\n - Friedman test: rank-based test for repeated measures designs\n - Permutation tests: resampling method to obtain exact p-values\n- Consider the trade-offs between robustness and power when selecting an alternative method","cheatsheet":null,"publishDate":null,"updatedAt":"2024-08-07T06:24:41.137Z","status":"PUBLISHED","images":[{"url":"https://storage.googleapis.com/static.prod.fiveable.me/search-images%2F%22Normality_assessment_in_ANOVA%3A_Q-Q_plots_histograms_Shapiro-Wilk_test_residuals_distribution_visualizations%22-normality-1.png","description":"Chapter 16 Regression | Untitled","sourceUrl":"https://psyteachr.github.io/msc-conv/16-regression_files/figure-html/normality-1.png","hostUrl":"https://psyteachr.github.io/msc-conv/regression.html","altText":null,"sectionTitle":"Normality and Its Assessment","rank":2,"height":960,"width":1344,"displayWidth":672,"displayHeight":480,"contentId":"66b31329d9be6c5c04e0aa8c","subjectId":"experimental-design"},{"url":"https://storage.googleapis.com/static.prod.fiveable.me/search-images%2F%22Normality_assessment_in_ANOVA%3A_Q-Q_plots_histograms_Shapiro-Wilk_test_residuals_distribution_visualizations%22-ZXRkL.png","description":"r - How to interpret a QQ plot - Cross Validated","sourceUrl":"http://i.stack.imgur.com/ZXRkL.png","hostUrl":"http://stats.stackexchange.com/questions/101274/how-to-interpret-a-qq-plot","altText":null,"sectionTitle":"Normality and Its Assessment","rank":3,"height":537,"width":468,"displayWidth":234,"displayHeight":268,"contentId":"66b31329d9be6c5c04e0aa8c","subjectId":"experimental-design"}],"tableOfContents":null,"meta":{"description":"Review 6.4 Assumptions and diagnostics for ANOVA for your test on Unit 6 – Analysis of Variance (ANOVA). For students taking Experimental Design","title":"6.4 Assumptions and diagnostics for ANOVA | Experimental Design Class Notes"},"subject":{"id":"experimental-design","name":"Experimental Design","emoji":"📊","order":null,"active":true,"slug":"experimental-design","branchSlug":"math","keyTermsActive":null,"generationMetadata":{"group":"Group 7 – unit, topics, key terms","level":"college undergraduate","branch":"Math","duration":"one semester","subBranch":"Statistics","lengthVariant":"less text","model":"opus"},"units":[{"id":"iA2uesFTUGLgpseU","publicId":"iA2uesFTUGLgpseU","name":"Unit 1 – Introduction to Experimental Design","order":1,"slug":"unit-1","description":"Unit 1 – Introduction to Experimental Design","h1":null,"active":true,"emoji":"📚","hasResources":true},{"id":"3mVDpiHue9jAQ253","publicId":"3mVDpiHue9jAQ253","name":"Unit 2 – Principles of Experimental Design","order":2,"slug":"unit-2","description":"Unit 2 – Principles of Experimental Design","h1":null,"active":true,"emoji":"📚","hasResources":true},{"id":"A1vH8NwymBXRHEvV","publicId":"A1vH8NwymBXRHEvV","name":"Unit 3 – Randomization Techniques","order":3,"slug":"unit-3","description":"Unit 3 – Randomization Techniques","h1":null,"active":true,"emoji":"📚","hasResources":true},{"id":"U3RtoNW3k3bZREZj","publicId":"U3RtoNW3k3bZREZj","name":"Unit 4 – Factorial Designs","order":4,"slug":"unit-4","description":"Unit 4 – Factorial Designs","h1":null,"active":true,"emoji":"📚","hasResources":true},{"id":"cZ8wtKJBydlRlTFK","publicId":"cZ8wtKJBydlRlTFK","name":"Unit 5 – Blocking and Confounding","order":5,"slug":"unit-5","description":"Unit 5 – Blocking and Confounding","h1":null,"active":true,"emoji":"📚","hasResources":true},{"id":"OGPAb8FIJ0ehgGEY","publicId":"OGPAb8FIJ0ehgGEY","name":"Unit 6 – Analysis of Variance (ANOVA)","order":6,"slug":"unit-6","description":"Unit 6 – Analysis of Variance (ANOVA)","h1":null,"active":true,"emoji":"📚","hasResources":true},{"id":"A9bCi8OdM9i0ayuU","publicId":"A9bCi8OdM9i0ayuU","name":"Unit 7 – Statistical Power and Sample Size","order":7,"slug":"unit-7","description":"Unit 7 – Statistical Power and Sample Size Determination","h1":null,"active":true,"emoji":"📚","hasResources":true},{"id":"1cvyYYPw1igkv41P","publicId":"1cvyYYPw1igkv41P","name":"Unit 8 – Split–Plot Designs","order":8,"slug":"unit-8","description":"Unit 8 – Split-Plot Designs","h1":null,"active":true,"emoji":"📚","hasResources":true},{"id":"YZAcKIK3gA9QzbP3","publicId":"YZAcKIK3gA9QzbP3","name":"Unit 9 – Repeated Measures Designs","order":9,"slug":"unit-9","description":"Unit 9 – Repeated Measures Designs","h1":null,"active":true,"emoji":"📚","hasResources":true},{"id":"y2VEHrae1DqTze66","publicId":"y2VEHrae1DqTze66","name":"Unit 10 – Response Surface Methodology","order":10,"slug":"unit-10","description":"Unit 10 – Response Surface Methodology","h1":null,"active":true,"emoji":"📚","hasResources":true},{"id":"xaHDl0vzqzQytXXM","publicId":"xaHDl0vzqzQytXXM","name":"Unit 11 – Designing Experiments for Analysis","order":11,"slug":"unit-11","description":"Unit 11 – Designing Experiments for Statistical Analysis","h1":null,"active":true,"emoji":"📚","hasResources":true},{"id":"a6CutZV1R8FHiyXu","publicId":"a6CutZV1R8FHiyXu","name":"Unit 12 – Interpreting Results & Drawing Conclusions","order":12,"slug":"unit-12","description":"Unit 12 – Interpreting Results and Drawing Valid Conclusions","h1":null,"active":true,"emoji":"📚","hasResources":true},{"id":"roABkStwkw6YnHlS","publicId":"roABkStwkw6YnHlS","name":"Unit 13 – Contemporary Issues in Experimental Design","order":13,"slug":"unit-13","description":"Unit 13 – Contemporary Issues in Experimental Design","h1":null,"active":true,"emoji":"📚","hasResources":true},{"id":"ihOO4Amp468JnBaj","publicId":"ihOO4Amp468JnBaj","name":"Unit 14 – Adaptive Designs","order":14,"slug":"unit-14","description":"Unit 14 – Adaptive Designs","h1":null,"active":true,"emoji":"📚","hasResources":true},{"id":"zhhlIIekmTz76GaB","publicId":"zhhlIIekmTz76GaB","name":"Unit 15 – Optimal Design Theory","order":15,"slug":"unit-15","description":"Unit 15 – Optimal Design Theory","h1":null,"active":true,"emoji":"📚","hasResources":true}]},"unit":{"id":"OGPAb8FIJ0ehgGEY","name":"Unit 6 – Analysis of Variance (ANOVA)","slug":"unit-6","active":true},"replayVideoLocations":[],"resources":[],"streamers":[],"duration":3,"creators":[],"editors":[]},"apQuestionData":[]},"contentQueryData":{"content":{"id":"L18Aw9UHrYsn4J29","topics":[{"id":"vUSJY4IzncXPoDnf","name":"6.4 Assumptions and diagnostics for ANOVA","fullNumber":"6.4"}],"title":"6.4 Assumptions and diagnostics for ANOVA","desc":null,"summary":null,"type":"STUDY_GUIDE","slug":"assumptions-diagnostics-anova","date":null,"vimeoLiveLink":null,"url":null,"markdown":"ANOVA assumptions are crucial for valid results. Normality, homogeneity of variance, and independence must be checked. Violations can lead to incorrect conclusions, so it's important to assess these assumptions using visual and formal methods.\n\nDiagnostic tests help evaluate ANOVA assumptions. Residual plots and formal tests like Levene's and Shapiro-Wilk are used. If violations occur, data transformations or robust methods can address issues, ensuring reliable analysis and interpretation of results.\n\n## Assumptions\n### Normality and Its Assessment\n\n ###### ![fiveable_image_carousel](https://fiveable.me)\n\n- Normality assumes the residuals (differences between observed and predicted values) are normally distributed\n- Violations of normality can lead to inaccurate p-values and confidence intervals\n- Assess normality visually using Q-Q plots or histograms of residuals\n - Q-Q plots compare the distribution of residuals to a theoretical normal distribution\n - Histograms should show a bell-shaped curve for normally distributed residuals\n- Formally test normality using the Shapiro-Wilk test\n - Null hypothesis: residuals are normally distributed\n - P-value < 0.05 suggests a significant departure from normality\n\n### Homogeneity of Variance and Independence\n- Homogeneity of variance (homoscedasticity) assumes equal variances across groups\n - Violations (heteroscedasticity) can affect the validity of F-tests and lead to incorrect conclusions\n - Assess homogeneity visually using residual plots (residuals vs. fitted values)\n - Patterns or increasing/decreasing spread indicate heteroscedasticity\n - Formally test homogeneity using Levene's test\n - Null hypothesis: variances are equal across groups\n - P-value < 0.05 suggests significant differences in variances\n- Independence of observations assumes that observations within and between groups are not related\n - Violations can occur due to repeated measures, clustering, or spatial/temporal correlation\n - Assess independence by examining the study design and data collection process\n - Violations may require alternative models (repeated measures ANOVA, mixed models)\n\n## Diagnostic Tests\n### Residual Plots for Assessing Assumptions\n- Residual plots are graphical tools for assessing ANOVA assumptions\n- Residuals vs. Fitted plot\n - Assess homogeneity of variance\n - Look for patterns, increasing/decreasing spread, or outliers\n- Normal Q-Q plot\n - Assess normality of residuals\n - Compare residuals to a theoretical normal distribution\n - Deviations from a straight line indicate non-normality\n- Scale-Location plot\n - Assess homogeneity of variance\n - Look for patterns or increasing/decreasing spread\n- Residuals vs. Leverage plot\n - Identify influential observations\n - Points with high leverage and large residuals may have a strong influence on the model\n\n### Formal Tests for Assumptions\n- Levene's test for homogeneity of variance\n - Null hypothesis: variances are equal across groups\n - P-value < 0.05 suggests significant differences in variances\n - Robust to non-normality, but sensitive to large sample sizes\n- Shapiro-Wilk test for normality\n - Null hypothesis: residuals are normally distributed\n - P-value < 0.05 suggests a significant departure from normality\n - More powerful than visual assessment, but sensitive to large sample sizes\n - Alternative: Anderson-Darling test\n\n## Addressing Violations\n### Data Transformations\n- Transformations can help stabilize variances and improve normality\n- Common transformations: logarithmic, square root, reciprocal\n - Logarithmic: $log(x)$ or $log(x+1)$ for data with zero values\n - Square root: $\\sqrt{x}$ for data with a Poisson distribution\n - Reciprocal: $\\frac{1}{x}$ for data with a strong right skew\n- Choose a transformation based on the nature of the data and the severity of the violation\n- Interpret results on the transformed scale or back-transform for interpretation\n\n### Robust ANOVA Methods and Non-Parametric Alternatives\n- Robust ANOVA methods are less sensitive to violations of assumptions\n - Welch's ANOVA: does not assume equal variances\n - Trimmed means ANOVA: robust to non-normality and outliers\n - Bootstrapping: resampling method to obtain robust confidence intervals and p-values\n- Non-parametric alternatives do not rely on distributional assumptions\n - Kruskal-Wallis test: rank-based test for comparing medians across groups\n - Friedman test: rank-based test for repeated measures designs\n - Permutation tests: resampling method to obtain exact p-values\n- Consider the trade-offs between robustness and power when selecting an alternative method","cheatsheet":null,"publishDate":null,"updatedAt":"2024-08-07T06:24:41.137Z","status":"PUBLISHED","images":[{"url":"https://storage.googleapis.com/static.prod.fiveable.me/search-images%2F%22Normality_assessment_in_ANOVA%3A_Q-Q_plots_histograms_Shapiro-Wilk_test_residuals_distribution_visualizations%22-normality-1.png","description":"Chapter 16 Regression | Untitled","sourceUrl":"https://psyteachr.github.io/msc-conv/16-regression_files/figure-html/normality-1.png","hostUrl":"https://psyteachr.github.io/msc-conv/regression.html","altText":null,"sectionTitle":"Normality and Its Assessment","rank":2,"height":960,"width":1344,"displayWidth":672,"displayHeight":480,"contentId":"66b31329d9be6c5c04e0aa8c","subjectId":"experimental-design"},{"url":"https://storage.googleapis.com/static.prod.fiveable.me/search-images%2F%22Normality_assessment_in_ANOVA%3A_Q-Q_plots_histograms_Shapiro-Wilk_test_residuals_distribution_visualizations%22-ZXRkL.png","description":"r - How to interpret a QQ plot - Cross Validated","sourceUrl":"http://i.stack.imgur.com/ZXRkL.png","hostUrl":"http://stats.stackexchange.com/questions/101274/how-to-interpret-a-qq-plot","altText":null,"sectionTitle":"Normality and Its Assessment","rank":3,"height":537,"width":468,"displayWidth":234,"displayHeight":268,"contentId":"66b31329d9be6c5c04e0aa8c","subjectId":"experimental-design"}],"tableOfContents":null,"meta":{"description":"Review 6.4 Assumptions and diagnostics for ANOVA for your test on Unit 6 – Analysis of Variance (ANOVA). For students taking Experimental Design","title":"6.4 Assumptions and diagnostics for ANOVA | Experimental Design Class Notes"},"subject":{"id":"experimental-design","name":"Experimental Design","emoji":"📊","order":null,"active":true,"slug":"experimental-design","branchSlug":"math","keyTermsActive":null,"generationMetadata":{"group":"Group 7 – unit, topics, key terms","level":"college undergraduate","branch":"Math","duration":"one semester","subBranch":"Statistics","lengthVariant":"less text","model":"opus"},"units":[{"id":"iA2uesFTUGLgpseU","publicId":"iA2uesFTUGLgpseU","name":"Unit 1 – Introduction to Experimental Design","order":1,"slug":"unit-1","description":"Unit 1 – Introduction to Experimental Design","h1":null,"active":true,"emoji":"📚","hasResources":true},{"id":"3mVDpiHue9jAQ253","publicId":"3mVDpiHue9jAQ253","name":"Unit 2 – Principles of Experimental Design","order":2,"slug":"unit-2","description":"Unit 2 – Principles of Experimental Design","h1":null,"active":true,"emoji":"📚","hasResources":true},{"id":"A1vH8NwymBXRHEvV","publicId":"A1vH8NwymBXRHEvV","name":"Unit 3 – Randomization Techniques","order":3,"slug":"unit-3","description":"Unit 3 – Randomization Techniques","h1":null,"active":true,"emoji":"📚","hasResources":true},{"id":"U3RtoNW3k3bZREZj","publicId":"U3RtoNW3k3bZREZj","name":"Unit 4 – Factorial Designs","order":4,"slug":"unit-4","description":"Unit 4 – Factorial Designs","h1":null,"active":true,"emoji":"📚","hasResources":true},{"id":"cZ8wtKJBydlRlTFK","publicId":"cZ8wtKJBydlRlTFK","name":"Unit 5 – Blocking and Confounding","order":5,"slug":"unit-5","description":"Unit 5 – Blocking and Confounding","h1":null,"active":true,"emoji":"📚","hasResources":true},{"id":"OGPAb8FIJ0ehgGEY","publicId":"OGPAb8FIJ0ehgGEY","name":"Unit 6 – Analysis of Variance (ANOVA)","order":6,"slug":"unit-6","description":"Unit 6 – Analysis of Variance (ANOVA)","h1":null,"active":true,"emoji":"📚","hasResources":true},{"id":"A9bCi8OdM9i0ayuU","publicId":"A9bCi8OdM9i0ayuU","name":"Unit 7 – Statistical Power and Sample Size","order":7,"slug":"unit-7","description":"Unit 7 – Statistical Power and Sample Size Determination","h1":null,"active":true,"emoji":"📚","hasResources":true},{"id":"1cvyYYPw1igkv41P","publicId":"1cvyYYPw1igkv41P","name":"Unit 8 – Split–Plot Designs","order":8,"slug":"unit-8","description":"Unit 8 – Split-Plot Designs","h1":null,"active":true,"emoji":"📚","hasResources":true},{"id":"YZAcKIK3gA9QzbP3","publicId":"YZAcKIK3gA9QzbP3","name":"Unit 9 – Repeated Measures Designs","order":9,"slug":"unit-9","description":"Unit 9 – Repeated Measures Designs","h1":null,"active":true,"emoji":"📚","hasResources":true},{"id":"y2VEHrae1DqTze66","publicId":"y2VEHrae1DqTze66","name":"Unit 10 – Response Surface Methodology","order":10,"slug":"unit-10","description":"Unit 10 – Response Surface Methodology","h1":null,"active":true,"emoji":"📚","hasResources":true},{"id":"xaHDl0vzqzQytXXM","publicId":"xaHDl0vzqzQytXXM","name":"Unit 11 – Designing Experiments for Analysis","order":11,"slug":"unit-11","description":"Unit 11 – Designing Experiments for Statistical Analysis","h1":null,"active":true,"emoji":"📚","hasResources":true},{"id":"a6CutZV1R8FHiyXu","publicId":"a6CutZV1R8FHiyXu","name":"Unit 12 – Interpreting Results & Drawing Conclusions","order":12,"slug":"unit-12","description":"Unit 12 – Interpreting Results and Drawing Valid Conclusions","h1":null,"active":true,"emoji":"📚","hasResources":true},{"id":"roABkStwkw6YnHlS","publicId":"roABkStwkw6YnHlS","name":"Unit 13 – Contemporary Issues in Experimental Design","order":13,"slug":"unit-13","description":"Unit 13 – Contemporary Issues in Experimental Design","h1":null,"active":true,"emoji":"📚","hasResources":true},{"id":"ihOO4Amp468JnBaj","publicId":"ihOO4Amp468JnBaj","name":"Unit 14 – Adaptive Designs","order":14,"slug":"unit-14","description":"Unit 14 – Adaptive Designs","h1":null,"active":true,"emoji":"📚","hasResources":true},{"id":"zhhlIIekmTz76GaB","publicId":"zhhlIIekmTz76GaB","name":"Unit 15 – Optimal Design Theory","order":15,"slug":"unit-15","description":"Unit 15 – Optimal Design Theory","h1":null,"active":true,"emoji":"📚","hasResources":true}]},"unit":{"id":"OGPAb8FIJ0ehgGEY","name":"Unit 6 – Analysis of Variance (ANOVA)","slug":"unit-6","active":true},"replayVideoLocations":[],"resources":[],"streamers":[],"duration":3,"creators":[],"editors":[]},"keyTermsByParentId":[{"_id":"66c15dec31bf7f01700a5315","slug":"r","subjectSlug":"experimental-design","term":"r","definition":"In statistical analysis, 'r' typically represents the correlation coefficient, a measure that describes the strength and direction of a relationship between two variables. Understanding 'r' is crucial for assessing relationships in various designs, including experimental and observational studies, influencing how data is interpreted across multiple contexts.","shortDefinition":null,"relatedTerms":[{"term":"Correlation","definition":"A statistical technique used to determine the degree to which two variables move in relation to each other.","keyTermSlug":null},{"term":"Regression Analysis","definition":"A statistical method used to model and analyze the relationships between a dependent variable and one or more independent variables.","keyTermSlug":null},{"term":"Effect Size","definition":"A quantitative measure of the magnitude of a phenomenon or the strength of an effect in a statistical analysis.","keyTermSlug":null}],"parents":[{"id":"q0KhaZ92DrEtICET","type":"content"},{"id":"qQU75Emt0wrKHm3h","type":"content"},{"id":"mBXAcVPXmJBqz2UX","type":"content"},{"id":"mwehq4wy26ycGdG2","type":"content"},{"id":"zLLywsRZ8YtwnMC2","type":"content"},{"id":"oO5NfvSqmH4AsbKN","type":"content"},{"id":"L18Aw9UHrYsn4J29","type":"content"}]},{"_id":"66c15dec0c3319858544d736","slug":"p-value","subjectSlug":"experimental-design","term":"p-value","definition":"A p-value is a statistical measure that helps determine the significance of results obtained in hypothesis testing. It indicates the probability of observing data at least as extreme as the sample data, assuming the null hypothesis is true. Understanding p-values is crucial as they help researchers make decisions about rejecting or failing to reject the null hypothesis, and they are foundational to various statistical methods and analyses.","shortDefinition":null,"relatedTerms":[{"term":"Null Hypothesis","definition":"A statement asserting that there is no effect or no difference, which researchers aim to test against in hypothesis testing.","keyTermSlug":null},{"term":"Type I Error","definition":"The error that occurs when a true null hypothesis is incorrectly rejected, leading to a false positive result.","keyTermSlug":null},{"term":"Statistical Significance","definition":"A determination that an observed effect or relationship in data is unlikely to have occurred by random chance alone, often indicated by a low p-value.","keyTermSlug":null}],"parents":[{"id":"t8JQRQ0jW41TO6Vv","type":"content"},{"id":"B1YTuE2olszq67i6","type":"content"},{"id":"VsVZV4OfoTSssNIK","type":"content"},{"id":"mwehq4wy26ycGdG2","type":"content"},{"id":"oO5NfvSqmH4AsbKN","type":"content"},{"id":"L18Aw9UHrYsn4J29","type":"content"}]},{"_id":"66c15eb30c3319858544dcbc","slug":"eta-squared","subjectSlug":"experimental-design","term":"eta squared","definition":"Eta squared is a measure of effect size that indicates the proportion of total variance in a dependent variable that can be attributed to a particular independent variable or factor. This statistic helps researchers understand the strength of relationships and the impact of different variables in analyses, especially within the context of ANOVA, power calculations, and assessing practical significance.","shortDefinition":null,"relatedTerms":[{"term":"ANOVA","definition":"ANOVA stands for Analysis of Variance, a statistical method used to test differences between two or more group means.","keyTermSlug":null},{"term":"Effect Size","definition":"Effect size is a quantitative measure of the magnitude of a phenomenon or the strength of a relationship between variables.","keyTermSlug":null},{"term":"Statistical Power","definition":"Statistical power is the probability that a statistical test will correctly reject a false null hypothesis, often influenced by sample size and effect size.","keyTermSlug":null}],"parents":[{"id":"HCLYvhOpM8wGXnQI","type":"content"},{"id":"B1YTuE2olszq67i6","type":"content"},{"id":"L18Aw9UHrYsn4J29","type":"content"}]},{"_id":"66c15eb0a66f65e044c64943","slug":"effect-size","subjectSlug":"experimental-design","term":"Effect Size","definition":"Effect size is a quantitative measure that reflects the magnitude of a treatment effect or the strength of a relationship between variables in a study. It helps in understanding the practical significance of research findings beyond just statistical significance, offering insights into the size of differences or relationships observed.","shortDefinition":null,"relatedTerms":[{"term":"Cohen's d","definition":"A commonly used measure of effect size that calculates the difference between two means divided by the pooled standard deviation, indicating how far apart the two groups are in standard deviation units.","keyTermSlug":null},{"term":"Eta-squared","definition":"A measure of effect size used in the context of ANOVA, representing the proportion of total variance in the dependent variable that is attributed to a factor.","keyTermSlug":null},{"term":"Statistical Power","definition":"The probability that a statistical test will correctly reject a null hypothesis when it is false, which is influenced by sample size, effect size, and significance level.","keyTermSlug":null}],"parents":[{"id":"W18kaCqTU0CM05ZZ","type":"content"},{"id":"HCLYvhOpM8wGXnQI","type":"content"},{"id":"7kWNKi0GYQyGkEwo","type":"content"},{"id":"9c08Y4coKXj0GOjO","type":"content"},{"id":"WzzDYAj1emuk4A9h","type":"content"},{"id":"VsVZV4OfoTSssNIK","type":"content"},{"id":"iflBTr5TWimgzSob","type":"content"},{"id":"y7KKUeScH22364X1","type":"content"},{"id":"h4ukRDZpb3AEBIJn","type":"content"},{"id":"vIxW7WpYfRK9vDp0","type":"content"},{"id":"mwehq4wy26ycGdG2","type":"content"},{"id":"9Hilbjc4aEiYbhKF","type":"content"},{"id":"oO5NfvSqmH4AsbKN","type":"content"},{"id":"L18Aw9UHrYsn4J29","type":"content"},{"id":"0rgNjiLL0grXjYHZ","type":"content"}]},{"_id":"66c15eb90946f59b838b65c2","slug":"cohens-d","subjectSlug":"experimental-design","term":"Cohen's d","definition":"Cohen's d is a measure of effect size that quantifies the difference between two group means in standard deviation units. It provides insight into the magnitude of an effect, allowing researchers to understand how meaningful their findings are beyond just statistical significance. This measure connects deeply with concepts like statistical power, sample size, and practical significance, making it vital for analyzing research outcomes effectively.","shortDefinition":null,"relatedTerms":[{"term":"Effect Size","definition":"A quantitative measure that describes the strength of a relationship or the magnitude of an effect in research, helping to determine practical significance.","keyTermSlug":null},{"term":"Statistical Power","definition":"The probability that a statistical test will correctly reject a false null hypothesis, often influenced by sample size and effect size.","keyTermSlug":null},{"term":"ANOVA","definition":"Analysis of Variance, a statistical method used to compare means among three or more groups to determine if at least one group mean is significantly different.","keyTermSlug":null}],"parents":[{"id":"HCLYvhOpM8wGXnQI","type":"content"},{"id":"B1YTuE2olszq67i6","type":"content"},{"id":"WzzDYAj1emuk4A9h","type":"content"},{"id":"VsVZV4OfoTSssNIK","type":"content"},{"id":"h4ukRDZpb3AEBIJn","type":"content"},{"id":"nKglpmUvpusG3h9i","type":"content"},{"id":"L18Aw9UHrYsn4J29","type":"content"}]},{"_id":"66c15ebd2965e1696c1ef646","slug":"sas","subjectSlug":"experimental-design","term":"SAS","definition":"SAS stands for Statistical Analysis System, a software suite used for advanced analytics, business intelligence, and data management. It is commonly employed to perform various statistical analyses, including ANOVA and repeated measures designs, allowing researchers to evaluate data integrity and handle complex datasets effectively.","shortDefinition":null,"relatedTerms":[{"term":"ANOVA","definition":"Analysis of Variance, a statistical method used to test differences between two or more group means.","keyTermSlug":null},{"term":"Imputation","definition":"A statistical technique used to replace missing data with substituted values to maintain the integrity of analysis.","keyTermSlug":null},{"term":"Data Diagnostics","definition":"Procedures and methods used to assess the quality and validity of data before conducting statistical analyses.","keyTermSlug":null}],"parents":[{"id":"q0KhaZ92DrEtICET","type":"content"},{"id":"L18Aw9UHrYsn4J29","type":"content"}]},{"_id":"66c15ec04a470781133306dc","slug":"durbin-watson-statistic","subjectSlug":"experimental-design","term":"Durbin-Watson Statistic","definition":"The Durbin-Watson statistic is a test statistic used to detect the presence of autocorrelation in the residuals from a regression analysis. Specifically, it helps to assess whether the residuals are correlated across time or space, which can violate key assumptions in statistical modeling, such as independence. This statistic ranges from 0 to 4, with values around 2 indicating no autocorrelation, values less than 2 suggesting positive autocorrelation, and values greater than 2 suggesting negative autocorrelation.","shortDefinition":null,"relatedTerms":[{"term":"Autocorrelation","definition":"A statistical phenomenon where residuals from a regression model are correlated with each other over time or space.","keyTermSlug":null},{"term":"Residuals","definition":"The differences between observed values and the values predicted by a regression model.","keyTermSlug":null},{"term":"Assumptions of Regression","definition":"Key conditions that must be met for the results of regression analysis to be valid, including linearity, independence, homoscedasticity, and normality of residuals.","keyTermSlug":null}],"parents":[{"id":"L18Aw9UHrYsn4J29","type":"content"}]},{"_id":"66c15ec04a470781133306d5","slug":"levenes-test","subjectSlug":"experimental-design","term":"Levene's Test","definition":"Levene's Test is a statistical procedure used to assess the equality of variances across groups. It plays a crucial role in validating one of the key assumptions of ANOVA, which is that the variances among different groups being compared are approximately equal. By checking this assumption, researchers can ensure that their results are more reliable and that the conclusions drawn from an ANOVA analysis are valid.","shortDefinition":null,"relatedTerms":[{"term":"ANOVA","definition":"Analysis of Variance (ANOVA) is a statistical method used to compare means among three or more groups to determine if at least one group mean is significantly different from the others.","keyTermSlug":null},{"term":"Homogeneity of Variance","definition":"The assumption that different samples have the same variance, which is essential for the validity of ANOVA results.","keyTermSlug":null},{"term":"F-test","definition":"A statistical test used to compare the variances of two or more groups to determine if they are significantly different from each other.","keyTermSlug":null}],"parents":[{"id":"L18Aw9UHrYsn4J29","type":"content"}]},{"_id":"66c15ec02965e1696c1ef656","slug":"square-root-transformation","subjectSlug":"experimental-design","term":"square root transformation","definition":"A square root transformation is a statistical technique used to stabilize variance and make data more normally distributed by applying the square root function to each data point. This method is particularly useful when dealing with count data or datasets exhibiting heteroscedasticity, as it helps meet the assumptions required for analysis of variance (ANOVA). By reducing the influence of larger values, this transformation improves the reliability of statistical tests and enhances interpretability.","shortDefinition":null,"relatedTerms":[{"term":"Heteroscedasticity","definition":"A condition in which the variance of errors varies across observations, often violating the assumptions of linear regression models.","keyTermSlug":null},{"term":"Normality","definition":"The assumption that the residuals of a model are normally distributed, which is crucial for the validity of many statistical tests.","keyTermSlug":null},{"term":"Variance Stabilization","definition":"The process of transforming data to achieve constant variance across levels of an independent variable, enhancing the robustness of statistical analyses.","keyTermSlug":null}],"parents":[{"id":"L18Aw9UHrYsn4J29","type":"content"}]},{"_id":"66c15ec10946f59b838b6611","slug":"repeated-measures-anova","subjectSlug":"experimental-design","term":"repeated measures ANOVA","definition":"Repeated measures ANOVA is a statistical method used to compare means across multiple groups when the same subjects are measured under different conditions or over time. This approach is particularly useful for analyzing data where the same participants are involved in all treatments, allowing researchers to account for individual differences and reduce the error variance associated with those differences.","shortDefinition":null,"relatedTerms":[{"term":"Within-Subject Design","definition":"A research design where the same subjects are exposed to all levels of the independent variable, allowing for direct comparisons within individuals.","keyTermSlug":null},{"term":"Sphericity","definition":"An assumption of repeated measures ANOVA that states the variances of the differences between all combinations of related groups should be equal.","keyTermSlug":null},{"term":"Post Hoc Tests","definition":"Statistical tests conducted after an ANOVA to determine which specific group means are significantly different from each other.","keyTermSlug":null}],"parents":[{"id":"mwehq4wy26ycGdG2","type":"content"},{"id":"L18Aw9UHrYsn4J29","type":"content"}]},{"_id":"66c15ec031bf7f01700a589c","slug":"log-transformation","subjectSlug":"experimental-design","term":"log transformation","definition":"Log transformation is a mathematical operation that replaces each value in a dataset with its logarithm, typically using base 10 or the natural logarithm (base e). This technique is particularly useful in statistical analysis to stabilize variance, make data more normally distributed, and meet the assumptions required for various statistical tests like ANOVA.","shortDefinition":null,"relatedTerms":[{"term":"Variance Stabilization","definition":"A process used in statistics to make the variability of a dataset more consistent across different levels of an independent variable.","keyTermSlug":null},{"term":"Normal Distribution","definition":"A probability distribution that is symmetric about the mean, showing that data near the mean are more frequent in occurrence than data far from the mean.","keyTermSlug":null},{"term":"ANOVA (Analysis of Variance)","definition":"A statistical method used to compare means among three or more groups to determine if at least one group mean is significantly different from the others.","keyTermSlug":null}],"parents":[{"id":"L18Aw9UHrYsn4J29","type":"content"}]},{"_id":"66c15ec00c3319858544dce1","slug":"f-statistic","subjectSlug":"experimental-design","term":"f-statistic","definition":"The f-statistic is a ratio that compares the variance between group means to the variance within groups in ANOVA (Analysis of Variance). It helps determine if there are statistically significant differences between the means of three or more groups. A higher f-statistic indicates a greater disparity among group means relative to the variability within each group, suggesting that at least one group mean is different from the others.","shortDefinition":null,"relatedTerms":[{"term":"ANOVA","definition":"ANOVA stands for Analysis of Variance, a statistical method used to compare means among three or more groups to see if at least one differs significantly.","keyTermSlug":null},{"term":"Mean Square","definition":"Mean Square is a measure of variance calculated by dividing the sum of squares by the degrees of freedom, used in the computation of the f-statistic.","keyTermSlug":null},{"term":"Null Hypothesis","definition":"The null hypothesis states that there is no effect or difference; in ANOVA, it asserts that all group means are equal.","keyTermSlug":null}],"parents":[{"id":"L18Aw9UHrYsn4J29","type":"content"}]},{"_id":"66c15ec831bf7f01700a58cd","slug":"independence-of-observations","subjectSlug":"experimental-design","term":"independence of observations","definition":"Independence of observations means that the data collected from different subjects or experimental units are not influenced by each other. This concept is critical for ensuring the validity of statistical analyses, as violations can lead to biased results and incorrect conclusions. In statistical methods like ANOVA and multifactor ANOVA, this assumption must hold true to accurately assess group differences and interactions among factors.","shortDefinition":null,"relatedTerms":[{"term":"Random Sampling","definition":"The process of selecting a sample from a population in such a way that every individual has an equal chance of being chosen, helping to ensure independence among observations.","keyTermSlug":null},{"term":"Homogeneity of Variance","definition":"The assumption that different groups have similar variances, which works in conjunction with independence of observations in statistical analyses.","keyTermSlug":null},{"term":"Repeated Measures","definition":"A design where the same subjects are used for multiple measurements, which can introduce dependence among observations if not properly accounted for.","keyTermSlug":null}],"parents":[{"id":"mwehq4wy26ycGdG2","type":"content"},{"id":"L18Aw9UHrYsn4J29","type":"content"}]},{"_id":"66c15ec5a66f65e044c649ca","slug":"shapiro-wilk-test","subjectSlug":"experimental-design","term":"Shapiro-Wilk Test","definition":"The Shapiro-Wilk Test is a statistical test used to determine whether a given dataset is normally distributed. It's particularly useful in the context of ANOVA, as one of the key assumptions for ANOVA is that the data should be normally distributed within each group being compared. This test helps assess whether this assumption holds, allowing researchers to make valid inferences based on their data.","shortDefinition":null,"relatedTerms":[{"term":"Normal Distribution","definition":"A probability distribution that is symmetric about the mean, showing that data near the mean are more frequent in occurrence than data far from the mean.","keyTermSlug":null},{"term":"ANOVA Assumptions","definition":"Conditions that must be satisfied for ANOVA to produce valid results, including normality, homogeneity of variances, and independence of observations.","keyTermSlug":null},{"term":"P-Value","definition":"The probability of obtaining test results at least as extreme as the observed results, assuming that the null hypothesis is true.","keyTermSlug":null}],"parents":[{"id":"L18Aw9UHrYsn4J29","type":"content"}]},{"_id":"66c15ec931bf7f01700a58db","slug":"one-way-anova","subjectSlug":"experimental-design","term":"one-way anova","definition":"One-way ANOVA (Analysis of Variance) is a statistical technique used to compare the means of three or more independent groups to determine if at least one group mean is statistically different from the others. This method is essential for analyzing experimental data and helps in understanding the impact of a single independent variable on a dependent variable while checking assumptions and diagnostics, calculating sample size, and selecting appropriate tests.","shortDefinition":null,"relatedTerms":[{"term":"Independent Variable","definition":"A variable that is manipulated or categorized in an experiment to observe its effect on a dependent variable.","keyTermSlug":null},{"term":"Post-hoc Tests","definition":"Statistical tests performed after an ANOVA to determine which specific group means are different when the ANOVA indicates significant differences.","keyTermSlug":null},{"term":"F-test","definition":"A statistical test used to compare the variances of two or more groups, which is the basis for conducting an ANOVA.","keyTermSlug":null}],"parents":[{"id":"WzzDYAj1emuk4A9h","type":"content"},{"id":"y7KKUeScH22364X1","type":"content"},{"id":"L18Aw9UHrYsn4J29","type":"content"}]},{"_id":"66c15ed50c3319858544dd63","slug":"type-i-error","subjectSlug":"experimental-design","term":"Type I Error","definition":"A Type I error occurs when a null hypothesis is incorrectly rejected, leading to the conclusion that there is an effect or difference when none actually exists. This mistake can have serious implications in various statistical contexts, affecting the reliability of results and decision-making processes.","shortDefinition":null,"relatedTerms":[{"term":"Null Hypothesis","definition":"A statement that there is no effect or no difference, serving as the starting point for statistical testing.","keyTermSlug":null},{"term":"Significance Level","definition":"The probability of making a Type I error, commonly denoted as alpha (α), typically set at 0.05 or 0.01 in hypothesis testing.","keyTermSlug":null},{"term":"Type II Error","definition":"A Type II error occurs when a null hypothesis is not rejected when it is false, leading to the failure to detect an effect that is present.","keyTermSlug":null}],"parents":[{"id":"W18kaCqTU0CM05ZZ","type":"content"},{"id":"HCLYvhOpM8wGXnQI","type":"content"},{"id":"9c08Y4coKXj0GOjO","type":"content"},{"id":"VsVZV4OfoTSssNIK","type":"content"},{"id":"y7KKUeScH22364X1","type":"content"},{"id":"h4ukRDZpb3AEBIJn","type":"content"},{"id":"ejQHVwPTrz04MHvZ","type":"content"},{"id":"L18Aw9UHrYsn4J29","type":"content"},{"id":"9k7XZWXBClXuM3vG","type":"content"}]},{"_id":"66c15ed6a66f65e044c64a3e","slug":"type-ii-error","subjectSlug":"experimental-design","term":"Type II Error","definition":"A Type II error occurs when a statistical test fails to reject a false null hypothesis, leading to the incorrect conclusion that there is no effect or difference when one actually exists. This concept is crucial as it relates to the sensitivity of tests, impacting the reliability of experimental results and interpretations.","shortDefinition":null,"relatedTerms":[{"term":"Null Hypothesis","definition":"The hypothesis stating that there is no effect or no difference, which researchers aim to test against.","keyTermSlug":null},{"term":"Statistical Power","definition":"The probability that a test correctly rejects a false null hypothesis, indicating its ability to detect an effect when one truly exists.","keyTermSlug":null},{"term":"Type I Error","definition":"The error that occurs when a true null hypothesis is incorrectly rejected, leading to a false positive result.","keyTermSlug":null}],"parents":[{"id":"W18kaCqTU0CM05ZZ","type":"content"},{"id":"HCLYvhOpM8wGXnQI","type":"content"},{"id":"9c08Y4coKXj0GOjO","type":"content"},{"id":"VsVZV4OfoTSssNIK","type":"content"},{"id":"y7KKUeScH22364X1","type":"content"},{"id":"h4ukRDZpb3AEBIJn","type":"content"},{"id":"L18Aw9UHrYsn4J29","type":"content"},{"id":"9k7XZWXBClXuM3vG","type":"content"}]},{"_id":"66c15f0de7ad9f341d8d2b41","slug":"homogeneity-of-variance","subjectSlug":"experimental-design","term":"homogeneity of variance","definition":"Homogeneity of variance refers to the assumption that different groups in a statistical test have the same variance or spread in their data. This concept is crucial when performing analyses like ANOVA, as violating this assumption can lead to incorrect conclusions about the differences between groups. Ensuring homogeneity of variance helps validate the results and interpretations derived from statistical tests, making it a fundamental consideration when comparing multiple groups.","shortDefinition":null,"relatedTerms":[{"term":"ANOVA","definition":"Analysis of Variance, a statistical method used to compare means among three or more groups and determine if at least one group mean is statistically different from the others.","keyTermSlug":null},{"term":"Levene's Test","definition":"A statistical test used to assess the equality of variances across different groups, often employed before conducting ANOVA.","keyTermSlug":null},{"term":"Post-hoc tests","definition":"Statistical tests conducted after ANOVA to determine which specific group means are significantly different from one another.","keyTermSlug":null}],"parents":[{"id":"0Lqbg6Q47lnTmiko","type":"content"},{"id":"y7KKUeScH22364X1","type":"content"},{"id":"ejQHVwPTrz04MHvZ","type":"content"},{"id":"L18Aw9UHrYsn4J29","type":"content"}]},{"_id":"66c15f0d2965e1696c1ef853","slug":"bonferroni-correction","subjectSlug":"experimental-design","term":"Bonferroni correction","definition":"The Bonferroni correction is a statistical method used to counteract the problem of multiple comparisons by adjusting the significance level when conducting multiple tests. By dividing the desired alpha level (e.g., 0.05) by the number of comparisons being made, it helps to reduce the likelihood of Type I errors, which occur when a true null hypothesis is incorrectly rejected. This adjustment is particularly relevant in analyses involving multiple groups or factors, ensuring that findings remain statistically valid.","shortDefinition":null,"relatedTerms":[{"term":"Type I error","definition":"The error that occurs when a true null hypothesis is incorrectly rejected, leading to a false positive result.","keyTermSlug":null},{"term":"ANOVA","definition":"Analysis of variance, a statistical method used to compare means among three or more groups to determine if at least one group mean is significantly different.","keyTermSlug":null},{"term":"Post-hoc tests","definition":"Statistical tests conducted after an ANOVA to determine which specific group means are different when the overall test indicates significance.","keyTermSlug":null}],"parents":[{"id":"0Lqbg6Q47lnTmiko","type":"content"},{"id":"ejQHVwPTrz04MHvZ","type":"content"},{"id":"L18Aw9UHrYsn4J29","type":"content"}]},{"_id":"66c15f100946f59b838b6843","slug":"tukeys-hsd","subjectSlug":"experimental-design","term":"Tukey's HSD","definition":"Tukey's HSD (Honestly Significant Difference) is a post-hoc test used to determine which specific group means are different after conducting an ANOVA. It helps in comparing all possible pairs of means while controlling the overall error rate, making it particularly useful in situations with multiple comparisons. This test provides a straightforward way to identify significant differences between groups when the initial analysis indicates that at least one group mean is significantly different from others.","shortDefinition":null,"relatedTerms":[{"term":"ANOVA","definition":"Analysis of Variance, a statistical method used to compare the means of three or more groups to see if at least one differs significantly.","keyTermSlug":null},{"term":"Post-hoc tests","definition":"Statistical tests conducted after an initial analysis to identify specific group differences when an overall effect is detected.","keyTermSlug":null},{"term":"Type I Error","definition":"The incorrect rejection of a true null hypothesis, which can occur more frequently when conducting multiple comparisons without proper adjustments.","keyTermSlug":null}],"parents":[{"id":"0Lqbg6Q47lnTmiko","type":"content"},{"id":"ejQHVwPTrz04MHvZ","type":"content"},{"id":"L18Aw9UHrYsn4J29","type":"content"}]},{"_id":"66c15f1db5d70b6a27b76dbb","slug":"spss","subjectSlug":"experimental-design","term":"SPSS","definition":"SPSS, which stands for Statistical Package for the Social Sciences, is a software program widely used for statistical analysis and data management. It provides tools for performing complex statistical analyses, including various types of ANOVA, handling repeated measures data, and addressing issues like missing data, making it essential for researchers and students in fields that require robust data analysis.","shortDefinition":null,"relatedTerms":[{"term":"ANOVA","definition":"Analysis of Variance (ANOVA) is a statistical method used to test differences between two or more group means.","keyTermSlug":null},{"term":"Data Management","definition":"The process of collecting, organizing, and maintaining data to ensure its accuracy and accessibility for analysis.","keyTermSlug":null},{"term":"Missing Data","definition":"Refers to the absence of data points in a dataset, which can occur for various reasons and needs to be managed appropriately during analysis.","keyTermSlug":null}],"parents":[{"id":"q0KhaZ92DrEtICET","type":"content"},{"id":"qQU75Emt0wrKHm3h","type":"content"},{"id":"mwehq4wy26ycGdG2","type":"content"},{"id":"oO5NfvSqmH4AsbKN","type":"content"},{"id":"L18Aw9UHrYsn4J29","type":"content"}]},{"_id":"66c15f1ee7ad9f341d8d2ba5","slug":"two-way-anova","subjectSlug":"experimental-design","term":"two-way ANOVA","definition":"Two-way ANOVA is a statistical test used to determine the effect of two independent variables on a dependent variable while also examining the interaction between the two independent variables. This method is particularly useful when researchers want to understand how different groups or conditions affect outcomes and whether these effects vary based on the levels of another factor. The analysis helps in understanding complex relationships and interactions that one-way ANOVA might miss.","shortDefinition":null,"relatedTerms":[{"term":"Interaction Effect","definition":"The effect that occurs when the influence of one independent variable on the dependent variable changes at different levels of another independent variable.","keyTermSlug":null},{"term":"Main Effect","definition":"The direct effect of an independent variable on the dependent variable, ignoring other independent variables.","keyTermSlug":null},{"term":"Post Hoc Tests","definition":"Statistical tests conducted after ANOVA to determine which specific group means are significantly different from each other.","keyTermSlug":null}],"parents":[{"id":"0Lqbg6Q47lnTmiko","type":"content"},{"id":"y7KKUeScH22364X1","type":"content"},{"id":"mwehq4wy26ycGdG2","type":"content"},{"id":"L18Aw9UHrYsn4J29","type":"content"}]},{"_id":"66c15f2b0c3319858544df4d","slug":"normality","subjectSlug":"experimental-design","term":"Normality","definition":"Normality refers to the assumption that the data being analyzed follows a normal distribution, which is a bell-shaped curve where most of the observations cluster around the central peak and probabilities for values further away from the mean taper off equally in both directions. This concept is crucial in many statistical methods, as violations of this assumption can lead to misleading results, especially when comparing means across groups or examining relationships between variables.","shortDefinition":null,"relatedTerms":[{"term":"Normal Distribution","definition":"A probability distribution that is symmetric about the mean, showing that data near the mean are more frequent in occurrence than data far from the mean.","keyTermSlug":null},{"term":"Central Limit Theorem","definition":"A statistical theory that states that the distribution of sample means approaches a normal distribution as the sample size increases, regardless of the shape of the population distribution.","keyTermSlug":null},{"term":"Skewness","definition":"A measure of the asymmetry of the probability distribution of a real-valued random variable, which indicates whether data points tend to be more spread out on one side of the mean.","keyTermSlug":null}],"parents":[{"id":"0Lqbg6Q47lnTmiko","type":"content"},{"id":"qQU75Emt0wrKHm3h","type":"content"},{"id":"y7KKUeScH22364X1","type":"content"},{"id":"mwehq4wy26ycGdG2","type":"content"},{"id":"ejQHVwPTrz04MHvZ","type":"content"},{"id":"oO5NfvSqmH4AsbKN","type":"content"},{"id":"L18Aw9UHrYsn4J29","type":"content"}]}],"apQuestionDataBySubjectSlug":[]}},"initialToc":{"units":[{"id":"iA2uesFTUGLgpseU","name":"Unit 1 – Introduction to Experimental Design","emoji":"📚","slug":"unit-1","hasResources":true,"resources":[{"id":"t8JQRQ0jW41TO6Vv","title":"1.1 Fundamentals of scientific method and experimentation","slug":"fundamentals-scientific-method-experimentation","type":"STUDY_GUIDE","date":null},{"id":"QZCSdDgVjjWs74Ct","title":"1.2 Historical perspective on experimental design","slug":"historical-perspective-experimental-design","type":"STUDY_GUIDE","date":null},{"id":"iKNy4skfmjBmXBOe","title":"1.3 Types of variables and their roles in experiments","slug":"types-variables-roles-experiments","type":"STUDY_GUIDE","date":null},{"id":"YINngz7x7lMt9Blf","title":"1.4 Importance of experimental design in research","slug":"importance-experimental-design-research","type":"STUDY_GUIDE","date":null}]},{"id":"3mVDpiHue9jAQ253","name":"Unit 2 – Principles of Experimental Design","emoji":"📚","slug":"unit-2","hasResources":true,"resources":[{"id":"4urivQ0hyvEgbaFT","title":"2.3 Bias and confounding variables","slug":"bias-confounding-variables","type":"STUDY_GUIDE","date":null},{"id":"iflBTr5TWimgzSob","title":"2.4 Experimental validity (internal and external)","slug":"experimental-validity-internal-external","type":"STUDY_GUIDE","date":null},{"id":"dj7Qxpc6NNlabYBv","title":"2.2 Experimental units and sampling techniques","slug":"experimental-units-sampling-techniques","type":"STUDY_GUIDE","date":null},{"id":"vIxW7WpYfRK9vDp0","title":"2.1 Replication, randomization, and local control","slug":"replication-randomization-local-control","type":"STUDY_GUIDE","date":null}]},{"id":"A1vH8NwymBXRHEvV","name":"Unit 3 – Randomization Techniques","emoji":"📚","slug":"unit-3","hasResources":true,"resources":[{"id":"gGnaMfZwHvcklVOt","title":"3.2 Stratified random sampling","slug":"stratified-random-sampling","type":"STUDY_GUIDE","date":null},{"id":"xWqmWA9kFg6QRIck","title":"3.3 Cluster sampling and systematic sampling","slug":"cluster-sampling-systematic-sampling","type":"STUDY_GUIDE","date":null},{"id":"Y6SDZWIfEEV2fdds","title":"3.4 Randomization in practice: methods and tools","slug":"randomization-practice-methods-tools","type":"STUDY_GUIDE","date":null},{"id":"ZYeHKub1RiyaLwY8","title":"3.1 Simple random sampling","slug":"simple-random-sampling","type":"STUDY_GUIDE","date":null}]},{"id":"U3RtoNW3k3bZREZj","name":"Unit 4 – Factorial Designs","emoji":"📚","slug":"unit-4","hasResources":true,"resources":[{"id":"WE0dGBdwZMo8dAsh","title":"4.1 Two-factor factorial designs","slug":"two-factor-factorial-designs","type":"STUDY_GUIDE","date":null},{"id":"Xz41WLyV6eIkDOtE","title":"4.2 Higher-order factorial designs","slug":"higher-order-factorial-designs","type":"STUDY_GUIDE","date":null},{"id":"9Hilbjc4aEiYbhKF","title":"4.3 Main effects and interactions","slug":"main-effects-interactions","type":"STUDY_GUIDE","date":null},{"id":"mBXAcVPXmJBqz2UX","title":"4.4 Fractional factorial designs","slug":"fractional-factorial-designs","type":"STUDY_GUIDE","date":null}]},{"id":"cZ8wtKJBydlRlTFK","name":"Unit 5 – Blocking and Confounding","emoji":"📚","slug":"unit-5","hasResources":true,"resources":[{"id":"9bxFr3Roj88rAoJB","title":"5.1 Principles of blocking","slug":"principles-blocking","type":"STUDY_GUIDE","date":null},{"id":"1x0ymRVIqTaJUmYf","title":"5.2 Randomized complete block designs","slug":"randomized-complete-block-designs","type":"STUDY_GUIDE","date":null},{"id":"reR6bieGMRfYfuiE","title":"5.3 Latin square and Graeco-Latin square designs","slug":"latin-square-graeco-latin-square-designs","type":"STUDY_GUIDE","date":null},{"id":"9k7XZWXBClXuM3vG","title":"5.4 Confounding in factorial experiments","slug":"confounding-factorial-experiments","type":"STUDY_GUIDE","date":null}]},{"id":"OGPAb8FIJ0ehgGEY","name":"Unit 6 – Analysis of Variance (ANOVA)","emoji":"📚","slug":"unit-6","hasResources":true,"resources":[{"id":"oO5NfvSqmH4AsbKN","title":"6.1 One-way ANOVA","slug":"one-way-anova","type":"STUDY_GUIDE","date":null},{"id":"0Lqbg6Q47lnTmiko","title":"6.2 Two-way ANOVA","slug":"two-way-anova","type":"STUDY_GUIDE","date":null},{"id":"L18Aw9UHrYsn4J29","title":"6.4 Assumptions and diagnostics for ANOVA","slug":"assumptions-diagnostics-anova","type":"STUDY_GUIDE","date":null},{"id":"mwehq4wy26ycGdG2","title":"6.3 Multifactor ANOVA","slug":"multifactor-anova","type":"STUDY_GUIDE","date":null}]},{"id":"A9bCi8OdM9i0ayuU","name":"Unit 7 – Statistical Power and Sample Size","emoji":"📚","slug":"unit-7","hasResources":true,"resources":[{"id":"HCLYvhOpM8wGXnQI","title":"7.1 Concepts of statistical power and effect size","slug":"concepts-statistical-power-effect-size","type":"STUDY_GUIDE","date":null},{"id":"W18kaCqTU0CM05ZZ","title":"7.2 Power analysis for different experimental designs","slug":"power-analysis-experimental-designs","type":"STUDY_GUIDE","date":null},{"id":"WzzDYAj1emuk4A9h","title":"7.3 Sample size calculation techniques","slug":"sample-size-calculation-techniques","type":"STUDY_GUIDE","date":null},{"id":"h4ukRDZpb3AEBIJn","title":"7.4 Trade-offs between power, sample size, and effect size","slug":"trade-offs-power-sample-size-effect-size","type":"STUDY_GUIDE","date":null}]},{"id":"1cvyYYPw1igkv41P","name":"Unit 8 – Split–Plot Designs","emoji":"📚","slug":"unit-8","hasResources":true,"resources":[{"id":"oIYOEnHj9hcGTfs5","title":"8.1 Principles of split-plot designs","slug":"principles-split-plot-designs","type":"STUDY_GUIDE","date":null},{"id":"P02eGA1IEX2WtTrv","title":"8.2 Analysis of split-plot experiments","slug":"analysis-split-plot-experiments","type":"STUDY_GUIDE","date":null},{"id":"cbgDMBbS9A27x3Yv","title":"8.4 Applications and limitations of split-plot designs","slug":"applications-limitations-split-plot-designs","type":"STUDY_GUIDE","date":null},{"id":"XwYcBW4wbIHs0zc0","title":"8.3 Split-split plot designs","slug":"split-split-plot-designs","type":"STUDY_GUIDE","date":null}]},{"id":"YZAcKIK3gA9QzbP3","name":"Unit 9 – Repeated Measures Designs","emoji":"📚","slug":"unit-9","hasResources":true,"resources":[{"id":"0rgNjiLL0grXjYHZ","title":"9.2 Between-subjects and within-subjects factors","slug":"between-subjects-within-subjects-factors","type":"STUDY_GUIDE","date":null},{"id":"qQU75Emt0wrKHm3h","title":"9.3 Analysis of repeated measures data","slug":"analysis-repeated-measures-data","type":"STUDY_GUIDE","date":null},{"id":"szM39nC3JyBaJFUc","title":"9.1 Fundamentals of repeated measures experiments","slug":"fundamentals-repeated-measures-experiments","type":"STUDY_GUIDE","date":null},{"id":"q0KhaZ92DrEtICET","title":"9.4 Handling missing data in repeated measures designs","slug":"handling-missing-data-repeated-measures-designs","type":"STUDY_GUIDE","date":null}]},{"id":"y2VEHrae1DqTze66","name":"Unit 10 – Response Surface Methodology","emoji":"📚","slug":"unit-10","hasResources":true,"resources":[{"id":"fiJBI8xrag8MxiNq","title":"10.2 First-order and second-order models","slug":"first-order-second-order-models","type":"STUDY_GUIDE","date":null},{"id":"q9IiCikLenSFfGN3","title":"10.1 Introduction to response surface designs","slug":"introduction-response-surface-designs","type":"STUDY_GUIDE","date":null},{"id":"1Pp7AJO4IRhGv2Ix","title":"10.4 Optimization techniques in response surface methodology","slug":"optimization-techniques-response-surface-methodology","type":"STUDY_GUIDE","date":null},{"id":"8yDKaI6k7DhHiR0L","title":"10.3 Central composite and Box-Behnken designs","slug":"central-composite-box-behnken-designs","type":"STUDY_GUIDE","date":null}]},{"id":"xaHDl0vzqzQytXXM","name":"Unit 11 – Designing Experiments for Analysis","emoji":"📚","slug":"unit-11","hasResources":true,"resources":[{"id":"9nvXsFlhY7MdoiSe","title":"11.2 Experimental design for regression analysis","slug":"experimental-design-regression-analysis","type":"STUDY_GUIDE","date":null},{"id":"yitbOl6RjXATqmGJ","title":"11.4 Bayesian approaches to experimental design","slug":"bayesian-approaches-experimental-design","type":"STUDY_GUIDE","date":null},{"id":"7kWNKi0GYQyGkEwo","title":"11.3 Designing experiments for non-parametric tests","slug":"designing-experiments-non-parametric-tests","type":"STUDY_GUIDE","date":null},{"id":"y7KKUeScH22364X1","title":"11.1 Choosing appropriate statistical tests","slug":"choosing-statistical-tests","type":"STUDY_GUIDE","date":null}]},{"id":"a6CutZV1R8FHiyXu","name":"Unit 12 – Interpreting Results & Drawing Conclusions","emoji":"📚","slug":"unit-12","hasResources":true,"resources":[{"id":"B1YTuE2olszq67i6","title":"12.3 Effect size interpretation and practical significance","slug":"effect-size-interpretation-practical-significance","type":"STUDY_GUIDE","date":null},{"id":"4wh5p53AlfHxJsqO","title":"12.4 Limitations and generalizability of experimental results","slug":"limitations-generalizability-experimental-results","type":"STUDY_GUIDE","date":null},{"id":"VsVZV4OfoTSssNIK","title":"12.1 Statistical inference and hypothesis testing","slug":"statistical-inference-hypothesis-testing","type":"STUDY_GUIDE","date":null},{"id":"ejQHVwPTrz04MHvZ","title":"12.2 Multiple comparisons and post-hoc tests","slug":"multiple-comparisons-post-hoc-tests","type":"STUDY_GUIDE","date":null}]},{"id":"roABkStwkw6YnHlS","name":"Unit 13 – Contemporary Issues in Experimental Design","emoji":"📚","slug":"unit-13","hasResources":true,"resources":[{"id":"UmSC1z6DtdRXKnN5","title":"13.4 Machine learning approaches in experimental design","slug":"machine-learning-approaches-experimental-design","type":"STUDY_GUIDE","date":null},{"id":"nKglpmUvpusG3h9i","title":"13.2 Reproducibility crisis and solutions","slug":"reproducibility-crisis-solutions","type":"STUDY_GUIDE","date":null},{"id":"zLLywsRZ8YtwnMC2","title":"13.3 Big data and high-dimensional experiments","slug":"big-data-high-dimensional-experiments","type":"STUDY_GUIDE","date":null},{"id":"rSGfFiBNg5pNgmug","title":"13.1 Ethical considerations in experimental research","slug":"ethical-considerations-experimental-research","type":"STUDY_GUIDE","date":null}]},{"id":"ihOO4Amp468JnBaj","name":"Unit 14 – Adaptive Designs","emoji":"📚","slug":"unit-14","hasResources":true,"resources":[{"id":"wyKcszFQtBXh1d6A","title":"14.1 Principles of adaptive experimental designs","slug":"principles-adaptive-experimental-designs","type":"STUDY_GUIDE","date":null},{"id":"KEyU7X82K60kEOH8","title":"14.2 Sequential and group sequential designs","slug":"sequential-group-sequential-designs","type":"STUDY_GUIDE","date":null},{"id":"9c08Y4coKXj0GOjO","title":"14.3 Sample size re-estimation methods","slug":"sample-size-re-estimation-methods","type":"STUDY_GUIDE","date":null},{"id":"1Vdv8UchzucUYSRi","title":"14.4 Applications of adaptive designs in clinical trials","slug":"applications-adaptive-designs-clinical-trials","type":"STUDY_GUIDE","date":null}]},{"id":"zhhlIIekmTz76GaB","name":"Unit 15 – Optimal Design Theory","emoji":"📚","slug":"unit-15","hasResources":true,"resources":[{"id":"AvvUCe8w6phXKuyA","title":"15.2 Alphabetic optimality criteria (A, D, E, G-optimality)","slug":"alphabetic-optimality-criteria-a-d-e-g-optimality","type":"STUDY_GUIDE","date":null},{"id":"mnHHCcSOhQaf2jU8","title":"15.1 Fundamentals of optimal design theory","slug":"fundamentals-optimal-design-theory","type":"STUDY_GUIDE","date":null},{"id":"yHLFIKBMsNCa1S1w","title":"15.3 Computer-aided optimal design generation","slug":"computer-aided-optimal-design-generation","type":"STUDY_GUIDE","date":null},{"id":"mJrxlf8sDYA6X1TO","title":"15.4 Robust optimal designs","slug":"robust-optimal-designs","type":"STUDY_GUIDE","date":null}]}],"activeUnit":{"id":"OGPAb8FIJ0ehgGEY","publicId":"OGPAb8FIJ0ehgGEY","name":"Unit 6 – Analysis of Variance (ANOVA)","order":6,"slug":"unit-6","description":"Unit 6 – Analysis of Variance (ANOVA)","h1":null,"active":true,"emoji":"📚","hasResources":true},"activeSubject":{"id":"experimental-design","name":"Experimental Design","emoji":"📊","slug":"experimental-design","active":true,"keyTermsActive":null,"category":"Math & Computer Science","hasCalculators":false,"hasKeyTerms":true,"hasPracticeQuestions":false,"units":[{"id":"iA2uesFTUGLgpseU","name":"Unit 1 – Introduction to Experimental Design","emoji":"📚","slug":"unit-1","hasResources":true,"resources":[{"id":"t8JQRQ0jW41TO6Vv","title":"1.1 Fundamentals of scientific method and experimentation","slug":"fundamentals-scientific-method-experimentation","type":"STUDY_GUIDE","date":null},{"id":"QZCSdDgVjjWs74Ct","title":"1.2 Historical perspective on experimental design","slug":"historical-perspective-experimental-design","type":"STUDY_GUIDE","date":null},{"id":"iKNy4skfmjBmXBOe","title":"1.3 Types of variables and their roles in experiments","slug":"types-variables-roles-experiments","type":"STUDY_GUIDE","date":null},{"id":"YINngz7x7lMt9Blf","title":"1.4 Importance of experimental design in research","slug":"importance-experimental-design-research","type":"STUDY_GUIDE","date":null}]},{"id":"3mVDpiHue9jAQ253","name":"Unit 2 – Principles of Experimental Design","emoji":"📚","slug":"unit-2","hasResources":true,"resources":[{"id":"4urivQ0hyvEgbaFT","title":"2.3 Bias and confounding variables","slug":"bias-confounding-variables","type":"STUDY_GUIDE","date":null},{"id":"iflBTr5TWimgzSob","title":"2.4 Experimental validity (internal and external)","slug":"experimental-validity-internal-external","type":"STUDY_GUIDE","date":null},{"id":"dj7Qxpc6NNlabYBv","title":"2.2 Experimental units and sampling techniques","slug":"experimental-units-sampling-techniques","type":"STUDY_GUIDE","date":null},{"id":"vIxW7WpYfRK9vDp0","title":"2.1 Replication, randomization, and local control","slug":"replication-randomization-local-control","type":"STUDY_GUIDE","date":null}]},{"id":"A1vH8NwymBXRHEvV","name":"Unit 3 – Randomization Techniques","emoji":"📚","slug":"unit-3","hasResources":true,"resources":[{"id":"gGnaMfZwHvcklVOt","title":"3.2 Stratified random sampling","slug":"stratified-random-sampling","type":"STUDY_GUIDE","date":null},{"id":"xWqmWA9kFg6QRIck","title":"3.3 Cluster sampling and systematic sampling","slug":"cluster-sampling-systematic-sampling","type":"STUDY_GUIDE","date":null},{"id":"Y6SDZWIfEEV2fdds","title":"3.4 Randomization in practice: methods and tools","slug":"randomization-practice-methods-tools","type":"STUDY_GUIDE","date":null},{"id":"ZYeHKub1RiyaLwY8","title":"3.1 Simple random sampling","slug":"simple-random-sampling","type":"STUDY_GUIDE","date":null}]},{"id":"U3RtoNW3k3bZREZj","name":"Unit 4 – Factorial Designs","emoji":"📚","slug":"unit-4","hasResources":true,"resources":[{"id":"WE0dGBdwZMo8dAsh","title":"4.1 Two-factor factorial designs","slug":"two-factor-factorial-designs","type":"STUDY_GUIDE","date":null},{"id":"Xz41WLyV6eIkDOtE","title":"4.2 Higher-order factorial designs","slug":"higher-order-factorial-designs","type":"STUDY_GUIDE","date":null},{"id":"9Hilbjc4aEiYbhKF","title":"4.3 Main effects and interactions","slug":"main-effects-interactions","type":"STUDY_GUIDE","date":null},{"id":"mBXAcVPXmJBqz2UX","title":"4.4 Fractional factorial designs","slug":"fractional-factorial-designs","type":"STUDY_GUIDE","date":null}]},{"id":"cZ8wtKJBydlRlTFK","name":"Unit 5 – Blocking and Confounding","emoji":"📚","slug":"unit-5","hasResources":true,"resources":[{"id":"9bxFr3Roj88rAoJB","title":"5.1 Principles of blocking","slug":"principles-blocking","type":"STUDY_GUIDE","date":null},{"id":"1x0ymRVIqTaJUmYf","title":"5.2 Randomized complete block designs","slug":"randomized-complete-block-designs","type":"STUDY_GUIDE","date":null},{"id":"reR6bieGMRfYfuiE","title":"5.3 Latin square and Graeco-Latin square designs","slug":"latin-square-graeco-latin-square-designs","type":"STUDY_GUIDE","date":null},{"id":"9k7XZWXBClXuM3vG","title":"5.4 Confounding in factorial experiments","slug":"confounding-factorial-experiments","type":"STUDY_GUIDE","date":null}]},{"id":"OGPAb8FIJ0ehgGEY","name":"Unit 6 – Analysis of Variance (ANOVA)","emoji":"📚","slug":"unit-6","hasResources":true,"resources":[{"id":"oO5NfvSqmH4AsbKN","title":"6.1 One-way ANOVA","slug":"one-way-anova","type":"STUDY_GUIDE","date":null},{"id":"0Lqbg6Q47lnTmiko","title":"6.2 Two-way ANOVA","slug":"two-way-anova","type":"STUDY_GUIDE","date":null},{"id":"L18Aw9UHrYsn4J29","title":"6.4 Assumptions and diagnostics for ANOVA","slug":"assumptions-diagnostics-anova","type":"STUDY_GUIDE","date":null},{"id":"mwehq4wy26ycGdG2","title":"6.3 Multifactor ANOVA","slug":"multifactor-anova","type":"STUDY_GUIDE","date":null}]},{"id":"A9bCi8OdM9i0ayuU","name":"Unit 7 – Statistical Power and Sample Size","emoji":"📚","slug":"unit-7","hasResources":true,"resources":[{"id":"HCLYvhOpM8wGXnQI","title":"7.1 Concepts of statistical power and effect size","slug":"concepts-statistical-power-effect-size","type":"STUDY_GUIDE","date":null},{"id":"W18kaCqTU0CM05ZZ","title":"7.2 Power analysis for different experimental designs","slug":"power-analysis-experimental-designs","type":"STUDY_GUIDE","date":null},{"id":"WzzDYAj1emuk4A9h","title":"7.3 Sample size calculation techniques","slug":"sample-size-calculation-techniques","type":"STUDY_GUIDE","date":null},{"id":"h4ukRDZpb3AEBIJn","title":"7.4 Trade-offs between power, sample size, and effect size","slug":"trade-offs-power-sample-size-effect-size","type":"STUDY_GUIDE","date":null}]},{"id":"1cvyYYPw1igkv41P","name":"Unit 8 – Split–Plot Designs","emoji":"📚","slug":"unit-8","hasResources":true,"resources":[{"id":"oIYOEnHj9hcGTfs5","title":"8.1 Principles of split-plot designs","slug":"principles-split-plot-designs","type":"STUDY_GUIDE","date":null},{"id":"P02eGA1IEX2WtTrv","title":"8.2 Analysis of split-plot experiments","slug":"analysis-split-plot-experiments","type":"STUDY_GUIDE","date":null},{"id":"cbgDMBbS9A27x3Yv","title":"8.4 Applications and limitations of split-plot designs","slug":"applications-limitations-split-plot-designs","type":"STUDY_GUIDE","date":null},{"id":"XwYcBW4wbIHs0zc0","title":"8.3 Split-split plot designs","slug":"split-split-plot-designs","type":"STUDY_GUIDE","date":null}]},{"id":"YZAcKIK3gA9QzbP3","name":"Unit 9 – Repeated Measures Designs","emoji":"📚","slug":"unit-9","hasResources":true,"resources":[{"id":"0rgNjiLL0grXjYHZ","title":"9.2 Between-subjects and within-subjects factors","slug":"between-subjects-within-subjects-factors","type":"STUDY_GUIDE","date":null},{"id":"qQU75Emt0wrKHm3h","title":"9.3 Analysis of repeated measures data","slug":"analysis-repeated-measures-data","type":"STUDY_GUIDE","date":null},{"id":"szM39nC3JyBaJFUc","title":"9.1 Fundamentals of repeated measures experiments","slug":"fundamentals-repeated-measures-experiments","type":"STUDY_GUIDE","date":null},{"id":"q0KhaZ92DrEtICET","title":"9.4 Handling missing data in repeated measures designs","slug":"handling-missing-data-repeated-measures-designs","type":"STUDY_GUIDE","date":null}]},{"id":"y2VEHrae1DqTze66","name":"Unit 10 – Response Surface Methodology","emoji":"📚","slug":"unit-10","hasResources":true,"resources":[{"id":"fiJBI8xrag8MxiNq","title":"10.2 First-order and second-order models","slug":"first-order-second-order-models","type":"STUDY_GUIDE","date":null},{"id":"q9IiCikLenSFfGN3","title":"10.1 Introduction to response surface designs","slug":"introduction-response-surface-designs","type":"STUDY_GUIDE","date":null},{"id":"1Pp7AJO4IRhGv2Ix","title":"10.4 Optimization techniques in response surface methodology","slug":"optimization-techniques-response-surface-methodology","type":"STUDY_GUIDE","date":null},{"id":"8yDKaI6k7DhHiR0L","title":"10.3 Central composite and Box-Behnken designs","slug":"central-composite-box-behnken-designs","type":"STUDY_GUIDE","date":null}]},{"id":"xaHDl0vzqzQytXXM","name":"Unit 11 – Designing Experiments for Analysis","emoji":"📚","slug":"unit-11","hasResources":true,"resources":[{"id":"9nvXsFlhY7MdoiSe","title":"11.2 Experimental design for regression analysis","slug":"experimental-design-regression-analysis","type":"STUDY_GUIDE","date":null},{"id":"yitbOl6RjXATqmGJ","title":"11.4 Bayesian approaches to experimental design","slug":"bayesian-approaches-experimental-design","type":"STUDY_GUIDE","date":null},{"id":"7kWNKi0GYQyGkEwo","title":"11.3 Designing experiments for non-parametric tests","slug":"designing-experiments-non-parametric-tests","type":"STUDY_GUIDE","date":null},{"id":"y7KKUeScH22364X1","title":"11.1 Choosing appropriate statistical tests","slug":"choosing-statistical-tests","type":"STUDY_GUIDE","date":null}]},{"id":"a6CutZV1R8FHiyXu","name":"Unit 12 – Interpreting Results & Drawing Conclusions","emoji":"📚","slug":"unit-12","hasResources":true,"resources":[{"id":"B1YTuE2olszq67i6","title":"12.3 Effect size interpretation and practical significance","slug":"effect-size-interpretation-practical-significance","type":"STUDY_GUIDE","date":null},{"id":"4wh5p53AlfHxJsqO","title":"12.4 Limitations and generalizability of experimental results","slug":"limitations-generalizability-experimental-results","type":"STUDY_GUIDE","date":null},{"id":"VsVZV4OfoTSssNIK","title":"12.1 Statistical inference and hypothesis testing","slug":"statistical-inference-hypothesis-testing","type":"STUDY_GUIDE","date":null},{"id":"ejQHVwPTrz04MHvZ","title":"12.2 Multiple comparisons and post-hoc tests","slug":"multiple-comparisons-post-hoc-tests","type":"STUDY_GUIDE","date":null}]},{"id":"roABkStwkw6YnHlS","name":"Unit 13 – Contemporary Issues in Experimental Design","emoji":"📚","slug":"unit-13","hasResources":true,"resources":[{"id":"UmSC1z6DtdRXKnN5","title":"13.4 Machine learning approaches in experimental design","slug":"machine-learning-approaches-experimental-design","type":"STUDY_GUIDE","date":null},{"id":"nKglpmUvpusG3h9i","title":"13.2 Reproducibility crisis and solutions","slug":"reproducibility-crisis-solutions","type":"STUDY_GUIDE","date":null},{"id":"zLLywsRZ8YtwnMC2","title":"13.3 Big data and high-dimensional experiments","slug":"big-data-high-dimensional-experiments","type":"STUDY_GUIDE","date":null},{"id":"rSGfFiBNg5pNgmug","title":"13.1 Ethical considerations in experimental research","slug":"ethical-considerations-experimental-research","type":"STUDY_GUIDE","date":null}]},{"id":"ihOO4Amp468JnBaj","name":"Unit 14 – Adaptive Designs","emoji":"📚","slug":"unit-14","hasResources":true,"resources":[{"id":"wyKcszFQtBXh1d6A","title":"14.1 Principles of adaptive experimental designs","slug":"principles-adaptive-experimental-designs","type":"STUDY_GUIDE","date":null},{"id":"KEyU7X82K60kEOH8","title":"14.2 Sequential and group sequential designs","slug":"sequential-group-sequential-designs","type":"STUDY_GUIDE","date":null},{"id":"9c08Y4coKXj0GOjO","title":"14.3 Sample size re-estimation methods","slug":"sample-size-re-estimation-methods","type":"STUDY_GUIDE","date":null},{"id":"1Vdv8UchzucUYSRi","title":"14.4 Applications of adaptive designs in clinical trials","slug":"applications-adaptive-designs-clinical-trials","type":"STUDY_GUIDE","date":null}]},{"id":"zhhlIIekmTz76GaB","name":"Unit 15 – Optimal Design Theory","emoji":"📚","slug":"unit-15","hasResources":true,"resources":[{"id":"AvvUCe8w6phXKuyA","title":"15.2 Alphabetic optimality criteria (A, D, E, G-optimality)","slug":"alphabetic-optimality-criteria-a-d-e-g-optimality","type":"STUDY_GUIDE","date":null},{"id":"mnHHCcSOhQaf2jU8","title":"15.1 Fundamentals of optimal design theory","slug":"fundamentals-optimal-design-theory","type":"STUDY_GUIDE","date":null},{"id":"yHLFIKBMsNCa1S1w","title":"15.3 Computer-aided optimal design generation","slug":"computer-aided-optimal-design-generation","type":"STUDY_GUIDE","date":null},{"id":"mJrxlf8sDYA6X1TO","title":"15.4 Robust optimal designs","slug":"robust-optimal-designs","type":"STUDY_GUIDE","date":null}]}]}},"subjectBySlug":{"id":"experimental-design","name":"Experimental Design","branch":"Math","keyTermsActive":null,"subBranches":[{"name":"Statistics"}],"description":"## What do you learn in Experimental Design\n\nExperimental Design covers the principles of planning and conducting experiments to draw valid conclusions. You'll learn about randomization, replication, blocking, factorial designs, and analysis of variance (ANOVA). The course dives into sample size determination, power analysis, and how to handle confounding variables. You'll also explore split-plot designs and repeated measures experiments.\n\n## Is Experimental Design hard?\n\nExperimental Design can be challenging, but it's not impossible. The concepts can get pretty abstract, and there's a fair amount of statistical theory to wrap your head around. The math isn't too intense, but you'll need to be comfortable with basic stats. The trickiest part is often applying the concepts to real-world scenarios. It's definitely not a blow-off class, but with some effort, you can totally handle it.\n\n## Tips for taking Experimental Design in college\n\n1. Use [Fiveable Study Guides](https://fiveable.me/cram-mode) to help you cram 🌶️\n2. Practice designing experiments for everyday situations to make concepts more relatable\n3. Create visual flowcharts for different design types (completely randomized, randomized block, etc.)\n4. Form a study group to discuss and debate the pros and cons of various designs\n5. Use statistical software like R or SAS to analyze data from example experiments\n6. Watch \"Mythbusters\" episodes to see experimental design in action\n7. Read \"The Design of Experiments\" by R.A. Fisher for a historical perspective\n\n## Common pre-requisites for Experimental Design\n\n1. Introduction to Statistics: This course covers basic statistical concepts, probability theory, and hypothesis testing. It lays the foundation for more advanced statistical methods.\n\n2. Probability Theory: This class delves into the mathematical foundations of probability. It explores concepts like random variables, probability distributions, and expected values.\n\n3. Linear Algebra: This course focuses on vector spaces, linear transformations, and matrices. It provides the mathematical tools needed for more advanced statistical analysis.\n\n## Classes similar to Experimental Design\n\n1. Design and Analysis of Clinical Trials: This course applies experimental design principles to medical research. It covers randomization techniques, blinding, and ethical considerations in human studies.\n\n2. Survey Sampling: This class focuses on designing and analyzing surveys. It covers sampling techniques, questionnaire design, and methods for handling non-response bias.\n\n3. Multivariate Analysis: This course explores techniques for analyzing data with multiple variables. It covers topics like principal component analysis, factor analysis, and discriminant analysis.\n\n4. Bayesian Statistics: This class introduces Bayesian inference and its applications. It covers prior and posterior distributions, Markov Chain Monte Carlo methods, and Bayesian experimental design.\n\n## Majors related to Experimental Design\n\n1. Statistics: Focuses on collecting, analyzing, and interpreting data. Statistics majors learn various statistical methods and their applications in research and industry.\n\n2. Data Science: Combines statistics, computer science, and domain expertise. Data science majors learn to extract insights from large and complex datasets.\n\n3. Psychology: Studies human behavior and mental processes. Psychology majors often use experimental design in their research to understand cognitive processes and social interactions.\n\n4. Biostatistics: Applies statistical methods to biological and medical research. Biostatistics majors learn to design and analyze clinical trials and epidemiological studies.\n\n## What can you do with a degree in Experimental Design?\n\n1. Clinical Research Scientist: Designs and conducts clinical trials for new drugs or medical treatments. They work closely with medical professionals and analyze trial data to determine the safety and efficacy of new interventions.\n\n2. Market Research Analyst: Designs experiments to test consumer preferences and behaviors. They use statistical techniques to analyze market trends and help companies make data-driven decisions.\n\n3. Quality Control Engineer: Develops and implements experiments to improve product quality in manufacturing. They use statistical process control methods to identify and reduce sources of variation in production processes.\n\n4. Environmental Scientist: Designs experiments to study ecosystems and environmental impacts. They collect and analyze data on pollution, climate change, and biodiversity to inform environmental policy and conservation efforts.\n\n## Experimental Design FAQs\n\n1. How is Experimental Design different from Observational Studies? Experimental Design involves actively manipulating variables to study their effects, while Observational Studies analyze existing data without intervention. Experiments allow for stronger causal inferences but may be less feasible in some situations.\n\n2. What software is commonly used in Experimental Design? Popular software includes R, SAS, and Minitab. These tools help with both designing experiments and analyzing the resulting data.\n\n3. How does Experimental Design relate to Machine Learning? Experimental Design principles are crucial in machine learning for tasks like model selection and hyperparameter tuning. Proper experimental design helps ensure that machine learning models are robust and generalizable.","emoji":"📊","order":null,"numResources":null,"active":true,"slug":"experimental-design","generationMetadata":{"group":"Group 7 – unit, topics, key terms","level":"college undergraduate","branch":"Math","duration":"one semester","subBranch":"Statistics","lengthVariant":"less text","model":"opus"}},"pageParams":{"communitySlug":"experimental-design","unitSlug":"unit-6","contentSlug":"assumptions-diagnostics-anova","docId":"L18Aw9UHrYsn4J29"},"children":["$","$L1c",null,{"content":{"id":"L18Aw9UHrYsn4J29","topics":[{"id":"vUSJY4IzncXPoDnf","name":"6.4 Assumptions and diagnostics for ANOVA","fullNumber":"6.4"}],"title":"6.4 Assumptions and diagnostics for ANOVA","desc":null,"summary":null,"type":"STUDY_GUIDE","slug":"assumptions-diagnostics-anova","date":null,"vimeoLiveLink":null,"url":null,"markdown":"ANOVA assumptions are crucial for valid results. Normality, homogeneity of variance, and independence must be checked. Violations can lead to incorrect conclusions, so it's important to assess these assumptions using visual and formal methods.\n\nDiagnostic tests help evaluate ANOVA assumptions. Residual plots and formal tests like Levene's and Shapiro-Wilk are used. If violations occur, data transformations or robust methods can address issues, ensuring reliable analysis and interpretation of results.\n\n## Assumptions\n### Normality and Its Assessment\n\n ###### ![fiveable_image_carousel](https://fiveable.me)\n\n- Normality assumes the residuals (differences between observed and predicted values) are normally distributed\n- Violations of normality can lead to inaccurate p-values and confidence intervals\n- Assess normality visually using Q-Q plots or histograms of residuals\n - Q-Q plots compare the distribution of residuals to a theoretical normal distribution\n - Histograms should show a bell-shaped curve for normally distributed residuals\n- Formally test normality using the Shapiro-Wilk test\n - Null hypothesis: residuals are normally distributed\n - P-value < 0.05 suggests a significant departure from normality\n### Homogeneity of Variance and Independence\n- Homogeneity of variance (homoscedasticity) assumes equal variances across groups\n - Violations (heteroscedasticity) can affect the validity of F-tests and lead to incorrect conclusions\n - Assess homogeneity visually using residual plots (residuals vs. fitted values)\n - Patterns or increasing/decreasing spread indicate heteroscedasticity\n - Formally test homogeneity using Levene's test\n - Null hypothesis: variances are equal across groups\n - P-value < 0.05 suggests significant differences in variances\n- Independence of observations assumes that observations within and between groups are not related\n - Violations can occur due to repeated measures, clustering, or spatial/temporal correlation\n - Assess independence by examining the study design and data collection process\n - Violations may require alternative models (repeated measures ANOVA, mixed models)\n## Diagnostic Tests\n### Residual Plots for Assessing Assumptions\n- Residual plots are graphical tools for assessing ANOVA assumptions\n- Residuals vs. Fitted plot\n - Assess homogeneity of variance\n - Look for patterns, increasing/decreasing spread, or outliers\n- Normal Q-Q plot\n - Assess normality of residuals\n - Compare residuals to a theoretical normal distribution\n - Deviations from a straight line indicate non-normality\n- Scale-Location plot\n - Assess homogeneity of variance\n - Look for patterns or increasing/decreasing spread\n- Residuals vs. Leverage plot\n - Identify influential observations\n - Points with high leverage and large residuals may have a strong influence on the model\n### Formal Tests for Assumptions\n- Levene's test for homogeneity of variance\n - Null hypothesis: variances are equal across groups\n - P-value < 0.05 suggests significant differences in variances\n - Robust to non-normality, but sensitive to large sample sizes\n- Shapiro-Wilk test for normality\n - Null hypothesis: residuals are normally distributed\n - P-value < 0.05 suggests a significant departure from normality\n - More powerful than visual assessment, but sensitive to large sample sizes\n - Alternative: Anderson-Darling test\n## Addressing Violations\n### Data Transformations\n- Transformations can help stabilize variances and improve normality\n- Common transformations: logarithmic, square root, reciprocal\n - Logarithmic: $log(x)$ or $log(x+1)$ for data with zero values\n - Square root: $\\sqrt{x}$ for data with a Poisson distribution\n - Reciprocal: $\\frac{1}{x}$ for data with a strong right skew\n- Choose a transformation based on the nature of the data and the severity of the violation\n- Interpret results on the transformed scale or back-transform for interpretation\n### Robust ANOVA Methods and Non-Parametric Alternatives\n- Robust ANOVA methods are less sensitive to violations of assumptions\n - Welch's ANOVA: does not assume equal variances\n - Trimmed means ANOVA: robust to non-normality and outliers\n - Bootstrapping: resampling method to obtain robust confidence intervals and p-values\n- Non-parametric alternatives do not rely on distributional assumptions\n - Kruskal-Wallis test: rank-based test for comparing medians across groups\n - Friedman test: rank-based test for repeated measures designs\n - Permutation tests: resampling method to obtain exact p-values\n- Consider the trade-offs between robustness and power when selecting an alternative method","cheatsheet":null,"publishDate":null,"updatedAt":"2024-08-07T06:24:41.137Z","status":"PUBLISHED","images":[{"url":"https://storage.googleapis.com/static.prod.fiveable.me/search-images%2F%22Normality_assessment_in_ANOVA%3A_Q-Q_plots_histograms_Shapiro-Wilk_test_residuals_distribution_visualizations%22-normality-1.png","description":"Chapter 16 Regression | Untitled","sourceUrl":"https://psyteachr.github.io/msc-conv/16-regression_files/figure-html/normality-1.png","hostUrl":"https://psyteachr.github.io/msc-conv/regression.html","altText":null,"sectionTitle":"Normality and Its Assessment","rank":2,"height":960,"width":1344,"displayWidth":672,"displayHeight":480,"contentId":"66b31329d9be6c5c04e0aa8c","subjectId":"experimental-design"},{"url":"https://storage.googleapis.com/static.prod.fiveable.me/search-images%2F%22Normality_assessment_in_ANOVA%3A_Q-Q_plots_histograms_Shapiro-Wilk_test_residuals_distribution_visualizations%22-ZXRkL.png","description":"r - How to interpret a QQ plot - Cross Validated","sourceUrl":"http://i.stack.imgur.com/ZXRkL.png","hostUrl":"http://stats.stackexchange.com/questions/101274/how-to-interpret-a-qq-plot","altText":null,"sectionTitle":"Normality and Its Assessment","rank":3,"height":537,"width":468,"displayWidth":234,"displayHeight":268,"contentId":"66b31329d9be6c5c04e0aa8c","subjectId":"experimental-design"}],"tableOfContents":null,"meta":{"description":"Review 6.4 Assumptions and diagnostics for ANOVA for your test on Unit 6 – Analysis of Variance (ANOVA). For students taking Experimental Design","title":"6.4 Assumptions and diagnostics for ANOVA | Experimental Design Class Notes"},"subject":{"id":"experimental-design","name":"Experimental Design","emoji":"📊","order":null,"active":true,"slug":"experimental-design","branchSlug":"math","keyTermsActive":null,"generationMetadata":{"group":"Group 7 – unit, topics, key terms","level":"college undergraduate","branch":"Math","duration":"one semester","subBranch":"Statistics","lengthVariant":"less text","model":"opus"},"units":[{"id":"iA2uesFTUGLgpseU","publicId":"iA2uesFTUGLgpseU","name":"Unit 1 – Introduction to Experimental Design","order":1,"slug":"unit-1","description":"Unit 1 – Introduction to Experimental Design","h1":null,"active":true,"emoji":"📚","hasResources":true},{"id":"3mVDpiHue9jAQ253","publicId":"3mVDpiHue9jAQ253","name":"Unit 2 – Principles of Experimental Design","order":2,"slug":"unit-2","description":"Unit 2 – Principles of Experimental Design","h1":null,"active":true,"emoji":"📚","hasResources":true},{"id":"A1vH8NwymBXRHEvV","publicId":"A1vH8NwymBXRHEvV","name":"Unit 3 – Randomization Techniques","order":3,"slug":"unit-3","description":"Unit 3 – Randomization Techniques","h1":null,"active":true,"emoji":"📚","hasResources":true},{"id":"U3RtoNW3k3bZREZj","publicId":"U3RtoNW3k3bZREZj","name":"Unit 4 – Factorial Designs","order":4,"slug":"unit-4","description":"Unit 4 – Factorial Designs","h1":null,"active":true,"emoji":"📚","hasResources":true},{"id":"cZ8wtKJBydlRlTFK","publicId":"cZ8wtKJBydlRlTFK","name":"Unit 5 – Blocking and Confounding","order":5,"slug":"unit-5","description":"Unit 5 – Blocking and Confounding","h1":null,"active":true,"emoji":"📚","hasResources":true},{"id":"OGPAb8FIJ0ehgGEY","publicId":"OGPAb8FIJ0ehgGEY","name":"Unit 6 – Analysis of Variance (ANOVA)","order":6,"slug":"unit-6","description":"Unit 6 – Analysis of Variance (ANOVA)","h1":null,"active":true,"emoji":"📚","hasResources":true},{"id":"A9bCi8OdM9i0ayuU","publicId":"A9bCi8OdM9i0ayuU","name":"Unit 7 – Statistical Power and Sample Size","order":7,"slug":"unit-7","description":"Unit 7 – Statistical Power and Sample Size Determination","h1":null,"active":true,"emoji":"📚","hasResources":true},{"id":"1cvyYYPw1igkv41P","publicId":"1cvyYYPw1igkv41P","name":"Unit 8 – Split–Plot Designs","order":8,"slug":"unit-8","description":"Unit 8 – Split-Plot Designs","h1":null,"active":true,"emoji":"📚","hasResources":true},{"id":"YZAcKIK3gA9QzbP3","publicId":"YZAcKIK3gA9QzbP3","name":"Unit 9 – Repeated Measures Designs","order":9,"slug":"unit-9","description":"Unit 9 – Repeated Measures Designs","h1":null,"active":true,"emoji":"📚","hasResources":true},{"id":"y2VEHrae1DqTze66","publicId":"y2VEHrae1DqTze66","name":"Unit 10 – Response Surface Methodology","order":10,"slug":"unit-10","description":"Unit 10 – Response Surface Methodology","h1":null,"active":true,"emoji":"📚","hasResources":true},{"id":"xaHDl0vzqzQytXXM","publicId":"xaHDl0vzqzQytXXM","name":"Unit 11 – Designing Experiments for Analysis","order":11,"slug":"unit-11","description":"Unit 11 – Designing Experiments for Statistical Analysis","h1":null,"active":true,"emoji":"📚","hasResources":true},{"id":"a6CutZV1R8FHiyXu","publicId":"a6CutZV1R8FHiyXu","name":"Unit 12 – Interpreting Results & Drawing Conclusions","order":12,"slug":"unit-12","description":"Unit 12 – Interpreting Results and Drawing Valid Conclusions","h1":null,"active":true,"emoji":"📚","hasResources":true},{"id":"roABkStwkw6YnHlS","publicId":"roABkStwkw6YnHlS","name":"Unit 13 – Contemporary Issues in Experimental Design","order":13,"slug":"unit-13","description":"Unit 13 – Contemporary Issues in Experimental Design","h1":null,"active":true,"emoji":"📚","hasResources":true},{"id":"ihOO4Amp468JnBaj","publicId":"ihOO4Amp468JnBaj","name":"Unit 14 – Adaptive Designs","order":14,"slug":"unit-14","description":"Unit 14 – Adaptive Designs","h1":null,"active":true,"emoji":"📚","hasResources":true},{"id":"zhhlIIekmTz76GaB","publicId":"zhhlIIekmTz76GaB","name":"Unit 15 – Optimal Design Theory","order":15,"slug":"unit-15","description":"Unit 15 – Optimal Design Theory","h1":null,"active":true,"emoji":"📚","hasResources":true}]},"unit":{"id":"OGPAb8FIJ0ehgGEY","name":"Unit 6 – Analysis of Variance (ANOVA)","slug":"unit-6","active":true},"replayVideoLocations":[],"resources":[],"streamers":[],"duration":3,"creators":[],"editors":[],"blocks":[]},"tableOfContentsItems":[{"id":"notes","title":"Notes","items":[{"id":"assumptions","title":"Assumptions","items":[]},{"id":"diagnostic-tests","title":"Diagnostic Tests","items":[]},{"id":"addressing-violations","title":"Addressing Violations","items":[]}]}],"pepQuizQuestions":[],"pepQuizStatus":true,"keyTerms":"$undefined"}]}]]