scipy-yli/tests/test_chi2.py

#   scipy-yli: Helpful SciPy utilities and recipes
#   Copyright © 2022  Lee Yingtong Li (RunasSudo)
#
#   This program is free software: you can redistribute it and/or modify
#   it under the terms of the GNU Affero General Public License as published by
#   the Free Software Foundation, either version 3 of the License, or
#   (at your option) any later version.
#
#   This program is distributed in the hope that it will be useful,
#   but WITHOUT ANY WARRANTY; without even the implied warranty of
#   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
#   GNU Affero General Public License for more details.
#
#   You should have received a copy of the GNU Affero General Public License
#   along with this program.  If not, see <https://www.gnu.org/licenses/>.

from pytest import approx

import numpy as np
import pandas as pd

import yli

def test_chi2_ol10_15():
	"""Compare yli.chi2 for Ott & Longnecker (2016) example 10.15"""
	
	data = [
		(1, 'Moderate', 15),
		(2, 'Moderate', 32),
		(3, 'Moderate', 18),
		(4, 'Moderate', 5),
		(1, 'Mildly Severe', 8),
		(2, 'Mildly Severe', 29),
		(3, 'Mildly Severe', 23),
		(4, 'Mildly Severe', 18),
		(1, 'Severe', 1),
		(2, 'Severe', 20),
		(3, 'Severe', 25),
		(4, 'Severe', 22)
	]
	
	df = pd.DataFrame({
		'AgeCategory': np.repeat([d[0] for d in data], [d[2] for d in data]),
		'Severity': np.repeat([d[1] for d in data], [d[2] for d in data])
	})
	
	result = yli.chi2(df, 'Severity', 'AgeCategory')
	assert result.statistic == approx(27.13, abs=0.01)
	assert result.pvalue == approx(0.00014, abs=0.00001)

def test_chi2_ol10_18():
	"""Compare yli.chi2 for Ott & Longnecker (2016) example 10.18"""
	
	data = [
		(False, False, 250),
		(True, False, 750),
		(False, True, 400),
		(True, True, 1600)
	]
	
	df = pd.DataFrame({
		'Response': np.repeat([d[0] for d in data], [d[2] for d in data]),
		'Stress': np.repeat([d[1] for d in data], [d[2] for d in data])
	})
	
	result = yli.chi2(df, 'Stress', 'Response')
	assert result.oddsratio.point == approx(1.333, abs=0.001)
	assert result.oddsratio.ci_lower == approx(1.113, abs=0.001)
	assert result.oddsratio.ci_upper == approx(1.596, abs=0.001)
Implement chi2 2022-10-13 13:25:24 +11:00			`# scipy-yli: Helpful SciPy utilities and recipes`
			`# Copyright © 2022 Lee Yingtong Li (RunasSudo)`
			`#`
			`# This program is free software: you can redistribute it and/or modify`
			`# it under the terms of the GNU Affero General Public License as published by`
			`# the Free Software Foundation, either version 3 of the License, or`
			`# (at your option) any later version.`
			`#`
			`# This program is distributed in the hope that it will be useful,`
			`# but WITHOUT ANY WARRANTY; without even the implied warranty of`
			`# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the`
			`# GNU Affero General Public License for more details.`
			`#`
			`# You should have received a copy of the GNU Affero General Public License`
			`# along with this program. If not, see <https://www.gnu.org/licenses/>.`

			`from pytest import approx`

			`import numpy as np`
			`import pandas as pd`

			`import yli`

			`def test_chi2_ol10_15():`
			`"""Compare yli.chi2 for Ott & Longnecker (2016) example 10.15"""`

			`data = [`
			`(1, 'Moderate', 15),`
			`(2, 'Moderate', 32),`
			`(3, 'Moderate', 18),`
			`(4, 'Moderate', 5),`
			`(1, 'Mildly Severe', 8),`
			`(2, 'Mildly Severe', 29),`
			`(3, 'Mildly Severe', 23),`
			`(4, 'Mildly Severe', 18),`
			`(1, 'Severe', 1),`
			`(2, 'Severe', 20),`
			`(3, 'Severe', 25),`
			`(4, 'Severe', 22)`
			`]`

			`df = pd.DataFrame({`
			`'AgeCategory': np.repeat([d[0] for d in data], [d[2] for d in data]),`
			`'Severity': np.repeat([d[1] for d in data], [d[2] for d in data])`
			`})`

			`result = yli.chi2(df, 'Severity', 'AgeCategory')`
			`assert result.statistic == approx(27.13, abs=0.01)`
			`assert result.pvalue == approx(0.00014, abs=0.00001)`

			`def test_chi2_ol10_18():`
			`"""Compare yli.chi2 for Ott & Longnecker (2016) example 10.18"""`

			`data = [`
			`(False, False, 250),`
			`(True, False, 750),`
			`(False, True, 400),`
			`(True, True, 1600)`
			`]`

			`df = pd.DataFrame({`
			`'Response': np.repeat([d[0] for d in data], [d[2] for d in data]),`
			`'Stress': np.repeat([d[1] for d in data], [d[2] for d in data])`
			`})`

			`result = yli.chi2(df, 'Stress', 'Response')`
			`assert result.oddsratio.point == approx(1.333, abs=0.001)`
			`assert result.oddsratio.ci_lower == approx(1.113, abs=0.001)`
			`assert result.oddsratio.ci_upper == approx(1.596, abs=0.001)`