scipy-yli/tests/test_chi2.py

#   scipy-yli: Helpful SciPy utilities and recipes
#   Copyright © 2022  Lee Yingtong Li (RunasSudo)
#
#   This program is free software: you can redistribute it and/or modify
#   it under the terms of the GNU Affero General Public License as published by
#   the Free Software Foundation, either version 3 of the License, or
#   (at your option) any later version.
#
#   This program is distributed in the hope that it will be useful,
#   but WITHOUT ANY WARRANTY; without even the implied warranty of
#   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
#   GNU Affero General Public License for more details.
#
#   You should have received a copy of the GNU Affero General Public License
#   along with this program.  If not, see <https://www.gnu.org/licenses/>.

from pytest import approx

import numpy as np
import pandas as pd

import yli

def test_chi2_ol10_15():
	"""Compare yli.chi2 for Ott & Longnecker (2016) example 10.15"""

	data = [
		(1, 'Moderate', 15),
		(2, 'Moderate', 32),
		(3, 'Moderate', 18),
		(4, 'Moderate', 5),
		(1, 'Mildly Severe', 8),
		(2, 'Mildly Severe', 29),
		(3, 'Mildly Severe', 23),
		(4, 'Mildly Severe', 18),
		(1, 'Severe', 1),
		(2, 'Severe', 20),
		(3, 'Severe', 25),
		(4, 'Severe', 22)
	]

	df = pd.DataFrame({
		'AgeCategory': np.repeat([d[0] for d in data], [d[2] for d in data]),
		'Severity': np.repeat([d[1] for d in data], [d[2] for d in data])
	})

	result = yli.chi2(df, 'Severity', 'AgeCategory')
	assert result.statistic == approx(27.13, abs=0.01)
	assert result.pvalue == approx(0.00014, abs=0.00001)

def test_chi2_ol10_18():
	"""Compare yli.chi2 for Ott & Longnecker (2016) example 10.18"""

	data = [
		(False, False, 250),
		(True, False, 750),
		(False, True, 400),
		(True, True, 1600)
	]

	df = pd.DataFrame({
		'Response': np.repeat([d[0] for d in data], [d[2] for d in data]),
		'Stress': np.repeat([d[1] for d in data], [d[2] for d in data])
	})

	result = yli.chi2(df, 'Stress', 'Response')
	assert result.oddsratio.point == approx(1.333, abs=0.001)
	assert result.oddsratio.ci_lower == approx(1.113, abs=0.001)
	assert result.oddsratio.ci_upper == approx(1.596, abs=0.001)

	expected_summary = '''Stress    False  True
Response
False       250   400
True        750  1600

χ²(1) = 9.82; p = 0.002*
OR (95% CI) = 1.33 (1.11–1.60)
RR (95% CI) = 1.11 (1.03–1.18)'''

	assert result.summary() == expected_summary