url="https://raw.githubusercontent.com/tompollard/data/master/primary-biliary-cirrhosis/pbc.csv"
data_pbc=pd.read_csv(url)
# 6 categories of age based on decade
data_pbc['age_group'] = data_pbc['age'].map(lambda x: int(x/10))
columns = ['age_group', 'age', 'sex', 'albumin', 'ast']
categorical = ['age_group']
table = TableOne(data_pbc, columns=columns, categorical=categorical, groupby='sex', pval=True)
table
gives:
tableone.py:463: UserWarning: No p-value was computed for age_group due to the low number of observations.
warnings.warn('No p-value was computed for {} due to the low number of observations.'.format(v))
gives:
but the p-value still appears in the output table