Source code for pyhealth.datasets.support2
import logging
from pathlib import Path
from typing import List, Optional
from .base_dataset import BaseDataset
logger = logging.getLogger(__name__)
[docs]class Support2Dataset(BaseDataset):
"""
A dataset class for handling SUPPORT2 (Study to Understand Prognoses and Preferences
for Outcomes and Risks of Treatments) data.
The SUPPORT2 dataset contains data on 9,105 seriously ill hospitalized adults from
five U.S. medical centers (1989-1994), including patient demographics, diagnoses,
clinical measurements, and outcomes.
Dataset is available for download from:
- UCI Machine Learning Repository: https://archive.ics.uci.edu/dataset/880/support2
- Vanderbilt Biostatistics: https://hbiostat.org/data/repo/supportdesc
- Hugging Face: https://huggingface.co/datasets/jarrydmartinx/support2
- R packages: "rms" and "Hmisc"
Citation:
Knaus WA, Harrell FE, Lynn J, et al. The SUPPORT prognostic model:
Objective estimates of survival for seriously ill hospitalized adults.
Ann Intern Med. 1995;122(3):191-203.
Args:
root (str): The root directory where the dataset CSV file is stored.
tables (List[str]): A list of tables to be included (typically ["support2"]).
dataset_name (Optional[str]): The name of the dataset. Defaults to "support2".
config_path (Optional[str]): The path to the configuration file. If not provided,
uses the default config.
**kwargs: Additional arguments passed to BaseDataset.
Examples:
>>> from pyhealth.datasets import Support2Dataset
>>> dataset = Support2Dataset(
... root="/path/to/support2/data",
... tables=["support2"]
... )
>>> dataset.stats()
Attributes:
root (str): The root directory where the dataset is stored.
tables (List[str]): A list of tables to be included in the dataset.
dataset_name (str): The name of the dataset.
config_path (str): The path to the configuration file.
"""
def __init__(
self,
root: str,
tables: List[str],
dataset_name: Optional[str] = None,
config_path: Optional[str] = None,
**kwargs
) -> None:
if config_path is None:
logger.info("No config path provided, using default config")
config_path = Path(__file__).parent / "configs" / "support2.yaml"
super().__init__(
root=root,
tables=tables,
dataset_name=dataset_name or "support2",
config_path=config_path,
**kwargs
)
return