support for Series, list and ndarray -> return float or dict

staskh · staskh · commit c2645cbd77ac · 2025-06-16T23:30:24.000+03:00
diff --git a/README.md b/README.md
@@ -45,12 +45,11 @@ Unless noted, IGLU-R test compatability is considered successful if it achieves
 | gvp |Glucose Variability Percentage| ✅ | ✅ only Series(DatetimeIndex) returns float
 | hbgi |High Blood Glucose Index| ✅ | ✅ returns float |
 | hyper_index |Hyperglycemia Index| ✅ |✅ returns float |
-| hyper_index |Hyperglycemia Index| ✅ |✅ returns float |
-| hypo_index |Hypoglycemia Index| ✅ |
-| igc |Index of Glycemic Control| ✅ |
+| hypo_index |Hypoglycemia Index| ✅ |✅ returns float |
+| igc |Index of Glycemic Control| ✅ |✅ returns float |
 | in_range_percent |percentage of values within target ranges| ✅ | ✅ returns dict
-| iqr_glu |glucose level interquartile range|✅ |
-| j_index |J-Index score for glucose measurements| ✅ |
+| iqr_glu |glucose level interquartile range|✅ |✅ returns float |
+| j_index |J-Index score for glucose measurements| ✅ |✅ returns float |
 | lbgi | Low Blood Glucose Index| ✅ |
 | m_value | M-value of Schlichtkrull et al | ✅ |
 | mad_glu | Median Absolute Deviation | ✅ |
diff --git a/iglu_python/igc.py b/iglu_python/igc.py
@@ -9,14 +9,14 @@
 
 
 def igc(
-    data: Union[pd.DataFrame, pd.Series],
+    data: Union[pd.DataFrame, pd.Series, np.ndarray, list],
     LLTR: int = 80,
     ULTR: int = 140,
     a: float = 1.1,
     b: float = 2,
     c: int = 30,
     d: int = 30,
-) -> pd.DataFrame:
+) -> pd.DataFrame|float:
     """
     Calculate Index of Glycemic Control (IGC).
 
@@ -25,8 +25,8 @@ def igc(
 
     Parameters
     ----------
-    data : Union[pd.DataFrame, pd.Series]
-        DataFrame with columns 'id', 'time', and 'gl', or a Series of glucose values
+    data : Union[pd.DataFrame, pd.Series, np.ndarray, list]
+        DataFrame with columns 'id', 'time', and 'gl', or a Series of glucose values, or a numpy array or list of glucose values
     LLTR : int, default=80
         Lower Limit of Target Range, in mg/dL
     ULTR : int, default=140
@@ -42,10 +42,9 @@ def igc(
 
     Returns
     -------
-    pd.DataFrame
+    pd.DataFrame|float
         DataFrame with 1 row for each subject, a column for subject id and a column
-        for the IGC value. If a Series of glucose values is passed, then a DataFrame
-        without the subject id is returned.
+        for the IGC value. If a Series of glucose values is passed, then a float is returned.
 
     References
     ----------
@@ -73,40 +72,34 @@ def igc(
     0  0.106
     """
     # Handle Series input
-    is_vector = False
-    if isinstance(data, (list, np.ndarray)):
-        data = pd.Series(data)
-    if isinstance(data, pd.Series):
-        is_vector = True
-        data = data.dropna()
-        if len(data) == 0:
-            return pd.DataFrame({"GVP": [np.nan]})
-
-        # Convert to DataFrame format for processing
-        data = pd.DataFrame(
-            {
-                "id": ["subject1"] * len(data),
-                "time": pd.date_range(
-                    start="2020-01-01", periods=len(data), freq="5min"
-                ),
-                "gl": data.values,
-            }
-        )
+    if isinstance(data, (pd.Series,list, np.ndarray)):
+        if isinstance(data, (np.ndarray, list)):
+            data = pd.Series(data)
+        return igc_single(data, LLTR, ULTR, a, b, c, d)
 
     # Check and prepare data
     data = check_data_columns(data)
 
-    # Calculate hyper_index and hypo_index
-    out_hyper = hyper_index(data, ULTR=ULTR, a=a, c=c)
-    out_hypo = hypo_index(data, LLTR=LLTR, b=b, d=d)
-
-    # Combine the indices
-    out = pd.merge(out_hyper, out_hypo, on="id")
-    out["IGC"] = out["hyper_index"] + out["hypo_index"]
-    out = out[["id", "IGC"]]
+    out = data.groupby('id').agg(
+        IGC = ("gl", lambda x: igc_single(x, LLTR, ULTR, a, b, c, d))
+    ).reset_index()
+    return out
 
-    # Remove id column if input was a Series
-    if is_vector:
-        out = out.drop("id", axis=1)
+def igc_single(
+    gl: pd.Series, 
+    LLTR: int = 80, 
+    ULTR: int = 140, 
+    a: float = 1.1, 
+    b: float = 2, 
+    c: int = 30, 
+    d: int = 30
+) -> float:
+    """
+    Calculate Index of Glycemic Control for a single subject.
+    """
+        # Calculate hyper_index and hypo_index
+    out_hyper = hyper_index(gl, ULTR=ULTR, a=a, c=c)
+    out_hypo = hypo_index(gl, LLTR=LLTR, b=b, d=d)
 
-    return out
+    out = out_hyper + out_hypo
+    return out
diff --git a/iglu_python/iqr_glu.py b/iglu_python/iqr_glu.py
@@ -6,7 +6,7 @@
 from .utils import check_data_columns
 
 
-def iqr_glu(data: Union[pd.DataFrame, pd.Series]) -> pd.DataFrame:
+def iqr_glu(data: Union[pd.DataFrame, pd.Series, np.ndarray, list]) -> pd.DataFrame|float:
     """
     Calculate glucose level interquartile range (IQR).
 
@@ -15,15 +15,14 @@ def iqr_glu(data: Union[pd.DataFrame, pd.Series]) -> pd.DataFrame:
 
     Parameters
     ----------
-    data : Union[pd.DataFrame, pd.Series]
-        DataFrame with columns 'id', 'time', and 'gl', or a Series of glucose values
+    data : Union[pd.DataFrame, pd.Series, np.ndarray, list]
+        DataFrame with columns 'id', 'time', and 'gl', or a Series of glucose values, or a numpy array or list of glucose values
 
     Returns
     -------
-    pd.DataFrame
-        DataFrame with columns:
-        - id: subject identifier (if DataFrame input)
-        - IQR: interquartile range of glucose values (75th percentile - 25th percentile)
+    pd.DataFrame|float
+        DataFrame with 1 row for each subject, a column for subject id and a column
+        for the IQR value. If a Series of glucose values is passed, then a float is returned.
 
     Examples
     --------
@@ -44,10 +43,15 @@ def iqr_glu(data: Union[pd.DataFrame, pd.Series]) -> pd.DataFrame:
     0   70.0
     """
     # Handle Series input
-    if isinstance(data, pd.Series):
+    if isinstance(data, (pd.Series,list, np.ndarray)):
+        if isinstance(data, (np.ndarray, list)):
+            data = pd.Series(data)
+        data = data.dropna()
+        if len(data) == 0:
+            return np.nan
         # Calculate IQR for Series
-        iqr_val = np.percentile(data, 75) - np.percentile(data, 25)
-        return pd.DataFrame({"IQR": [iqr_val]})
+        iqr_val = iqr_glu_single(data)
+        return iqr_val   
 
     # Handle DataFrame input
     data = check_data_columns(data)
@@ -57,8 +61,28 @@ def iqr_glu(data: Union[pd.DataFrame, pd.Series]) -> pd.DataFrame:
     data = data.dropna()
     result = (
         data.groupby("id")
-        .agg(IQR=("gl", lambda x: np.percentile(x, 75) - np.percentile(x, 25)))
+        .agg(IQR=("gl", lambda x: iqr_glu_single(x)))
         .reset_index()
     )
 
     return result
+
+def iqr_glu_single(
+    gl: pd.Series,
+) -> float:
+    """
+    Calculate glucose level interquartile range (IQR) for a single subject.
+
+    Parameters
+    ----------
+    gl : pd.Series
+        Series of glucose values
+
+    Returns
+    """
+    gl = gl.dropna()
+    if len(gl) == 0:
+        return np.nan
+    # Calculate IQR for Series
+    iqr_val = np.percentile(gl, 75) - np.percentile(gl, 25)
+    return iqr_val 
diff --git a/iglu_python/j_index.py b/iglu_python/j_index.py
@@ -1,11 +1,12 @@
 from typing import Union
 
+import numpy as np
 import pandas as pd
 
 from .utils import check_data_columns
 
 
-def j_index(data: Union[pd.DataFrame, pd.Series]) -> pd.DataFrame:
+def j_index(data: Union[pd.DataFrame, pd.Series, np.ndarray, list]) -> pd.DataFrame|float:
     """
     Calculate J-Index score for glucose measurements.
 
@@ -15,15 +16,15 @@ def j_index(data: Union[pd.DataFrame, pd.Series]) -> pd.DataFrame:
 
     Parameters
     ----------
-    data : Union[pd.DataFrame, pd.Series]
-        DataFrame with columns 'id', 'time', and 'gl', or a Series of glucose values
+    data : Union[pd.DataFrame, pd.Series, np.ndarray, list]
+        DataFrame with columns 'id', 'time', and 'gl', or a Series of glucose values, 
+        or a numpy array or list of glucose values
 
     Returns
     -------
-    pd.DataFrame
+    pd.DataFrame|float
         DataFrame with 1 row for each subject, a column for subject id and a column
-        for J-Index value. If a Series of glucose values is passed, then a DataFrame
-        without the subject id is returned.
+        for J-Index value. If a Series of glucose values is passed, then a float is returned.
 
     References
     ----------
@@ -51,34 +52,30 @@ def j_index(data: Union[pd.DataFrame, pd.Series]) -> pd.DataFrame:
     0  1.5000
     """
     # Handle Series input
-    if isinstance(data, pd.Series):
-        # Calculate mean and standard deviation
-        mean_gl = data.mean()
-        sd_gl = data.std()
-
-        # Calculate J-index
-        j_index = 0.001 * (mean_gl + sd_gl) ** 2
-
-        return pd.DataFrame({"J_index": [j_index]})
+    if isinstance(data, (pd.Series,list, np.ndarray)):
+        if isinstance(data, (np.ndarray, list)):
+            data = pd.Series(data)
+        return j_index_single(data)
 
     # Handle DataFrame input
     data = check_data_columns(data)
 
-    # Initialize result list
-    result = []
-
-    # Process each subject
-    for subject in data["id"].unique():
-        subject_data = data[data["id"] == subject]
-
-        # Calculate mean and standard deviation
-        mean_gl = subject_data["gl"].mean()
-        sd_gl = subject_data["gl"].std()
+    out = data.groupby('id').agg(
+        J_index = ("gl", lambda x: j_index_single(x))
+    ).reset_index()
+    return out
 
-        # Calculate J-index
-        j_index = 0.001 * (mean_gl + sd_gl) ** 2
-
-        result.append({"id": subject, "J_index": j_index})
-
-    # Convert to DataFrame
-    return pd.DataFrame(result)
+def j_index_single(gl:  pd.Series) -> float:
+    """
+    Calculate J-Index score for a single subject.
+    """
+    gl = gl.dropna()
+    if len(gl) == 0:
+        return np.nan
+    # Calculate mean and standard deviation
+    mean_gl = gl.mean()
+    sd_gl = gl.std()
+
+    # Calculate J-index
+    j_index = 0.001 * (mean_gl + sd_gl) ** 2
+    return j_index
diff --git a/tests/test_igc.py b/tests/test_igc.py
@@ -106,15 +106,28 @@ def test_igc_series_input():
 
     # Calculate IGC
     result = iglu.igc(data)
+    expected = 1.453976
 
     # Check output format
-    assert isinstance(result, pd.DataFrame)
-    assert "IGC" in result.columns
-    assert "id" not in result.columns
-    assert len(result) == 1
+    assert isinstance(result, float)
+    np.testing.assert_allclose(result, expected, rtol=1e-3)
+
+def test_igc_list_input():
+    """Test IGC calculation with list input."""
+    data = [150, 200, 180, 130, 190, 160]
+    result = iglu.igc(data)
+    expected = 1.453976
+    assert isinstance(result, float)
+    np.testing.assert_allclose(result, expected, rtol=1e-3)
+
+def test_igc_numpy_array_input():
+    """Test IGC calculation with numpy array input."""
+    data = np.array([150, 200, 180, 130, 190, 160])
+    result = iglu.igc(data)
+    expected = 1.453976
+    assert isinstance(result, float)
+    np.testing.assert_allclose(result, expected, rtol=1e-3)
 
-    # Check that IGC value is non-negative
-    assert result["IGC"].iloc[0] >= 0
 
 
 def test_igc_custom_parameters():
diff --git a/tests/test_in_range_percent.py b/tests/test_in_range_percent.py
@@ -119,10 +119,35 @@ def test_in_range_percent_series_input():
     assert len(result) == 2
 
     # Check that percentages are between 0 and 100
-    assert (result["in_range_70_180"] >= 0) and (result["in_range_70_180"] <= 100)
-    assert (result["in_range_63_140"] >= 0) and (result["in_range_63_140"] <= 100)
+    np.testing.assert_allclose(result["in_range_70_180"], 83.33, rtol=1e-3)
+    np.testing.assert_allclose(result["in_range_63_140"], 66.66, rtol=1e-3)
 
+def test_in_range_percent_list_input():
+    """Test in_range_percent calculation with list input."""
+    data = [80, 90, 100, 130, 190, 160]
+    result = iglu.in_range_percent(data)
+    assert isinstance(result, dict)
+    assert "in_range_70_180" in result
+    assert "in_range_63_140" in result
+    assert len(result) == 2
+
+    # Check that percentages are between 0 and 100
+    np.testing.assert_allclose(result["in_range_70_180"], 83.33, rtol=1e-3)
+    np.testing.assert_allclose(result["in_range_63_140"], 66.66, rtol=1e-3)
 
+def test_in_range_percent_numpy_array_input():
+    """Test in_range_percent calculation with numpy array input."""
+    data = np.array([80, 90, 100, 130, 190, 160])
+    result = iglu.in_range_percent(data)
+    assert isinstance(result, dict)
+    assert "in_range_70_180" in result
+    assert "in_range_63_140" in result
+    assert len(result) == 2
+
+    # Check that percentages are between 0 and 100
+    np.testing.assert_allclose(result["in_range_70_180"], 83.33, rtol=1e-3)
+    np.testing.assert_allclose(result["in_range_63_140"], 66.66, rtol=1e-3)
+    
 def test_in_range_percent_custom_targets():
     """Test in_range_percent calculation with custom targets."""
     data = pd.DataFrame(
diff --git a/tests/test_iqr_glu.py b/tests/test_iqr_glu.py
@@ -111,13 +111,19 @@ def test_iqr_glu_output_format():
     # Test with Series input
     series_data = pd.Series([150, 155, 160, 165, 140, 145])
     result_series = iglu.iqr_glu(series_data)
-    assert isinstance(result_series, pd.DataFrame)
-    assert "IQR" in result_series.columns
-    assert len(result_series) == 1
-    assert (
-        result_series["IQR"].iloc[0] == 12.5
-    )  # 75th percentile (160) - 25th percentile (145)
-
+    assert isinstance(result_series, float)
+    np.testing.assert_allclose(result_series, 12.5, rtol=1e-3)
+
+    list_data = [150, 155, 160, 165, 140, 145]
+    result_list = iglu.iqr_glu(list_data)
+    assert isinstance(result_list, float)
+    np.testing.assert_allclose(result_list, 12.5, rtol=1e-3)
+
+    array_data = np.array([150, 155, 160, 165, 140, 145])
+    result_array = iglu.iqr_glu(array_data)
+    assert isinstance(result_array, float)
+    np.testing.assert_allclose(result_array, 12.5, rtol=1e-3)
+    
     # Test with empty data
     empty_data = pd.DataFrame(columns=["id", "time", "gl"])
     with pytest.raises(ValueError):
diff --git a/tests/test_j_index.py b/tests/test_j_index.py