support for Series, list and ndarray -> return float or dict

staskh · staskh · commit 9c0ddc9aaa15 · 2025-06-16T23:09:27.000+03:00
diff --git a/README.md b/README.md
@@ -44,7 +44,8 @@ Unless noted, IGLU-R test compatability is considered successful if it achieves
 | gri |Glycemia Risk Index | ✅ | ✅ returns float |
 | gvp |Glucose Variability Percentage| ✅ | ✅ only Series(DatetimeIndex) returns float
 | hbgi |High Blood Glucose Index| ✅ | ✅ returns float |
-| hyper_index |Hyperglycemia Index| ✅ |
+| hyper_index |Hyperglycemia Index| ✅ |✅ returns float |
+| hyper_index |Hyperglycemia Index| ✅ |✅ returns float |
 | hypo_index |Hypoglycemia Index| ✅ |
 | igc |Index of Glycemic Control| ✅ |
 | in_range_percent |percentage of values within target ranges| ✅ | ✅ returns dict
diff --git a/iglu_python/hyper_index.py b/iglu_python/hyper_index.py
@@ -7,8 +7,8 @@
 
 
 def hyper_index(
-    data: Union[pd.DataFrame, pd.Series], ULTR: int = 140, a: float = 1.1, c: int = 30
-) -> pd.DataFrame:
+    data: Union[pd.DataFrame, pd.Series, np.ndarray, list], ULTR: int = 140, a: float = 1.1, c: int = 30
+) -> pd.DataFrame|float:
     """
     Calculate Hyperglycemia Index.
 
@@ -19,8 +19,8 @@ def hyper_index(
 
     Parameters
     ----------
-    data : Union[pd.DataFrame, pd.Series]
-        DataFrame with columns 'id', 'time', and 'gl', or a Series of glucose values
+    data : Union[pd.DataFrame, pd.Series, np.ndarray, list]
+        DataFrame with columns 'id', 'time', and 'gl', or a Series of glucose values, or a numpy array or list of glucose values
     ULTR : int, default=140
         Upper Limit of Target Range, in mg/dL
     a : float, default=1.1
@@ -31,10 +31,10 @@ def hyper_index(
 
     Returns
     -------
-    pd.DataFrame
+    pd.DataFrame|float
         DataFrame with 1 row for each subject, a column for subject id and a column
         for the Hyperglycemia Index value. If a Series of glucose values is passed,
-        then a DataFrame without the subject id is returned.
+        then a float is returned.
 
     References
     ----------
@@ -62,50 +62,32 @@ def hyper_index(
     0  0.106
     """
     # Handle Series input
-    is_vector = False
-    if isinstance(data, (list, np.ndarray)):
-        data = pd.Series(data)
-    if isinstance(data, pd.Series):
-        is_vector = True
-        data = data.dropna()
-        if len(data) == 0:
-            return pd.DataFrame({"GVP": [np.nan]})
-
-        # Convert to DataFrame format for processing
-        data = pd.DataFrame(
-            {
-                "id": ["subject1"] * len(data),
-                "time": pd.date_range(
-                    start="2020-01-01", periods=len(data), freq="5min"
-                ),
-                "gl": data.values,
-            }
-        )
+    if isinstance(data, (pd.Series,list, np.ndarray)):
+        if isinstance(data, (np.ndarray, list)):
+            data = pd.Series(data)
+        return hyper_index_single(data, ULTR, a, c)
 
     # Check and prepare data
     data = check_data_columns(data)
 
     # Calculate hyper_index for each subject
-    result = []
-    for subject in data["id"].unique():
-        subject_data = data[data["id"] == subject]
-        # Remove NA values
-        subject_data = subject_data.dropna(subset=["gl"])
-
-        if len(subject_data) == 0:
-            continue
-
-        # Calculate hyper_index
-        hyper_values = subject_data[subject_data["gl"] > ULTR]["gl"] - ULTR
-        hyper_index = np.sum(hyper_values**a) / (len(subject_data) * c)
-
-        result.append({"id": subject, "hyper_index": hyper_index})
-
-    # Convert to DataFrame
-    out = pd.DataFrame(result)
-
-    # Remove id column if input was a Series
-    if is_vector and not out.empty:
-        out = out.drop("id", axis=1)
+    out = data.groupby('id').agg(
+        hyper_index = ("gl", lambda x: hyper_index_single(x, ULTR, a, c))
+    ).reset_index()
 
     return out
+
+def hyper_index_single(
+    gl: pd.Series, ULTR: int = 140, a: float = 1.1, c: int = 30
+) -> float:
+    """
+    Calculate Hyperglycemia Index for a single subject.
+    """
+    gl = gl.dropna()
+    if len(gl) == 0:
+        return np.nan
+    # Calculate hyper_index
+    hyper_values = gl[gl > ULTR] - ULTR
+    hyper_index = np.sum(hyper_values**a) / (len(gl) * c)
+
+    return hyper_index   
diff --git a/iglu_python/hypo_index.py b/iglu_python/hypo_index.py
@@ -7,8 +7,8 @@
 
 
 def hypo_index(
-    data: Union[pd.DataFrame, pd.Series], LLTR: int = 80, b: float = 2, d: int = 30
-) -> pd.DataFrame:
+    data: Union[pd.DataFrame, pd.Series, np.ndarray, list], LLTR: int = 80, b: float = 2, d: int = 30
+) -> pd.DataFrame|float:
     """
     Calculate Hypoglycemia Index.
 
@@ -19,8 +19,9 @@ def hypo_index(
 
     Parameters
     ----------
-    data : Union[pd.DataFrame, pd.Series]
-        DataFrame with columns 'id', 'time', and 'gl', or a Series of glucose values
+    data : Union[pd.DataFrame, pd.Series, np.ndarray, list]
+        DataFrame with columns 'id', 'time', and 'gl', or a Series of glucose values, 
+        or a numpy array or list of glucose values
     LLTR : int, default=80
         Lower Limit of Target Range, in mg/dL
     b : float, default=2
@@ -31,10 +32,10 @@ def hypo_index(
 
     Returns
     -------
-    pd.DataFrame
+    pd.DataFrame|float
         DataFrame with 1 row for each subject, a column for subject id and a column
         for the Hypoglycemia Index value. If a Series of glucose values is passed,
-        then a DataFrame without the subject id is returned.
+        then a float is returned.
 
     References
     ----------
@@ -62,50 +63,27 @@ def hypo_index(
     0  0.106
     """
     # Handle Series input
-    is_vector = False
-    if isinstance(data, (list, np.ndarray)):
-        data = pd.Series(data)
-    if isinstance(data, pd.Series):
-        is_vector = True
-        data = data.dropna()
-        if len(data) == 0:
-            return pd.DataFrame({"GVP": [np.nan]})
-
-        # Convert to DataFrame format for processing
-        data = pd.DataFrame(
-            {
-                "id": ["subject1"] * len(data),
-                "time": pd.date_range(
-                    start="2020-01-01", periods=len(data), freq="5min"
-                ),
-                "gl": data.values,
-            }
-        )
-
-    # Check and prepare data
+    if isinstance(data, (pd.Series,list, np.ndarray)):
+        if isinstance(data, (np.ndarray, list)):
+            data = pd.Series(data)
+        return hypo_index_single(data, LLTR, b, d)
+    
     data = check_data_columns(data)
-
-    # Calculate hypo_index for each subject
-    result = []
-    for subject in data["id"].unique():
-        subject_data = data[data["id"] == subject]
-        # Remove NA values
-        subject_data = subject_data.dropna(subset=["gl"])
-
-        if len(subject_data) == 0:
-            continue
-
-        # Calculate hypo_index
-        hypo_values = LLTR - subject_data[subject_data["gl"] < LLTR]["gl"]
-        hypo_index = np.sum(hypo_values**b) / (len(subject_data) * d)
-
-        result.append({"id": subject, "hypo_index": hypo_index})
-
-    # Convert to DataFrame
-    out = pd.DataFrame(result)
-
-    # Remove id column if input was a Series
-    if is_vector and not out.empty:
-        out = out.drop("id", axis=1)
-
+    out = data.groupby('id').agg(
+        hypo_index = ("gl", lambda x: hypo_index_single(x, LLTR, b, d))
+    ).reset_index()
     return out
+
+def hypo_index_single(
+    gl: pd.Series, LLTR: int = 80, b: float = 2, d: int = 30
+) -> float:
+    """
+    Calculate Hypoglycemia Index for a single subject.
+    """
+    gl = gl.dropna()
+    if len(gl) == 0:
+        return np.nan
+    # Calculate hypo_index
+    hypo_values = LLTR - gl[gl < LLTR]
+    hypo_index = np.sum(hypo_values**b) / (len(gl) * d)
+    return hypo_index
diff --git a/tests/test_hyper_index.py b/tests/test_hyper_index.py
@@ -101,6 +101,29 @@ def test_hyper_index_basic():
     subject2_index = result[result["id"] == "subject2"]["hyper_index"].iloc[0]
     assert subject1_index > subject2_index
 
+def test_hyper_index_list_input():
+
+    # Create test data as Series
+    data = [150, 200, 180, 130, 190, 160]
+
+    # Calculate hyper_index
+    result = iglu.hyper_index(data)
+    expected = 1.453976 
+    # Check output format
+    assert isinstance(result, float)
+    np.testing.assert_allclose(result, expected, rtol=1e-3)
+
+def test_hyper_index_numpy_array_input():
+
+    # Create test data as Series
+    data = np.array([150, 200, 180, 130, 190, 160])
+
+    # Calculate hyper_index
+    result = iglu.hyper_index(data)
+    expected = 1.453976 
+    # Check output format
+    assert isinstance(result, float)
+    np.testing.assert_allclose(result, expected, rtol=1e-3)
 
 def test_hyper_index_series_input():
     """Test hyper_index calculation with Series input."""
@@ -109,15 +132,11 @@ def test_hyper_index_series_input():
 
     # Calculate hyper_index
     result = iglu.hyper_index(data)
-
+    expected = 1.453976 
     # Check output format
-    assert isinstance(result, pd.DataFrame)
-    assert "hyper_index" in result.columns
-    assert "id" not in result.columns
-    assert len(result) == 1
+    assert isinstance(result, float)
+    np.testing.assert_allclose(result, expected, rtol=1e-3)
 
-    # Check that hyper_index value is non-negative
-    assert result["hyper_index"].iloc[0] >= 0
 
 
 def test_hyper_index_custom_parameters():
diff --git a/tests/test_hypo_index.py b/tests/test_hypo_index.py
@@ -110,15 +110,27 @@ def test_hypo_index_series_input():
 
     # Calculate hypo_index
     result = iglu.hypo_index(data)
+    expected = 7.638889
 
     # Check output format
-    assert isinstance(result, pd.DataFrame)
-    assert "hypo_index" in result.columns
-    assert "id" not in result.columns
-    assert len(result) == 1
+    assert isinstance(result, float)
+    np.testing.assert_allclose(result, expected, rtol=1e-3)
 
-    # Check that hypo_index value is non-negative
-    assert result["hypo_index"].iloc[0] >= 0
+def test_hypo_index_list_input():
+    """Test hypo_index calculation with list input."""
+    data = [70, 60, 75, 65, 85, 55]
+    result = iglu.hypo_index(data)
+    expected = 7.638889
+    assert isinstance(result, float)
+    np.testing.assert_allclose(result, expected, rtol=1e-3)
+
+def test_hypo_index_numpy_array_input():
+    """Test hypo_index calculation with numpy array input."""
+    data = np.array([70, 60, 75, 65, 85, 55])
+    result = iglu.hypo_index(data)
+    expected = 7.638889
+    assert isinstance(result, float)
+    np.testing.assert_allclose(result, expected, rtol=1e-3)
 
 
 def test_hypo_index_custom_parameters():