Spaces:

GlucoseDao
/

glucosedao

Sleeping

App Files Files Community

Livia_Zaharia commited on Oct 29, 2024

Commit

64e42c0

1 Parent(s): 7935ff0

it works locally and with user input of preprocessed csv

Browse files

Files changed (12) hide show

__pycache__/plot_predictions.cpython-311.pyc +0 -0
__pycache__/routes.cpython-311.pyc +0 -0
__pycache__/tools.cpython-311.pyc +0 -0
app.py +3 -3
data_formatter/__pycache__/base.cpython-311.pyc +0 -0
data_formatter/base.py +2 -0
environment.yaml +8 -2
gluformer/__pycache__/model.cpython-311.pyc +0 -0
requirements.txt +5 -1
tools.py +70 -59
utils/__pycache__/darts_processing.cpython-311.pyc +0 -0
utils/darts_processing.py +0 -1

__pycache__/plot_predictions.cpython-311.pyc DELETED Viewed

Binary file (9.5 kB)

__pycache__/routes.cpython-311.pyc DELETED Viewed

Binary file (2.33 kB)

__pycache__/tools.cpython-311.pyc DELETED Viewed

Binary file (13.3 kB)

app.py CHANGED Viewed

@@ -2,7 +2,7 @@ import gradio as gr
 from tools import *
-def gradio_output():
-    return (predict_glucose_tool())
-gr.Interface(fn=gradio_output,inputs=None,outputs="image").launch()

 from tools import *
+def gradio_output(file):
+    return (predict_glucose_tool(file))
+gr.Interface(fn=gradio_output,inputs=gr.File(label="Upload CSV File"),outputs="plot").launch()

data_formatter/__pycache__/base.cpython-311.pyc DELETED Viewed

Binary file (16.4 kB)

data_formatter/base.py CHANGED Viewed

@@ -7,6 +7,7 @@ import sklearn.preprocessing
 import data_formatter.types as types
 import data_formatter.utils as utils
 DataTypes = types.DataTypes
 InputTypes = types.InputTypes
@@ -44,6 +45,7 @@ class DataFormatter:
     print('Loading data...')
     self.params['index_col'] = False if self.params['index_col'] == -1 else self.params['index_col']
     # read data table
     self.data = pd.read_csv(self.params['data_csv_path'], index_col=self.params['index_col'])
     # drop columns / rows

 import data_formatter.types as types
 import data_formatter.utils as utils
 DataTypes = types.DataTypes
 InputTypes = types.InputTypes
     print('Loading data...')
     self.params['index_col'] = False if self.params['index_col'] == -1 else self.params['index_col']
     # read data table
     self.data = pd.read_csv(self.params['data_csv_path'], index_col=self.params['index_col'])
     # drop columns / rows

environment.yaml CHANGED Viewed

@@ -1,11 +1,10 @@
-name: glucose_genie
 channels:
   - conda-forge
   - defaults
 dependencies:
   - python=3.11
   - gradio
-  - seaborn
   - pytorch
   - optuna
   - tensorboard
@@ -17,3 +16,10 @@ dependencies:
     - pmdarima==2.0.4
     - numpy==1.26.4
     - peft

+name: glucose_hf
 channels:
   - conda-forge
   - defaults
 dependencies:
   - python=3.11
   - gradio
   - pytorch
   - optuna
   - tensorboard
     - pmdarima==2.0.4
     - numpy==1.26.4
     - peft
+    - transformers
+    - datasets
+    - python-multipart
+    - plotly
+    - kaleido

gluformer/__pycache__/model.cpython-311.pyc DELETED Viewed

Binary file (15.9 kB)

requirements.txt CHANGED Viewed

@@ -1,5 +1,4 @@
 gradio
-seaborn
 torch
 optuna
 numpy==1.26.4
@@ -10,3 +9,8 @@ typer
 darts==0.29.0
 pmdarima==2.0.4
 peft

 gradio
 torch
 optuna
 numpy==1.26.4
 darts==0.29.0
 pmdarima==2.0.4
 peft
+transformers
+datasets
+python-multipart
+plotly
+kaleido

tools.py CHANGED Viewed

@@ -3,25 +3,16 @@ import os
 import pickle
 import gzip
 from pathlib import Path
-import seaborn as sns
 import numpy as np
-import matplotlib.pyplot as plt
-import matplotlib.colors as mcolors
-from matplotlib.figure import Figure
 import torch
 from scipy import stats
 from gluformer.model import Gluformer
 from utils.darts_processing import *
 from utils.darts_dataset import *
 import hashlib
 from urllib.parse import urlparse
-import numpy as np
-import typer
 glucose = Path(os.path.abspath(__file__)).parent.resolve()
@@ -29,7 +20,7 @@ file_directory = glucose / "files"
 def plot_forecast(forecasts: np.ndarray, scalers: Any, dataset_test_glufo: Any, filename: str):
-    filename=filename
     forecasts = (forecasts - scalers['target'].min_) / scalers['target'].scale_
     trues = [dataset_test_glufo.evalsample(i) for i in range(len(dataset_test_glufo))]
@@ -41,25 +32,18 @@ def plot_forecast(forecasts: np.ndarray, scalers: Any, dataset_test_glufo: Any,
     inputs = [dataset_test_glufo[i][0] for i in range(len(dataset_test_glufo))]
     inputs = (np.array(inputs) - scalers['target'].min_) / scalers['target'].scale_
-    # Plot settings
-    colors = ['#00264c', '#0a2c62', '#14437f', '#1f5a9d', '#2973bb', '#358ad9', '#4d9af4', '#7bb7ff', '#add5ff', '#e6f3ff']
-    cmap = mcolors.LinearSegmentedColormap.from_list('my_colormap', colors)
-    sns.set_theme(style="whitegrid")
-    # Generate the plot
-    fig, ax = plt.subplots(figsize=(10, 6))
     # Select a specific sample to plot
-    ind = 30  # Example index
     samples = np.random.normal(
         loc=forecasts[ind, :],  # Mean (center) of the distribution
         scale=0.1,  # Standard deviation (spread) of the distribution
         size=(forecasts.shape[1], forecasts.shape[2])
     )
-    #samples = samples.reshape(samples.shape[0], samples.shape[1], -1)
-    #print ("samples",samples.shape)
     # Plot predictive distribution
     for point in range(samples.shape[0]):
@@ -67,38 +51,64 @@ def plot_forecast(forecasts: np.ndarray, scalers: Any, dataset_test_glufo: Any,
         maxi, mini = 1.2 * np.max(samples[point, :]), 0.8 * np.min(samples[point, :])
         y_grid = np.linspace(mini, maxi, 200)
         x = kde(y_grid)
-        ax.fill_betweenx(y_grid, x1=point, x2=point - x * 15,
-                         alpha=0.7,
-                         edgecolor='black',
-                         color=cmap(point / samples.shape[0]))
     # Plot median
     forecast = samples[:, :]
     median = np.quantile(forecast, 0.5, axis=-1)
-    ax.plot(np.arange(12), median, color='red', marker='o')
-    # Plot true values
-    ax.plot(np.arange(-12, 12), np.concatenate([inputs[ind, -12:], trues[ind, :]]), color='blue')
-    # Add labels and title
-    ax.set_xlabel('Time (in 5 minute intervals)')
-    ax.set_ylabel('Glucose (mg/dL)')
-    ax.set_title(f'Gluformer Prediction with Gradient for dateset')
-    # Adjust font sizes
-    ax.xaxis.label.set_fontsize(16)
-    ax.yaxis.label.set_fontsize(16)
-    ax.title.set_fontsize(18)
-    for item in ax.get_xticklabels() + ax.get_yticklabels():
-        item.set_fontsize(14)
     # Save figure
-    plt.tight_layout()
-    where = file_directory /filename
-    plt.savefig(str(where), dpi=300, bbox_inches='tight')
-    return where,ax
 def generate_filename_from_url(url: str, extension: str = "png") -> str:
@@ -120,18 +130,21 @@ def generate_filename_from_url(url: str, extension: str = "png") -> str:
-def predict_glucose_tool(url: str= 'https://huggingface.co/datasets/Livia-Zaharia/glucose_processed/blob/main/livia_mini.csv',
-                        model: str = 'https://huggingface.co/Livia-Zaharia/gluformer_models/blob/main/gluformer_1samples_10000epochs_10heads_32batch_geluactivation_livia_mini_weights.pth'
-                    ) -> Figure:
     """
     Function to predict future glucose of user. It receives URL with users csv. It will run an ML and will return URL with predictions that user can open on her own..
-    :param url: of the csv file with glucose values
-    :param model: model that is used to predict the glucose
     :param explain if it should give both url and explanation
     :param if the person is diabetic when doing prediction and explanation
     :return:
     """
     formatter, series, scalers = load_data(url=str(url), config_path=file_directory / "config.yaml", use_covs=True,
                                            cov_type='dual',
                                            use_static_covs=True)
@@ -141,7 +154,7 @@ def predict_glucose_tool(url: str= 'https://huggingface.co/datasets/Livia-Zahari
     formatter.params['gluformer'] = {
         'in_len': 96,  # example input length, adjust as necessary
         'd_model': 512,  # model dimension
-        'n_heads': 10,  # number of attention heads##############################################################################
         'd_fcn': 1024,  # fully connected layer dimension
         'num_enc_layers': 2,  # number of encoder layers
         'num_dec_layers': 2,  # number of decoder layers
@@ -166,11 +179,9 @@ def predict_glucose_tool(url: str= 'https://huggingface.co/datasets/Livia-Zahari
         num_dynamic_features=num_dynamic_features,
         num_static_features=num_static_features
     )
-    weights = gr.Interface.load(model)
-    assert f"weights for {model} should exist", weights.exists()
     device = "cuda" if torch.cuda.is_available() else "cpu"
-    glufo.load_state_dict(torch.load(str(weights), map_location=torch.device(device), weights_only=False))
     # Define dataset for inference
     dataset_test_glufo = SamplingDatasetInferenceDual(
@@ -184,9 +195,9 @@ def predict_glucose_tool(url: str= 'https://huggingface.co/datasets/Livia-Zahari
     forecasts, _ = glufo.predict(
         dataset_test_glufo,
-        batch_size=16,####################################################
         num_samples=10,
-        device='cpu'
     )
     figure_path, result = plot_forecast(forecasts, scalers, dataset_test_glufo,filename)

 import pickle
 import gzip
 from pathlib import Path
 import numpy as np
 import torch
 from scipy import stats
 from gluformer.model import Gluformer
 from utils.darts_processing import *
 from utils.darts_dataset import *
 import hashlib
 from urllib.parse import urlparse
+from huggingface_hub import hf_hub_download
+import plotly.graph_objects as go
 glucose = Path(os.path.abspath(__file__)).parent.resolve()
 def plot_forecast(forecasts: np.ndarray, scalers: Any, dataset_test_glufo: Any, filename: str):
     forecasts = (forecasts - scalers['target'].min_) / scalers['target'].scale_
     trues = [dataset_test_glufo.evalsample(i) for i in range(len(dataset_test_glufo))]
     inputs = [dataset_test_glufo[i][0] for i in range(len(dataset_test_glufo))]
     inputs = (np.array(inputs) - scalers['target'].min_) / scalers['target'].scale_
     # Select a specific sample to plot
+    ind = 10  # Example index
     samples = np.random.normal(
         loc=forecasts[ind, :],  # Mean (center) of the distribution
         scale=0.1,  # Standard deviation (spread) of the distribution
         size=(forecasts.shape[1], forecasts.shape[2])
     )
+    # Create figure
+    fig = go.Figure()
     # Plot predictive distribution
     for point in range(samples.shape[0]):
         maxi, mini = 1.2 * np.max(samples[point, :]), 0.8 * np.min(samples[point, :])
         y_grid = np.linspace(mini, maxi, 200)
         x = kde(y_grid)
+        # Create gradient color
+        color = f'rgba(53, 138, 217, {(point + 1) / samples.shape[0]})'
+        # Add filled area
+        fig.add_trace(go.Scatter(
+            x=np.concatenate([np.full_like(y_grid, point), np.full_like(y_grid, point - x * 15)[::-1]]),
+            y=np.concatenate([y_grid, y_grid[::-1]]),
+            fill='tonexty',
+            fillcolor=color,
+            line=dict(color='rgba(0,0,0,0)'),
+            showlegend=False
+        ))
+    true_values = np.concatenate([inputs[ind, -12:], trues[ind, :]])
+    true_values_flat=true_values.flatten()
+    fig.add_trace(go.Scatter(
+        x=list(range(-12, 12)),
+        y=true_values_flat.tolist(),  # Convert to list explicitly
+        mode='lines+markers',
+        line=dict(color='blue', width=2),
+        marker=dict(size=6),
+        name='True Values'
+    ))
     # Plot median
     forecast = samples[:, :]
     median = np.quantile(forecast, 0.5, axis=-1)
+    fig.add_trace(go.Scatter(
+        x=list(range(12)),
+        y=median.tolist(),  # Convert to list explicitly
+        mode='lines+markers',
+        line=dict(color='red', width=2),
+        marker=dict(size=8),
+        name='Median Forecast'
+    ))
+    # Update layout
+    fig.update_layout(
+        title='Gluformer Prediction with Gradient for dataset',
+        xaxis_title='Time (in 5 minute intervals)',
+        yaxis_title='Glucose (mg/dL)',
+        font=dict(size=14),
+        showlegend=True,
+        width=1000,
+        height=600
+    )
     # Save figure
+    where = file_directory / filename
+    fig.write_html(str(where.with_suffix('.html')))
+    fig.write_image(str(where))
+    return where, fig
 def generate_filename_from_url(url: str, extension: str = "png") -> str:
+def predict_glucose_tool(file) -> go.Figure:
     """
     Function to predict future glucose of user. It receives URL with users csv. It will run an ML and will return URL with predictions that user can open on her own..
+    :param file: it is the csv file imported as a string path to the temporary location gradio allows
+    :param model: model that is used to predict the glucose- was hardcoded
     :param explain if it should give both url and explanation
     :param if the person is diabetic when doing prediction and explanation
     :return:
     """
+    url = file
+    model="Livia-Zaharia/gluformer_models"
+    model_path = hf_hub_download(repo_id= model, filename="gluformer_1samples_10000epochs_10heads_32batch_geluactivation_livia_mini_weights.pth")
     formatter, series, scalers = load_data(url=str(url), config_path=file_directory / "config.yaml", use_covs=True,
                                            cov_type='dual',
                                            use_static_covs=True)
     formatter.params['gluformer'] = {
         'in_len': 96,  # example input length, adjust as necessary
         'd_model': 512,  # model dimension
+        'n_heads': 10,  # number of attention heads########################
         'd_fcn': 1024,  # fully connected layer dimension
         'num_enc_layers': 2,  # number of encoder layers
         'num_dec_layers': 2,  # number of decoder layers
         num_dynamic_features=num_dynamic_features,
         num_static_features=num_static_features
     )
     device = "cuda" if torch.cuda.is_available() else "cpu"
+    glufo.load_state_dict(torch.load(str(model_path), map_location=torch.device(device), weights_only=True))
     # Define dataset for inference
     dataset_test_glufo = SamplingDatasetInferenceDual(
     forecasts, _ = glufo.predict(
         dataset_test_glufo,
+        batch_size=16,#######
         num_samples=10,
+        device=device
     )
     figure_path, result = plot_forecast(forecasts, scalers, dataset_test_glufo,filename)

utils/__pycache__/darts_processing.cpython-311.pyc DELETED Viewed

Binary file (17.2 kB)

utils/darts_processing.py CHANGED Viewed

@@ -165,7 +165,6 @@ def load_data(url: str,
     config["data_csv_path"] = url
     formatter = DataFormatter(config)
-    #assert dataset is not None, 'dataset must be specified in the load_data call'
     assert use_covs is not None, 'use_covs must be specified in the load_data call'
     # convert to series

     config["data_csv_path"] = url
     formatter = DataFormatter(config)
     assert use_covs is not None, 'use_covs must be specified in the load_data call'
     # convert to series