Spaces:

alisrbdni
/

federated-learning-dynamic

Sleeping

App Files Files Community

alisrbdni commited on May 21, 2024

Commit

e44dff4

verified ·

1 Parent(s): 11edc3b

Update app.py

Browse files

Files changed (1) hide show

app.py +266 -104

app.py CHANGED Viewed

@@ -1,3 +1,4 @@
 # # %%writefile app.py
 # import streamlit as st
@@ -11,8 +12,15 @@
 # import random
 # from collections import OrderedDict
 # import flwr as fl
-# DEVICE = torch.device("cpu")
 # def load_data(dataset_name, train_size=20, test_size=20, num_clients=2):
 #     raw_datasets = load_dataset(dataset_name)
@@ -39,10 +47,8 @@
 #     data_collator = DataCollatorWithPadding(tokenizer=tokenizer)
-#     return train_datasets, test_datasets, data_collator
-# def read_log_file():
-#     with open("./log.txt", "r") as file:
-#         return file.read()
 # def train(net, trainloader, epochs):
 #     optimizer = AdamW(net.parameters(), lr=5e-5)
 #     net.train()
@@ -55,6 +61,38 @@
 #             optimizer.step()
 #             optimizer.zero_grad()
 # def test(net, testloader):
 #     metric = load_metric("accuracy")
 #     net.eval()
@@ -89,17 +127,21 @@
 #         self.net.load_state_dict(state_dict, strict=True)
 #     def fit(self, parameters, config):
 #         self.set_parameters(parameters)
 #         train(self.net, self.trainloader, epochs=1)
 #         loss, accuracy = test(self.net, self.testloader)
 #         self.losses.append(loss)
 #         self.accuracies.append(accuracy)
-#         return self.get_parameters(config={}), len(self.trainloader.dataset), {}
 #     def evaluate(self, parameters, config):
 #         self.set_parameters(parameters)
 #         loss, accuracy = test(self.net, self.testloader)
-#         return float(loss), len(self.testloader.dataset), {"accuracy": float(accuracy)}
 #     def plot_metrics(self, round_num, plot_placeholder):
 #         if self.losses and self.accuracies:
@@ -123,16 +165,107 @@
 #             fig.tight_layout()
 #             plot_placeholder.pyplot(fig)
 # def main():
 #     st.write("## Federated Learning with Dynamic Models and Datasets for Mobile Devices")
 #     dataset_name = st.selectbox("Dataset", ["imdb", "amazon_polarity", "ag_news"])
-#     model_name = st.selectbox("Model", ["bert-base-uncased","facebook/hubert-base-ls960", "distilbert-base-uncased"])
 #     NUM_CLIENTS = st.slider("Number of Clients", min_value=1, max_value=10, value=2)
 #     NUM_ROUNDS = st.slider("Number of Rounds", min_value=1, max_value=10, value=3)
-#     train_datasets, test_datasets, data_collator = load_data(dataset_name, num_clients=NUM_CLIENTS)
 #     trainloaders = []
 #     testloaders = []
@@ -144,9 +277,14 @@
 #         train_df = pd.DataFrame(train_datasets[i])
 #         test_df = pd.DataFrame(test_datasets[i])
-#         st.write("#### Train Dataset")
 #         edited_train_df = st.data_editor(train_df, key=f"train_{i}")
-#         st.write("#### Test Dataset")
 #         edited_test_df = st.data_editor(test_df, key=f"test_{i}")
 #         edited_train_dataset = Dataset.from_pandas(edited_train_df)
@@ -179,21 +317,73 @@
 #         )
 #         for round_num in range(NUM_ROUNDS):
-#             st.write(f"### Round {round_num + 1}")
-#             plot_placeholders = [st.empty() for _ in range(NUM_CLIENTS)]
-#             fl.common.logger.configure(identifier="myFlowerExperiment", filename="./log.txt")
 #             fl.simulation.start_simulation(
 #                 client_fn=client_fn,
 #                 num_clients=NUM_CLIENTS,
 #                 config=fl.server.ServerConfig(num_rounds=1),
 #                 strategy=strategy,
-#                 client_resources={"num_cpus": 1, "num_gpus": 0},
-#                 ray_init_args={"log_to_driver": False, "num_cpus": 1, "num_gpus": 0}
 #             )
 #             for i, client in enumerate(clients):
-#                 st.markdown("LOGS : "+ read_log_file())
 #                 client.plot_metrics(round_num + 1, plot_placeholders[i])
 #                 st.write(" ")
@@ -203,18 +393,36 @@
 #         st.write("## Final Client Metrics")
 #         for client in clients:
 #             st.write(f"### Client {client.client_id}")
-#             st.write(f"Final Loss: {client.losses[-1]:.4f}")
-#             st.write(f"Final Accuracy: {client.accuracies[-1]:.4f}")
-#             client.plot_metrics(NUM_ROUNDS, st.empty())
 #             st.write(" ")
 #     else:
 #         st.write("Click the 'Start Training' button to start the training process.")
 # if __name__ == "__main__":
 #     main()
-# %%writefile app.py
 import streamlit as st
 import matplotlib.pyplot as plt
@@ -230,7 +438,8 @@ import flwr as fl
 from logging import INFO, DEBUG
 from flwr.common.logger import log
 import logging
-import streamlit
 # If you're curious of all the loggers
@@ -276,38 +485,6 @@ def train(net, trainloader, epochs):
             optimizer.step()
             optimizer.zero_grad()
-# class SaveModelStrategy(fl.server.strategy.FedAvg):
-#     def aggregate_fit(
-#         self,
-#         server_round: int,
-#         results: List[Tuple[fl.server.client_proxy.ClientProxy, fl.common.FitRes]],
-#         failures: List[Union[Tuple[ClientProxy, FitRes], BaseException]],
-#     ) -> Tuple[Optional[Parameters], Dict[str, Scalar]]:
-#         """Aggregate model weights using weighted average and store checkpoint"""
-#         # Call aggregate_fit from base class (FedAvg) to aggregate parameters and metrics
-#         aggregated_parameters, aggregated_metrics = super().aggregate_fit(server_round, results, failures)
-#         if aggregated_parameters is not None:
-#             print(f"Saving round {server_round} aggregated_parameters...")
-#             # Convert `Parameters` to `List[np.ndarray]`
-#             aggregated_ndarrays: List[np.ndarray] = fl.common.parameters_to_ndarrays(aggregated_parameters)
-#             # Convert `List[np.ndarray]` to PyTorch`state_dict`
-#             params_dict = zip(net.state_dict().keys(), aggregated_ndarrays)
-#             state_dict = OrderedDict({k: torch.tensor(v) for k, v in params_dict})
-#             net.load_state_dict(state_dict, strict=True)
-#             # Save the model
-#             torch.save(net.state_dict(), f"model_round_{server_round}.pth")
-#         return aggregated_parameters, aggregated_metrics
 def test(net, testloader):
     metric = load_metric("accuracy")
     net.eval()
@@ -380,8 +557,6 @@ class CustomClient(fl.client.NumPyClient):
             fig.tight_layout()
             plot_placeholder.pyplot(fig)
-import matplotlib.pyplot as plt
-import re
 def read_log_file(log_path='./log.txt'):
     with open(log_path, 'r') as file:
@@ -392,18 +567,18 @@ def parse_log(log_lines):
     rounds = []
     clients = {}
     memory_usage = []
-    round_pattern = re.compile(r'ROUND(\d+)ROUND (\d+)')
     client_pattern = re.compile(r'Client (\d+) \| (INFO|DEBUG) \| (.*)')
     memory_pattern = re.compile(r'memory used=(\d+\.\d+)GB')
     current_round = None
     for line in log_lines:
         round_match = round_pattern.search(line)
         client_match = client_pattern.search(line)
         memory_match = memory_pattern.search(line)
         if round_match:
             current_round = int(round_match.group(1))
             rounds.append(current_round)
@@ -411,20 +586,20 @@ def parse_log(log_lines):
             client_id = int(client_match.group(1))
             log_level = client_match.group(2)
             message = client_match.group(3)
             if client_id not in clients:
                 clients[client_id] = {'rounds': [], 'messages': []}
             clients[client_id]['rounds'].append(current_round)
             clients[client_id]['messages'].append((log_level, message))
         elif memory_match:
             memory_usage.append(float(memory_match.group(1)))
     return rounds, clients, memory_usage
 def plot_metrics(rounds, clients, memory_usage):
     st.write("## Metrics Overview")
     st.write("### Memory Usage")
     plt.figure()
     plt.plot(range(len(memory_usage)), memory_usage, label='Memory Usage (GB)')
@@ -432,25 +607,25 @@ def plot_metrics(rounds, clients, memory_usage):
     plt.ylabel('Memory Usage (GB)')
     plt.legend()
     st.pyplot(plt)
     for client_id, data in clients.items():
         st.write(f"### Client {client_id} Metrics")
         info_messages = [msg for level, msg in data['messages'] if level == 'INFO']
         debug_messages = [msg for level, msg in data['messages'] if level == 'DEBUG']
         st.write("#### INFO Messages")
         for msg in info_messages:
             st.write(msg)
         st.write("#### DEBUG Messages")
         for msg in debug_messages:
             st.write(msg)
         # Placeholder for actual loss and accuracy values, assuming they're included in the messages
         losses = [float(re.search(r'loss=([\d\.]+)', msg).group(1)) for msg in debug_messages if 'loss=' in msg]
         accuracies = [float(re.search(r'accuracy=([\d\.]+)', msg).group(1)) for msg in debug_messages if 'accuracy=' in msg]
         if losses:
             plt.figure()
             plt.plot(data['rounds'], losses, label='Loss')
@@ -458,7 +633,7 @@ def plot_metrics(rounds, clients, memory_usage):
             plt.ylabel('Loss')
             plt.legend()
             st.pyplot(plt)
         if accuracies:
             plt.figure()
             plt.plot(data['rounds'], accuracies, label='Accuracy')
@@ -467,12 +642,11 @@ def plot_metrics(rounds, clients, memory_usage):
             plt.legend()
             st.pyplot(plt)
 def read_log_file2():
     with open("./log.txt", "r") as file:
         return file.read()
-def main():
     st.write("## Federated Learning with Dynamic Models and Datasets for Mobile Devices")
     dataset_name = st.selectbox("Dataset", ["imdb", "amazon_polarity", "ag_news"])
     model_name = st.selectbox("Model", ["bert-base-uncased", "facebook/hubert-base-ls960", "distilbert-base-uncased"])
@@ -534,59 +708,44 @@ def main():
         for round_num in range(NUM_ROUNDS):
             st.write(f"### Round {round_num + 1} ✅")
-            st.markdown(print(st.logger._loggers))
-            st.markdown(read_log_file2())
             logs = read_log_file2()
-            import re
-            import plotly.graph_objects as go
-            import streamlit as st
-            import pandas as pd
-            # Log data
-            log_data = logs
             # Extract relevant data
-            accuracy_pattern = re.compile(r"'accuracy': \((\d+),([\d.]+)\)\((\d+), ([\d.]+)\)")
-            loss_pattern = re.compile(r"'loss': \((\d+),([\d.]+)\)\((\d+), ([\d.]+)\)")
-            accuracy_matches = accuracy_pattern.findall(log_data)
-            loss_matches = loss_pattern.findall(log_data)
             rounds = [int(match[0]) for match in accuracy_matches]
             accuracies = [float(match[1]) for match in accuracy_matches]
             losses = [float(match[1]) for match in loss_matches]
             # Create accuracy plot
             accuracy_fig = go.Figure()
             accuracy_fig.add_trace(go.Scatter(x=rounds, y=accuracies, mode='lines+markers', name='Accuracy'))
             accuracy_fig.update_layout(title='Accuracy over Rounds', xaxis_title='Round', yaxis_title='Accuracy')
             # Create loss plot
             loss_fig = go.Figure()
             loss_fig.add_trace(go.Scatter(x=rounds, y=losses, mode='lines+markers', name='Loss'))
             loss_fig.update_layout(title='Loss over Rounds', xaxis_title='Round', yaxis_title='Loss')
             # Display plots in Streamlit
             st.plotly_chart(accuracy_fig)
             st.plotly_chart(loss_fig)
             # Display data table
             data = {
                 'Round': rounds,
                 'Accuracy': accuracies,
                 'Loss': losses
             }
             df = pd.DataFrame(data)
             st.write("## Training Metrics")
             st.table(df)
             plot_placeholders = [st.empty() for _ in range(NUM_CLIENTS)]
             fl.simulation.start_simulation(
@@ -619,12 +778,12 @@ def main():
         # Display log.txt content
         st.write("## Training Log")
-        # st.text(read_log_file())
         st.write("## Training Log Analysis")
         log_lines = read_log_file()
         rounds, clients, memory_usage = parse_log(log_lines)
         plot_metrics(rounds, clients, memory_usage)
     else:
@@ -634,3 +793,6 @@ if __name__ == "__main__":
     main()

 # # %%writefile app.py
 # import streamlit as st
 # import random
 # from collections import OrderedDict
 # import flwr as fl
+# from logging import INFO, DEBUG
+# from flwr.common.logger import log
+# import logging
+# import streamlit
+# # If you're curious of all the loggers
+# DEVICE = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+# fl.common.logger.configure(identifier="myFlowerExperiment", filename="./log.txt")
 # def load_data(dataset_name, train_size=20, test_size=20, num_clients=2):
 #     raw_datasets = load_dataset(dataset_name)
 #     data_collator = DataCollatorWithPadding(tokenizer=tokenizer)
+#     return train_datasets, test_datasets, data_collator, raw_datasets
 # def train(net, trainloader, epochs):
 #     optimizer = AdamW(net.parameters(), lr=5e-5)
 #     net.train()
 #             optimizer.step()
 #             optimizer.zero_grad()
+# # class SaveModelStrategy(fl.server.strategy.FedAvg):
+# #     def aggregate_fit(
+# #         self,
+# #         server_round: int,
+# #         results: List[Tuple[fl.server.client_proxy.ClientProxy, fl.common.FitRes]],
+# #         failures: List[Union[Tuple[ClientProxy, FitRes], BaseException]],
+# #     ) -> Tuple[Optional[Parameters], Dict[str, Scalar]]:
+# #         """Aggregate model weights using weighted average and store checkpoint"""
+# #         # Call aggregate_fit from base class (FedAvg) to aggregate parameters and metrics
+# #         aggregated_parameters, aggregated_metrics = super().aggregate_fit(server_round, results, failures)
+# #         if aggregated_parameters is not None:
+# #             print(f"Saving round {server_round} aggregated_parameters...")
+# #             # Convert `Parameters` to `List[np.ndarray]`
+# #             aggregated_ndarrays: List[np.ndarray] = fl.common.parameters_to_ndarrays(aggregated_parameters)
+# #             # Convert `List[np.ndarray]` to PyTorch`state_dict`
+# #             params_dict = zip(net.state_dict().keys(), aggregated_ndarrays)
+# #             state_dict = OrderedDict({k: torch.tensor(v) for k, v in params_dict})
+# #             net.load_state_dict(state_dict, strict=True)
+# #             # Save the model
+# #             torch.save(net.state_dict(), f"model_round_{server_round}.pth")
+# #         return aggregated_parameters, aggregated_metrics
 # def test(net, testloader):
 #     metric = load_metric("accuracy")
 #     net.eval()
 #         self.net.load_state_dict(state_dict, strict=True)
 #     def fit(self, parameters, config):
+#         log(INFO, f"Client {self.client_id} is starting fit()")
 #         self.set_parameters(parameters)
 #         train(self.net, self.trainloader, epochs=1)
 #         loss, accuracy = test(self.net, self.testloader)
 #         self.losses.append(loss)
 #         self.accuracies.append(accuracy)
+#         log(INFO, f"Client {self.client_id} finished fit() with loss: {loss:.4f} and accuracy: {accuracy:.4f}")
+#         return self.get_parameters(config={}), len(self.trainloader.dataset), {"loss": loss, "accuracy": accuracy}
 #     def evaluate(self, parameters, config):
+#         log(INFO, f"Client {self.client_id} is starting evaluate()")
 #         self.set_parameters(parameters)
 #         loss, accuracy = test(self.net, self.testloader)
+#         log(INFO, f"Client {self.client_id} finished evaluate() with loss: {loss:.4f} and accuracy: {accuracy:.4f}")
+#         return float(loss), len(self.testloader.dataset), {"accuracy": float(accuracy), "loss": float(loss)}
 #     def plot_metrics(self, round_num, plot_placeholder):
 #         if self.losses and self.accuracies:
 #             fig.tight_layout()
 #             plot_placeholder.pyplot(fig)
+# import matplotlib.pyplot as plt
+# import re
+# def read_log_file(log_path='./log.txt'):
+#     with open(log_path, 'r') as file:
+#         log_lines = file.readlines()
+#     return log_lines
+# def parse_log(log_lines):
+#     rounds = []
+#     clients = {}
+#     memory_usage = []
+#     round_pattern = re.compile(r'ROUND(\d+)ROUND (\d+)')
+#     client_pattern = re.compile(r'Client (\d+) \| (INFO|DEBUG) \| (.*)')
+#     memory_pattern = re.compile(r'memory used=(\d+\.\d+)GB')
+#     current_round = None
+#     for line in log_lines:
+#         round_match = round_pattern.search(line)
+#         client_match = client_pattern.search(line)
+#         memory_match = memory_pattern.search(line)
+#         if round_match:
+#             current_round = int(round_match.group(1))
+#             rounds.append(current_round)
+#         elif client_match:
+#             client_id = int(client_match.group(1))
+#             log_level = client_match.group(2)
+#             message = client_match.group(3)
+#             if client_id not in clients:
+#                 clients[client_id] = {'rounds': [], 'messages': []}
+#             clients[client_id]['rounds'].append(current_round)
+#             clients[client_id]['messages'].append((log_level, message))
+#         elif memory_match:
+#             memory_usage.append(float(memory_match.group(1)))
+#     return rounds, clients, memory_usage
+# def plot_metrics(rounds, clients, memory_usage):
+#     st.write("## Metrics Overview")
+#     st.write("### Memory Usage")
+#     plt.figure()
+#     plt.plot(range(len(memory_usage)), memory_usage, label='Memory Usage (GB)')
+#     plt.xlabel('Step')
+#     plt.ylabel('Memory Usage (GB)')
+#     plt.legend()
+#     st.pyplot(plt)
+#     for client_id, data in clients.items():
+#         st.write(f"### Client {client_id} Metrics")
+#         info_messages = [msg for level, msg in data['messages'] if level == 'INFO']
+#         debug_messages = [msg for level, msg in data['messages'] if level == 'DEBUG']
+#         st.write("#### INFO Messages")
+#         for msg in info_messages:
+#             st.write(msg)
+#         st.write("#### DEBUG Messages")
+#         for msg in debug_messages:
+#             st.write(msg)
+#         # Placeholder for actual loss and accuracy values, assuming they're included in the messages
+#         losses = [float(re.search(r'loss=([\d\.]+)', msg).group(1)) for msg in debug_messages if 'loss=' in msg]
+#         accuracies = [float(re.search(r'accuracy=([\d\.]+)', msg).group(1)) for msg in debug_messages if 'accuracy=' in msg]
+#         if losses:
+#             plt.figure()
+#             plt.plot(data['rounds'], losses, label='Loss')
+#             plt.xlabel('Round')
+#             plt.ylabel('Loss')
+#             plt.legend()
+#             st.pyplot(plt)
+#         if accuracies:
+#             plt.figure()
+#             plt.plot(data['rounds'], accuracies, label='Accuracy')
+#             plt.xlabel('Round')
+#             plt.ylabel('Accuracy')
+#             plt.legend()
+#             st.pyplot(plt)
+# def read_log_file2():
+#     with open("./log.txt", "r") as file:
+#         return file.read()
 # def main():
 #     st.write("## Federated Learning with Dynamic Models and Datasets for Mobile Devices")
 #     dataset_name = st.selectbox("Dataset", ["imdb", "amazon_polarity", "ag_news"])
+#     model_name = st.selectbox("Model", ["bert-base-uncased", "facebook/hubert-base-ls960", "distilbert-base-uncased"])
 #     NUM_CLIENTS = st.slider("Number of Clients", min_value=1, max_value=10, value=2)
 #     NUM_ROUNDS = st.slider("Number of Rounds", min_value=1, max_value=10, value=3)
+#     train_datasets, test_datasets, data_collator, raw_datasets = load_data(dataset_name, num_clients=NUM_CLIENTS)
 #     trainloaders = []
 #     testloaders = []
 #         train_df = pd.DataFrame(train_datasets[i])
 #         test_df = pd.DataFrame(test_datasets[i])
+#         st.write("#### Train Dataset (Words)")
+#         st.dataframe(raw_datasets["train"].select(random.sample(range(len(raw_datasets["train"])), 20)))
+#         st.write("#### Train Dataset (Tokens)")
 #         edited_train_df = st.data_editor(train_df, key=f"train_{i}")
+#         st.write("#### Test Dataset (Words)")
+#         st.dataframe(raw_datasets["test"].select(random.sample(range(len(raw_datasets["test"])), 20)))
+#         st.write("#### Test Dataset (Tokens)")
 #         edited_test_df = st.data_editor(test_df, key=f"test_{i}")
 #         edited_train_dataset = Dataset.from_pandas(edited_train_df)
 #         )
 #         for round_num in range(NUM_ROUNDS):
+#             st.write(f"### Round {round_num + 1} ✅")
+#             st.markdown(print(st.logger._loggers))
+#             st.markdown(read_log_file2())
+#             logs = read_log_file2()
+#             import re
+#             import plotly.graph_objects as go
+#             import streamlit as st
+#             import pandas as pd
+#             # Log data
+#             log_data = logs
+#             # Extract relevant data
+#             accuracy_pattern = re.compile(r"'accuracy': \((\d+),([\d.]+)\)\((\d+), ([\d.]+)\)")
+#             loss_pattern = re.compile(r"'loss': \((\d+),([\d.]+)\)\((\d+), ([\d.]+)\)")
+#             accuracy_matches = accuracy_pattern.findall(log_data)
+#             loss_matches = loss_pattern.findall(log_data)
+#             rounds = [int(match[0]) for match in accuracy_matches]
+#             accuracies = [float(match[1]) for match in accuracy_matches]
+#             losses = [float(match[1]) for match in loss_matches]
+#             # Create accuracy plot
+#             accuracy_fig = go.Figure()
+#             accuracy_fig.add_trace(go.Scatter(x=rounds, y=accuracies, mode='lines+markers', name='Accuracy'))
+#             accuracy_fig.update_layout(title='Accuracy over Rounds', xaxis_title='Round', yaxis_title='Accuracy')
+#             # Create loss plot
+#             loss_fig = go.Figure()
+#             loss_fig.add_trace(go.Scatter(x=rounds, y=losses, mode='lines+markers', name='Loss'))
+#             loss_fig.update_layout(title='Loss over Rounds', xaxis_title='Round', yaxis_title='Loss')
+#             # Display plots in Streamlit
+#             st.plotly_chart(accuracy_fig)
+#             st.plotly_chart(loss_fig)
+#             # Display data table
+#             data = {
+#                 'Round': rounds,
+#                 'Accuracy': accuracies,
+#                 'Loss': losses
+#             }
+#             df = pd.DataFrame(data)
+#             st.write("## Training Metrics")
+#             st.table(df)
+#             plot_placeholders = [st.empty() for _ in range(NUM_CLIENTS)]
 #             fl.simulation.start_simulation(
 #                 client_fn=client_fn,
 #                 num_clients=NUM_CLIENTS,
 #                 config=fl.server.ServerConfig(num_rounds=1),
 #                 strategy=strategy,
+#                 client_resources={"num_cpus": 1, "num_gpus": (1 if torch.cuda.is_available() else 0)},
+#                 ray_init_args={"log_to_driver": True, "num_cpus": 1, "num_gpus": (1 if torch.cuda.is_available() else 0)}
 #             )
 #             for i, client in enumerate(clients):
 #                 client.plot_metrics(round_num + 1, plot_placeholders[i])
 #                 st.write(" ")
 #         st.write("## Final Client Metrics")
 #         for client in clients:
 #             st.write(f"### Client {client.client_id}")
+#             if client.losses and client.accuracies:
+#                 st.write(f"Final Loss: {client.losses[-1]:.4f}")
+#                 st.write(f"Final Accuracy: {client.accuracies[-1]:.4f}")
+#                 client.plot_metrics(NUM_ROUNDS, st.empty())
+#             else:
+#                 st.write("No metrics available.")
 #             st.write(" ")
+#         # Display log.txt content
+#         st.write("## Training Log")
+#         # st.text(read_log_file())
+#         st.write("## Training Log Analysis")
+#         log_lines = read_log_file()
+#         rounds, clients, memory_usage = parse_log(log_lines)
+#         plot_metrics(rounds, clients, memory_usage)
 #     else:
 #         st.write("Click the 'Start Training' button to start the training process.")
 # if __name__ == "__main__":
 #     main()
+##############NEW
 import streamlit as st
 import matplotlib.pyplot as plt
 from logging import INFO, DEBUG
 from flwr.common.logger import log
 import logging
+import re
+import plotly.graph_objects as go
 # If you're curious of all the loggers
             optimizer.step()
             optimizer.zero_grad()
 def test(net, testloader):
     metric = load_metric("accuracy")
     net.eval()
             fig.tight_layout()
             plot_placeholder.pyplot(fig)
 def read_log_file(log_path='./log.txt'):
     with open(log_path, 'r') as file:
     rounds = []
     clients = {}
     memory_usage = []
+    round_pattern = re.compile(r'\[ROUND (\d+)\]')
     client_pattern = re.compile(r'Client (\d+) \| (INFO|DEBUG) \| (.*)')
     memory_pattern = re.compile(r'memory used=(\d+\.\d+)GB')
     current_round = None
     for line in log_lines:
         round_match = round_pattern.search(line)
         client_match = client_pattern.search(line)
         memory_match = memory_pattern.search(line)
         if round_match:
             current_round = int(round_match.group(1))
             rounds.append(current_round)
             client_id = int(client_match.group(1))
             log_level = client_match.group(2)
             message = client_match.group(3)
             if client_id not in clients:
                 clients[client_id] = {'rounds': [], 'messages': []}
             clients[client_id]['rounds'].append(current_round)
             clients[client_id]['messages'].append((log_level, message))
         elif memory_match:
             memory_usage.append(float(memory_match.group(1)))
     return rounds, clients, memory_usage
 def plot_metrics(rounds, clients, memory_usage):
     st.write("## Metrics Overview")
     st.write("### Memory Usage")
     plt.figure()
     plt.plot(range(len(memory_usage)), memory_usage, label='Memory Usage (GB)')
     plt.ylabel('Memory Usage (GB)')
     plt.legend()
     st.pyplot(plt)
     for client_id, data in clients.items():
         st.write(f"### Client {client_id} Metrics")
         info_messages = [msg for level, msg in data['messages'] if level == 'INFO']
         debug_messages = [msg for level, msg in data['messages'] if level == 'DEBUG']
         st.write("#### INFO Messages")
         for msg in info_messages:
             st.write(msg)
         st.write("#### DEBUG Messages")
         for msg in debug_messages:
             st.write(msg)
         # Placeholder for actual loss and accuracy values, assuming they're included in the messages
         losses = [float(re.search(r'loss=([\d\.]+)', msg).group(1)) for msg in debug_messages if 'loss=' in msg]
         accuracies = [float(re.search(r'accuracy=([\d\.]+)', msg).group(1)) for msg in debug_messages if 'accuracy=' in msg]
         if losses:
             plt.figure()
             plt.plot(data['rounds'], losses, label='Loss')
             plt.ylabel('Loss')
             plt.legend()
             st.pyplot(plt)
         if accuracies:
             plt.figure()
             plt.plot(data['rounds'], accuracies, label='Accuracy')
             plt.legend()
             st.pyplot(plt)
 def read_log_file2():
     with open("./log.txt", "r") as file:
         return file.read()
+def main():
     st.write("## Federated Learning with Dynamic Models and Datasets for Mobile Devices")
     dataset_name = st.selectbox("Dataset", ["imdb", "amazon_polarity", "ag_news"])
     model_name = st.selectbox("Model", ["bert-base-uncased", "facebook/hubert-base-ls960", "distilbert-base-uncased"])
         for round_num in range(NUM_ROUNDS):
             st.write(f"### Round {round_num + 1} ✅")
             logs = read_log_file2()
             # Extract relevant data
+            accuracy_pattern = re.compile(r"'accuracy': \{(\d+), ([\d.]+)\}")
+            loss_pattern = re.compile(r"'loss': \{(\d+), ([\d.]+)\}")
+            accuracy_matches = accuracy_pattern.findall(logs)
+            loss_matches = loss_pattern.findall(logs)
             rounds = [int(match[0]) for match in accuracy_matches]
             accuracies = [float(match[1]) for match in accuracy_matches]
             losses = [float(match[1]) for match in loss_matches]
             # Create accuracy plot
             accuracy_fig = go.Figure()
             accuracy_fig.add_trace(go.Scatter(x=rounds, y=accuracies, mode='lines+markers', name='Accuracy'))
             accuracy_fig.update_layout(title='Accuracy over Rounds', xaxis_title='Round', yaxis_title='Accuracy')
             # Create loss plot
             loss_fig = go.Figure()
             loss_fig.add_trace(go.Scatter(x=rounds, y=losses, mode='lines+markers', name='Loss'))
             loss_fig.update_layout(title='Loss over Rounds', xaxis_title='Round', yaxis_title='Loss')
             # Display plots in Streamlit
             st.plotly_chart(accuracy_fig)
             st.plotly_chart(loss_fig)
             # Display data table
             data = {
                 'Round': rounds,
                 'Accuracy': accuracies,
                 'Loss': losses
             }
             df = pd.DataFrame(data)
             st.write("## Training Metrics")
             st.table(df)
             plot_placeholders = [st.empty() for _ in range(NUM_CLIENTS)]
             fl.simulation.start_simulation(
         # Display log.txt content
         st.write("## Training Log")
+        st.write(read_log_file2())
         st.write("## Training Log Analysis")
         log_lines = read_log_file()
         rounds, clients, memory_usage = parse_log(log_lines)
         plot_metrics(rounds, clients, memory_usage)
     else:
     main()
+#################