Handle NaN values in TensorBoard scalar extraction

- Updated `extract_scalar_data` to handle NaN values in TensorBoard logs. - If a scalar value is NaN, the method now falls back to the previous valid value. - If no previous value is available, a default of 0.0 is used. - This ensures continuity and robustness in the extracted scalar data.
2025-04-27 23:18:59 +08:00 · 2024-08-09 13:11:15 +02:00 · 2024-08-09 13:11:15 +02:00 · 254faa1b91
commit 254faa1b91
parent 1b7add90ea
1 changed files with 13 additions and 2 deletions
--- a/infer/lib/train/graph_generation.py
+++ b/infer/lib/train/graph_generation.py
@ -1,6 +1,7 @@
 import os
 from typing import List
 import matplotlib.pyplot as plt
 import numpy as np
 import logging
 # Suppress TensorBoard event processing logs
@ -58,11 +59,21 @@ def extract_scalar_data(log_dir):
        if tag in ea.Tags()['scalars']:
            scalar_events = ea.Scalars(tag)
            scalar_data[tag] = {}
            previous_value = 0.0  # Initialize fallback value
            for event in scalar_events:
                value = event.value
                # Check if value is NaN, use previous value or fallback to 0.0
                if np.isnan(value):
                    value = previous_value
                if event.step not in scalar_data[tag]:
-                    scalar_data[tag][event.step] = [event.value]
+                    scalar_data[tag][event.step] = [value]
                else:
-                    scalar_data[tag][event.step].append(event.value)
+                    scalar_data[tag][event.step].append(value)
                previous_value = value  # Update previous value for the next iteration
            # Calculate the average for each step. Restarting training can cause multiple events for the same step.
            scalar_data[tag] = {step: sum(values) / len(values) for step, values in scalar_data[tag].items()}
        else: