Spaces:

nanotron
/

predict_memory

Running

App Files Files Community

nouamanetazi HF Staff commited on Feb 4, 2025

Commit

2fa84c8

1 Parent(s): 9d879a4

qol updated

Browse files

Files changed (1) hide show

app.py +112 -59

app.py CHANGED Viewed

@@ -1,45 +1,68 @@
 import gradio as gr
 import matplotlib.pyplot as plt
 import yaml
 from pathlib import Path
 import io
 from utils import calculate_memory_components, plot_memory_breakdown
-def load_config_from_yaml_content(yaml_content):
     try:
-        config = yaml.safe_load(yaml_content)
-        # Extract relevant parameters from config
-        model_config = config['model']['model_config']
-        parallelism = config['parallelism']
-        tokens = config['tokens']
-        optimizer = config['optimizer']
-        return {
-            'hidden_size': model_config['hidden_size'],
-            'num_layers': model_config['num_hidden_layers'],
-            'vocab_size': model_config['vocab_size'],
-            'intermediate_size': model_config['intermediate_size'],
-            'seq_len': tokens['sequence_length'],
-            'mbs': tokens['micro_batch_size'],
-            'batch_accum': tokens['batch_accumulation_per_replica'],
-            'tp': parallelism['tp'],
-            'pp': parallelism['pp'],
-            'dp': parallelism['dp'],
-            'zero_stage': optimizer['zero_stage'],
-            'tie_word_embeddings': model_config['tie_word_embeddings'],
-            'num_attention_heads': model_config['num_attention_heads'],
-            'num_key_value_heads': model_config.get('num_key_value_heads', model_config['num_attention_heads'])
-        }
     except Exception as e:
-        raise gr.Error(f"Error parsing YAML: {str(e)}")
 def load_config_from_yaml_file(yaml_path):
     if not yaml_path:
         return None
     with open(yaml_path.name, 'r') as f:
-        return load_config_from_yaml_content(f.read())
 def format_config_display(config):
     if not config:
@@ -75,38 +98,41 @@ def process_yaml_and_plot(config):
     fig1, fig2, memory_usage_peak_tbi = plot_memory_breakdown(**config)
     oom_prediction = "OOM" if memory_usage_peak_tbi > 75000 else "No OOM"
     return fig1, fig2, format_config_display(config), oom_prediction
 with gr.Blocks() as demo:
     with gr.Row():
         with gr.Column(scale=1):
-            with gr.Accordion("YAML Configuration", open=True):
-                yaml_file = gr.File(label="Upload YAML Config", file_types=[".yaml", ".yml"])
-                yaml_text = gr.Textbox(
-                    label="Or paste YAML content here",
-                    placeholder="Paste your YAML configuration here...",
                     lines=10
                 )
-                yaml_submit = gr.Button("Calculate Memory from YAML")
-            with gr.Accordion("Manual Configuration", open=False):
                 with gr.Accordion("Model Architecture", open=True):
-                    hidden_size = gr.Number(4096, label="Hidden Size")
-                    num_layers = gr.Number(32, label="Number of Layers")
-                    vocab_size = gr.Number(50432, label="Vocabulary Size")
-                    intermediate_size = gr.Number(11008, label="Intermediate Size")
                     tie_word_embeddings = gr.Checkbox(True, label="Tie Word Embeddings")
-                    num_attention_heads = gr.Number(32, label="Number of Attention Heads")
-                    num_key_value_heads = gr.Number(32, label="Number of Key Value Heads")
                 with gr.Accordion("Training Configuration", open=True):
-                    seq_len = gr.Number(2048, label="Sequence Length")
-                    mbs = gr.Number(1, label="Micro Batch Size")
-                    batch_accum = gr.Number(1, label="Gradient Accumulation Steps")
                 with gr.Accordion("Parallelism", open=True):
-                    tp = gr.Number(1, label="Tensor Parallelism")
-                    pp = gr.Number(1, label="Pipeline Parallelism")
-                    dp = gr.Number(1, label="Data Parallelism")
                     zero_stage = gr.Radio([0, 1, 2, 3], value=0, label="ZeRO Stage")
                 manual_submit = gr.Button("Calculate Memory (Manual Input)")
@@ -116,19 +142,46 @@ with gr.Blocks() as demo:
             plot1 = gr.Plot(label="Memory Component Breakdown")
             plot2 = gr.Plot(label="Aggregate Memory Metrics")
-    # Handle YAML file upload
-    yaml_file.change(
-        lambda x: process_yaml_and_plot(load_config_from_yaml_file(x) if x else None),
-        inputs=[yaml_file],
-        outputs=[plot1, plot2, config_display, oom_display]
     )
-    # Handle YAML text input
-    yaml_submit.click(
-        lambda x: process_yaml_and_plot(load_config_from_yaml_content(x) if x else None),
-        inputs=[yaml_text],
-        outputs=[plot1, plot2, config_display, oom_display]
-    )
     # Handle manual input
     def manual_input_to_config(*args):
@@ -148,7 +201,7 @@ with gr.Blocks() as demo:
             'num_attention_heads': args[1],
             'num_key_value_heads': args[2]
         }
-        return process_yaml_and_plot(config)
     manual_submit.click(
         manual_input_to_config,

 import gradio as gr
 import matplotlib.pyplot as plt
 import yaml
+import json
 from pathlib import Path
 import io
 from utils import calculate_memory_components, plot_memory_breakdown
+def load_config_from_content(content):
     try:
+        # Try parsing as JSON first
+        try:
+            config = json.loads(content)
+            # Convert JSON HF config format to our format
+            return {
+                'hidden_size': config['hidden_size'],
+                'num_layers': config['num_hidden_layers'],
+                'vocab_size': config['vocab_size'],
+                'intermediate_size': config['intermediate_size'],
+                'seq_len': 2048,  # Default value since not in config
+                'mbs': 1,        # Default value
+                'batch_accum': 1, # Default value
+                'tp': 1,         # Default value
+                'pp': 1,         # Default value
+                'dp': 1,         # Default value
+                'zero_stage': 0,  # Default value
+                'tie_word_embeddings': config.get('tie_word_embeddings', True),
+                'num_attention_heads': config['num_attention_heads'],
+                'num_key_value_heads': config.get('num_key_value_heads', config['num_attention_heads'])
+            }
+        except json.JSONDecodeError:
+            # If not JSON, try YAML
+            config = yaml.safe_load(content)
+            # Extract relevant parameters from YAML config
+            model_config = config['model']['model_config']
+            parallelism = config['parallelism']
+            tokens = config['tokens']
+            optimizer = config['optimizer']
+            return {
+                'hidden_size': model_config['hidden_size'],
+                'num_layers': model_config['num_hidden_layers'],
+                'vocab_size': model_config['vocab_size'],
+                'intermediate_size': model_config['intermediate_size'],
+                'seq_len': tokens['sequence_length'],
+                'mbs': tokens['micro_batch_size'],
+                'batch_accum': tokens['batch_accumulation_per_replica'],
+                'tp': parallelism['tp'],
+                'pp': parallelism['pp'],
+                'dp': parallelism['dp'],
+                'zero_stage': optimizer['zero_stage'],
+                'tie_word_embeddings': model_config['tie_word_embeddings'],
+                'num_attention_heads': model_config['num_attention_heads'],
+                'num_key_value_heads': model_config.get('num_key_value_heads', model_config['num_attention_heads'])
+            }
     except Exception as e:
+        raise gr.Error(f"Error parsing configuration: {str(e)}")
 def load_config_from_yaml_file(yaml_path):
     if not yaml_path:
         return None
     with open(yaml_path.name, 'r') as f:
+        return load_config_from_content(f.read())
 def format_config_display(config):
     if not config:
     fig1, fig2, memory_usage_peak_tbi = plot_memory_breakdown(**config)
     oom_prediction = "OOM" if memory_usage_peak_tbi > 75000 else "No OOM"
     return fig1, fig2, format_config_display(config), oom_prediction
 with gr.Blocks() as demo:
     with gr.Row():
         with gr.Column(scale=1):
+            with gr.Accordion("Configuration Input", open=True):
+                config_text = gr.Textbox(
+                    label="Paste YAML or JSON configuration",
+                    placeholder="Paste your YAML or JSON configuration here...",
                     lines=10
                 )
+                config_submit = gr.Button("Calculate Memory from Config")
+            with gr.Accordion("Manual Configuration", open=True):
                 with gr.Accordion("Model Architecture", open=True):
+                    with gr.Row():
+                        hidden_size = gr.Number(4096, label="Hidden Size")
+                        num_layers = gr.Number(32, label="Number of Layers")
+                    with gr.Row():
+                        vocab_size = gr.Number(50432, label="Vocabulary Size")
+                        intermediate_size = gr.Number(11008, label="Intermediate Size")
+                    with gr.Row():
+                        num_attention_heads = gr.Number(32, label="Number of Attention Heads")
+                        num_key_value_heads = gr.Number(32, label="Number of Key Value Heads")
                     tie_word_embeddings = gr.Checkbox(True, label="Tie Word Embeddings")
                 with gr.Accordion("Training Configuration", open=True):
+                    with gr.Row():
+                        seq_len = gr.Number(2048, label="Sequence Length")
+                        mbs = gr.Number(1, label="Micro Batch Size")
+                        batch_accum = gr.Number(1, label="Gradient Accumulation Steps")
                 with gr.Accordion("Parallelism", open=True):
+                    with gr.Row():
+                        tp = gr.Number(1, label="Tensor Parallelism")
+                        pp = gr.Number(1, label="Pipeline Parallelism")
+                        dp = gr.Number(1, label="Data Parallelism")
                     zero_stage = gr.Radio([0, 1, 2, 3], value=0, label="ZeRO Stage")
                 manual_submit = gr.Button("Calculate Memory (Manual Input)")
             plot1 = gr.Plot(label="Memory Component Breakdown")
             plot2 = gr.Plot(label="Aggregate Memory Metrics")
+    # Handle config text input
+    config_submit.click(
+        lambda x: process_yaml_and_update_ui(load_config_from_content(x) if x else None),
+        inputs=[config_text],
+        outputs=[
+            plot1, plot2, config_display, oom_display,
+            hidden_size, num_attention_heads, num_key_value_heads, num_layers,
+            vocab_size, intermediate_size, seq_len, mbs, batch_accum,
+            tp, pp, dp, zero_stage, tie_word_embeddings
+        ]
     )
+    def process_yaml_and_update_ui(config):
+        if not config:
+            return [None, None, "No configuration loaded", None] + [gr.update() for _ in range(14)]
+        fig1, fig2, memory_usage_peak_tbi = plot_memory_breakdown(**config)
+        oom_prediction = "OOM" if memory_usage_peak_tbi > 75000 else "No OOM"
+        # Return values for all outputs including UI updates
+        return [
+            fig1, fig2,
+            format_config_display(config),
+            oom_prediction,
+            # UI component updates
+            config['hidden_size'],
+            config['num_attention_heads'],
+            config['num_key_value_heads'],
+            config['num_layers'],
+            config['vocab_size'],
+            config['intermediate_size'],
+            config['seq_len'],
+            config['mbs'],
+            config['batch_accum'],
+            config['tp'],
+            config['pp'],
+            config['dp'],
+            config['zero_stage'],
+            config['tie_word_embeddings']
+        ]
     # Handle manual input
     def manual_input_to_config(*args):
             'num_attention_heads': args[1],
             'num_key_value_heads': args[2]
         }
+        return process_yaml_and_update_ui(config)
     manual_submit.click(
         manual_input_to_config,