InflectionLM

Paused

cafierom commited on 20 days ago

Commit

360bdcd

verified ·

1 Parent(s): c928ab8

Upload 2 files

Files changed (2) hide show

app.py CHANGED Viewed

@@ -69,7 +69,7 @@ def generate_beam_html(index, all_beams_data, dark_mode):
 @spaces.GPU
 def predict(prompt, dark_mode, temperature):
     """
-    Generates responses for 5 beams and returns the first beam's visualization and visibility for controls.
     """
     # Generate beams
     generated_dicts, transcription = make_beams(model, processor, prompt, temperature=temperature)
@@ -112,7 +112,7 @@ def switch_beam(current_index, all_beams_data, dark_mode):
     if all_beams_data is None:
         return None, None, 0
-    new_index = (current_index + 1) % 5
     main_html, detail_html = generate_beam_html(new_index, all_beams_data, dark_mode)
     return main_html, detail_html, new_index

 @spaces.GPU
 def predict(prompt, dark_mode, temperature):
     """
+    Generates responses for 3 beams and returns the first beam's visualization and visibility for controls.
     """
     # Generate beams
     generated_dicts, transcription = make_beams(model, processor, prompt, temperature=temperature)
     if all_beams_data is None:
         return None, None, 0
+    new_index = (current_index + 1) % 3
     main_html, detail_html = generate_beam_html(new_index, all_beams_data, dark_mode)
     return main_html, detail_html, new_index

inflections_funcs.py CHANGED Viewed

@@ -19,7 +19,7 @@ def start_model(model_id: str = "google/gemma-4-31B-it"):
 def make_beams(model: AutoModelForCausalLM, processor: AutoProcessor, initial_prompt: str, temperature: float = 1.0) -> Tuple[Any, List[str]]:
     '''
-    Generates 5 diverse beams in response to a prompt.
     '''
     messages = [
         {"role": "system", "content": "You are a helpful assistant."},
@@ -39,7 +39,7 @@ def make_beams(model: AutoModelForCausalLM, processor: AutoProcessor, initial_pr
     generated_dicts = model.generate(**inputs,
                                     max_new_tokens=1024,
                                     num_beams=1,          # Disable beam search for pure sampling
-                                    num_return_sequences=5, # Generate 5 independent diverse samples
                                     return_dict_in_generate=True,
                                     output_scores=True,
                                     temperature=temperature if temperature > 0 else 0.1, # Ensure T > 0 for sampling

 def make_beams(model: AutoModelForCausalLM, processor: AutoProcessor, initial_prompt: str, temperature: float = 1.0) -> Tuple[Any, List[str]]:
     '''
+    Generates 3 diverse responses in response to a prompt.
     '''
     messages = [
         {"role": "system", "content": "You are a helpful assistant."},
     generated_dicts = model.generate(**inputs,
                                     max_new_tokens=1024,
                                     num_beams=1,          # Disable beam search for pure sampling
+                                    num_return_sequences=3, # Generate 3 independent diverse samples
                                     return_dict_in_generate=True,
                                     output_scores=True,
                                     temperature=temperature if temperature > 0 else 0.1, # Ensure T > 0 for sampling