Spaces:

gsarti
/

pecore

Running on Zero

gsarti commited on Apr 24, 2024

Commit

cd7e21b

1 Parent(s): 7c57fe0

Minor fixes to presets

Files changed (2) hide show

app.py CHANGED Viewed

@@ -673,6 +673,7 @@ with gr.Blocks(css=custom_css) as demo:
         outputs=[
             model_name_or_path,
             input_template,
             contextless_input_template,
             special_tokens_to_keep,
             generation_kwargs,

         outputs=[
             model_name_or_path,
             input_template,
+            decoder_input_output_separator,
             contextless_input_template,
             special_tokens_to_keep,
             generation_kwargs,

presets.py CHANGED Viewed

@@ -77,17 +77,18 @@ def set_towerinstruct_preset():
 def set_gemma_preset():
     return (
         "google/gemma-2b-it", # model_name_or_path
-        "<start_of_turn>user\n{context}\n{current}<end_of_turn>\n<start_of_turn>model\n", # input_template
-        "<start_of_turn>user\n{current}<end_of_turn>\n<start_of_turn>model\n", # input_current_text_template
         ["<start_of_turn>", "<end_of_turn>"], # special_tokens_to_keep
         '{\n\t"max_new_tokens": 50\n}',  # generation_kwargs
     )
 def set_mistral_instruct_preset():
     return (
-        "mistralai/Mistral-7B-Instruct-v0.2" # model_name_or_path
-        "[INST]{context}\n{current}[/INST]" # input_template
-        "[INST]{current}[/INST]" # input_current_text_template
         '{\n\t"max_new_tokens": 50\n}',  # generation_kwargs
     )

 def set_gemma_preset():
     return (
         "google/gemma-2b-it", # model_name_or_path
+        "<start_of_turn>user\n{context}\n{current}<end_of_turn>\n<start_of_turn>model", # input_template
+        "\n",  # decoder_input_output_separator
+        "<start_of_turn>user\n{current}<end_of_turn>\n<start_of_turn>model", # input_current_text_template
         ["<start_of_turn>", "<end_of_turn>"], # special_tokens_to_keep
         '{\n\t"max_new_tokens": 50\n}',  # generation_kwargs
     )
 def set_mistral_instruct_preset():
     return (
+        "mistralai/Mistral-7B-Instruct-v0.2", # model_name_or_path
+        "[INST]{context}\n{current}[/INST]", # input_template
+        "[INST]{current}[/INST]", # input_current_text_template
         '{\n\t"max_new_tokens": 50\n}',  # generation_kwargs
     )