Nemo-Mistral-Minitron

Running on Zero

Tonic commited on Sep 17

Commit

ad72fd3

•

1 Parent(s): ade11b4

improve interface

Files changed (2) hide show

app.py CHANGED Viewed

@@ -97,24 +97,24 @@ with gr.Blocks() as demo:
                 value="You are a helpful AI assistant.",
                 lines=2,
                 placeholder="Set the AI's behavior and context..."
-            )
-            context = gr.Textbox(
-                label="Context",
-                lines=2,
-                placeholder="Enter additional context information..."
-            )
-            max_tokens = gr.Slider(minimum=1, maximum=1024, value=256, step=1, label="Max Tokens")
-            temperature = gr.Slider(minimum=0.1, maximum=2.0, value=0.7, step=0.1, label="Temperature")
-            top_p = gr.Slider(minimum=0.1, maximum=1.0, value=0.95, step=0.05, label="Top-p")
-            use_pipeline = gr.Checkbox(label="Use Pipeline", value=False)
-            use_tool = gr.Checkbox(label="Use Function Calling", value=False)
-            with gr.Column(visible=False) as tool_options:
-                tool_definition = gr.Code(
-                    label="Tool Definition (JSON)",
-                    value=customtool,
-                    lines=15,
-                    language="json"
                 )
     def user(user_message, history):
         return "", history + [[user_message, None]]

                 value="You are a helpful AI assistant.",
                 lines=2,
                 placeholder="Set the AI's behavior and context..."
                 )
+                context = gr.Textbox(
+                    label="Context",
+                    lines=2,
+                    placeholder="Enter additional context information..."
+                )
+                max_tokens = gr.Slider(minimum=1, maximum=1024, value=256, step=1, label="Max Tokens")
+                temperature = gr.Slider(minimum=0.1, maximum=2.0, value=0.7, step=0.1, label="Temperature")
+                top_p = gr.Slider(minimum=0.1, maximum=1.0, value=0.95, step=0.05, label="Top-p")
+                use_pipeline = gr.Checkbox(label="Use Pipeline", value=False)
+                use_tool = gr.Checkbox(label="Use Function Calling", value=False)
+                with gr.Column(visible=False) as tool_options:
+                    tool_definition = gr.Code(
+                        label="Tool Definition (JSON)",
+                        value=customtool,
+                        lines=15,
+                        language="json"
+                    )
     def user(user_message, history):
         return "", history + [[user_message, None]]

globe.py CHANGED Viewed

@@ -14,14 +14,14 @@ presentation1 = """Try this model on [build.nvidia.com](https://build.nvidia.com
 **Model Dates:** 🤖Nemotron-Mini-4B-Instruct was trained between February 2024 and Aug 2024.
-## License
 [NVIDIA Community Model License](https://huggingface.co/nvidia/Nemotron-Mini-4B-Instruct/blob/main/nvidia-community-model-license-aug2024.pdf)"""
 presentation2 = """
-## Model Architecture
-Nemotron-Mini-4B-Instruct uses a model embedding size of 3072, 32 attention heads, and an MLP intermediate dimension of 9216. It also uses Grouped-Query Attention (GQA) and Rotary Position Embeddings (RoPE).
 **Architecture Type:** Transformer Decoder (auto-regressive language model)

 **Model Dates:** 🤖Nemotron-Mini-4B-Instruct was trained between February 2024 and Aug 2024.
+### License
 [NVIDIA Community Model License](https://huggingface.co/nvidia/Nemotron-Mini-4B-Instruct/blob/main/nvidia-community-model-license-aug2024.pdf)"""
 presentation2 = """
+###  Model Architecture
+🤖Nemotron-Mini-4B-Instruct uses a model embedding size of 3072, 32 attention heads, and an MLP intermediate dimension of 9216. It also uses Grouped-Query Attention (GQA) and Rotary Position Embeddings (RoPE).
 **Architecture Type:** Transformer Decoder (auto-regressive language model)