myr1-2

Sleeping

App Files Files Community

wuhp commited on Feb 1

Commit

6d30b44

verified ·

1 Parent(s): 066a25e

Update app.py

Browse files

Files changed (1) hide show

app.py +10 -27

app.py CHANGED Viewed

@@ -424,41 +424,32 @@ def chat_rag(
     return history, history
 with gr.Blocks() as demo:
     gr.Markdown("# QLoRA Fine-tuning & RAG-based Chat Demo using Custom R1 Model")
     gr.Markdown("---")
-    with gr.TabbedInterface(
         [
             gr.Interface(
                 fn=finetune_small_subset,
                 inputs=None,
                 outputs=gr.Textbox(label="Fine-tuning Status", interactive=False),
                 title="⚙️ Fine-tuning (Optional)",
-                description="""
-                    ### Optional Fine-tuning
-                    This section allows you to fine-tune the custom R1 model on a small subset of the ServiceNow dataset.
-                    This step is **optional** but can potentially improve the model's performance on ServiceNow-related tasks.
-                    **Note:** This process may take up to 5 minutes. Click the button below to start fine-tuning.
-                """
             ),
             gr.Interface(
                 fn=predict,
                 inputs=[
                     gr.Textbox(lines=3, label="Input Prompt", placeholder="Enter your prompt here..."),
-                    gr.Slider(0.0, 1.5, step=0.1, value=0.7, label="Temperature (Creativity)", info="Adjust the randomness of the output. Higher values mean more creative but potentially less coherent text."),
-                    gr.Slider(0.0, 1.0, step=0.05, value=0.9, label="Top-p (Sampling Nucleus)", info="Controls the sampling pool. Lower values make the output more focused."),
-                    gr.Slider(1, 2500, value=50, step=10, label="Min New Tokens", info="Minimum number of tokens to generate."),
-                    gr.Slider(1, 2500, value=200, step=50, label="Max New Tokens", info="Maximum number of tokens to generate.")
                 ],
                 outputs=gr.Textbox(label="Custom R1 Output", lines=8, interactive=False),
                 title="✍️ Direct Generation",
-                description="""
-                    ### Direct Text Generation
-                    Enter a prompt to generate text directly using the custom R1 model.
-                    This is standard text generation without retrieval augmentation.
-                """
             ),
             gr.Interface(
                 fn=compare_models,
@@ -474,22 +465,14 @@ with gr.Blocks() as demo:
                     gr.Textbox(label="Official R1 Output", lines=6, interactive=False)
                 ],
                 title="🆚 Model Comparison",
-                description="""
-                    ### Model Output Comparison
-                    Enter a prompt to compare the text generation of your fine-tuned custom R1 model with the official DeepSeek-R1-Distill-Llama-8B model.
-                    This allows you to see the differences in output between the two models.
-                """
             ),
             gr.ChatInterface(
                 fn=chat_rag,
                 chatbot=gr.Chatbot(label="RAG Chatbot"),
                 textbox=gr.Textbox(placeholder="Ask a question to the RAG Chatbot...", lines=2, show_label=False),
                 title="💬 RAG Chat",
-                description="""
-                    ### RAG-Enhanced Chat with Custom R1
-                    Chat with the custom R1 model, enhanced with retrieval-augmented generation (RAG).
-                    The model retrieves relevant information to provide more informed and context-aware responses.
-                """
             )
         ]
     )

     return history, history
+# Build the Gradio interface with tabs.
 with gr.Blocks() as demo:
     gr.Markdown("# QLoRA Fine-tuning & RAG-based Chat Demo using Custom R1 Model")
     gr.Markdown("---")
+    gr.TabbedInterface(
         [
             gr.Interface(
                 fn=finetune_small_subset,
                 inputs=None,
                 outputs=gr.Textbox(label="Fine-tuning Status", interactive=False),
                 title="⚙️ Fine-tuning (Optional)",
+                description="This section allows you to fine-tune the custom R1 model on a small subset of the ServiceNow dataset. This step is optional but can potentially improve the model's performance on ServiceNow-related tasks. **Note:** This process may take up to 5 minutes."
             ),
             gr.Interface(
                 fn=predict,
                 inputs=[
                     gr.Textbox(lines=3, label="Input Prompt", placeholder="Enter your prompt here..."),
+                    gr.Slider(0.0, 1.5, step=0.1, value=0.7, label="Temperature (Creativity)"),
+                    gr.Slider(0.0, 1.0, step=0.05, value=0.9, label="Top-p (Sampling Nucleus)"),
+                    gr.Slider(1, 2500, value=50, step=10, label="Min New Tokens"),
+                    gr.Slider(1, 2500, value=200, step=50, label="Max New Tokens")
                 ],
                 outputs=gr.Textbox(label="Custom R1 Output", lines=8, interactive=False),
                 title="✍️ Direct Generation",
+                description="Enter a prompt to generate text directly using the custom R1 model. This is standard text generation without retrieval augmentation."
             ),
             gr.Interface(
                 fn=compare_models,
                     gr.Textbox(label="Official R1 Output", lines=6, interactive=False)
                 ],
                 title="🆚 Model Comparison",
+                description="Enter a prompt to compare the text generation of your fine-tuned custom R1 model with the official DeepSeek-R1-Distill-Llama-8B model."
             ),
             gr.ChatInterface(
                 fn=chat_rag,
                 chatbot=gr.Chatbot(label="RAG Chatbot"),
                 textbox=gr.Textbox(placeholder="Ask a question to the RAG Chatbot...", lines=2, show_label=False),
                 title="💬 RAG Chat",
+                description="Chat with the custom R1 model, enhanced with retrieval-augmented memory. The model retrieves relevant info for informed responses."
             )
         ]
     )