Spaces:

George-API
/

qwen4bit

Sleeping

App Files Files Community

George-API commited on Mar 10

Commit

b4b3dd2

verified ·

1 Parent(s): 4dfe8a5

Upload app.py with huggingface_hub

Browse files

Files changed (1) hide show

app.py +115 -76

app.py CHANGED Viewed

@@ -1,76 +1,115 @@
-import gradio as gr
-import os
-from dotenv import load_dotenv
-# Load environment variables
-load_dotenv()
-# Model details
-MODEL_NAME = "unsloth/DeepSeek-R1-Distill-Qwen-14B-bnb-4bit"
-SPACE_NAME = os.getenv("HF_SPACE_NAME", "qwen4bit")
-def generate_response(prompt, max_new_tokens=256):
-    """
-    This is a placeholder function that will be replaced with actual model inference
-    after fine-tuning is complete.
-    """
-    # Currently returns a placeholder message
-    return f"""[Placeholder Response]
-This is a demo of the {MODEL_NAME} model.
-Once fine-tuning is complete, this will respond to:
-"{prompt}"
-This space will be updated with the fine-tuned model."""
-# Create the Gradio interface
-with gr.Blocks(title=f"Fine-tuned {MODEL_NAME}") as demo:
-    gr.Markdown(f"""
-    # Fine-tuned DeepSeek-R1-Distill-Qwen-14B Model
-    This space will host the fine-tuned version of `{MODEL_NAME}` once training is complete.
-    **Model Details**:
-    - Base model: `{MODEL_NAME}`
-    - Fine-tuned on: `phi4-cognitive-dataset`
-    - 4-bit quantized (already, not further quantized)
-    **Current Status**: Preparing for fine-tuning
-    """)
-    with gr.Row():
-        with gr.Column():
-            input_text = gr.Textbox(
-                label="Enter your prompt",
-                placeholder="Type your prompt here...",
-                lines=4
-            )
-            max_tokens = gr.Slider(
-                minimum=32,
-                maximum=1024,
-                value=256,
-                step=32,
-                label="Max new tokens"
-            )
-            submit_btn = gr.Button("Generate Response")
-        with gr.Column():
-            output_text = gr.Textbox(
-                label="Model Response",
-                lines=10
-            )
-    submit_btn.click(
-        fn=generate_response,
-        inputs=[input_text, max_tokens],
-        outputs=output_text
-    )
-    gr.Markdown("""
-    ### Note
-    This is a placeholder application. The actual fine-tuned model will be deployed
-    to this space once training is complete.
-    """)
-# Launch the app
-if __name__ == "__main__":
-    demo.launch()

+import gradio as gr
+import os
+import json
+import torch
+from dotenv import load_dotenv
+import logging
+# Configure logging
+logging.basicConfig(
+    level=logging.INFO,
+    format='%(asctime)s - %(name)s - %(levelname)s - %(message)s',
+    handlers=[
+        logging.StreamHandler(),
+        logging.FileHandler("app.log")
+    ]
+)
+logger = logging.getLogger(__name__)
+# Load environment variables
+load_dotenv()
+# Load config file
+def load_config(config_path="transformers_config.json"):
+    try:
+        with open(config_path, 'r') as f:
+            config = json.load(f)
+        return config
+    except Exception as e:
+        logger.error(f"Error loading config: {str(e)}")
+        return {}
+# Load configuration
+config = load_config()
+model_config = config.get("model_config", {})
+# Model details from config
+MODEL_NAME = model_config.get("model_name_or_path", "unsloth/DeepSeek-R1-Distill-Qwen-14B-bnb-4bit")
+SPACE_NAME = os.getenv("HF_SPACE_NAME", "phi4training")
+TRAINING_ACTIVE = os.path.exists("TRAINING_ACTIVE")
+# Create Gradio interface - training status only, no model outputs
+with gr.Blocks(css="footer {visibility: hidden}") as demo:
+    gr.Markdown(f"# {SPACE_NAME}: Training Status Dashboard")
+    with gr.Row():
+        with gr.Column():
+            status = gr.Markdown(
+                f"""
+                ## Research Training Phase Active
+                **Model**: {MODEL_NAME}
+                **Dataset**: phi4-cognitive-dataset
+                This is a multidisciplinary research training phase. The model is not available for interactive use.
+                ### Training Configuration:
+                - **Epochs**: {config.get("training_config", {}).get("num_train_epochs", 3)}
+                - **Batch Size**: {config.get("training_config", {}).get("per_device_train_batch_size", 2)}
+                - **Gradient Accumulation Steps**: {config.get("training_config", {}).get("gradient_accumulation_steps", 4)}
+                - **Learning Rate**: {config.get("training_config", {}).get("learning_rate", 2e-5)}
+                - **Max Sequence Length**: {config.get("training_config", {}).get("max_seq_length", 2048)}
+                ### Training Status:
+                {"🟢 Training in progress" if TRAINING_ACTIVE else "⚪ Training not currently active"}
+                ⚠️ **NOTE**: This space does not provide model outputs during the research training phase.
+                """
+            )
+    # Add a refresh button to check status
+    refresh_btn = gr.Button("Refresh Status")
+    def refresh_status():
+        # Re-check if training is active
+        training_active = os.path.exists("TRAINING_ACTIVE")
+        return f"""
+        ## Research Training Phase Active
+        **Model**: {MODEL_NAME}
+        **Dataset**: phi4-cognitive-dataset
+        This is a multidisciplinary research training phase. The model is not available for interactive use.
+        ### Training Configuration:
+        - **Epochs**: {config.get("training_config", {}).get("num_train_epochs", 3)}
+        - **Batch Size**: {config.get("training_config", {}).get("per_device_train_batch_size", 2)}
+        - **Gradient Accumulation Steps**: {config.get("training_config", {}).get("gradient_accumulation_steps", 4)}
+        - **Learning Rate**: {config.get("training_config", {}).get("learning_rate", 2e-5)}
+        - **Max Sequence Length**: {config.get("training_config", {}).get("max_seq_length", 2048)}
+        ### Training Status:
+        {"🟢 Training in progress" if training_active else "⚪ Training not currently active"}
+        ⚠️ **NOTE**: This space does not provide model outputs during the research training phase.
+        """
+    refresh_btn.click(refresh_status, outputs=status)
+    gr.Markdown("""
+    ### Research Training Information
+    This model is being fine-tuned on research-focused datasets and is not available for interactive querying.
+    Training logs are available to authorized researchers only.
+    """)
+# Launch the interface
+if __name__ == "__main__":
+    # Create an empty TRAINING_ACTIVE file to indicate training is in progress
+    # This would be managed by the actual training script
+    if not os.path.exists("TRAINING_ACTIVE"):
+        with open("TRAINING_ACTIVE", "w") as f:
+            f.write("Training in progress")
+    # Start Gradio with minimal features
+    logger.info("Starting training status dashboard")
+    demo.launch(share=False, enable_queue=False)