Spaces:

Dannyar608
/

Final_project

Running

Dannyar608 commited on 3 days ago

Commit

b6b0c94

verified ·

1 Parent(s): 8463af4

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -36,24 +36,19 @@ if HF_TOKEN:
 # ========== DEEPSEEK MODEL LOADING ==========
 def load_deepseek_model():
     """Load the DeepSeek model with progress tracking"""
-    progress = gr.Progress()
-    progress(0, desc="Loading DeepSeek model...")
     try:
         start_time = time.time()
         tokenizer = AutoTokenizer.from_pretrained(
             "deepseek-ai/DeepSeek-V3",
             trust_remote_code=True
         )
-        progress(0.3, desc="Loading tokenizer...")
         model = AutoModelForCausalLM.from_pretrained(
             "deepseek-ai/DeepSeek-V3",
             trust_remote_code=True,
             torch_dtype=torch.float16,
-            device_map="auto"
         )
-        progress(0.9, desc="Loading model weights...")
         load_time = time.time() - start_time
         print(f"DeepSeek model loaded in {load_time:.2f} seconds")
@@ -1459,13 +1454,17 @@ def create_interface():
             outputs=[tabs, nav_message, quiz_alert]
         )
-        # Check model loading status periodically
         def check_model_status():
             if model is not None and tokenizer is not None:
                 return gr.update(visible=False)
             return gr.update(visible=True)
-        app.load(check_model_status, None, model_status, every=1)
     return app
@@ -1475,4 +1474,4 @@ app = create_interface()
 # For Hugging Face Spaces deployment
 if __name__ == "__main__":
     app.launch()

 # ========== DEEPSEEK MODEL LOADING ==========
 def load_deepseek_model():
     """Load the DeepSeek model with progress tracking"""
     try:
         start_time = time.time()
         tokenizer = AutoTokenizer.from_pretrained(
             "deepseek-ai/DeepSeek-V3",
             trust_remote_code=True
         )
         model = AutoModelForCausalLM.from_pretrained(
             "deepseek-ai/DeepSeek-V3",
             trust_remote_code=True,
             torch_dtype=torch.float16,
+            device_map="auto" if torch.cuda.is_available() else None
         )
         load_time = time.time() - start_time
         print(f"DeepSeek model loaded in {load_time:.2f} seconds")
             outputs=[tabs, nav_message, quiz_alert]
         )
+        # Check model loading status
         def check_model_status():
             if model is not None and tokenizer is not None:
                 return gr.update(visible=False)
             return gr.update(visible=True)
+        app.load(
+            fn=check_model_status,
+            inputs=None,
+            outputs=model_status
+        )
     return app
 # For Hugging Face Spaces deployment
 if __name__ == "__main__":
     app.launch()