Spaces:

nvidia
/

Eagle2-Demo

Running on Zero

App Files Files Community

liuguilin commited on 6 days ago

Commit

9fde336

1 Parent(s): 2447c5c

update

Browse files

Files changed (2) hide show

app.py +5 -5
eagle_vl/serve/inference.py +5 -5

app.py CHANGED Viewed

@@ -29,8 +29,8 @@ from eagle_vl.serve.chat_utils import (
 from eagle_vl.serve.inference import eagle_vl_generate, load_model
 from eagle_vl.serve.examples import get_examples
-TITLE = """<h1 align="left" style="min-width:200px; margin-top:0;">Chat with Eagle2.5-VL </h1>"""
-DESCRIPTION_TOP = """<a href="https://github.com/NVlabs/EAGLE" target="_blank">Eagle2.5-VL</a> is a multi-modal LLM that can understand text, images and videos, and generate text"""
 DESCRIPTION = """"""
 ROOT_DIR = os.path.dirname(os.path.abspath(__file__))
 DEPLOY_MODELS = dict()
@@ -39,7 +39,7 @@ logger = configure_logger()
 def parse_args():
     parser = argparse.ArgumentParser()
-    parser.add_argument("--model", type=str, default="Eagle2.5-VL-8B-Preview")
     parser.add_argument(
         "--local-path",
         type=str,
@@ -256,7 +256,7 @@ def build_demo(args: argparse.Namespace) -> gr.Blocks:
             with gr.Column(scale=4):
                 with gr.Row():
                     chatbot = gr.Chatbot(
-                        elem_id="Eagle2.5-VL-8B-chatbot",
                         show_share_button=True,
                         bubble_full_width=False,
                         height=600,
@@ -338,7 +338,7 @@ def build_demo(args: argparse.Namespace) -> gr.Blocks:
         del_last_btn.click(delete_last_conversation, [chatbot, history], output_widgets, show_progress=True)
         cancel_btn.click(cancel_outputing, [], [status_display], cancels=predict_events)
-    demo.title = "Eagle2.5-VL-8B Chatbot"
     return demo

 from eagle_vl.serve.inference import eagle_vl_generate, load_model
 from eagle_vl.serve.examples import get_examples
+TITLE = """<h1 align="left" style="min-width:200px; margin-top:0;">Chat with Eagle2-VL </h1>"""
+DESCRIPTION_TOP = """<a href="https://github.com/NVlabs/EAGLE" target="_blank">Eagle2-VL</a> is a multi-modal LLM that can understand text, images and videos, and generate text"""
 DESCRIPTION = """"""
 ROOT_DIR = os.path.dirname(os.path.abspath(__file__))
 DEPLOY_MODELS = dict()
 def parse_args():
     parser = argparse.ArgumentParser()
+    parser.add_argument("--model", type=str, default="Eagle2-8B")
     parser.add_argument(
         "--local-path",
         type=str,
             with gr.Column(scale=4):
                 with gr.Row():
                     chatbot = gr.Chatbot(
+                        elem_id="Eagle2-VL-8B-chatbot",
                         show_share_button=True,
                         bubble_full_width=False,
                         height=600,
         del_last_btn.click(delete_last_conversation, [chatbot, history], output_widgets, show_progress=True)
         cancel_btn.click(cancel_outputing, [], [status_display], cancels=predict_events)
+    demo.title = "Eagle2-VL-8B Chatbot"
     return demo

eagle_vl/serve/inference.py CHANGED Viewed

@@ -18,7 +18,7 @@ from .chat_utils import Conversation, get_conv_template
 logger = logging.getLogger(__name__)
-def load_model_from_nv(model_path: str = "nvidia/Eagle-2.5-8B"):
     token = os.environ.get("HF_TOKEN")
     # hotfix the model to use flash attention 2
@@ -41,7 +41,7 @@ def load_model_from_nv(model_path: str = "nvidia/Eagle-2.5-8B"):
     return model, processor
-def load_model_from_eagle(model_path: str = "NVEagle/Eagle2.5-VL-8B-Preview"):
     token = os.environ.get("HF_TOKEN")
     logger.info(f"token = {token[:4]}***{token[-2:]}")
@@ -65,7 +65,7 @@ def load_model_from_eagle(model_path: str = "NVEagle/Eagle2.5-VL-8B-Preview"):
     return model, processor
-def load_model(model_path: str = "nvidia/Eagle-2.5-8B"):
     try:
         model, processor = load_model_from_nv(model_path)
     except Exception as e:
@@ -100,10 +100,10 @@ def preprocess(
     results = [
         {
             "role": "system",
-            "content": """You are Eagle 2.5, a cutting-edge large language model developed by NVIDIA. You are highly capable, efficient, and aligned, specialized in understanding complex multimodal inputs and providing expert-level responses across domains.
 Always be concise, accurate, and helpful. You respond like a reliable co-pilot to researchers, developers, and engineers, offering deep technical insight, step-by-step reasoning, and practical suggestions.
 You can interpret long contexts, follow nuanced instructions, and dynamically adjust your tone to match the user's intent. If the user does not specify a tone, default to a professional, technical, yet friendly style.
-You understand you are Eagle 2.5, and may refer to yourself as such when asked."""}
     ]
     # get texts from conversations
     # converstion = get_conv_template(sft_format)

 logger = logging.getLogger(__name__)
+def load_model_from_nv(model_path: str = "nvidia/Eagle-2-8B"):
     token = os.environ.get("HF_TOKEN")
     # hotfix the model to use flash attention 2
     return model, processor
+def load_model_from_eagle(model_path: str = "NVEagle/Eagle2-8B"):
     token = os.environ.get("HF_TOKEN")
     logger.info(f"token = {token[:4]}***{token[-2:]}")
     return model, processor
+def load_model(model_path: str = "nvidia/Eagle2-8B"):
     try:
         model, processor = load_model_from_nv(model_path)
     except Exception as e:
     results = [
         {
             "role": "system",
+            "content": """You are Eagle 2, a cutting-edge large language model developed by NVIDIA. You are highly capable, efficient, and aligned, specialized in understanding complex multimodal inputs and providing expert-level responses across domains.
 Always be concise, accurate, and helpful. You respond like a reliable co-pilot to researchers, developers, and engineers, offering deep technical insight, step-by-step reasoning, and practical suggestions.
 You can interpret long contexts, follow nuanced instructions, and dynamically adjust your tone to match the user's intent. If the user does not specify a tone, default to a professional, technical, yet friendly style.
+You understand you are Eagle 2, and may refer to yourself as such when asked."""}
     ]
     # get texts from conversations
     # converstion = get_conv_template(sft_format)