metastable-void
commited on
update
Browse files
app.py
CHANGED
@@ -22,11 +22,10 @@ MAX_INPUT_TOKEN_LENGTH = int(os.getenv("MAX_INPUT_TOKEN_LENGTH", "32768"))
|
|
22 |
if torch.cuda.is_available():
|
23 |
model_id = "vericava/llm-jp-3-1.8b-instruct-lora-vericava7-llama"
|
24 |
base_model_id = "llm-jp/llm-jp-3-1.8b-instruct"
|
25 |
-
tokenizer = AutoTokenizer.from_pretrained(base_model_id)
|
26 |
-
model = AutoModelForCausalLM.from_pretrained(model_id)
|
27 |
my_pipeline=pipeline(
|
28 |
model=model_id,
|
29 |
tokenizer=base_model_id,
|
|
|
30 |
)
|
31 |
my_pipeline.tokenizer.chat_template = "{{bos_token}}{% for message in messages %}{% if message['role'] == 'user' %}{{ '\\n\\n### 前の投稿:\\n' + message['content'] + '' }}{% elif message['role'] == 'system' %}{{ '以下は、SNS上の投稿です。あなたはSNSの投稿生成botとして、次に続く投稿を考えなさい。説明はせず、投稿の内容のみを鉤括弧をつけずに答えよ。' }}{% elif message['role'] == 'assistant' %}{{ '\\n\\n### 次の投稿:\\n' + message['content'] + eos_token }}{% endif %}{% if loop.last and add_generation_prompt %}{{ '\\n\\n### 次の投稿:\\n' }}{% endif %}{% endfor %}"
|
32 |
|
|
|
22 |
if torch.cuda.is_available():
|
23 |
model_id = "vericava/llm-jp-3-1.8b-instruct-lora-vericava7-llama"
|
24 |
base_model_id = "llm-jp/llm-jp-3-1.8b-instruct"
|
|
|
|
|
25 |
my_pipeline=pipeline(
|
26 |
model=model_id,
|
27 |
tokenizer=base_model_id,
|
28 |
+
use_safetensors=True,
|
29 |
)
|
30 |
my_pipeline.tokenizer.chat_template = "{{bos_token}}{% for message in messages %}{% if message['role'] == 'user' %}{{ '\\n\\n### 前の投稿:\\n' + message['content'] + '' }}{% elif message['role'] == 'system' %}{{ '以下は、SNS上の投稿です。あなたはSNSの投稿生成botとして、次に続く投稿を考えなさい。説明はせず、投稿の内容のみを鉤括弧をつけずに答えよ。' }}{% elif message['role'] == 'assistant' %}{{ '\\n\\n### 次の投稿:\\n' + message['content'] + eos_token }}{% endif %}{% if loop.last and add_generation_prompt %}{{ '\\n\\n### 次の投稿:\\n' }}{% endif %}{% endfor %}"
|
31 |
|