Spaces:

bardicreels
/

rag2

Sleeping

user commited on Sep 12, 2024

Commit

cc19159

1 Parent(s): 576b273

Fix UnhashableParamError and improve caching in create_embeddings

Files changed (1) hide show

app.py CHANGED Viewed

@@ -27,12 +27,12 @@ def load_and_process_text(file_path):
         return []
 @st.cache_data
-def create_embeddings(chunks, tokenizer, embedding_model):
     embeddings = []
     for chunk in chunks:
         inputs = tokenizer(chunk, return_tensors="pt", padding=True, truncation=True, max_length=512)
         with torch.no_grad():
-            outputs = embedding_model(**inputs)
         embeddings.append(outputs.last_hidden_state.mean(dim=1).squeeze().numpy())
     return np.array(embeddings)
@@ -80,7 +80,7 @@ st.markdown('<p class="big-font">Chat with the Muse of A.R. Ammons. Ask question
 with st.spinner("Loading models and data..."):
     tokenizer, embedding_model, generation_model = load_models()
     chunks = load_and_process_text('ammons_muse.txt')
-    embeddings = create_embeddings(chunks, tokenizer, embedding_model)
     index = create_faiss_index(embeddings)
 if tokenizer is None or embedding_model is None or generation_model is None or not chunks:

         return []
 @st.cache_data
+def create_embeddings(chunks, _embedding_model):
     embeddings = []
     for chunk in chunks:
         inputs = tokenizer(chunk, return_tensors="pt", padding=True, truncation=True, max_length=512)
         with torch.no_grad():
+            outputs = _embedding_model(**inputs)
         embeddings.append(outputs.last_hidden_state.mean(dim=1).squeeze().numpy())
     return np.array(embeddings)
 with st.spinner("Loading models and data..."):
     tokenizer, embedding_model, generation_model = load_models()
     chunks = load_and_process_text('ammons_muse.txt')
+    embeddings = create_embeddings(chunks, embedding_model)
     index = create_faiss_index(embeddings)
 if tokenizer is None or embedding_model is None or generation_model is None or not chunks: