M17idd commited on
Commit
febfa21
·
verified ·
1 Parent(s): 538588e

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -137,13 +137,13 @@ def get_pdf_index():
137
  small_chunks.append(text)
138
 
139
  final_chunks = []
140
- max_tokens = 2000
141
 
142
  for chunk in small_chunks:
143
  token_count = count_tokens(chunk, model_name="gpt-3.5-turbo")
144
  if token_count > max_tokens:
145
  splitter_token_safe = RecursiveCharacterTextSplitter(
146
- chunk_size=1000,
147
  chunk_overlap=100
148
  )
149
  smaller_chunks = splitter_token_safe.split_text(chunk)
 
137
  small_chunks.append(text)
138
 
139
  final_chunks = []
140
+ max_tokens = 512
141
 
142
  for chunk in small_chunks:
143
  token_count = count_tokens(chunk, model_name="gpt-3.5-turbo")
144
  if token_count > max_tokens:
145
  splitter_token_safe = RecursiveCharacterTextSplitter(
146
+ chunk_size=512,
147
  chunk_overlap=100
148
  )
149
  smaller_chunks = splitter_token_safe.split_text(chunk)