Spaces:

Daoneeee
/

task_Chatbot

Sleeping

App Files Files Community

Daoneeee commited on Nov 21, 2023

Commit

15e44b9

1 Parent(s): 3a75faa

Update app.py

Browse files

Files changed (1) hide show

app.py +52 -0

app.py CHANGED Viewed

@@ -14,6 +14,51 @@ from langchain.document_loaders import PyPDFLoader, TextLoader, JSONLoader, CSVL
 import tempfile  # 임시 파일을 생성하기 위한 라이브러리입니다.
 import os
 # PDF 문서로부터 텍스트를 추출하는 함수입니다.
 def get_pdf_text(pdf_docs):
@@ -52,11 +97,18 @@ def get_json_file(json_docs):
     temp_filepath = os.path.join(temp_dir.name, json_docs.name)
     with open(temp_filepath, "wb") as f:
         f.write(json_docs.getvalue())
     json_loader = JSONLoader(temp_filepath)
     json_doc = json_loader.load()
     return json_doc
 # 문서들을 처리하여 텍스트 청크로 나누는 함수입니다.
 def get_text_chunks(documents):
     text_splitter = RecursiveCharacterTextSplitter(

 import tempfile  # 임시 파일을 생성하기 위한 라이브러리입니다.
 import os
+{'image': {'creation_timestamp': 1675549016, 'uri': 'image_of_the_chat.jpg'},
+ 'is_still_participant': True,
+ 'joinable_mode': {'link': '', 'mode': 1},
+ 'magic_words': [],
+ 'messages': [{'content': 'Bye!',
+               'sender_name': 'User 2',
+               'timestamp_ms': 1675597571851},
+              {'content': 'Oh no worries! Bye',
+               'sender_name': 'User 1',
+               'timestamp_ms': 1675597435669},
+              {'content': 'No Im sorry it was my mistake, the blue one is not '
+                          'for sale',
+               'sender_name': 'User 2',
+               'timestamp_ms': 1675596277579},
+              {'content': 'I thought you were selling the blue one!',
+               'sender_name': 'User 1',
+               'timestamp_ms': 1675595140251},
+              {'content': 'Im not interested in this bag. Im interested in the '
+                          'blue one!',
+               'sender_name': 'User 1',
+               'timestamp_ms': 1675595109305},
+              {'content': 'Here is $129',
+               'sender_name': 'User 2',
+               'timestamp_ms': 1675595068468},
+              {'photos': [{'creation_timestamp': 1675595059,
+                           'uri': 'url_of_some_picture.jpg'}],
+               'sender_name': 'User 2',
+               'timestamp_ms': 1675595060730},
+              {'content': 'Online is at least $100',
+               'sender_name': 'User 2',
+               'timestamp_ms': 1675595045152},
+              {'content': 'How much do you want?',
+               'sender_name': 'User 1',
+               'timestamp_ms': 1675594799696},
+              {'content': 'Goodmorning! $50 is too low.',
+               'sender_name': 'User 2',
+               'timestamp_ms': 1675577876645},
+              {'content': 'Hi! Im interested in your bag. Im offering $50. Let '
+                          'me know if you are interested. Thanks!',
+               'sender_name': 'User 1',
+               'timestamp_ms': 1675549022673}],
+ 'participants': [{'name': 'User 1'}, {'name': 'User 2'}],
+ 'thread_path': 'inbox/User 1 and User 2 chat',
+ 'title': 'User 1 and User 2 chat'}
 # PDF 문서로부터 텍스트를 추출하는 함수입니다.
 def get_pdf_text(pdf_docs):
     temp_filepath = os.path.join(temp_dir.name, json_docs.name)
     with open(temp_filepath, "wb") as f:
         f.write(json_docs.getvalue())
+        loader = JSONLoader(
+            file_path='./example_data/facebook_chat.json',
+            jq_schema='.messages[].content',
+            text_content=False)
+        data = loader.load()
     json_loader = JSONLoader(temp_filepath)
     json_doc = json_loader.load()
     return json_doc
 # 문서들을 처리하여 텍스트 청크로 나누는 함수입니다.
 def get_text_chunks(documents):
     text_splitter = RecursiveCharacterTextSplitter(