M17idd commited on
Commit
76f6398
·
1 Parent(s): 7fb2b42

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +6 -8
app.py CHANGED
@@ -15,6 +15,8 @@ from sentence_transformers import SentenceTransformer
15
  import faiss
16
  from langchain.indexes import VectorstoreIndexCreator
17
  from langchain.vectorstores import FAISS
 
 
18
 
19
  # ----------------- تنظیمات صفحه -----------------
20
  st.set_page_config(page_title="چت‌ بات توانا", page_icon="🪖", layout="wide")
@@ -99,24 +101,20 @@ st.markdown("""
99
 
100
  # ----------------- لود PDF و ساخت ایندکس -----------------
101
 
 
102
  @st.cache_resource
103
  def get_pdf_index():
104
  with st.spinner('📄 در حال پردازش فایل PDF...'):
105
  loader = PyPDFLoader('test1.pdf')
106
- # documents = loader.load()
107
 
108
  splitter = RecursiveCharacterTextSplitter(chunk_size=2000, chunk_overlap=128)
109
- # texts = []
110
- # for doc in documents:
111
- # texts.extend(splitter.split_text(doc.page_content))
112
-
113
 
114
  embedding_function = SentenceTransformer("togethercomputer/m2-bert-80M-8k-retrieval", trust_remote_code=True)
115
-
116
- # ctorstore_index_creator.from_documents([Document(page_content=text) for text in texts])
117
 
118
  return VectorstoreIndexCreator(
119
- embedding=embedding_function,
120
  text_splitter=splitter
121
  ).from_loaders(loader)
122
 
 
15
  import faiss
16
  from langchain.indexes import VectorstoreIndexCreator
17
  from langchain.vectorstores import FAISS
18
+ from langchain.embeddings import SentenceTransformerEmbeddings
19
+
20
 
21
  # ----------------- تنظیمات صفحه -----------------
22
  st.set_page_config(page_title="چت‌ بات توانا", page_icon="🪖", layout="wide")
 
101
 
102
  # ----------------- لود PDF و ساخت ایندکس -----------------
103
 
104
+ # ----------------- لود PDF و ساخت ایندکس -----------------
105
  @st.cache_resource
106
  def get_pdf_index():
107
  with st.spinner('📄 در حال پردازش فایل PDF...'):
108
  loader = PyPDFLoader('test1.pdf')
 
109
 
110
  splitter = RecursiveCharacterTextSplitter(chunk_size=2000, chunk_overlap=128)
 
 
 
 
111
 
112
  embedding_function = SentenceTransformer("togethercomputer/m2-bert-80M-8k-retrieval", trust_remote_code=True)
113
+
114
+ embedding = SentenceTransformerEmbeddings(model=embedding_function)
115
 
116
  return VectorstoreIndexCreator(
117
+ embedding=embedding,
118
  text_splitter=splitter
119
  ).from_loaders(loader)
120