Update app.py
Browse files
app.py
CHANGED
|
@@ -20,7 +20,7 @@ from threading import Thread
|
|
| 20 |
dataset = load_dataset("not-lain/wikipedia",revision = "embedded")
|
| 21 |
|
| 22 |
# Returns a list of dictionaries, each representing a row in the dataset.
|
| 23 |
-
print(dataset[1])
|
| 24 |
#splitter = RecursiveCharacterTextSplitter(chunk_size=150, chunk_overlap=25,separators=["\n\n"]) # ["\n\n", "\n", " ", ""])
|
| 25 |
|
| 26 |
|
|
@@ -41,7 +41,7 @@ data = dataset["train"]
|
|
| 41 |
|
| 42 |
print(data)
|
| 43 |
data = data.add_faiss_index("embeddings")
|
| 44 |
-
# adds
|
| 45 |
|
| 46 |
|
| 47 |
print("check1")
|
|
|
|
| 20 |
dataset = load_dataset("not-lain/wikipedia",revision = "embedded")
|
| 21 |
|
| 22 |
# Returns a list of dictionaries, each representing a row in the dataset.
|
| 23 |
+
#print(dataset[1])
|
| 24 |
#splitter = RecursiveCharacterTextSplitter(chunk_size=150, chunk_overlap=25,separators=["\n\n"]) # ["\n\n", "\n", " ", ""])
|
| 25 |
|
| 26 |
|
|
|
|
| 41 |
|
| 42 |
print(data)
|
| 43 |
data = data.add_faiss_index("embeddings")
|
| 44 |
+
# adds an index column that for the embeddings
|
| 45 |
|
| 46 |
|
| 47 |
print("check1")
|