import { expect, test } from "@jest/globals"; import chroma from "./initClient"; import { IncludeEnum } from "../src/types"; import { EMBEDDINGS, IDS, METADATAS, DOCUMENTS } from "./data"; import { IEmbeddingFunction } from "../src/embeddings/IEmbeddingFunction"; export class TestEmbeddingFunction implements IEmbeddingFunction { constructor() { } public async generate(texts: string[]): Promise { let embeddings: number[][] = []; for (let i = 0; i < texts.length; i += 1) { embeddings.push([1, 2, 3, 4, 5, 6, 7, 8, 9, 10]); } return embeddings; } } test("it should query a collection", async () => { await chroma.reset(); const collection = await chroma.createCollection({ name: "test" }); await collection.add({ ids: IDS, embeddings: EMBEDDINGS }); const results = await collection.query({ queryEmbeddings: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10], nResults: 2 }); expect(results).toBeDefined(); expect(results).toBeInstanceOf(Object); expect(["test1", "test2"]).toEqual(expect.arrayContaining(results.ids[0])); expect(["test3"]).not.toEqual(expect.arrayContaining(results.ids[0])); }); // test where_document test("it should get embedding with matching documents", async () => { await chroma.reset(); const collection = await chroma.createCollection({ name: "test" }); await collection.add({ ids: IDS, embeddings: EMBEDDINGS, metadatas: METADATAS, documents: DOCUMENTS }); const results = await collection.query({ queryEmbeddings: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10], nResults: 3, whereDocument: { $contains: "This is a test" } }); // it should only return doc1 expect(results).toBeDefined(); expect(results).toBeInstanceOf(Object); expect(results.ids.length).toBe(1); expect(["test1"]).toEqual(expect.arrayContaining(results.ids[0])); expect(["test2"]).not.toEqual(expect.arrayContaining(results.ids[0])); expect(["This is a test"]).toEqual( expect.arrayContaining(results.documents[0]) ); const results2 = await collection.query({ queryEmbeddings: [1, 2, 3, 4, 5, 6, 7, 8, 9, 10], nResults: 3, whereDocument: { $contains: "This is a test" }, include: [IncludeEnum.Embeddings] }); // expect(results2.embeddings[0][0]).toBeInstanceOf(Array); expect(results2.embeddings![0].length).toBe(1); expect(results2.embeddings![0][0]).toEqual([1, 2, 3, 4, 5, 6, 7, 8, 9, 10]); }); // test queryTexts test("it should query a collection with text", async () => { await chroma.reset(); let embeddingFunction = new TestEmbeddingFunction(); const collection = await chroma.createCollection({ name: "test", embeddingFunction: embeddingFunction }); await collection.add({ ids: IDS, embeddings: EMBEDDINGS, metadatas: METADATAS, documents: DOCUMENTS }); const results = await collection.query({ queryTexts: ["test"], nResults: 3, whereDocument: { $contains: "This is a test" } }); expect(results).toBeDefined(); expect(results).toBeInstanceOf(Object); expect(results.ids.length).toBe(1); expect(["test1"]).toEqual(expect.arrayContaining(results.ids[0])); expect(["test2"]).not.toEqual(expect.arrayContaining(results.ids[0])); expect(["This is a test"]).toEqual( expect.arrayContaining(results.documents[0]) ); }) test("it should query a collection with text and where", async () => { await chroma.reset(); let embeddingFunction = new TestEmbeddingFunction(); const collection = await chroma.createCollection({ name: "test", embeddingFunction: embeddingFunction }); await collection.add({ ids: IDS, embeddings: EMBEDDINGS, metadatas: METADATAS, documents: DOCUMENTS }); const results = await collection.query({ queryTexts: ["test"], nResults: 3, where: { "float_value" : 2 } }); expect(results).toBeDefined(); expect(results).toBeInstanceOf(Object); expect(results.ids.length).toBe(1); expect(["test3"]).toEqual(expect.arrayContaining(results.ids[0])); expect(["test2"]).not.toEqual(expect.arrayContaining(results.ids[0])); expect(["This is a third test"]).toEqual( expect.arrayContaining(results.documents[0]) ); }) test("it should query a collection with text and where in", async () => { await chroma.reset(); let embeddingFunction = new TestEmbeddingFunction(); const collection = await chroma.createCollection({ name: "test", embeddingFunction: embeddingFunction }); await collection.add({ ids: IDS, embeddings: EMBEDDINGS, metadatas: METADATAS, documents: DOCUMENTS }); const results = await collection.query({ queryTexts: ["test"], nResults: 3, where: { "float_value" : { '$in': [2,5,10] }} }); expect(results).toBeDefined(); expect(results).toBeInstanceOf(Object); expect(results.ids.length).toBe(1); expect(["test3"]).toEqual(expect.arrayContaining(results.ids[0])); expect(["test2"]).not.toEqual(expect.arrayContaining(results.ids[0])); expect(["This is a third test"]).toEqual( expect.arrayContaining(results.documents[0]) ); }) test("it should query a collection with text and where nin", async () => { await chroma.reset(); let embeddingFunction = new TestEmbeddingFunction(); const collection = await chroma.createCollection({ name: "test", embeddingFunction: embeddingFunction }); await collection.add({ ids: IDS, embeddings: EMBEDDINGS, metadatas: METADATAS, documents: DOCUMENTS }); const results = await collection.query({ queryTexts: ["test"], nResults: 3, where: { "float_value" : { '$nin': [-2,0] }} }); expect(results).toBeDefined(); expect(results).toBeInstanceOf(Object); expect(results.ids.length).toBe(1); expect(["test3"]).toEqual(expect.arrayContaining(results.ids[0])); expect(["test2"]).not.toEqual(expect.arrayContaining(results.ids[0])); expect(["This is a third test"]).toEqual( expect.arrayContaining(results.documents[0]) ); })