最后活跃于 1730301429

修订 8e0871537a1e8910813aa6e7acb9bb481e3eb5ec

Chroma-2.py 原始文件
1import chromadb
2# setup Chroma in-memory, for easy prototyping. Can add persistence easily!
3client = chromadb.Client()
4
5# Create collection. get_collection, get_or_create_collection, delete_collection also available!
6collection = client.create_collection("all-my-documents")
7
8# Add docs to the collection. Can also update and delete. Row-based API coming soon!
9collection.add(
10 documents=["This is document1", "This is document2"], # we handle tokenization, embedding, and indexing automatically. You can skip that and add your own embeddings as well
11 metadatas=[{"source": "notion"}, {"source": "google-docs"}], # filter on these!
12 ids=["doc1", "doc2"], # unique for each doc
13)
14
15# Query/search 2 most similar results. You can also .get by id
16results = collection.query(
17 query_texts=["This is a query document"],
18 n_results=2,
19 # where={"metadata_field": "is_equal_to_this"}, # optional filter
20 # where_document={"$contains":"search_string"} # optional filter
21)