ic/vsp-chroma.py

## vsp-chroma.py
from pprint import pprint as pp

import chromadb

client = chromadb.Client()
collection = client.create_collection("all-my-documents")

# "document" is Chroma terminology. In VectorDB and others it is "chunk"
#   And when querying with Chroma, response "units" are "documents". So better
#   chop them finely to get good granularity, or not at all to get whole docs.
documents = [
    "Whatever this is it should at some point include the word document, and nothing else perhaps.",
    "This is document1",
    "This is document2",
    "This is not",
    "Not at all",
    "Not even remotely",
]

collection.add(
    documents=documents,
    ids=[f"d{i}" for i in range(len(documents))],
)

results = collection.query(
    query_texts=["This is a query document, and nothing else"],
    n_results=2,
)

pp(results)
	from pprint import pprint as pp

	import chromadb

	client = chromadb.Client()
	collection = client.create_collection("all-my-documents")

	# "document" is Chroma terminology. In VectorDB and others it is "chunk"
	# And when querying with Chroma, response "units" are "documents". So better
	# chop them finely to get good granularity, or not at all to get whole docs.
	documents = [
	"Whatever this is it should at some point include the word document, and nothing else perhaps.",
	"This is document1",
	"This is document2",
	"This is not",
	"Not at all",
	"Not even remotely",
	]

	collection.add(
	documents=documents,
	ids=[f"d{i}" for i in range(len(documents))],
	)

	results = collection.query(
	query_texts=["This is a query document, and nothing else"],
	n_results=2,
	)

	pp(results)