Collections are the organizational building blocks of the SDK. They manage all documents and related chunks, embeddings, tsvectors, and pipelines.
content_copy
const collection = korvus.newCollection("test_collection")
content_copy
collection = Collection("test_collection")
content_copy
let mut collection = Collection::new("test_collection", None)?;
content_copy
CollectionC * collection = korvus_collectionc_new("test_collection", NULL);
Create a Collection that reads from a different database than that set by the environment variable KORVUS_DATABASE_URL
.
content_copy
const collection = korvus.newCollection("test_collection", CUSTOM_DATABASE_URL)
content_copy
collection = Collection("test_collection", CUSTOM_DATABASE_URL)
content_copy
let mut collection = Collection::new("test_collection", Some(CUSTOM_DATABASE_URL))?;
content_copy
CollectionC * collection = korvus_collectionc_new("test_collection", CUSTOM_DATABASE_URL);
content_copy
const documents = [
{
id: "document_one",
title: "Document One",
text: "document one contents...",
random_key: "here is some random data",
},
{
id: "document_two",
title: "Document Two",
text: "document two contents...",
random_key: "here is some random data",
},
];
await collection.upsert_documents(documents);
content_copy
documents = [
{
"id": "document_one",
"title": "Document One",
"text": "Here are the contents of Document 1",
"random_key": "here is some random data",
},
{
"id": "document_two",
"title": "Document Two",
"text": "Here are the contents of Document 2",
"random_key": "here is some random data",
},
]
await collection.upsert_documents(documents)
content_copy
let documents: Vec = vec![
serde_json::json!({
"id": "document_one",
"title": "Document One",
"text": "Here are the contents of Document 1",
"random_key": "here is some random data",
})
.into(),
serde_json::json!({
"id": "document_two",
"title": "Document Two",
"text": "Here are the contents of Document 2",
"random_key": "here is some random data",
})
.into(),
];
collection.upsert_documents(documents, None).await?;
content_copy
char * documents[2] = {
"{\"id\": \"document_one\", \"title\": \"Document One\", \"text\": \"Here are the contents of Document 1\", \"random_key\": \"here is some random data\"}",
"{\"id\": \"document_two\", \"title\": \"Document Two\", \"text\": \"Here are the contents of Document 2\", \"random_key\": \"here is some random data\"}"
};
korvus_collectionc_upsert_documents(collection, documents, 2, NULL);
content_copy
const documents = [
{
id: "document_one",
title: "Document One New Title",
text: "Here is some new text for document one",
random_key: "here is some new random data",
},
{
id: "document_two",
title: "Document Two New Title",
text: "Here is some new text for document two",
random_key: "here is some new random data",
},
];
await collection.upsert_documents(documents);
content_copy
documents = [
{
"id": "document_one",
"title": "Document One",
"text": "Here is some new text for document one",
"random_key": "here is some random data",
},
{
"id": "document_two",
"title": "Document Two",
"text": "Here is some new text for document two",
"random_key": "here is some random data",
},
]
await collection.upsert_documents(documents)
content_copy
let documents: Vec = vec![
serde_json::json!({
"id": "document_one",
"title": "Document One",
"text": "Here is some new text for document one",
"random_key": "here is some random data",
})
.into(),
serde_json::json!({
"id": "document_two",
"title": "Document Two",
"text": "Here is some new text for document two",
"random_key": "here is some random data",
})
.into(),
];
collection.upsert_documents(documents, None).await?;
content_copy
char * documents[2] = {
"{\"id\": \"document_one\", \"title\": \"Document One\", \"text\": \"Here is some new text for document one\", \"random_key\": \"here is some random data\"}",
"{\"id\": \"document_two\", \"title\": \"Document Two\", \"text\": \"Here is some new text for document two\", \"random_key\": \"here is some random data\"}"
};
korvus_collectionc_upsert_documents(collection, documents, 2, NULL);
content_copy
const documents = [
{
id: "document_one",
new_key: "this will be a new key in document one",
random_key: "this will replace old random_key"
},
{
id: "document_two",
new_key: "this will bew a new key in document two",
random_key: "this will replace old random_key"
},
];
await collection.upsert_documents(documents, {
merge: true
});
content_copy
documents = [
{
"id": "document_one",
"new_key": "this will be a new key in document one",
"random_key": "this will replace old random_key",
},
{
"id": "document_two",
"new_key": "this will be a new key in document two",
"random_key": "this will replace old random_key",
},
]
await collection.upsert_documents(documents, {"merge": True})
content_copy
let documents: Vec = vec![
serde_json::json!({
"id": "document_one",
"new_key": "this will be a new key in document one",
"random_key": "this will replace old random_key"
})
.into(),
serde_json::json!({
"id": "document_two",
"new_key": "this will be a new key in document two",
"random_key": "this will replace old random_key"
})
.into(),
];
collection
.upsert_documents(documents, Some(serde_json::json!({"merge": true}).into()))
.await?;
content_copy
char * documents[2] = {
"{\"id\": \"document_one\", \"new_key\": \"this will be a new key in document one\", \"random_key\": \"this will replace old random_key\"}",
"{\"id\": \"document_two\", \"new_key\": \"this will be a new key in document two\", \"random_key\": \"this will replace old random_key\"}"
};
korvus_collectionc_upsert_documents(collection, documents, 2, "{\"merge\": true}");
content_copy
const documents = await collection.get_documents({limit: 100 })
content_copy
documents = await collection.get_documents({ "limit": 100 })
content_copy
let documents = collection
.get_documents(Some(serde_json::json!({"limit": 100}).into()))
.await?;
content_copy
unsigned long r_size = 0;
char** documents = korvus_collectionc_get_documents(collection, "{\"limit\": 100}", &r_size);
The SDK supports limit-offset pagination and keyset pagination.
content_copy
const documents = await collection.get_documents({ limit: 100, offset: 10 })
content_copy
documents = await collection.get_documents({ "limit": 100, "offset": 10 })
content_copy
let documents = collection
.get_documents(Some(serde_json::json!({"limit": 100, "offset": 10}).into()))
.await?;
content_copy
unsigned long r_size = 0;
char** documents = korvus_collectionc_get_documents(collection, "{\"limit\": 100, \"offset\": 10}", &r_size);
content_copy
const documents = await collection.get_documents({ limit: 100, last_row_id: 10 })
content_copy
documents = await collection.get_documents({ "limit": 100, "last_row_id": 10 })
content_copy
let documents = collection
.get_documents(Some(serde_json::json!({"limit": 100, "last_row_id": 10}).into()))
.await?;
content_copy
unsigned long r_size = 0;
char** documents = korvus_collectionc_get_documents(collection, "{\"limit\": 100, \"last_row_id\": 10}", &r_size);
content_copy
const documents = await collection.get_documents({
limit: 10,
filter: {
id: {
$eq: "document_one"
}
}
})
content_copy
documents = await collection.get_documents(
{
"limit": 100,
"filter": {
"id": {"$eq": "document_one"},
},
}
)
content_copy
let documents = collection
.get_documents(Some(
serde_json::json!({
"limit": 100,
"filter": {
"id": {"$eq": "document_one"},
}
})
.into(),
))
.await?;
content_copy
unsigned long r_size = 0;
char** documents = korvus_collectionc_get_documents(collection, "{\"limit\": 100, \"filter\": {\"id\": {\"$eq\": \"document_one\"}}}", &r_size);
Documents can be sorted on any key. Note that this does not currently work well with Keyset based pagination. If paginating and sorting, use Limit-Offset based pagination.
content_copy
const documents = await collection.get_documents({
limit: 100,
offset: 10,
order_by: {
id: "desc"
}
})
content_copy
documents = await collection.get_documents({
"limit": 100,
"offset": 10,
"order_by": {
"id": "desc"
}
})
content_copy
let documents = collection
.get_documents(Some(
serde_json::json!({
"limit": 100,
"offset": 10,
"order_by": {
"id": "desc"
}
})
.into(),
))
.await?;
content_copy
unsigned long r_size = 0;
char** documents = korvus_collectionc_get_documents(collection, "{\"limit\": 100, \"offset\": 10, \"order_by\": {\"id\": \"desc\"}}", &r_size);
content_copy
const documents = await collection.delete_documents({
id: {
$eq: 1
}
})
content_copy
documents = await collection.delete_documents(
{
"id": {"$eq": 1},
}
)
content_copy
let documents = collection
.delete_documents(
serde_json::json!({
"id": {
"$eq": 1
}
})
.into(),
)
.await?;
content_copy
korvus_collectionc_delete_documents(collection, "{\"id\": { \"$eq\": 1}}");