cognee.datasets
Static class for managing datasets and their data.
Methods
datasets.list_datasets()
await cognee.datasets.list_datasets(user=None)
Returns a list of all datasets accessible to the user.
datasets.list_data()
await cognee.datasets.list_data(dataset_id, user=None)
Returns all data items in a dataset.
datasets.has_data()
await cognee.datasets.has_data(dataset_id, user=None) -> bool
Check whether a dataset contains any data.
datasets.get_status()
await cognee.datasets.get_status(dataset_ids) -> dict
Get the pipeline processing status for one or more datasets.
datasets.delete_data()
await cognee.datasets.delete_data(
dataset_id,
data_id,
user=None,
mode="soft",
delete_dataset_if_empty=False,
)
Delete a specific data item from a dataset.
UUID of the data item to delete.
Deletion mode: "soft" marks as deleted, "hard" removes permanently.
If true, delete the dataset itself when the last item is removed.
datasets.empty_dataset()
await cognee.datasets.empty_dataset(dataset_id, user=None)
Remove all data from a dataset without deleting the dataset itself.
datasets.delete_all()
await cognee.datasets.delete_all(user=None)
Delete all datasets the user has permission to delete.
datasets.discover_datasets()
cognee.datasets.discover_datasets(directory_path)
Discover datasets from files in a local directory.
Examples
import cognee
# List all datasets
datasets = await cognee.datasets.list_datasets()
for ds in datasets:
print(ds.name, ds.id)
# Check dataset contents
data = await cognee.datasets.list_data(dataset_id=ds.id)
# Delete a specific item
await cognee.datasets.delete_data(
dataset_id=ds.id,
data_id=item.id,
)
# Wipe everything
await cognee.datasets.delete_all()