LICENSE
README.md
pyproject.toml
requirements/requirements.txt
tests/test_deduplication.py
tests/test_sampling.py
tests/test_utils.py
vdc/__init__.py
vdc/py.typed
vdc/utils.py
vdc/version.py
vdc/conf/__init__.py
vdc/conf/config.json
vdc/conf/settings.py
vdc/deduplication/__init__.py
vdc/deduplication/dsu.py
vdc/deduplication/lsh.py
vdc/sampling/__init__.py
vdc/sampling/allocation.py
vdc/sampling/base_sampler.py
vdc/sampling/cluster.py
vdc/sampling/hierarchical_random_sampler.py
vdc/scripts/__init__.py
vdc/scripts/__main__.py
vdc/scripts/_content_filter.py
vdc/scripts/aesthetic_filter.py
vdc/scripts/apply_deduplication.py
vdc/scripts/apply_score_filter.py
vdc/scripts/build_lsh_index.py
vdc/scripts/convert_to_npy.py
vdc/scripts/deduplicate_images.py
vdc/scripts/filter_by_examples.py
vdc/scripts/hierarchical_kmeans_clustering.py
vdc/scripts/nsfw_filter.py
vdc/scripts/prune_missing_samples.py
vdc/scripts/sample_images.py
vdc/scripts/sanitize_images.py
vision_data_curation.egg-info/PKG-INFO
vision_data_curation.egg-info/SOURCES.txt
vision_data_curation.egg-info/dependency_links.txt
vision_data_curation.egg-info/requires.txt
vision_data_curation.egg-info/top_level.txt