LICENSE
README.md
README_PYPI.md
pyproject.toml
soak/__init__.py
soak/agreement.py
soak/agreement_scripts.py
soak/calibration.py
soak/cli.py
soak/document_utils.py
soak/error_handlers.py
soak/export_utils.py
soak/ground_truth_metrics.py
soak/helpers.py
soak/hyde.py
soak/specs.py
soak/template_resolution.py
soak/template_validator.py
soak/visualization.py
soak/analysis/__init__.py
soak/analysis/self_similarity.py
soak/calibration-data/README.md
soak/calibration-data/calibration_comparison.png
soak/calibration-data/distribution-gpt-4.1-mini.png
soak/calibration-data/distribution-gpt-5-mini.png
soak/calibration-data/distribution-gpt-5.2.png
soak/calibration-data/llm_ordinal_separation_summary.csv
soak/calibration-data/llm_paraphrase_comparison.png
soak/calibration-data/llm_paraphrase_metrics.csv
soak/calibration-data/llm_paraphrase_metrics.png
soak/calibration-data/model_comparison.png
soak/calibration-data/models.yaml
soak/calibration-data/paraphrase_models.yaml
soak/calibration-data/paraphrases-gpt-4.1-mini.csv
soak/calibration-data/paraphrases-gpt-5-mini.csv
soak/calibration-data/paraphrases-gpt-5.2.csv
soak/calibration-data/paraphrases.sd
soak/calibration-data/plot_centroid_spacing.png
soak/calibration-data/plot_overlap_heatmap.png
soak/calibration-data/plot_ridge_densities.png
soak/calibration-data/similarities-gpt-4.1-mini-bge-large.csv
soak/calibration-data/similarities-gpt-5-mini-bge-large.csv
soak/calibration-data/similarities-gpt-5.2-bge-large.csv
soak/calibration-data/similarities-gpt-5.2-openai-large.csv
soak/calibration-data/thematic_analysis_papers.csv
soak/calibration-data/models/BAAI-bge-large-en-v1.5/calibration.pkl
soak/calibration-data/models/BAAI-bge-large-en-v1.5/calibration.png
soak/calibration-data/models/BAAI-bge-large-en-v1.5/calibration.yaml
soak/calibration-data/models/BAAI-bge-large-en-v1.5/paraphrases.csv
soak/calibration-data/models/all-MiniLM-L6-v2/calibration.pkl
soak/calibration-data/models/all-MiniLM-L6-v2/calibration.png
soak/calibration-data/models/all-MiniLM-L6-v2/calibration.yaml
soak/calibration-data/models/all-MiniLM-L6-v2/paraphrases.csv
soak/calibration-data/models/all-mpnet-base-v2/calibration.pkl
soak/calibration-data/models/all-mpnet-base-v2/calibration.png
soak/calibration-data/models/all-mpnet-base-v2/calibration.yaml
soak/calibration-data/models/all-mpnet-base-v2/paraphrases.csv
soak/calibration-data/models/intfloat-e5-base-v2/calibration.pkl
soak/calibration-data/models/intfloat-e5-base-v2/calibration.png
soak/calibration-data/models/intfloat-e5-base-v2/calibration.yaml
soak/calibration-data/models/intfloat-e5-base-v2/paraphrases.csv
soak/calibration-data/models/text-embedding-3-large/calibration.pkl
soak/calibration-data/models/text-embedding-3-large/calibration.png
soak/calibration-data/models/text-embedding-3-large/calibration.yaml
soak/calibration-data/models/text-embedding-3-large/paraphrases.csv
soak/calibration-data/models/text-embedding-3-small/calibration.pkl
soak/calibration-data/models/text-embedding-3-small/calibration.png
soak/calibration-data/models/text-embedding-3-small/calibration.yaml
soak/calibration-data/models/text-embedding-3-small/paraphrases.csv
soak/calibration-data/models/thenlper-gte-base/calibration.pkl
soak/calibration-data/models/thenlper-gte-base/calibration.png
soak/calibration-data/models/thenlper-gte-base/calibration.yaml
soak/calibration-data/models/thenlper-gte-base/paraphrases.csv
soak/cli/__init__.py
soak/cli/_common.py
soak/cli/compare.py
soak/cli/coverage_cmd.py
soak/cli/export.py
soak/cli/misc.py
soak/cli/run.py
soak/cli/show.py
soak/comparators/__init__.py
soak/comparators/base.py
soak/comparators/baselines.py
soak/comparators/optimal_transport.py
soak/comparators/paraphrasing.py
soak/comparators/rescaling.py
soak/comparators/similarity_comparator.py
soak/comparators/utils.py
soak/comparators/visualizations.py
soak/coverage/__init__.py
soak/coverage/analyzer.py
soak/coverage/models.py
soak/exports/__init__.py
soak/exports/typst_export.py
soak/exports/visualizations.py
soak/exports/xlsx_export.py
soak/models/__init__.py
soak/models/alignment.py
soak/models/base.py
soak/models/context.py
soak/models/cost_tracker.py
soak/models/dag.py
soak/models/pipeline.py
soak/models/progress.py
soak/models/text_utils.py
soak/models/utils.py
soak/models/nodes/__init__.py
soak/models/nodes/base.py
soak/models/nodes/batch.py
soak/models/nodes/classifier.py
soak/models/nodes/cluster.py
soak/models/nodes/filter.py
soak/models/nodes/groupby.py
soak/models/nodes/map.py
soak/models/nodes/reduce.py
soak/models/nodes/scrub.py
soak/models/nodes/transform.py
soak/models/nodes/ungroup.py
soak/models/nodes/verify.py
soak/pipelines/check_quote_fair_use.sd
soak/pipelines/filter_chunks.sd
soak/pipelines/pre_extract_relevant.sd
soak/soak-data/annomi.csv
soak/soak-data/annomi_with_ctx_train.csv
soak/soak-data/cfsb.zip
soak/soak-data/constitution.txt
soak/soak-data/dream.txt
soak/soak-data/examplethemes.xlsx
soak/soak-data/interview_sample.txt
soak/soak-data/matthew-57.txt
soak/soak-data/pii.txt
soak/soak-data/test_data.csv
soak/soak-data/wheel.txt
soak/soak-data/cfs/README.txt
soak/soak-data/cfs/aGKbypa8fhI.txt
soak/soak-data/cfs/aOUUTEeIiS0.txt
soak/soak-data/cfs/aS8CQtc9DmA.txt
soak/soak-data/cfs/aTvSX_toNL4.txt
soak/soak-data/cfs/acWL9FBKr3o.txt
soak/soak-data/cfs/as7I55hY29k.txt
soak/soak-data/cfs/bRidO1PiZJs.txt
soak/soak-data/cfs/ba2LcetNybI.txt
soak/soak-data/cfsb/bRidO1PiZJs.txt
soak/soak-data/cfsb/ba2LcetNybI.txt
soak/templates/_alpine_components.html
soak/templates/_base_styles.html
soak/templates/_header.html
soak/templates/_offcanvas.html
soak/templates/_tabs.html
soak/templates/comparison.html
soak/templates/coverage.html
soak/templates/does_quote_exist.sd
soak/templates/hyde_quotes.sd
soak/templates/make_labels.sd
soak/templates/narrative.html
soak/templates/paraphrase_quote.sd
soak/templates/paraphrase_theme.sd
soak/templates/pipeline.html
soak/templates/short_label.sd
soak/templates/simple.html
soak/templates/summarise_quote_use.sd
soak/templates/verify_theme_quotes.sd
soak/templates/nodes/batch.html
soak/templates/nodes/classifier.html
soak/templates/nodes/cluster.html
soak/templates/nodes/default.html
soak/templates/nodes/filter.html
soak/templates/nodes/groupby.html
soak/templates/nodes/map.html
soak/templates/nodes/reduce.html
soak/templates/nodes/scrub.html
soak/templates/nodes/split.html
soak/templates/nodes/transform.html
soak/templates/nodes/transformreduce.html
soak/templates/nodes/ungroup.html
soak/templates/nodes/verifyquotes.html
soak/utils/__init__.py
soaking.egg-info/PKG-INFO
soaking.egg-info/SOURCES.txt
soaking.egg-info/dependency_links.txt
soaking.egg-info/entry_points.txt
soaking.egg-info/requires.txt
soaking.egg-info/top_level.txt
tests/test_agreement.py
tests/test_agreement_validation.py
tests/test_error_handling.py
tests/test_ground_truth.py
tests/test_integration_pipelines.py
tests/test_nodes.py
tests/test_overlap_exclusion.py
tests/test_spreadsheet_input.py
tests/test_template_resolution.py
tests/test_verify_comprehensive.py