# file: /Users/mfwolffe/GithubOrgs/tenseleyFlow/DocumentLanguageModel/src/dlm/train/cpt/vocab_gap.py
# hypothesis_version: 6.152.1

[0.0, '  top tokens:', '\\b\\w+\\b', 'input_ids', 'unk_token_id']