1ffc6060e6e974f1c229ddbf5581e0d4 *DESCRIPTION
9c4fad8a3a8ec6d6f2d6b4f1c4eb787b *NAMESPACE
c60e759160729ee9f5d8dbc797eb71a5 *NEWS.md
f296dadd33814fc95efbfaa1a83e76b1 *R/imports.R
22e6f9cc246641b20ac98278632a9373 *R/tokenization.R
b34a0e56a3e0625aabc26224909ff4ae *R/utils.R
7650998252eadd58bb4d4936e133112d *R/vocab.R
fbae0ea57cb1f4bf061f6b7f682cf206 *R/zzz.R
13760bb286f9bc4188bffc0f7a6e8a0e *README.md
5c3145f3e88e5192b7ba83b39bdec8ab *build/vignette.rds
a28bc78066f23f68932a739e90d442b7 *inst/doc/basic_usage.R
19e0e2cf2c893330a0783a40902eae9f *inst/doc/basic_usage.Rmd
e156480a69c4cbd6e43cb59ebae772b4 *inst/doc/basic_usage.html
430fba0e5c551d011e52bb7b0c2e6169 *inst/extdata/tiny_vocab.txt
e462bfed1f0f2ef10d1958fb0ffa604c *inst/extdata/tiny_vocab_cased.txt
0d1625272743a9918b1139dcce5aa4cf *man/dot-get_casedness.Rd
4c7fcc25442880b24e2ff1d27b09fd29 *man/dot-infer_case_from_vocab.Rd
a381b3ef6572cb08697c5648f7196c7f *man/dot-new_wordpiece_vocabulary.Rd
3b2f5300e6ee0a4d9669c485d579f2d8 *man/dot-process_vocab.Rd
e125b6d3ca3c2c624a4719de5e36b58c *man/dot-process_wp_vocab.Rd
1789deca52c38325fa2380c25c722a16 *man/dot-validate_wordpiece_vocabulary.Rd
5755adf723dfa9e84a1350a14a3fd5be *man/dot-wp_tokenize_single_string.Rd
cfae724eb06be4497c25e00433d0c755 *man/dot-wp_tokenize_word.Rd
6c380ae136ca57c191478b85d4f6e421 *man/load_or_retrieve_vocab.Rd
97e09cf31d032370c22bbe981b3da487 *man/load_vocab.Rd
0c3b85f72c305a2939e2a21a98d57ac5 *man/prepare_vocab.Rd
a9b817175255f39299e621ceb86f4cd0 *man/reexports.Rd
e5ddb761edf423c9afe21e414617ada4 *man/set_wordpiece_cache_dir.Rd
3ea58b479bcf09689da4db40c208fa59 *man/wordpiece_cache_dir.Rd
b6619092e936e30ecb2d2b6419884e25 *man/wordpiece_tokenize.Rd
a252975f543a8b8195a0dfdba6e2b654 *tests/testthat.R
57c48340410a21f9da4b019ab6973a55 *tests/testthat/_snaps/vocab.md
d85eef27c5081920c65fa2875bdf76cb *tests/testthat/badvocab_dupes.txt
de32b3f658e3dce3ba6028abb50304fa *tests/testthat/badvocab_spaces.txt
d41d8cd98f00b204e9800998ecf8427e *tests/testthat/empty_vocab.txt
c40f96f3a616dab467b8c859f7b1d683 *tests/testthat/test-tokenization.R
30a9a92f655dd95adf38f4264cbb28d6 *tests/testthat/test-vocab.R
2c4fe769c687a30f59b65e5f5f12a230 *tests/testthat/vocab.txt
19e0e2cf2c893330a0783a40902eae9f *vignettes/basic_usage.Rmd
