Skip to content

Commit 976852e

Browse files
committed
Merge branch 'main' into jz/hf-tokenizer-special-token-handling
2 parents b93cd82 + c11169c commit 976852e

File tree

1 file changed

+0
-4
lines changed

1 file changed

+0
-4
lines changed

include/pytorch/tokenizers/bpe_tokenizer_base.h

-4
Original file line numberDiff line numberDiff line change
@@ -111,17 +111,13 @@ static Result<std::unique_ptr<IRegex>> build_special_token_regex(
111111
std::string special_pattern;
112112
const std::size_t count = special_token_map.size();
113113

114-
std::cout << "iterating" << std::endl;
115114
for (std::size_t i = 0; i < count; ++i) {
116-
std::cout << "i: " << i << "/" << count << std::endl;
117115
const auto& [token, _] = special_token_map.getElement(i);
118-
std::cout << "token: " << token << std::endl;
119116
if (!special_pattern.empty()) {
120117
special_pattern += "|";
121118
}
122119
special_pattern += re2::RE2::QuoteMeta(std::string(token));
123120
}
124-
std::cout << "special pattern: " << special_pattern << std::endl;
125121

126122
if (special_pattern.empty()) {
127123
return static_cast<std::unique_ptr<IRegex>>(nullptr);

0 commit comments

Comments
 (0)