#ifdef UNSAFE_BUFFERS_BUILD
#pragma allow_unsafe_buffers
#endif
#include "components/language_detection/core/ngram_hash_ops_utils.h"
#include <cstring>
#include "third_party/utf/src/include/utf.h"
namespace language_detection {
constexpr char kPrefix[] = …;
constexpr char kSuffix[] = …;
constexpr char kReplacementToken[] = …;
TokenizedOutput::TokenizedOutput() = default;
TokenizedOutput::~TokenizedOutput() = default;
TokenizedOutput::TokenizedOutput(const TokenizedOutput& rhs) = default;
TokenizedOutput Tokenize(const char* input_str,
size_t len,
size_t max_tokens,
bool exclude_nonalphaspace_tokens) { … }
void LowercaseUnicodeStr(const char* input_str,
int len,
std::string* output_str) { … }
}