blob: 4f4574e3f698a16b984c252c0bc8c38fc231804e [file] [log] [blame]
// Copyright 2022 Google LLC
//
// Use of this source code is governed by an MIT-style
// license that can be found in the LICENSE file or at
// https://opensource.org/licenses/MIT.
/* This is a wrapper for the Google range-sse.cc algorithm which checks whether a
* sequence of bytes is a valid UTF-8 sequence and finds the longest valid prefix of
* the UTF-8 sequence.
*
* The key difference is that it checks for as much ASCII symbols as possible
* and then falls back to the range-sse.cc algorithm. The changes to the
* algorithm are cosmetic, mostly to trick the clang compiler to produce optimal
* code.
*
* For API see the utf8_validity.h header.
*/
#include "utf8_validity.h"
#include <cstddef>
#include "absl/strings/string_view.h"
#include "utf8_range.h"
namespace utf8_range {
bool IsStructurallyValid(absl::string_view str) {
return utf8_range_IsValid(str.data(), str.size());
}
size_t SpanStructurallyValid(absl::string_view str) {
return utf8_range_ValidPrefix(str.data(), str.size());
}
} // namespace utf8_range