// Copyright (c) 2011 The Chromium Authors. All rights reserved. // Use of this source code is governed by a BSD-style license that can be // found in the LICENSE file. #ifndef BASE_UTF_OFFSET_STRING_CONVERSIONS_H_ #define BASE_UTF_OFFSET_STRING_CONVERSIONS_H_ #pragma once #include <string> #include <vector> #include "base/base_api.h" #include "base/string16.h" namespace base { class StringPiece; } // Like the conversions in utf_string_conversions.h, but also takes one or more // offsets (|offset[s]_for_adjustment|) into the source strings, each offset // will be adjusted to point at the same logical place in the result strings. // If this isn't possible because an offset points past the end of the source // strings or into the middle of a multibyte sequence, the offending offset will // be set to std::wstring::npos. |offset[s]_for_adjustment| may be NULL. BASE_API bool UTF8ToWideAndAdjustOffset(const char* src, size_t src_len, std::wstring* output, size_t* offset_for_adjustment); BASE_API bool UTF8ToWideAndAdjustOffsets( const char* src, size_t src_len, std::wstring* output, std::vector<size_t>* offsets_for_adjustment); BASE_API std::wstring UTF8ToWideAndAdjustOffset(const base::StringPiece& utf8, size_t* offset_for_adjustment); BASE_API std::wstring UTF8ToWideAndAdjustOffsets( const base::StringPiece& utf8, std::vector<size_t>* offsets_for_adjustment); BASE_API bool UTF16ToWideAndAdjustOffset(const char16* src, size_t src_len, std::wstring* output, size_t* offset_for_adjustment); BASE_API bool UTF16ToWideAndAdjustOffsets( const char16* src, size_t src_len, std::wstring* output, std::vector<size_t>* offsets_for_adjustment); BASE_API std::wstring UTF16ToWideAndAdjustOffset(const string16& utf16, size_t* offset_for_adjustment); BASE_API std::wstring UTF16ToWideAndAdjustOffsets( const string16& utf16, std::vector<size_t>* offsets_for_adjustment); // Limiting function callable by std::for_each which will replace any value // which is equal to or greater than |limit| with npos. template <typename T> struct LimitOffset { explicit LimitOffset(size_t limit) : limit_(limit) {} void operator()(size_t& offset) { if (offset >= limit_) offset = T::npos; } size_t limit_; }; // Adjustment function called by std::transform which will adjust any offset // that occurs after one or more modified substrings. To use, create any // number of AdjustOffset::Adjustments, drop them into a vector, then call // std::transform with the transform function being something similar to // AdjustOffset(adjustments). Each Adjustment gives the original |location| // of the encoded section and the |old_length| and |new_length| of the section // before and after decoding. struct AdjustOffset { // Helper structure which indicates where an encoded character occurred // and how long that encoding was. struct Adjustment { Adjustment(size_t location, size_t old_length, size_t new_length); size_t location; size_t old_length; size_t new_length; }; typedef std::vector<Adjustment> Adjustments; explicit AdjustOffset(const Adjustments& adjustments); void operator()(size_t& offset); const Adjustments& adjustments_; }; #endif // BASE_UTF_OFFSET_STRING_CONVERSIONS_H_