// Copyright (c) 2011 The Chromium Authors. All rights reserved.
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.
#ifndef BASE_UTF_OFFSET_STRING_CONVERSIONS_H_
#define BASE_UTF_OFFSET_STRING_CONVERSIONS_H_
#pragma once
#include <string>
#include <vector>
#include "base/base_api.h"
#include "base/string16.h"
namespace base {
class StringPiece;
}
// Like the conversions in utf_string_conversions.h, but also takes one or more
// offsets (|offset[s]_for_adjustment|) into the source strings, each offset
// will be adjusted to point at the same logical place in the result strings.
// If this isn't possible because an offset points past the end of the source
// strings or into the middle of a multibyte sequence, the offending offset will
// be set to std::wstring::npos. |offset[s]_for_adjustment| may be NULL.
BASE_API bool UTF8ToWideAndAdjustOffset(const char* src,
size_t src_len,
std::wstring* output,
size_t* offset_for_adjustment);
BASE_API bool UTF8ToWideAndAdjustOffsets(
const char* src,
size_t src_len,
std::wstring* output,
std::vector<size_t>* offsets_for_adjustment);
BASE_API std::wstring UTF8ToWideAndAdjustOffset(const base::StringPiece& utf8,
size_t* offset_for_adjustment);
BASE_API std::wstring UTF8ToWideAndAdjustOffsets(
const base::StringPiece& utf8,
std::vector<size_t>* offsets_for_adjustment);
BASE_API bool UTF16ToWideAndAdjustOffset(const char16* src,
size_t src_len,
std::wstring* output,
size_t* offset_for_adjustment);
BASE_API bool UTF16ToWideAndAdjustOffsets(
const char16* src,
size_t src_len,
std::wstring* output,
std::vector<size_t>* offsets_for_adjustment);
BASE_API std::wstring UTF16ToWideAndAdjustOffset(const string16& utf16,
size_t* offset_for_adjustment);
BASE_API std::wstring UTF16ToWideAndAdjustOffsets(
const string16& utf16,
std::vector<size_t>* offsets_for_adjustment);
// Limiting function callable by std::for_each which will replace any value
// which is equal to or greater than |limit| with npos.
template <typename T>
struct LimitOffset {
explicit LimitOffset(size_t limit)
: limit_(limit) {}
void operator()(size_t& offset) {
if (offset >= limit_)
offset = T::npos;
}
size_t limit_;
};
// Adjustment function called by std::transform which will adjust any offset
// that occurs after one or more modified substrings. To use, create any
// number of AdjustOffset::Adjustments, drop them into a vector, then call
// std::transform with the transform function being something similar to
// AdjustOffset(adjustments). Each Adjustment gives the original |location|
// of the encoded section and the |old_length| and |new_length| of the section
// before and after decoding.
struct AdjustOffset {
// Helper structure which indicates where an encoded character occurred
// and how long that encoding was.
struct Adjustment {
Adjustment(size_t location, size_t old_length, size_t new_length);
size_t location;
size_t old_length;
size_t new_length;
};
typedef std::vector<Adjustment> Adjustments;
explicit AdjustOffset(const Adjustments& adjustments);
void operator()(size_t& offset);
const Adjustments& adjustments_;
};
#endif // BASE_UTF_OFFSET_STRING_CONVERSIONS_H_