11767c5feSopenharmony_ci// Copyright (C) 2011 The Libphonenumber Authors
21767c5feSopenharmony_ci//
31767c5feSopenharmony_ci// Licensed under the Apache License, Version 2.0 (the "License");
41767c5feSopenharmony_ci// you may not use this file except in compliance with the License.
51767c5feSopenharmony_ci// You may obtain a copy of the License at
61767c5feSopenharmony_ci//
71767c5feSopenharmony_ci// http://www.apache.org/licenses/LICENSE-2.0
81767c5feSopenharmony_ci//
91767c5feSopenharmony_ci// Unless required by applicable law or agreed to in writing, software
101767c5feSopenharmony_ci// distributed under the License is distributed on an "AS IS" BASIS,
111767c5feSopenharmony_ci// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
121767c5feSopenharmony_ci// See the License for the specific language governing permissions and
131767c5feSopenharmony_ci// limitations under the License.
141767c5feSopenharmony_ci
151767c5feSopenharmony_ci#include <string>
161767c5feSopenharmony_ci
171767c5feSopenharmony_ci#include "phonenumbers/utf/unicodetext.h"
181767c5feSopenharmony_ci
191767c5feSopenharmony_cinamespace i18n {
201767c5feSopenharmony_cinamespace phonenumbers {
211767c5feSopenharmony_ci
221767c5feSopenharmony_cistruct NormalizeUTF8 {
231767c5feSopenharmony_ci  // Put a UTF-8 string in ASCII digits: All decimal digits (Nd) replaced by
241767c5feSopenharmony_ci  // their ASCII counterparts; all other characters are copied from input to
251767c5feSopenharmony_ci  // output.
261767c5feSopenharmony_ci  static string NormalizeDecimalDigits(const string& number) {
271767c5feSopenharmony_ci    string normalized;
281767c5feSopenharmony_ci    UnicodeText number_as_unicode;
291767c5feSopenharmony_ci    number_as_unicode.PointToUTF8(number.data(), static_cast<int>(number.size()));
301767c5feSopenharmony_ci    if (!number_as_unicode.UTF8WasValid())
311767c5feSopenharmony_ci      return normalized; // Return an empty result to indicate an error
321767c5feSopenharmony_ci    for (UnicodeText::const_iterator it = number_as_unicode.begin();
331767c5feSopenharmony_ci         it != number_as_unicode.end();
341767c5feSopenharmony_ci         ++it) {
351767c5feSopenharmony_ci      int32_t digitValue = u_charDigitValue(*it);
361767c5feSopenharmony_ci      if (digitValue == -1) {
371767c5feSopenharmony_ci        // Not a decimal digit.
381767c5feSopenharmony_ci        char utf8[4];
391767c5feSopenharmony_ci        int len = it.get_utf8(utf8);
401767c5feSopenharmony_ci        normalized.append(utf8, len);
411767c5feSopenharmony_ci      } else {
421767c5feSopenharmony_ci        normalized.push_back('0' + digitValue);
431767c5feSopenharmony_ci      }
441767c5feSopenharmony_ci    }
451767c5feSopenharmony_ci    return normalized;
461767c5feSopenharmony_ci  }
471767c5feSopenharmony_ci};
481767c5feSopenharmony_ci
491767c5feSopenharmony_ci}  // namespace phonenumbers
501767c5feSopenharmony_ci}  // namespace i18n
51