blob: dfde5bc4683cfbb26e4a2589553daced0c2e9983 [file] [log] [blame]
// Copyright 2010-2015, Google Inc.
// All rights reserved.
//
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are
// met:
//
// * Redistributions of source code must retain the above copyright
// notice, this list of conditions and the following disclaimer.
// * Redistributions in binary form must reproduce the above
// copyright notice, this list of conditions and the following disclaimer
// in the documentation and/or other materials provided with the
// distribution.
// * Neither the name of Google Inc. nor the names of its
// contributors may be used to endorse or promote products derived from
// this software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
// This module provides utilities similar to those in base/number_util.h.
// However, this module is separated from it because of the dependency on
// rewriter/counter_suffix.h.
#ifndef MOZC_REWRITER_NUMBER_COMPOUND_UTIL_H_
#define MOZC_REWRITER_NUMBER_COMPOUND_UTIL_H_
#include "base/port.h"
#include "base/string_piece.h"
#include "converter/segments.h"
namespace mozc {
class POSMatcher;
struct CounterSuffixEntry;
namespace number_compound_util {
enum NumberScriptType {
NONE = 0,
HALFWIDTH_ARABIC = 1,
FULLWIDTH_ARABIC = 2,
KANJI = 4,
OLD_KANJI = 8,
};
// Splits a string to number and counter suffix if possible. For example, input
// "一階" can be splitted as "一" + "階". At the same time, script type of
// number can be obtained. A sorted array of counter suffix needs to be
// provided, which can be obtained using data manager; see
// data_manager/data_manager_interface.h. Returns false if the input cannot be
// splitted.
bool SplitStringIntoNumberAndCounterSuffix(
const CounterSuffixEntry *suffix_array, size_t suffix_array_size,
StringPiece input, StringPiece *number, StringPiece *counter_suffix,
uint32 *script_type);
// Checks if the given candidate is number, where candidate is considered as a
// number when satisfying one of the following conditions:
// 1) lid is number
// 2) lid is Kanji number
// 3) lid is general nound and content value consists of number and counter
// suffix, where counter suffix needs to be provided as a sorted array.
bool IsNumber(const CounterSuffixEntry *suffix_array, size_t suffix_array_size,
const POSMatcher &pos_matcher, const Segment::Candidate &cand);
} // namespace number_compound_util
} // namespace mozc
#endif // MOZC_REWRITER_NUMBER_COMPOUND_UTIL_H_