blob: 62055df14faf27769fff2ff2798b8b6e14505753 [file] [log] [blame]
// Copyright 2010-2015, Google Inc.
// All rights reserved.
//
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are
// met:
//
// * Redistributions of source code must retain the above copyright
// notice, this list of conditions and the following disclaimer.
// * Redistributions in binary form must reproduce the above
// copyright notice, this list of conditions and the following disclaimer
// in the documentation and/or other materials provided with the
// distribution.
// * Neither the name of Google Inc. nor the names of its
// contributors may be used to endorse or promote products derived from
// this software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
#include "rewriter/normalization_rewriter.h"
#include <string>
#include "base/system_util.h"
#include "converter/conversion_request.h"
#include "converter/segments.h"
#include "testing/base/public/gunit.h"
DECLARE_string(test_tmpdir);
namespace mozc {
namespace {
void AddSegment(const string &key, const string &value,
Segments *segments) {
segments->Clear();
Segment *seg = segments->push_back_segment();
seg->set_key(key);
Segment::Candidate *candidate = seg->add_candidate();
candidate->Init();
candidate->value = value;
candidate->content_value = value;
}
} // namespace
class NormalizationRewriterTest : public testing::Test {
protected:
NormalizationRewriterTest() {}
~NormalizationRewriterTest() {}
virtual void SetUp() {
SystemUtil::SetUserProfileDirectory(FLAGS_test_tmpdir);
}
virtual void TearDown() {}
};
TEST_F(NormalizationRewriterTest, NormalizationTest) {
NormalizationRewriter normalization_rewriter;
Segments segments;
const ConversionRequest request;
segments.Clear();
AddSegment("test", "test", &segments);
EXPECT_FALSE(normalization_rewriter.Rewrite(request, &segments));
EXPECT_EQ("test", segments.segment(0).candidate(0).value);
segments.Clear();
// AddSegment("きょうと", "京都", &segments);
AddSegment("\xE3\x81\x8D\xE3\x82\x87\xE3\x81\x86\xE3\x81\xA8",
"\xE4\xBA\xAC\xE9\x83\xBD", &segments);
EXPECT_FALSE(normalization_rewriter.Rewrite(request, &segments));
// EXPECT_EQ("京都", segments.segment(0).candidate(0).value);
EXPECT_EQ("\xE4\xBA\xAC\xE9\x83\xBD",
segments.segment(0).candidate(0).value);
// Wave dash (U+301C)
segments.Clear();
// AddSegment("なみ", "〜", &segments);
AddSegment("\xE3\x81\xAA\xE3\x81\xBF",
"\xE3\x80\x9C", &segments);
#ifdef OS_WIN
EXPECT_TRUE(normalization_rewriter.Rewrite(request, &segments));
// U+FF5E
// EXPECT_EQ("~", segments.segment(0).candidate(0).value);
EXPECT_EQ("\xEF\xBD\x9E", segments.segment(0).candidate(0).value);
#else
EXPECT_FALSE(normalization_rewriter.Rewrite(request, &segments));
// U+301C
// EXPECT_EQ("〜", segments.segment(0).candidate(0).value);
EXPECT_EQ("\xE3\x80\x9C", segments.segment(0).candidate(0).value);
#endif
// not normalized.
segments.Clear();
// AddSegment("なみ", "〜", &segments);
AddSegment("\xE3\x81\xAA\xE3\x81\xBF",
"\xE3\x80\x9C", &segments);
segments.mutable_segment(0)->mutable_candidate(0)->attributes |=
Segment::Candidate::USER_DICTIONARY;
EXPECT_FALSE(normalization_rewriter.Rewrite(request, &segments));
// U+301C
// EXPECT_EQ("〜", segments.segment(0).candidate(0).value);
EXPECT_EQ("\xE3\x80\x9C", segments.segment(0).candidate(0).value);
}
} // namespace mozc