1 // Copyright 2010-2018, Google Inc.
2 // All rights reserved.
3 //
4 // Redistribution and use in source and binary forms, with or without
5 // modification, are permitted provided that the following conditions are
6 // met:
7 //
8 //     * Redistributions of source code must retain the above copyright
9 // notice, this list of conditions and the following disclaimer.
10 //     * Redistributions in binary form must reproduce the above
11 // copyright notice, this list of conditions and the following disclaimer
12 // in the documentation and/or other materials provided with the
13 // distribution.
14 //     * Neither the name of Google Inc. nor the names of its
15 // contributors may be used to endorse or promote products derived from
16 // this software without specific prior written permission.
17 //
18 // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
19 // "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
20 // LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
21 // A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
22 // OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
23 // SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
24 // LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
25 // DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
26 // THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
27 // (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
28 // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
29 
30 #ifndef MOZC_CONVERTER_SEGMENTER_H_
31 #define MOZC_CONVERTER_SEGMENTER_H_
32 
33 #include "base/port.h"
34 
35 namespace mozc {
36 
37 class DataManagerInterface;
38 struct Node;
39 
40 class Segmenter {
41  public:
42   static Segmenter *CreateFromDataManager(
43       const DataManagerInterface &data_manager);
44 
45   // This class does not take the ownership of pointer parameters.
46   Segmenter(size_t l_num_elements, size_t r_num_elements,
47             const uint16 *l_table, const uint16 *r_table,
48             size_t bitarray_num_bytes, const char *bitarray_data,
49             const uint16 *boundary_data);
50   ~Segmenter();
51 
52   bool IsBoundary(const Node &lnode, const Node &rnode,
53                   bool is_single_segment) const;
54   bool IsBoundary(uint16 rid, uint16 lid) const;
55   int32 GetPrefixPenalty(uint16 lid) const;
56   int32 GetSuffixPenalty(uint16 rid) const;
57 
58  private:
59   const size_t l_num_elements_;
60   const size_t r_num_elements_;
61   const uint16 *l_table_;
62   const uint16 *r_table_;
63   const size_t bitarray_num_bytes_;
64   const char *bitarray_data_;
65   const uint16 *boundary_data_;
66 
67   DISALLOW_COPY_AND_ASSIGN(Segmenter);
68 };
69 
70 }  // namespace mozc
71 
72 #endif  // MOZC_CONVERTER_SEGMENTER_H_
73