tesseract  4.00.00dev
UNICHARMAP Class Reference

#include <unicharmap.h>

Public Member Functions

 UNICHARMAP ()
 
 ~UNICHARMAP ()
 
void insert (const char *const unichar_repr, UNICHAR_ID id)
 
UNICHAR_ID unichar_to_id (const char *const unichar_repr) const
 
UNICHAR_ID unichar_to_id (const char *const unichar_repr, int length) const
 
bool contains (const char *const unichar_repr) const
 
bool contains (const char *const unichar_repr, int length) const
 
int minmatch (const char *const unichar_repr) const
 
void clear ()
 

Detailed Description

Definition at line 27 of file unicharmap.h.

Constructor & Destructor Documentation

◆ UNICHARMAP()

UNICHARMAP::UNICHARMAP ( )

Definition at line 25 of file unicharmap.cpp.

25  :
26 nodes(0) {
27 }

◆ ~UNICHARMAP()

UNICHARMAP::~UNICHARMAP ( )

Definition at line 29 of file unicharmap.cpp.

29  {
30  if (nodes != 0)
31  delete[] nodes;
32 }

Member Function Documentation

◆ clear()

void UNICHARMAP::clear ( )

Definition at line 154 of file unicharmap.cpp.

154  {
155  if (nodes != 0)
156  {
157  delete[] nodes;
158  nodes = 0;
159  }
160 }

◆ contains() [1/2]

bool UNICHARMAP::contains ( const char *const  unichar_repr) const

Definition at line 101 of file unicharmap.cpp.

101  {
102  if (unichar_repr == NULL || *unichar_repr == '\0') return false;
103 
104  const char* current_char = unichar_repr;
105  UNICHARMAP_NODE* current_nodes = nodes;
106 
107  while (current_nodes != 0 && *(current_char + 1) != '\0') {
108  current_nodes =
109  current_nodes[static_cast<unsigned char>(*current_char)].children;
110  ++current_char;
111  }
112  return current_nodes != 0 && *(current_char + 1) == '\0' &&
113  current_nodes[static_cast<unsigned char>(*current_char)].id >= 0;
114 }

◆ contains() [2/2]

bool UNICHARMAP::contains ( const char *const  unichar_repr,
int  length 
) const

Definition at line 120 of file unicharmap.cpp.

121  {
122  if (unichar_repr == NULL || *unichar_repr == '\0') return false;
123  if (length <= 0 || length > UNICHAR_LEN) return false;
124 
125  const char* current_char = unichar_repr;
126  UNICHARMAP_NODE* current_nodes = nodes;
127 
128  while (current_nodes != 0 && (length > 1 && *(current_char + 1) != '\0')) {
129  current_nodes =
130  current_nodes[static_cast<unsigned char>(*current_char)].children;
131  --length;
132  ++current_char;
133  }
134  return current_nodes != 0 && (length == 1 || *(current_char + 1) == '\0') &&
135  current_nodes[static_cast<unsigned char>(*current_char)].id >= 0;
136 }
#define UNICHAR_LEN
Definition: unichar.h:30

◆ insert()

void UNICHARMAP::insert ( const char *const  unichar_repr,
UNICHAR_ID  id 
)

Definition at line 76 of file unicharmap.cpp.

76  {
77  const char* current_char = unichar_repr;
78  UNICHARMAP_NODE** current_nodes_pointer = &nodes;
79 
80  assert(*unichar_repr != '\0');
81  assert(id >= 0);
82 
83  do {
84  if (*current_nodes_pointer == 0)
85  *current_nodes_pointer = new UNICHARMAP_NODE[256];
86  if (*(current_char + 1) == '\0') {
87  (*current_nodes_pointer)
88  [static_cast<unsigned char>(*current_char)].id = id;
89  return;
90  }
91  current_nodes_pointer =
92  &((*current_nodes_pointer)
93  [static_cast<unsigned char>(*current_char)].children);
94  ++current_char;
95  } while (true);
96 }

◆ minmatch()

int UNICHARMAP::minmatch ( const char *const  unichar_repr) const

Definition at line 140 of file unicharmap.cpp.

140  {
141  const char* current_char = unichar_repr;
142  UNICHARMAP_NODE* current_nodes = nodes;
143 
144  while (current_nodes != NULL && *current_char != '\0') {
145  if (current_nodes[static_cast<unsigned char>(*current_char)].id >= 0)
146  return current_char + 1 - unichar_repr;
147  current_nodes =
148  current_nodes[static_cast<unsigned char>(*current_char)].children;
149  ++current_char;
150  }
151  return 0;
152 }

◆ unichar_to_id() [1/2]

UNICHAR_ID UNICHARMAP::unichar_to_id ( const char *const  unichar_repr) const

Definition at line 36 of file unicharmap.cpp.

36  {
37  const char* current_char = unichar_repr;
38  UNICHARMAP_NODE* current_nodes = nodes;
39 
40  assert(*unichar_repr != '\0');
41 
42  do {
43  if (*(current_char + 1) == '\0')
44  return current_nodes[static_cast<unsigned char>(*current_char)].id;
45  current_nodes =
46  current_nodes[static_cast<unsigned char>(*current_char)].children;
47  ++current_char;
48  } while (true);
49 }

◆ unichar_to_id() [2/2]

UNICHAR_ID UNICHARMAP::unichar_to_id ( const char *const  unichar_repr,
int  length 
) const

Definition at line 54 of file unicharmap.cpp.

55  {
56  const char* current_char = unichar_repr;
57  UNICHARMAP_NODE* current_nodes = nodes;
58 
59  assert(*unichar_repr != '\0');
60  assert(length > 0 && length <= UNICHAR_LEN);
61 
62  do {
63  if (length == 1 || *(current_char + 1) == '\0')
64  return current_nodes[static_cast<unsigned char>(*current_char)].id;
65  current_nodes =
66  current_nodes[static_cast<unsigned char>(*current_char)].children;
67  ++current_char;
68  --length;
69  } while (true);
70 }
#define UNICHAR_LEN
Definition: unichar.h:30

The documentation for this class was generated from the following files: