blob: fbb387fdafdac757cac7903074257c837559ac09 [file] [log] [blame]
/*
* Copyright (C) 2008,2009 OMRON SOFTWARE Co., Ltd.
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
#include "nj_lib.h"
#include "nj_err.h"
#include "nj_ext.h"
#include "nj_dic.h"
#include "njd.h"
#define NODE_TERM(x) ((NJ_UINT8)(0x80 & (*(x))))
#define NODE_LEFT_EXIST(x) ((NJ_UINT8)(0x40 & (*(x))))
#define NODE_DATA_EXIST(x) ((NJ_UINT8)(0x20 & (*(x))))
#define NODE_IDX_EXIST(x) ((NJ_UINT8)(0x10 & (*(x))))
#define NODE_IDX_CNT(x) ((NJ_UINT8)((0x0f & (*(x))) + 2))
#define STEM_TERMINETER(x) ((NJ_UINT8)(0x80 & (*(x))))
#define STEM_NO_CONV_FLG(x) ((NJ_UINT8)(0x40 & (*(x))))
#define TERM_BIT (1)
#define INDEX_BIT (8)
#define APPEND_YOMI_FLG(h) ((NJ_UINT8)(0x80 & (*((h) + 0x1C))))
#define HINSI_NO_TOP_ADDR(h) ((NJ_UINT8*)((h) + NJ_INT32_READ((h) + 0x1D)))
#define FHINSI_NO_CNT(h) ((NJ_INT16)(NJ_INT16_READ((h) + 0x21)))
#define BHINSI_NO_CNT(h) ((NJ_INT16)(NJ_INT16_READ((h) + 0x23)))
#define HINSI_NO_BYTE(h) ((NJ_UINT8)(*((h) + 0x25)))
#define HINDO_NO_TOP_ADDR(h) ((NJ_UINT8*)((h) + NJ_INT32_READ((h) + 0x26)))
#define HINDO_NO_CNT(h) ((NJ_UINT8)(*((h) + 0x2A)))
#define STEM_AREA_TOP_ADDR(h) ((NJ_UINT8*)((h) + NJ_INT32_READ((h) + 0x2B)))
#define BIT_CANDIDATE_LEN(h) ((NJ_UINT8)(*((h) + 0x2F)))
#define BIT_FHINSI(h) ((NJ_UINT8)(*((h) + 0x30)))
#define BIT_BHINSI(h) ((NJ_UINT8)(*((h) + 0x31)))
#define BIT_HINDO_LEN(h) ((NJ_UINT8)(*((h) + 0x32)))
#define BIT_MUHENKAN_LEN(h) ((NJ_UINT8)(*((h) + 0x33)))
#define BIT_YOMI_LEN(h) ((NJ_UINT8)(*((h) + 0x35)))
#define YOMI_INDX_TOP_ADDR(h) ((NJ_UINT8*)((h) + NJ_INT32_READ((h) + 0x42)))
#define YOMI_INDX_CNT(h) ((NJ_INT16)(*((h) + 0x46)))
#define YOMI_INDX_SIZE(h) ((NJ_INT8)(*((h) + 0x47)))
#define NODE_AREA_TOP_ADDR(h) ((NJ_UINT8*)((h) + NJ_INT32_READ((h) + 0x48)))
#define BIT_NODE_AREA_DATA_LEN(h) ((NJ_UINT8)(*((h) + 0x4C)))
#define BIT_NODE_AREA_LEFT_LEN(h) ((NJ_UINT8)(*((h) + 0x4D)))
#define NODE_AREA_MID_ADDR(h) ((NJ_UINT32)(NJ_INT32_READ((h) + 0x4E)))
#define CAND_IDX_AREA_TOP_ADDR(h) ((NJ_UINT8*)((h) + NJ_INT32_READ((h) + 0x52)))
#define CAND_IDX_AREA_CNT(h) ((NJ_UINT32)(((NJ_INT32_READ((h) + 0x56)) >> 8) & 0x00FFFFFF))
#define CAND_IDX_AREA_SIZE(h) ((NJ_UINT8)(*((h) + 0x59)))
#define WORD_LEN(x) ((NJ_UINT16)(0x007F & (x)))
#define CURRENT_INFO_SET ((NJ_UINT8)(0x10))
#define COMP_DIC_FREQ_DIV 63
#define LOC_CURRENT_NO_ENTRY 0xffffffffU
typedef struct {
NJ_UINT16 stem_size;
NJ_UINT16 term;
NJ_UINT16 no_conv_flg;
NJ_HINDO hindo;
NJ_UINT16 hindo_jitu;
NJ_UINT16 candidate_size;
NJ_UINT16 yomi_size;
NJ_UINT16 fhinsi;
NJ_UINT16 bhinsi;
NJ_UINT16 fhinsi_jitu;
NJ_UINT16 bhinsi_jitu;
} STEM_DATA_SET;
static NJ_INT16 get_stem_next(NJ_DIC_HANDLE hdl, NJ_UINT8 *stem_data);
static void get_stem_word(NJ_DIC_HANDLE hdl, NJ_UINT8 *stem_data, STEM_DATA_SET *stem_set, NJ_UINT8 check);
static void get_stem_cand_data(NJ_DIC_HANDLE hdl, NJ_UINT8 *stem_data, STEM_DATA_SET *stem_set);
static NJ_UINT16 get_stem_yomi_data(NJ_DIC_HANDLE hdl, NJ_UINT8 *stem_data,STEM_DATA_SET *stem_set);
static NJ_UINT16 get_stem_yomi_size(NJ_DIC_HANDLE hdl, NJ_UINT8 *stem_data, NJ_UINT16 yomi_size);
static NJ_UINT16 get_stem_yomi_string(NJ_DIC_HANDLE hdl, NJ_UINT8 *stem_data, NJ_CHAR *yomi, NJ_UINT16 yomi_pos, NJ_UINT16 yomi_size, NJ_UINT16 size);
static NJ_INT16 search_node(NJ_SEARCH_CONDITION *condition, NJ_SEARCH_LOCATION_SET *loctset);
static NJ_INT16 bdic_search_data(NJ_SEARCH_CONDITION *condition, NJ_SEARCH_LOCATION_SET *loctset);
static NJ_INT16 bdic_search_fore_data(NJ_SEARCH_CONDITION *condition, NJ_SEARCH_LOCATION_SET *loctset);
static NJ_HINDO get_stem_hindo(NJ_DIC_HANDLE hdl, NJ_UINT8 *stem_data);
static NJ_INT16 search_node2(NJ_SEARCH_CONDITION *condition, NJ_SEARCH_LOCATION_SET *loctset,
NJ_UINT16 hidx);
static NJ_INT16 bdic_search_fore_data2(NJ_SEARCH_CONDITION *condition,
NJ_SEARCH_LOCATION_SET *loctset, NJ_UINT16 hidx);
static NJ_INT16 search_yomi_node(NJ_UINT8 operation, NJ_UINT8 *node,
NJ_UINT8 *now, NJ_UINT16 idx_no,
NJ_CHAR *yomi, NJ_UINT16 yomilen,
NJ_UINT8 *root, NJ_UINT8 *node_mid,
NJ_UINT16 bit_left, NJ_UINT16 bit_data,
NJ_UINT8 *data_top,
NJ_INT16 ytbl_cnt, NJ_UINT16 y,
NJ_UINT8 *ytbl_top, NJ_CACHE_INFO *storebuf,
NJ_UINT8 **con_node, NJ_UINT32 *data_offset);
static NJ_INT16 get_node_bottom(NJ_CHAR *yomi, NJ_UINT8 *now, NJ_UINT8 *node_mid,
NJ_UINT8 *data_top, NJ_UINT16 bit_left,
NJ_UINT16 bit_data, NJ_UINT32 top,
NJ_DIC_HANDLE handle, NJ_UINT32 *ret_bottom);
static NJ_INT16 bdic_get_next_data(NJ_UINT8 *data_top, NJ_UINT8 *data_end,
NJ_SEARCH_LOCATION_SET *loctset,
NJ_SEARCH_CACHE *psrhCache, NJ_UINT16 abIdx);
static NJ_INT16 bdic_get_word_freq(NJ_UINT8 *data_top, NJ_SEARCH_LOCATION_SET *loctset,
NJ_SEARCH_CACHE *psrhCache, NJ_UINT16 abIdx);
static NJ_HINDO get_stem_hindo(NJ_DIC_HANDLE hdl, NJ_UINT8 *stem_data)
{
NJ_UINT8 flg_bit;
NJ_UINT16 data;
NJ_UINT16 pos, j, bit_all;
flg_bit = BIT_MUHENKAN_LEN(hdl);
if (NJ_GET_DIC_FMT(hdl) != NJ_DIC_FMT_KANAKAN) {
flg_bit++;
}
if (BIT_HINDO_LEN(hdl)) {
bit_all = (NJ_UINT16)(TERM_BIT + flg_bit);
pos = (NJ_UINT16)(bit_all >> 3);
data = (NJ_UINT16)(NJ_INT16_READ(stem_data + pos));
j = (NJ_UINT16)(bit_all & 0x0007);
return GET_BITFIELD_16(data, j, BIT_HINDO_LEN(hdl));
} else {
return 0;
}
}
static NJ_INT16 get_stem_next(NJ_DIC_HANDLE hdl, NJ_UINT8 *stem_data)
{
NJ_UINT8 flg_bit;
NJ_UINT16 data;
NJ_UINT16 pos, j, bit_all;
NJ_UINT16 stem_size, cand_bit, yomi_bit;
NJ_UINT16 candidate_size, yomi_size;
flg_bit = BIT_MUHENKAN_LEN(hdl);
if (NJ_GET_DIC_FMT(hdl) != NJ_DIC_FMT_KANAKAN) {
flg_bit++;
}
bit_all = (NJ_UINT16)(TERM_BIT + flg_bit +
BIT_HINDO_LEN(hdl) +
BIT_FHINSI(hdl) +
BIT_BHINSI(hdl));
pos = (NJ_UINT16)(bit_all >> 3);
data = (NJ_UINT16)(NJ_INT16_READ(stem_data + pos));
j = (NJ_UINT16)(bit_all & 0x0007);
cand_bit = BIT_CANDIDATE_LEN(hdl);
candidate_size = GET_BITFIELD_16(data, j, cand_bit);
bit_all += cand_bit;
if (APPEND_YOMI_FLG(hdl) && STEM_TERMINETER(stem_data)) {
pos = (NJ_UINT16)(bit_all >> 3);
data = (NJ_UINT16)(NJ_INT16_READ(stem_data + pos));
j = (NJ_UINT16)(bit_all & 0x0007);
yomi_bit = BIT_YOMI_LEN(hdl);
yomi_size = GET_BITFIELD_16(data, j, yomi_bit);
bit_all += yomi_bit;
} else {
yomi_size = 0;
}
stem_size = GET_BIT_TO_BYTE(bit_all);
stem_size += candidate_size;
stem_size += yomi_size;
return stem_size;
}
static void get_stem_word(NJ_DIC_HANDLE hdl, NJ_UINT8 *stem_data, STEM_DATA_SET *stem_set, NJ_UINT8 check)
{
NJ_UINT8 flg_bit;
NJ_UINT16 data;
NJ_UINT16 pos, j, bit_all = 0;
NJ_UINT16 bit;
NJ_UINT16 dpos = 0;
NJ_INT16 next;
NJ_UINT8 b;
NJ_UINT8 *wkc;
flg_bit = BIT_MUHENKAN_LEN(hdl);
if (NJ_GET_DIC_FMT(hdl) != NJ_DIC_FMT_KANAKAN) {
flg_bit++;
}
if (BIT_HINDO_LEN(hdl)) {
bit_all = (NJ_UINT16)(TERM_BIT + flg_bit);
pos = (NJ_UINT16)(bit_all >> 3);
data = (NJ_UINT16)(NJ_INT16_READ(stem_data + pos));
j = (NJ_UINT16)(bit_all & 0x0007);
stem_set->hindo = GET_BITFIELD_16(data, j, BIT_HINDO_LEN(hdl));
} else {
stem_set->hindo = 0;
}
stem_set->hindo_jitu = (NJ_UINT16)(*(HINDO_NO_TOP_ADDR(hdl) + stem_set->hindo));
if (BIT_FHINSI(hdl)) {
bit_all = (NJ_UINT16)(TERM_BIT + flg_bit + BIT_HINDO_LEN(hdl));
pos = (NJ_UINT16)(bit_all >> 3);
data = (NJ_UINT16)(NJ_INT16_READ(stem_data + pos));
j = (NJ_UINT16)(bit_all & 0x0007);
stem_set->fhinsi = GET_BITFIELD_16(data, j, BIT_FHINSI(hdl));
} else {
stem_set->fhinsi = 0;
}
b = HINSI_NO_BYTE(hdl);
wkc = (NJ_UINT8*)(HINSI_NO_TOP_ADDR(hdl) + (b * (NJ_UINT16)(stem_set->fhinsi)));
if (b == 2) {
stem_set->fhinsi_jitu = (NJ_UINT16)(NJ_INT16_READ(wkc));
} else {
stem_set->fhinsi_jitu = (NJ_UINT16)*wkc;
}
if (BIT_BHINSI(hdl)) {
bit_all = (NJ_UINT16)(TERM_BIT + flg_bit + BIT_HINDO_LEN(hdl) + BIT_FHINSI(hdl));
pos = (NJ_UINT16)(bit_all >> 3);
data = (NJ_UINT16)(NJ_INT16_READ(stem_data + pos));
j = (NJ_UINT16)(bit_all & 0x0007);
stem_set->bhinsi = GET_BITFIELD_16(data, j, BIT_BHINSI(hdl));
} else {
stem_set->bhinsi = 0;
}
wkc = (NJ_UINT8*)(HINSI_NO_TOP_ADDR(hdl)
+ (b * (FHINSI_NO_CNT(hdl) + (NJ_UINT16)(stem_set->bhinsi))));
if (b == 2) {
stem_set->bhinsi_jitu = (NJ_UINT16)(NJ_INT16_READ(wkc));
} else {
stem_set->bhinsi_jitu = (NJ_UINT16)*wkc;
}
if (check != 1) {
bit_all = (NJ_UINT16)(TERM_BIT + flg_bit +
BIT_HINDO_LEN(hdl) +
BIT_FHINSI(hdl) +
BIT_BHINSI(hdl));
pos = (NJ_UINT16)(bit_all >> 3);
data = (NJ_UINT16)(NJ_INT16_READ(stem_data + pos));
j = (NJ_UINT16)(bit_all & 0x0007);
bit = BIT_CANDIDATE_LEN(hdl);
stem_set->candidate_size = GET_BITFIELD_16(data, j, bit);
bit_all += bit;
}
if (check == 0) {
stem_set->yomi_size = 0;
if (APPEND_YOMI_FLG(hdl) && STEM_TERMINETER(stem_data)) {
pos = (NJ_UINT16)(bit_all >> 3);
data = (NJ_UINT16)(NJ_INT16_READ(stem_data + pos));
j = (NJ_UINT16)(bit_all & 0x0007);
bit = BIT_YOMI_LEN(hdl);
stem_set->yomi_size = GET_BITFIELD_16(data, j, bit);
bit_all += bit;
dpos = GET_BIT_TO_BYTE(bit_all);
dpos += stem_set->candidate_size;
} else if (APPEND_YOMI_FLG(hdl)) {
while (!(STEM_TERMINETER(stem_data))) {
next = get_stem_next(hdl, stem_data);
stem_data += next;
}
dpos = get_stem_yomi_data(hdl, stem_data, stem_set);
}
if (stem_set->yomi_size) {
stem_set->yomi_size = get_stem_yomi_size(hdl, stem_data + dpos, stem_set->yomi_size);
}
}
}
static void get_stem_cand_data(NJ_DIC_HANDLE hdl, NJ_UINT8 *stem_data, STEM_DATA_SET *stem_set)
{
NJ_UINT8 flg_bit;
NJ_UINT16 data;
NJ_UINT16 pos, j, bit_all;
NJ_UINT16 cand_bit, yomi_bit;
flg_bit = BIT_MUHENKAN_LEN(hdl);
if (NJ_GET_DIC_FMT(hdl) != NJ_DIC_FMT_KANAKAN) {
flg_bit++;
}
bit_all = (NJ_UINT16)(TERM_BIT + flg_bit +
BIT_HINDO_LEN(hdl) +
BIT_FHINSI(hdl) +
BIT_BHINSI(hdl));
pos = (NJ_UINT16)(bit_all >> 3);
data = (NJ_UINT16)(NJ_INT16_READ(stem_data + pos));
cand_bit = BIT_CANDIDATE_LEN(hdl);
j = (NJ_UINT16)(bit_all & 0x0007);
stem_set->candidate_size = GET_BITFIELD_16(data, j, cand_bit);
bit_all += cand_bit;
if (APPEND_YOMI_FLG(hdl) && STEM_TERMINETER(stem_data)) {
yomi_bit = BIT_YOMI_LEN(hdl);
bit_all += yomi_bit;
}
stem_set->stem_size = GET_BIT_TO_BYTE(bit_all);
}
static NJ_UINT16 get_stem_yomi_data(NJ_DIC_HANDLE hdl, NJ_UINT8 *stem_data,STEM_DATA_SET *stem_set)
{
NJ_UINT16 flg_bit;
NJ_UINT16 data;
NJ_UINT16 cand_bit, yomi_bit;
NJ_UINT16 pos, j, bit_all;
NJ_UINT16 yomi_pos;
NJ_UINT16 candidate_size;
flg_bit = BIT_MUHENKAN_LEN(hdl);
if (NJ_GET_DIC_FMT(hdl) != NJ_DIC_FMT_KANAKAN) {
flg_bit++;
}
bit_all = (NJ_UINT16)(TERM_BIT + flg_bit + BIT_HINDO_LEN(hdl) +
BIT_FHINSI(hdl) + BIT_BHINSI(hdl));
pos = (NJ_UINT16)(bit_all >> 3);
data = (NJ_UINT16)(NJ_INT16_READ(stem_data + pos));
j = (NJ_UINT16)(bit_all & 0x0007);
cand_bit = BIT_CANDIDATE_LEN(hdl);
candidate_size = GET_BITFIELD_16(data, j, cand_bit);
bit_all += cand_bit;
if (APPEND_YOMI_FLG(hdl) && STEM_TERMINETER(stem_data)) {
pos = (NJ_UINT16)(bit_all >> 3);
data = (NJ_UINT16)(NJ_INT16_READ(stem_data + pos));
j = (NJ_UINT16)(bit_all & 0x0007);
yomi_bit = BIT_YOMI_LEN(hdl);
stem_set->yomi_size = GET_BITFIELD_16(data, j, yomi_bit);
bit_all += yomi_bit;
} else {
stem_set->yomi_size = 0;
}
yomi_pos = GET_BIT_TO_BYTE(bit_all);
yomi_pos += candidate_size;
return yomi_pos;
}
static NJ_UINT16 get_stem_yomi_size(NJ_DIC_HANDLE hdl, NJ_UINT8 *ydata, NJ_UINT16 yomi_size)
{
NJ_INT16 ytbl_cnt;
NJ_INT8 ysize;
NJ_UINT8 *ytbl_top;
NJ_UINT8 *ytbl;
NJ_UINT8 yidx;
NJ_UINT16 i;
NJ_UINT16 len;
ytbl_cnt = YOMI_INDX_CNT(hdl);
if (ytbl_cnt) {
ysize = YOMI_INDX_SIZE(hdl);
ytbl_top = YOMI_INDX_TOP_ADDR(hdl);
len = 0;
for (i = 0; i < yomi_size; i++) {
if (ysize == 2) {
yidx = *(ydata+i);
ytbl = ytbl_top + ((yidx-1) * ysize);
len += UTL_CHAR(ytbl);
} else {
len++;
}
}
return len * sizeof(NJ_CHAR);
} else {
return yomi_size;
}
}
static NJ_UINT16 get_stem_yomi_string(NJ_DIC_HANDLE hdl, NJ_UINT8 *stem_data, NJ_CHAR *yomi, NJ_UINT16 yomi_pos, NJ_UINT16 yomi_size, NJ_UINT16 size)
{
NJ_INT16 ytbl_cnt;
NJ_INT8 ysize;
NJ_UINT8 *ytbl_top, *ytbl;
NJ_UINT8 *ydata;
NJ_UINT8 yidx;
NJ_UINT16 i;
NJ_UINT16 copy_len;
NJ_UINT16 char_len;
ytbl_cnt = YOMI_INDX_CNT(hdl);
ysize = YOMI_INDX_SIZE(hdl);
ytbl_top = YOMI_INDX_TOP_ADDR(hdl);
ydata = stem_data + yomi_pos;
if (ytbl_cnt) {
copy_len = 0;
for (i = 0; i < yomi_size; i++) {
yidx = *(ydata + i);
ytbl = ytbl_top + ((yidx - 1) * ysize);
if (ysize == 2) {
char_len = UTL_CHAR(ytbl);
if (((copy_len + char_len + NJ_TERM_LEN) * sizeof(NJ_CHAR)) > size) {
return size;
}
while (char_len > 0) {
NJ_CHAR_COPY(yomi + copy_len, ytbl);
copy_len++;
char_len--;
ytbl += sizeof(NJ_CHAR);
}
} else {
if (((copy_len + 1 + NJ_TERM_LEN) * sizeof(NJ_CHAR)) > size) {
return size;
}
*(yomi + copy_len) = (NJ_CHAR)(*ytbl);
copy_len++;
}
}
} else {
if ((yomi_size + (NJ_TERM_LEN * sizeof(NJ_CHAR))) > size) {
return size;
}
nj_memcpy((NJ_UINT8*)yomi, ydata, yomi_size);
copy_len = yomi_size / sizeof(NJ_CHAR);
}
*(yomi + copy_len) = NJ_CHAR_NUL;
return copy_len;
}
static NJ_INT16 search_node(NJ_SEARCH_CONDITION *condition, NJ_SEARCH_LOCATION_SET *loctset)
{
NJ_UINT8 *root, *now, *node, *node_mid;
NJ_UINT8 index;
NJ_UINT8 *byomi;
NJ_UINT8 *wkc;
NJ_UINT8 idx_no;
NJ_INT16 idx;
NJ_INT16 char_size;
NJ_INT16 left, right, mid;
NJ_INT16 ytbl_cnt;
NJ_UINT16 c, d;
NJ_UINT8 c1 = 0, c2 = 0;
NJ_UINT16 y;
NJ_UINT16 ysize = (condition->ylen * sizeof(NJ_CHAR));
NJ_UINT8 *ytbl_top;
NJ_UINT16 idx_cnt;
NJ_UINT16 nd_index;
NJ_UINT16 bit_left, bit_data;
NJ_UINT32 data_offset;
NJ_UINT16 data;
NJ_UINT16 pos, j, bit_all, bit_tmp, bit_idx;
NJ_UINT32 data_l;
NJ_UINT8 restart_flg = 0;
NJ_UINT8 bottom_flg = 0;
NJ_UINT8 *data_top, *stem_data;
NJ_UINT16 hindo, hindo_max;
NJ_UINT32 current,hindo_max_data, bottom, next;
node = NULL;
byomi = (NJ_UINT8*)(condition->yomi);
root = NODE_AREA_TOP_ADDR(loctset->loct.handle);
node_mid = root + NODE_AREA_MID_ADDR(loctset->loct.handle);
now = node_mid;
idx_no = 0;
idx_cnt = 1;
bit_left = BIT_NODE_AREA_LEFT_LEN(loctset->loct.handle);
bit_data = BIT_NODE_AREA_DATA_LEN(loctset->loct.handle);
ytbl_cnt = YOMI_INDX_CNT(loctset->loct.handle);
y = YOMI_INDX_SIZE(loctset->loct.handle);
ytbl_top = YOMI_INDX_TOP_ADDR(loctset->loct.handle);
data_top = STEM_AREA_TOP_ADDR(loctset->loct.handle);
if ((condition->operation == NJ_CUR_OP_FORE) &&
NJ_CHAR_STRLEN_IS_0(condition->yomi)) {
ysize = 0;
node = root;
}
while (ysize > 0) {
if (ytbl_cnt != 0) {
char_size = UTL_CHAR(byomi) * sizeof(NJ_CHAR);
if (char_size > 2) {
loctset->loct.status = NJ_ST_SEARCH_END_EXT;
return 0;
}
if (char_size == 2) {
if (y == 1) {
return 0;
}
c1 = *byomi;
c2 = *(byomi + 1);
c = (NJ_UINT16)((c1 << 8) | c2);
} else {
c1 = *byomi;
c2 = 0x00;
c = (NJ_UINT16)(*byomi);
}
idx = -1;
left = 0;
right = ytbl_cnt;
if (y == 2) {
while (left <= right) {
mid = (left + right) >> 1;
wkc = ytbl_top + (mid << 1);
if (c1 == *wkc) {
if (c2 == *(wkc + 1)) {
idx = (NJ_UINT16)(mid + 1);
break;
}
if (c2 < *(wkc + 1)) {
right = mid - 1;
} else {
left = mid + 1;
}
} else if (c1 < *wkc) {
right = mid - 1;
} else {
left = mid + 1;
}
}
} else {
while (left <= right) {
mid = (left + right) >> 1;
wkc = ytbl_top + (mid * y);
d = (NJ_UINT16)(*wkc);
if (c == d) {
idx = (NJ_UINT16)(mid + 1);
break;
}
if (c < d) {
right = mid - 1;
} else {
left = mid + 1;
}
}
}
if (idx < 0) {
loctset->loct.status = NJ_ST_SEARCH_END_EXT;
return 0;
}
index = (NJ_UINT8)idx;
} else {
index = *byomi;
char_size = 1;
}
byomi += char_size;
ysize -= char_size;
while (now < data_top) {
if (NODE_IDX_EXIST(now)) {
bit_idx = 8;
idx_cnt = NODE_IDX_CNT(now);
} else {
bit_idx = 4;
idx_cnt = 1;
}
bit_all = bit_idx;
if (NODE_LEFT_EXIST(now)) {
bit_all += bit_left;
}
if (NODE_DATA_EXIST(now)) {
bit_all += bit_data;
}
bit_tmp = bit_all;
bit_all += (NJ_UINT16)(idx_no << 3);
pos = (NJ_UINT16)(bit_all >> 3);
data = (NJ_UINT16)(NJ_INT16_READ(now + pos));
j = (NJ_UINT16)(bit_all & 0x0007);
nd_index = GET_BITFIELD_16(data, j, INDEX_BIT);
if (index == (NJ_UINT8)nd_index) {
break;
} else {
if ((!NODE_TERM(now)) && (index > (NJ_UINT8)nd_index) && (idx_no == 0)) {
now += GET_BIT_TO_BYTE(bit_tmp + (idx_cnt * 8));
if (now == node_mid) {
loctset->loct.status = NJ_ST_SEARCH_END_EXT;
return 0;
}
continue;
} else {
if ((now == node_mid) && (restart_flg == 0) &&
(index < (NJ_UINT8)nd_index) && (idx_no == 0) &&
(root != node_mid)) {
now = root;
idx_no = 0;
restart_flg = 1;
continue;
}
loctset->loct.status = NJ_ST_SEARCH_END_EXT;
return 0;
}
}
}
if ( (idx_cnt > (NJ_UINT16)(idx_no + 1))) {
if (ysize == 0) {
if (condition->operation == NJ_CUR_OP_FORE) {
node = now;
break;
}
loctset->loct.status = NJ_ST_SEARCH_END;
return 0;
}
idx_no++;
continue;
}
node = now;
idx_no = 0;
if (ysize == 0) {
break;
} else {
if (!(NODE_LEFT_EXIST(now))) {
loctset->loct.status = NJ_ST_SEARCH_END_EXT;
return 0;
}
}
if (NODE_IDX_EXIST(now)) {
bit_idx = 8;
} else {
bit_idx = 4;
}
pos = (NJ_UINT16)(bit_idx >> 3);
data_l = (NJ_UINT32)(NJ_INT32_READ(now + pos));
j = (NJ_UINT16)(bit_idx & 0x0007);
now += GET_BITFIELD_32(data_l, j, bit_left);
}
now = node;
if ((node == NULL) || !(NODE_DATA_EXIST(node))) {
if ((condition->operation == NJ_CUR_OP_FORE) &&
(node != NULL)) {
while (!NODE_DATA_EXIST(node)) {
if (!(NODE_LEFT_EXIST(node))) {
loctset->loct.status = NJ_ST_SEARCH_END;
return 0;
}
if (NODE_IDX_EXIST(node)) {
bit_idx = 8;
} else {
bit_idx = 4;
}
pos = (NJ_UINT16)(bit_idx >> 3);
data_l = (NJ_UINT32)(NJ_INT32_READ(node + pos));
j = (NJ_UINT16)(bit_idx & 0x0007);
node += GET_BITFIELD_32(data_l, j, bit_left);
}
} else {
loctset->loct.status = NJ_ST_SEARCH_END;
return 0;
}
}
if (NODE_IDX_EXIST(node)) {
bit_idx = 8;
} else {
bit_idx = 4;
}
if (NODE_LEFT_EXIST(node)) {
bit_all = bit_idx + bit_left;
} else {
bit_all = bit_idx;
}
pos = (NJ_UINT16)(bit_all >> 3);
data_l = (NJ_UINT32)(NJ_INT32_READ(node + pos));
j = (NJ_UINT16)(bit_all & 0x0007);
data_offset = GET_BITFIELD_32(data_l, j, bit_data);
loctset->loct.top = data_offset;
loctset->loct.current = 0;
if (condition->operation == NJ_CUR_OP_FORE) {
bottom = loctset->loct.top;
if (NJ_CHAR_STRLEN_IS_0(condition->yomi)) {
node = node_mid;
} else {
node = now;
if (NODE_LEFT_EXIST(node)) {
if (NODE_IDX_EXIST(node)) {
bit_all = 8;
} else {
bit_all = 4;
}
pos = (NJ_UINT16)(bit_all >> 3);
data_l = (NJ_UINT32)(NJ_INT32_READ(node + pos));
j = (NJ_UINT16)(bit_all & 0x0007);
node += GET_BITFIELD_32(data_l, j, bit_left);
} else {
bottom_flg = 1;
}
}
if (!bottom_flg) {
while (node < data_top) {
if (!NODE_TERM(node)) {
if (NODE_IDX_EXIST(node)) {
bit_all = 8;
idx_cnt = NODE_IDX_CNT(node);
} else {
bit_all = 4;
idx_cnt = 1;
}
if (NODE_LEFT_EXIST(node)) {
bit_all += bit_left;
}
if (NODE_DATA_EXIST(node)) {
bit_all += bit_data;
}
node += GET_BIT_TO_BYTE(bit_all + (idx_cnt * 8));
} else {
if (!NODE_LEFT_EXIST(node)) {
if (NODE_DATA_EXIST(node)) {
if (NODE_IDX_EXIST(node)) {
bit_all = 8;
} else {
bit_all = 4;
}
pos = (NJ_UINT16)(bit_all >> 3);
data_l = (NJ_UINT32)(NJ_INT32_READ(node + pos));
j = (NJ_UINT16)(bit_all & 0x0007);
data_offset = GET_BITFIELD_32(data_l, j, bit_data);
bottom = data_offset;
break;
} else {
return NJ_SET_ERR_VAL(NJ_FUNC_NJD_B_SEARCH_WORD, NJ_ERR_DIC_BROKEN);
}
} else {
if (NODE_IDX_EXIST(node)) {
bit_all = 8;
} else {
bit_all = 4;
}
pos = (NJ_UINT16)(bit_all >> 3);
data_l = (NJ_UINT32)(NJ_INT32_READ(node + pos));
j = (NJ_UINT16)(bit_all & 0x0007);
node += GET_BITFIELD_32(data_l, j, bit_left);
}
}
}
}
stem_data = data_top + bottom;
while (!(STEM_TERMINETER(stem_data))) {
next = get_stem_next(loctset->loct.handle, stem_data);
stem_data += next;
}
loctset->loct.bottom = (NJ_UINT32)(stem_data - data_top);
stem_data = data_top + loctset->loct.top;
hindo = (NJ_UINT16) *((NJ_UINT8*)(HINDO_NO_TOP_ADDR(loctset->loct.handle)
+ get_stem_hindo(loctset->loct.handle, stem_data)));
hindo_max = hindo;
hindo_max_data = 0;
if (condition->mode == NJ_CUR_MODE_FREQ) {
j = get_stem_next(loctset->loct.handle, stem_data);
current = j;
stem_data += j;
while (stem_data <= (data_top + loctset->loct.bottom)) {
hindo = (NJ_UINT16) *((NJ_UINT8*)(HINDO_NO_TOP_ADDR(loctset->loct.handle)
+ get_stem_hindo(loctset->loct.handle, stem_data)));
if (hindo > hindo_max) {
hindo_max = hindo;
hindo_max_data = current;
}
j = get_stem_next(loctset->loct.handle, stem_data);
current += j;
stem_data += j;
}
}
loctset->cache_freq = CALCULATE_HINDO(hindo_max, loctset->dic_freq.base,
loctset->dic_freq.high, COMP_DIC_FREQ_DIV);
loctset->loct.current = hindo_max_data;
}
return 1;
}
static NJ_INT16 bdic_search_data(NJ_SEARCH_CONDITION *condition, NJ_SEARCH_LOCATION_SET *loctset)
{
NJ_UINT8 *data, *data_end;
NJ_INT16 i, current = 0;
NJ_UINT16 hindo;
data = STEM_AREA_TOP_ADDR(loctset->loct.handle);
data += loctset->loct.top + loctset->loct.current;
if (GET_LOCATION_STATUS(loctset->loct.status) != NJ_ST_SEARCH_NO_INIT) {
if (STEM_TERMINETER(data)) {
loctset->loct.status = NJ_ST_SEARCH_END;
return 0;
}
i = get_stem_next(loctset->loct.handle, data);
data += i;
current += i;
}
if (NJ_GET_DIC_FMT(loctset->loct.handle) == NJ_DIC_FMT_KANAKAN) {
data_end = loctset->loct.handle
+ NJ_DIC_COMMON_HEADER_SIZE
+ NJ_INT32_READ(loctset->loct.handle + NJ_DIC_POS_DATA_SIZE)
+ NJ_INT32_READ(loctset->loct.handle + NJ_DIC_POS_EXT_SIZE)
- NJ_DIC_ID_LEN;
} else {
data_end = CAND_IDX_AREA_TOP_ADDR(loctset->loct.handle);
}
if (data < data_end) {
loctset->loct.status = NJ_ST_SEARCH_READY;
loctset->loct.current += current;
hindo = (NJ_UINT16) *((NJ_UINT8*)(HINDO_NO_TOP_ADDR(loctset->loct.handle) +
get_stem_hindo(loctset->loct.handle, data)));
loctset->cache_freq = CALCULATE_HINDO(hindo, loctset->dic_freq.base,
loctset->dic_freq.high, COMP_DIC_FREQ_DIV);
return 1;
}
loctset->loct.status = NJ_ST_SEARCH_END;
return 0;
}
static NJ_INT16 bdic_search_fore_data(NJ_SEARCH_CONDITION *condition, NJ_SEARCH_LOCATION_SET *loctset)
{
NJ_UINT8 *data, *data_top, *bottom, *data_end;
NJ_INT16 i = 0;
NJ_INT16 hindo = 0;
NJ_INT16 hindo_max = -1;
NJ_UINT8 no_hit = 0;
NJ_UINT32 current = loctset->loct.current;
NJ_UINT8 *current_org;
NJ_UINT32 hindo_data = 0;
if (GET_LOCATION_STATUS(loctset->loct.status) == NJ_ST_SEARCH_NO_INIT) {
loctset->loct.status = NJ_ST_SEARCH_READY;
loctset->loct.current_info = CURRENT_INFO_SET;
return 1;
}
data_top = STEM_AREA_TOP_ADDR(loctset->loct.handle);
data = data_top + loctset->loct.top + loctset->loct.current;
current_org = data;
bottom = data_top + loctset->loct.bottom;
if (NJ_GET_DIC_FMT(loctset->loct.handle) == NJ_DIC_FMT_KANAKAN) {
data_end = loctset->loct.handle
+ NJ_DIC_COMMON_HEADER_SIZE
+ NJ_INT32_READ(loctset->loct.handle + NJ_DIC_POS_DATA_SIZE)
+ NJ_INT32_READ(loctset->loct.handle + NJ_DIC_POS_EXT_SIZE)
- NJ_DIC_ID_LEN;
} else {
data_end = CAND_IDX_AREA_TOP_ADDR(loctset->loct.handle);
}
if (condition->mode == NJ_CUR_MODE_FREQ) {
while (data < data_end) {
i = get_stem_next(loctset->loct.handle, data);
data += i;
current += i;
if (data > bottom) {
if (loctset->cache_freq == 0) {
loctset->loct.status = NJ_ST_SEARCH_END;
return 0;
} else if (no_hit == 1) {
loctset->loct.status = NJ_ST_SEARCH_END;
return 0;
}
loctset->cache_freq -= 1;
data = data_top + loctset->loct.top;
current = 0;
no_hit = 1;
}
if ((hindo_max != -1) && (data == current_org)) {
loctset->loct.status = NJ_ST_SEARCH_READY;
loctset->loct.current_info = CURRENT_INFO_SET;
loctset->loct.current = hindo_data;
loctset->cache_freq = hindo_max;
return 1;
}
hindo = (NJ_INT16) *((NJ_UINT8*)(HINDO_NO_TOP_ADDR(loctset->loct.handle) + get_stem_hindo(loctset->loct.handle, data)));
hindo = CALCULATE_HINDO(hindo, loctset->dic_freq.base,
loctset->dic_freq.high, COMP_DIC_FREQ_DIV);
if (hindo == loctset->cache_freq) {
loctset->loct.status = NJ_ST_SEARCH_READY;
loctset->loct.current_info = CURRENT_INFO_SET;
loctset->loct.current = current;
return 1;
}
if (hindo < loctset->cache_freq) {
if (((hindo == hindo_max) && (current < hindo_data)) ||
(hindo > hindo_max)) {
hindo_max = hindo;
hindo_data = current;
}
}
}
} else {
i = get_stem_next(loctset->loct.handle, data);
data += i;
current += i;
if (data > bottom) {
loctset->loct.status = NJ_ST_SEARCH_END;
return 0;
}
hindo = (NJ_INT16) *((NJ_UINT8*)(HINDO_NO_TOP_ADDR(loctset->loct.handle)
+ get_stem_hindo(loctset->loct.handle, data)));
loctset->cache_freq = CALCULATE_HINDO(hindo, loctset->dic_freq.base,
loctset->dic_freq.high, COMP_DIC_FREQ_DIV);
loctset->loct.status = NJ_ST_SEARCH_READY;
loctset->loct.current_info = CURRENT_INFO_SET;
loctset->loct.current = current;
return 1;
}
loctset->loct.status = NJ_ST_SEARCH_END;
return 0;
}
NJ_INT16 njd_b_search_word(NJ_SEARCH_CONDITION *con, NJ_SEARCH_LOCATION_SET *loctset)
{
NJ_INT16 ret;
NJ_DIC_INFO *pdicinfo;
NJ_UINT16 hIdx;
switch (con->operation) {
case NJ_CUR_OP_COMP:
if (con->mode != NJ_CUR_MODE_FREQ) {
loctset->loct.status = NJ_ST_SEARCH_END_EXT;
return 0;
}
break;
case NJ_CUR_OP_FORE:
if (APPEND_YOMI_FLG(loctset->loct.handle) == 0) {
loctset->loct.status = NJ_ST_SEARCH_END_EXT;
return 0;
}
if ((NJ_GET_DIC_TYPE_EX(loctset->loct.type, loctset->loct.handle) != NJ_DIC_TYPE_CUSTOM_COMPRESS)
&& NJ_CHAR_STRLEN_IS_0(con->yomi)) {
loctset->loct.status = NJ_ST_SEARCH_END_EXT;
return 0;
}
break;
default:
loctset->loct.status = NJ_ST_SEARCH_END_EXT;
return 0;
}
if (con->ylen > NJ_GET_MAX_YLEN(loctset->loct.handle)) {
loctset->loct.status = NJ_ST_SEARCH_END_EXT;
return 0;
}
if (GET_LOCATION_STATUS(loctset->loct.status) == NJ_ST_SEARCH_NO_INIT) {
switch (con->operation) {
case NJ_CUR_OP_COMP:
ret = search_node(con, loctset);
if (ret < 1) {
return ret;
}
ret = bdic_search_data(con, loctset);
if (ret < 1) {
loctset->loct.status = NJ_ST_SEARCH_END;
}
break;
case NJ_CUR_OP_FORE:
pdicinfo = con->ds->dic;
for (hIdx = 0; (hIdx < NJ_MAX_DIC) && (pdicinfo->handle != loctset->loct.handle); hIdx++) {
pdicinfo++;
}
if (hIdx == NJ_MAX_DIC) {
loctset->loct.status = NJ_ST_SEARCH_END;
return 0;
}
if ((con->ds->dic[hIdx].srhCache == NULL) || (con->ylen == 0) ||
!(con->ds->mode & 0x0001)) {
ret = search_node(con, loctset);
if (ret < 1) {
return ret;
}
ret = bdic_search_fore_data(con, loctset);
} else {
ret = search_node2(con, loctset, hIdx);
if (ret == NJ_SET_ERR_VAL(NJ_FUNC_NJD_B_SEARCH_WORD, NJ_ERR_CACHE_NOT_ENOUGH)) {
NJ_SET_CACHEOVER_TO_SCACHE(con->ds->dic[hIdx].srhCache);
ret = search_node2(con, loctset, hIdx);
}
if (ret < 1) {
return ret;
}
ret = bdic_search_fore_data2(con, loctset, hIdx);
}
if (ret < 1) {
loctset->loct.status = NJ_ST_SEARCH_END;
}
break;
default:
loctset->loct.status = NJ_ST_SEARCH_END_EXT;
return 0;
}
} else if (GET_LOCATION_STATUS(loctset->loct.status) == NJ_ST_SEARCH_READY) {
switch (con->operation) {
case NJ_CUR_OP_COMP:
ret = bdic_search_data(con, loctset);
if (ret < 1) {
loctset->loct.status = NJ_ST_SEARCH_END;
}
break;
case NJ_CUR_OP_FORE:
pdicinfo = con->ds->dic;
for (hIdx = 0; (hIdx < NJ_MAX_DIC) && (pdicinfo->handle != loctset->loct.handle); hIdx++) {
pdicinfo++;
}
if (hIdx == NJ_MAX_DIC) {
loctset->loct.status = NJ_ST_SEARCH_END;
return 0;
}
if ((con->ds->dic[hIdx].srhCache == NULL) || (con->ylen == 0) ||
!(con->ds->mode & 0x0001)) {
ret = bdic_search_fore_data(con, loctset);
} else {
ret = bdic_search_fore_data2(con, loctset, hIdx);
}
if (ret < 1) {
loctset->loct.status = NJ_ST_SEARCH_END;
}
break;
default:
loctset->loct.status = NJ_ST_SEARCH_END;
return 0;
}
} else {
loctset->loct.status = NJ_ST_SEARCH_END;
return 0;
}
return ret;
}
NJ_INT16 njd_b_get_word(NJ_SEARCH_LOCATION_SET *loctset, NJ_WORD *word)
{
NJ_UINT8 *data;
STEM_DATA_SET stem_set;
NJ_UINT8 check;
if (GET_LOCATION_STATUS(loctset->loct.status) == NJ_ST_SEARCH_END) {
return 0;
}
if (GET_LOCATION_OPERATION(loctset->loct.status) == NJ_CUR_OP_FORE) {
data = STEM_AREA_TOP_ADDR(loctset->loct.handle);
data += loctset->loct.top + loctset->loct.current;
check = 0;
} else {
data = STEM_AREA_TOP_ADDR(loctset->loct.handle);
data += loctset->loct.top + loctset->loct.current;
check = 2;
}
get_stem_word(loctset->loct.handle, data, &stem_set, check);
if (GET_LOCATION_OPERATION(loctset->loct.status) == NJ_CUR_OP_FORE) {
word->stem.info1 = (NJ_UINT16)(stem_set.yomi_size / sizeof(NJ_CHAR));
}
word->stem.info1 = WORD_LEN(word->stem.info1);
word->stem.info1 |= (NJ_UINT16)(stem_set.fhinsi_jitu << 7);
if (check != 1) {
if (stem_set.candidate_size == 0) {
if (GET_LOCATION_OPERATION(loctset->loct.status) == NJ_CUR_OP_FORE) {
word->stem.info2 = (NJ_UINT16)(stem_set.yomi_size / sizeof(NJ_CHAR));
} else {
word->stem.info2 = (NJ_UINT16)NJ_GET_YLEN_FROM_STEM(word);
}
} else {
word->stem.info2 = (NJ_UINT16)(stem_set.candidate_size / sizeof(NJ_CHAR));
}
} else {
word->stem.info2 = (NJ_UINT16)NJ_GET_YLEN_FROM_STEM(word);
}
word->stem.info2 = WORD_LEN(word->stem.info2);
word->stem.info2 |= (NJ_UINT16)(stem_set.bhinsi_jitu << 7);
word->stem.hindo = CALCULATE_HINDO(stem_set.hindo_jitu, loctset->dic_freq.base,
loctset->dic_freq.high, COMP_DIC_FREQ_DIV);
word->stem.loc = loctset->loct;
return 1;
}
NJ_INT16 njd_b_get_candidate(NJ_WORD *word, NJ_CHAR *candidate, NJ_UINT16 size)
{
NJ_SEARCH_LOCATION *loc;
NJ_CHAR *wkc, *cand;
NJ_UINT8 *wkd;
NJ_UINT8 *data;
NJ_UINT8 *data_org;
NJ_UINT16 len, j;
STEM_DATA_SET stem_set;
NJ_INT16 next;
NJ_UINT16 yomi_pos;
NJ_CHAR ybuf[NJ_MAX_LEN + NJ_TERM_LEN];
if ((GET_LOCATION_OPERATION(word->stem.loc.status) == NJ_CUR_OP_COMP) ||
(GET_LOCATION_OPERATION(word->stem.loc.status) == NJ_CUR_OP_FORE)) {
loc = &word->stem.loc;
data = STEM_AREA_TOP_ADDR(loc->handle);
data += loc->top + loc->current;
get_stem_cand_data(loc->handle, data, &stem_set);
len = stem_set.candidate_size / sizeof(NJ_CHAR);
} else {
return NJ_SET_ERR_VAL(NJ_FUNC_NJD_B_GET_CANDIDATE, NJ_ERR_INVALID_RESULT);
}
if (len == 0) {
data_org = data;
if (GET_LOCATION_OPERATION(word->stem.loc.status) == NJ_CUR_OP_COMP) {
len = WORD_LEN(word->stem.info1);
if (size < ((len + NJ_TERM_LEN) * sizeof(NJ_CHAR))) {
return NJ_SET_ERR_VAL(NJ_FUNC_NJD_B_GET_CANDIDATE, NJ_ERR_BUFFER_NOT_ENOUGH);
}
wkc = word->yomi;
} else {
while (!(STEM_TERMINETER(data))) {
next = get_stem_next(loc->handle, data);
data += next;
}
yomi_pos = get_stem_yomi_data(loc->handle, data, &stem_set);
wkc = ybuf;
len = get_stem_yomi_string(loc->handle, data, wkc,
yomi_pos, stem_set.yomi_size,
size);
if (size < ((len + NJ_TERM_LEN) * sizeof(NJ_CHAR))) {
return NJ_SET_ERR_VAL(NJ_FUNC_NJD_B_GET_CANDIDATE, NJ_ERR_BUFFER_NOT_ENOUGH);
}
}
if (STEM_NO_CONV_FLG(data_org) == 0) {
cand = candidate;
for (j = 0; j < len; j++) {
*cand++ = *wkc++;
}
*cand = NJ_CHAR_NUL;
} else {
nje_convert_hira_to_kata(wkc, candidate, len);
}
} else {
if (size < (stem_set.candidate_size + (NJ_TERM_LEN*sizeof(NJ_CHAR)))) {
return NJ_SET_ERR_VAL(NJ_FUNC_NJD_B_GET_CANDIDATE, NJ_ERR_BUFFER_NOT_ENOUGH);
}
wkc = candidate;
wkd = data + stem_set.stem_size;
for (j = 0; j < len; j++) {
NJ_CHAR_COPY(wkc, wkd);
wkd += sizeof(NJ_CHAR);
wkc++;
}
*wkc = NJ_CHAR_NUL;
}
return len;
}
NJ_INT16 njd_b_get_stroke(NJ_WORD *word, NJ_CHAR *stroke, NJ_UINT16 size)
{
NJ_SEARCH_LOCATION *loc;
NJ_UINT8 *data;
NJ_INT16 len;
NJ_INT16 next;
NJ_UINT16 yomi_pos;
STEM_DATA_SET stem_set;
if (GET_LOCATION_OPERATION(word->stem.loc.status) == NJ_CUR_OP_FORE) {
if (NJ_GET_YLEN_FROM_STEM(word) == 0) {
return NJ_SET_ERR_VAL(NJ_FUNC_NJD_B_GET_STROKE, NJ_ERR_INVALID_RESULT);
}
loc = &word->stem.loc;
data = STEM_AREA_TOP_ADDR(loc->handle);
data += loc->top + loc->current;
} else {
return NJ_SET_ERR_VAL(NJ_FUNC_NJD_B_GET_STROKE, NJ_ERR_INVALID_RESULT);
}
while (!(STEM_TERMINETER(data))) {
next = get_stem_next(loc->handle, data);
data += next;
}
yomi_pos = get_stem_yomi_data(loc->handle, data, &stem_set);
if (stem_set.yomi_size == 0) {
return NJ_SET_ERR_VAL(NJ_FUNC_NJD_B_GET_STROKE, NJ_ERR_INVALID_RESULT);
}
len = get_stem_yomi_string(loc->handle, data, stroke,
yomi_pos, stem_set.yomi_size,
size);
if (size < (NJ_UINT16)((len+NJ_TERM_LEN)*sizeof(NJ_CHAR))) {
return NJ_SET_ERR_VAL(NJ_FUNC_NJD_B_GET_STROKE, NJ_ERR_BUFFER_NOT_ENOUGH);
}
*(stroke + len) = NJ_CHAR_NUL;
return len;
}
static NJ_INT16 search_node2(NJ_SEARCH_CONDITION *condition, NJ_SEARCH_LOCATION_SET *loctset, NJ_UINT16 hidx)
{
NJ_UINT8 *root, *now, *node, *node_mid;
NJ_CHAR *yomi;
NJ_INT16 ytbl_cnt;
NJ_UINT16 y;
NJ_UINT8 *ytbl_top;
NJ_UINT16 bit_left, bit_data;
NJ_UINT32 data_offset;
NJ_UINT16 j;
NJ_UINT8 *data_top, *stem_data;
NJ_UINT16 hindo, hindo_max, hindo_tmp;
NJ_UINT32 current, hindo_max_data, hindo_tmp_data;
NJ_SEARCH_CACHE *psrhCache = condition->ds->dic[hidx].srhCache;
NJ_CHAR *key;
NJ_UINT8 cmpflg;
NJ_UINT8 endflg;
NJ_UINT16 abPtrIdx;
NJ_UINT16 key_len;
NJ_UINT16 i, l, m;
NJ_UINT16 abIdx;
NJ_UINT16 abIdx_current;
NJ_UINT16 abIdx_old;
NJ_UINT16 addcnt = 0;
NJ_CHAR char_tmp[NJ_MAX_LEN + NJ_TERM_LEN];
NJ_UINT16 tmp_len;
NJ_UINT16 endIdx;
NJ_INT16 ret;
NJ_UINT8 *con_node;
NJ_UINT16 yomi_clen;
NJ_UINT8 aimai_flg = 0x01;
NJ_CHAR key_tmp[NJ_MAX_CHAR_LEN + NJ_TERM_LEN];
NJ_CACHE_INFO tmpbuff;
if (NJ_GET_CACHEOVER_FROM_SCACHE(psrhCache)) {
aimai_flg = 0x00;
}
node = NULL;
yomi = condition->yomi;
root = NODE_AREA_TOP_ADDR(loctset->loct.handle);
node_mid = root + NODE_AREA_MID_ADDR(loctset->loct.handle);
now = node_mid;
bit_left = BIT_NODE_AREA_LEFT_LEN(loctset->loct.handle);
bit_data = BIT_NODE_AREA_DATA_LEN(loctset->loct.handle);
ytbl_cnt = YOMI_INDX_CNT(loctset->loct.handle);
y = YOMI_INDX_SIZE(loctset->loct.handle);
ytbl_top = YOMI_INDX_TOP_ADDR(loctset->loct.handle);
data_top = STEM_AREA_TOP_ADDR(loctset->loct.handle);
endflg = 0x00;
cmpflg = 0x00;
abPtrIdx = 0;
key = condition->ds->keyword;
yomi_clen = condition->yclen;
for (i = 0; i < yomi_clen; i++) {
abPtrIdx = i;
if (!cmpflg) {
if (((abPtrIdx != 0) && (psrhCache->keyPtr[abPtrIdx] == 0))
|| (psrhCache->keyPtr[abPtrIdx + 1] == 0)) {
cmpflg = 0x01;
} else {
}
}
addcnt = 0;
if (cmpflg) {
if (abPtrIdx == 0) {
abIdx = 0;
nj_charncpy(key_tmp, yomi, 1);
key_len = nj_strlen(key_tmp);
node = NULL;
now = node_mid;
psrhCache->keyPtr[0] = 0;
ret = search_yomi_node(condition->operation,
node, now, 0, key_tmp, key_len,
root, node_mid, bit_left, bit_data,
data_top, ytbl_cnt, y, ytbl_top,
&tmpbuff,
&con_node, &data_offset);
if (ret < 0) {
} else {
psrhCache->storebuff[abIdx] = tmpbuff;
now = con_node;
psrhCache->storebuff[abIdx].top = data_offset;
if (condition->operation == NJ_CUR_OP_FORE) {
ret = get_node_bottom(key_tmp, now, node_mid, data_top,
bit_left, bit_data,
psrhCache->storebuff[abIdx].top,
loctset->loct.handle,
&(psrhCache->storebuff[abIdx].bottom));
if (ret < 0) {
return ret;
}
}
addcnt++;
abIdx++;
}
if ((condition->charset != NULL) && aimai_flg) {
for (l = 0; l < condition->charset->charset_count; l++) {
if (nj_charncmp(key, condition->charset->from[l], 1) == 0) {
nj_strcpy(char_tmp, condition->charset->to[l]);
tmp_len = nj_strlen(char_tmp);
node = NULL;
now = node_mid;
ret = search_yomi_node(condition->operation,
node, now, 0, char_tmp, tmp_len,
root, node_mid, bit_left, bit_data,
data_top, ytbl_cnt, y, ytbl_top,
&tmpbuff,
&con_node, &data_offset);
if (ret < 0) {
} else {
if (abIdx >= NJ_SEARCH_CACHE_SIZE) {
psrhCache->keyPtr[abPtrIdx+1] = 0;
return NJ_SET_ERR_VAL(NJ_FUNC_NJD_B_SEARCH_WORD, NJ_ERR_CACHE_NOT_ENOUGH);
}
psrhCache->storebuff[abIdx] = tmpbuff;
now = con_node;
psrhCache->storebuff[abIdx].top = data_offset;
if (condition->operation == NJ_CUR_OP_FORE) {
ret = get_node_bottom(key_tmp, now,
node_mid, data_top,
bit_left, bit_data,
psrhCache->storebuff[abIdx].top,
loctset->loct.handle,
&(psrhCache->storebuff[abIdx].bottom));
if (ret < 0) {
return ret;
}
}
addcnt++;
abIdx++;
}
}
}
}
psrhCache->keyPtr[abPtrIdx + 1] = abIdx;
} else {
nj_charncpy(key_tmp, yomi, 1);
key_len = nj_strlen(key_tmp);
if (psrhCache->keyPtr[abPtrIdx] == psrhCache->keyPtr[abPtrIdx - 1]) {
psrhCache->keyPtr[abPtrIdx+1] = psrhCache->keyPtr[abPtrIdx-1];
endflg = 0x01;
} else {
endIdx = psrhCache->keyPtr[abPtrIdx];
abIdx_old = psrhCache->keyPtr[abPtrIdx - 1];
if (NJ_GET_CACHEOVER_FROM_SCACHE(psrhCache)) {
abIdx = psrhCache->keyPtr[abPtrIdx - 1];
psrhCache->keyPtr[abPtrIdx] = abIdx;
} else {
abIdx = psrhCache->keyPtr[abPtrIdx];
}
if ((abIdx > NJ_SEARCH_CACHE_SIZE) || (abIdx_old >= NJ_SEARCH_CACHE_SIZE)
|| (endIdx > NJ_SEARCH_CACHE_SIZE)) {
return NJ_SET_ERR_VAL(NJ_FUNC_NJD_B_SEARCH_WORD, NJ_ERR_CACHE_BROKEN);
}
for (m = abIdx_old; m < endIdx; m++) {
node = psrhCache->storebuff[m].node;
now = psrhCache->storebuff[m].now;
if ((node == now) && (psrhCache->storebuff[m].idx_no == 0)) {
continue;
}
ret = search_yomi_node(condition->operation,
node, now, psrhCache->storebuff[m].idx_no,
key_tmp, key_len, root,
node_mid, bit_left, bit_data,
data_top, ytbl_cnt, y, ytbl_top,
&tmpbuff,
&con_node, &data_offset);
if (ret < 0) {
} else {
if (abIdx >= NJ_SEARCH_CACHE_SIZE) {
psrhCache->keyPtr[abPtrIdx+1] = 0;
return NJ_SET_ERR_VAL(NJ_FUNC_NJD_B_SEARCH_WORD, NJ_ERR_CACHE_NOT_ENOUGH);
}
psrhCache->storebuff[abIdx] = tmpbuff;
now = con_node;
psrhCache->storebuff[abIdx].top = data_offset;
if (condition->operation == NJ_CUR_OP_FORE) {
ret = get_node_bottom(key_tmp, now, node_mid, data_top,
bit_left, bit_data,
psrhCache->storebuff[abIdx].top,
loctset->loct.handle,
&(psrhCache->storebuff[abIdx].bottom));
if (ret < 0) {
return ret;
}
}
addcnt++;
abIdx++;
}
if ((condition->charset != NULL) && aimai_flg) {
for (l = 0; l < condition->charset->charset_count; l++) {
if (nj_charncmp(key, condition->charset->from[l], 1) == 0) {
nj_strcpy(char_tmp, condition->charset->to[l]);
tmp_len = nj_strlen(char_tmp);
node = psrhCache->storebuff[m].node;
now = psrhCache->storebuff[m].now;
ret = search_yomi_node(condition->operation,
node, now,
psrhCache->storebuff[m].idx_no,
char_tmp, tmp_len,
root, node_mid,
bit_left, bit_data, data_top,
ytbl_cnt, y, ytbl_top,
&tmpbuff,
&con_node, &data_offset);
if (ret < 0) {
} else {
if (abIdx >= NJ_SEARCH_CACHE_SIZE) {
psrhCache->keyPtr[abPtrIdx+1] = 0;
return NJ_SET_ERR_VAL(NJ_FUNC_NJD_B_SEARCH_WORD, NJ_ERR_CACHE_NOT_ENOUGH);
}
psrhCache->storebuff[abIdx] = tmpbuff;
now = con_node;
psrhCache->storebuff[abIdx].top = data_offset;
if (condition->operation == NJ_CUR_OP_FORE) {
ret = get_node_bottom(key_tmp, now, node_mid,
data_top, bit_left, bit_data,
psrhCache->storebuff[abIdx].top,
loctset->loct.handle,
&(psrhCache->storebuff[abIdx].bottom));
if (ret < 0) {
return ret;
}
}
addcnt++;
abIdx++;
}
}
}
}
}
psrhCache->keyPtr[abPtrIdx + 1] = abIdx;
}
}
}
yomi += UTL_CHAR(yomi);
key += UTL_CHAR(key);
}
if ((addcnt == 0) && (psrhCache->keyPtr[yomi_clen - 1] == psrhCache->keyPtr[yomi_clen])) {
endflg = 0x01;
}
if (endflg) {
loctset->loct.status = NJ_ST_SEARCH_END;
return 0;
}
loctset->loct.current = 0;
abPtrIdx = condition->yclen;
abIdx = psrhCache->keyPtr[abPtrIdx];
abIdx_old = psrhCache->keyPtr[abPtrIdx - 1];
if ((abIdx > NJ_SEARCH_CACHE_SIZE) || (abIdx_old >= NJ_SEARCH_CACHE_SIZE)) {
return NJ_SET_ERR_VAL(NJ_FUNC_NJD_B_SEARCH_WORD, NJ_ERR_CACHE_BROKEN);
}
if (condition->mode == NJ_CUR_MODE_FREQ) {
hindo_max = 0;
hindo_max_data = 0;
abIdx_current = abIdx_old;
stem_data = data_top + psrhCache->storebuff[abIdx_current].top;
hindo = (NJ_UINT16) *((NJ_UINT8 *)(HINDO_NO_TOP_ADDR(loctset->loct.handle) +
get_stem_hindo(loctset->loct.handle, stem_data)));
hindo_tmp = 0;
hindo_tmp_data = 0;
current = 0;
while (stem_data <= (data_top + psrhCache->storebuff[abIdx_current].bottom)) {
if (hindo > hindo_tmp) {
hindo_tmp = hindo;
hindo_tmp_data = current;
}
j = get_stem_next(loctset->loct.handle, stem_data);
current += j;
stem_data += j;
hindo = (NJ_UINT16) *((NJ_UINT8 *) (HINDO_NO_TOP_ADDR(loctset->loct.handle) +
get_stem_hindo(loctset->loct.handle, stem_data)));
}
psrhCache->storebuff[abIdx_current].current = hindo_tmp_data;
if (hindo_tmp > hindo_max) {
hindo_max = hindo_tmp;
hindo_max_data = hindo_tmp_data;
}
} else {
abIdx_current = abIdx_old;
stem_data = data_top + psrhCache->storebuff[abIdx_current].top;
hindo = (NJ_UINT16) *((NJ_UINT8 *)(HINDO_NO_TOP_ADDR(loctset->loct.handle)
+ get_stem_hindo(loctset->loct.handle, stem_data)));
hindo_max = hindo;
hindo_max_data = 0;
}
loctset->loct.top = psrhCache->storebuff[abIdx_current].top;
loctset->loct.bottom = psrhCache->storebuff[abIdx_current].bottom;
loctset->cache_freq = CALCULATE_HINDO(hindo_max, loctset->dic_freq.base,
loctset->dic_freq.high, COMP_DIC_FREQ_DIV);
loctset->loct.current = hindo_max_data;
loctset->loct.current_cache = (NJ_UINT8)abIdx_current;
psrhCache->viewCnt = 1;
NJ_SET_AIMAI_TO_SCACHE(psrhCache);
return 1;
}
static NJ_INT16 search_yomi_node(NJ_UINT8 operation, NJ_UINT8 *node, NJ_UINT8 *now,
NJ_UINT16 idx_no, NJ_CHAR *yomi, NJ_UINT16 yomilen,
NJ_UINT8 * root, NJ_UINT8 * node_mid,
NJ_UINT16 bit_left, NJ_UINT16 bit_data,
NJ_UINT8 * data_top,
NJ_INT16 ytbl_cnt, NJ_UINT16 y, NJ_UINT8 * ytbl_top,
NJ_CACHE_INFO * storebuf,
NJ_UINT8 ** con_node,
NJ_UINT32 * data_offset)
{
NJ_UINT8 index;
NJ_UINT8 *wkc;
NJ_UINT8 *byomi;
NJ_INT16 idx;
NJ_INT16 char_size;
NJ_INT16 left, right, mid;
NJ_UINT16 c, d;
NJ_UINT8 c1 = 0, c2 = 0;
NJ_UINT16 ysize = yomilen * sizeof(NJ_CHAR);
NJ_UINT16 idx_cnt;
NJ_UINT16 nd_index;
NJ_UINT16 data;
NJ_UINT16 pos, j, bit_all, bit_tmp, bit_idx;
NJ_UINT32 data_l;
NJ_UINT8 restart_flg = 0;
*con_node = NULL;
idx_cnt = 1;
storebuf->idx_no = 0;
byomi = (NJ_UINT8*)yomi;
while (ysize > 0) {
if (ytbl_cnt != 0) {
char_size = UTL_CHAR(byomi) * sizeof(NJ_CHAR);
if (char_size > 2) {
return -1;
}
if (char_size == 2) {
if (y == 1) {
return -1;
}
c1 = *byomi;
c2 = *(byomi + 1);
c = (NJ_UINT16)((c1 << 8) | c2);
} else {
c1 = *byomi;
c2 = 0x00;
c = (NJ_UINT16)(*byomi);
}
idx = -1;
left = 0;
right = ytbl_cnt;
if (y == 2) {
while (left <= right) {
mid = (left + right) >> 1;
wkc = ytbl_top + (mid << 1);
if (c1 == *wkc) {
if (c2 == *(wkc + 1)) {
idx = (NJ_UINT16) (mid + 1);
break;
}
if (c2 < *(wkc + 1)) {
right = mid - 1;
} else {
left = mid + 1;
}
} else if (c1 < *wkc) {
right = mid - 1;
} else {
left = mid + 1;
}
}
} else {
while (left <= right) {
mid = (left + right) >> 1;
wkc = ytbl_top + (mid * y);
d = (NJ_UINT16) (*wkc);
if (c == d) {
idx = (NJ_UINT16) (mid + 1);
break;
}
if (c < d) {
right = mid - 1;
} else {
left = mid + 1;
}
}
}
if (idx < 0) {
return -1;
}
index = (NJ_UINT8) idx;
} else {
index = *byomi;
char_size = 1;
}
byomi += char_size;
ysize -= char_size;
while (now < data_top) {
if (NODE_IDX_EXIST(now)) {
bit_idx = 8;
idx_cnt = NODE_IDX_CNT(now);
} else {
bit_idx = 4;
idx_cnt = 1;
}
bit_all = bit_idx;
if (NODE_LEFT_EXIST(now)) {
bit_all += bit_left;
}
if (NODE_DATA_EXIST(now)) {
bit_all += bit_data;
}
bit_tmp = bit_all;
bit_all += (NJ_UINT16) (idx_no << 3);
pos = (NJ_UINT16) (bit_all >> 3);
data = (NJ_UINT16) (NJ_INT16_READ(now + pos));
j = (NJ_UINT16) (bit_all & 0x0007);
nd_index = GET_BITFIELD_16(data, j, INDEX_BIT);
if (index == (NJ_UINT8) nd_index) {
break;
} else {
if ((!NODE_TERM(now)) && (index > (NJ_UINT8) nd_index) && (idx_no == 0)) {
now += GET_BIT_TO_BYTE(bit_tmp + (idx_cnt * 8));
if (now == node_mid) {
return -1;
}
continue;
} else {
if ((now == node_mid) && (restart_flg == 0)
&& (index < (NJ_UINT8) nd_index) && (idx_no == 0)
&& (root != node_mid)) {
now = root;
idx_no = 0;
restart_flg = 1;
continue;
}
return -1;
}
}
}
if ( (idx_cnt > (NJ_UINT16) (idx_no + 1))) {
if (ysize == 0) {
if (operation == NJ_CUR_OP_FORE) {
storebuf->node = now;
storebuf->now = now;
storebuf->idx_no = idx_no + 1;
node = now;
break;
}
return -2;
}
idx_no++;
continue;
}
node = now;
storebuf->node = now;
idx_no = 0;
if (ysize == 0) {
*con_node = now;
} else {
if (!(NODE_LEFT_EXIST(now))) {
return -1;
}
}
if (NODE_LEFT_EXIST(now)) {
if (NODE_IDX_EXIST(now)) {
bit_idx = 8;
} else {
bit_idx = 4;
}
pos = (NJ_UINT16) (bit_idx >> 3);
data_l = (NJ_UINT32) (NJ_INT32_READ(now + pos));
j = (NJ_UINT16) (bit_idx & 0x0007);
now += GET_BITFIELD_32(data_l, j, bit_left);
storebuf->now = now;
} else {
storebuf->now = now;
}
}
if (*con_node == NULL) {
*con_node = now;
}
if ((node == NULL) || !(NODE_DATA_EXIST(node))) {
if ((operation == NJ_CUR_OP_FORE) && (node != NULL)) {
while (!NODE_DATA_EXIST(node)) {
if (!(NODE_LEFT_EXIST(node))) {
return -2;
}
if (NODE_IDX_EXIST(node)) {
bit_idx = 8;
} else {
bit_idx = 4;
}
pos = (NJ_UINT16) (bit_idx >> 3);
data_l = (NJ_UINT32) (NJ_INT32_READ(node + pos));
j = (NJ_UINT16) (bit_idx & 0x0007);
node += GET_BITFIELD_32(data_l, j, bit_left);
}
} else {
return -2;
}
}
if (NODE_IDX_EXIST(node)) {
bit_idx = 8;
} else {
bit_idx = 4;
}
if (NODE_LEFT_EXIST(node)) {
bit_all = bit_idx + bit_left;
} else {
bit_all = bit_idx;
}
pos = (NJ_UINT16) (bit_all >> 3);
data_l = (NJ_UINT32) (NJ_INT32_READ(node + pos));
j = (NJ_UINT16) (bit_all & 0x0007);
*data_offset = GET_BITFIELD_32(data_l, j, bit_data);
return 1;
}
static NJ_INT16 get_node_bottom(NJ_CHAR * yomi, NJ_UINT8 * now, NJ_UINT8 * node_mid,
NJ_UINT8 * data_top, NJ_UINT16 bit_left, NJ_UINT16 bit_data,
NJ_UINT32 top, NJ_DIC_HANDLE handle,
NJ_UINT32 * ret_bottom)
{
NJ_UINT8 *node;
NJ_UINT16 idx_cnt;
NJ_UINT32 data_offset;
NJ_UINT16 pos, j, bit_all;
NJ_UINT32 data_l;
NJ_UINT8 bottom_flg = 0;
NJ_UINT8 *stem_data;
NJ_UINT32 bottom, next;
bottom = top;
if (NJ_CHAR_STRLEN_IS_0(yomi)) {
node = node_mid;
} else {
node = now;
if (NODE_LEFT_EXIST(node)) {
if (NODE_IDX_EXIST(node)) {
bit_all = 8;
} else {
bit_all = 4;
}
pos = (NJ_UINT16) (bit_all >> 3);
data_l = (NJ_UINT32) (NJ_INT32_READ(node + pos));
j = (NJ_UINT16) (bit_all & 0x0007);
node += GET_BITFIELD_32(data_l, j, bit_left);
} else {
bottom_flg = 1;
}
}
if (!bottom_flg) {
while (node < data_top) {
if (!NODE_TERM(node)) {
if (NODE_IDX_EXIST(node)) {
bit_all = 8;
idx_cnt = NODE_IDX_CNT(node);
} else {
bit_all = 4;
idx_cnt = 1;
}
if (NODE_LEFT_EXIST(node)) {
bit_all += bit_left;
}
if (NODE_DATA_EXIST(node)) {
bit_all += bit_data;
}
node += GET_BIT_TO_BYTE(bit_all + (idx_cnt * 8));
} else {
if (!NODE_LEFT_EXIST(node)) {
if (NODE_DATA_EXIST(node)) {
if (NODE_IDX_EXIST(node)) {
bit_all = 8;
} else {
bit_all = 4;
}
pos = (NJ_UINT16) (bit_all >> 3);
data_l = (NJ_UINT32) (NJ_INT32_READ(node + pos));
j = (NJ_UINT16) (bit_all & 0x0007);
data_offset = GET_BITFIELD_32(data_l, j, bit_data);
bottom = data_offset;
break;
} else {
return NJ_SET_ERR_VAL(NJ_FUNC_NJD_B_SEARCH_WORD, NJ_ERR_DIC_BROKEN);
}
} else {
if (NODE_IDX_EXIST(node)) {
bit_all = 8;
} else {
bit_all = 4;
}
pos = (NJ_UINT16) (bit_all >> 3);
data_l = (NJ_UINT32) (NJ_INT32_READ(node + pos));
j = (NJ_UINT16) (bit_all & 0x0007);
node += GET_BITFIELD_32(data_l, j, bit_left);
}
}
}
}
stem_data = data_top + bottom;
while (!(STEM_TERMINETER(stem_data))) {
next = get_stem_next(handle, stem_data);
stem_data += next;
}
*ret_bottom = (NJ_UINT32) (stem_data - data_top);
return 1;
}
static NJ_INT16 bdic_search_fore_data2(NJ_SEARCH_CONDITION *condition, NJ_SEARCH_LOCATION_SET *loctset, NJ_UINT16 hidx)
{
NJ_UINT8 *data, *data_top, *bottom, *data_end;
NJ_INT16 i = 0;
NJ_INT16 hindo = 0;
NJ_UINT32 current = loctset->loct.current;
NJ_SEARCH_CACHE *psrhCache = condition->ds->dic[hidx].srhCache;
NJ_UINT16 top_abIdx;
NJ_UINT16 bottom_abIdx;
NJ_UINT16 count_abIdx;
NJ_UINT16 current_abIdx;
NJ_UINT16 old_abIdx;
NJ_UINT8 freq_flag = 0;
NJ_INT16 save_hindo = 0;
NJ_UINT16 save_abIdx = 0;
NJ_UINT16 abPtrIdx;
NJ_UINT16 m;
NJ_INT16 ret;
NJ_INT16 loop_check;
NJ_UINT16 abIdx;
NJ_UINT16 abIdx_old;
NJ_UINT16 hindo_max, hindo_tmp;
NJ_UINT32 hindo_max_data, hindo_tmp_data;
NJ_UINT16 abIdx_current;
if (GET_LOCATION_STATUS(loctset->loct.status) == NJ_ST_SEARCH_NO_INIT) {
loctset->loct.status = NJ_ST_SEARCH_READY;
loctset->loct.current_info = CURRENT_INFO_SET;
return 1;
}
if (NJ_GET_AIMAI_FROM_SCACHE(psrhCache)) {
NJ_UNSET_AIMAI_TO_SCACHE(psrhCache);
data_top = STEM_AREA_TOP_ADDR(loctset->loct.handle);
if (condition->operation == NJ_CUR_OP_FORE) {
if (condition->ylen) {
abPtrIdx = condition->yclen;
abIdx = psrhCache->keyPtr[abPtrIdx];
abIdx_old = psrhCache->keyPtr[abPtrIdx - 1];
if ((abIdx > NJ_SEARCH_CACHE_SIZE) || (abIdx_old >= NJ_SEARCH_CACHE_SIZE)) {
return NJ_SET_ERR_VAL(NJ_FUNC_NJD_B_SEARCH_WORD, NJ_ERR_CACHE_BROKEN);
}
if (condition->mode == NJ_CUR_MODE_FREQ) {
hindo_max = 0;
hindo_max_data = 0;
abIdx_current = abIdx_old;
for (m = abIdx_old; m < abIdx; m++) {
data = data_top + psrhCache->storebuff[m].top;
hindo = (NJ_UINT16) *((NJ_UINT8 *)(HINDO_NO_TOP_ADDR(loctset->loct.handle) +
get_stem_hindo(loctset->loct.handle, data)));
hindo_tmp = 0;
hindo_tmp_data = 0;
current = 0;
while (data <= (data_top + psrhCache->storebuff[m].bottom)) {
if (hindo > hindo_tmp) {
hindo_tmp = hindo;
hindo_tmp_data = current;
}
i = get_stem_next(loctset->loct.handle, data);
current += i;
data += i;
hindo = (NJ_UINT16) *((NJ_UINT8 *) (HINDO_NO_TOP_ADDR(loctset->loct.handle) +
get_stem_hindo(loctset->loct.handle, data)));
}
psrhCache->storebuff[m].current = hindo_tmp_data;
if (hindo_tmp > hindo_max) {
hindo_max = hindo_tmp;
hindo_max_data = hindo_tmp_data;
abIdx_current = m;
}
}
} else {
abIdx_current = abIdx_old;
data = data_top + psrhCache->storebuff[abIdx_current].top;
hindo = (NJ_UINT16) *((NJ_UINT8 *)(HINDO_NO_TOP_ADDR(loctset->loct.handle)
+ get_stem_hindo(loctset->loct.handle, data)));
hindo_max = hindo;
hindo_max_data = 0;
}
loctset->loct.top = psrhCache->storebuff[abIdx_current].top;
loctset->loct.bottom = psrhCache->storebuff[abIdx_current].bottom;
loctset->cache_freq = CALCULATE_HINDO(hindo_max, loctset->dic_freq.base,
loctset->dic_freq.high, COMP_DIC_FREQ_DIV);
loctset->loct.current = hindo_max_data;
loctset->loct.current_cache = (NJ_UINT8)abIdx_current;
psrhCache->viewCnt = 1;
} else {
data = data_top + loctset->loct.top;
hindo = (NJ_UINT16) *((NJ_UINT8 *)(HINDO_NO_TOP_ADDR(loctset->loct.handle) +
get_stem_hindo(loctset->loct.handle, data)));
hindo_max = hindo;
hindo_max_data = 0;
if (condition->mode == NJ_CUR_MODE_FREQ) {
i = get_stem_next(loctset->loct.handle, data);
current = i;
data += i;
while (data <= (data_top + loctset->loct.bottom)) {
hindo = (NJ_UINT16)*((NJ_UINT8 *)(HINDO_NO_TOP_ADDR(loctset->loct.handle) +
get_stem_hindo(loctset->loct.handle, data)));
if (hindo > hindo_max) {
hindo_max = hindo;
hindo_max_data = current;
}
i = get_stem_next(loctset->loct.handle, data);
current += i;
data += i;
}
}
loctset->cache_freq = CALCULATE_HINDO(hindo_max,
loctset->dic_freq.base,
loctset->dic_freq.high, COMP_DIC_FREQ_DIV);
loctset->loct.current = hindo_max_data;
}
}
return 1;
}
data_top = STEM_AREA_TOP_ADDR(loctset->loct.handle);
data = data_top + loctset->loct.top + loctset->loct.current;
bottom = data_top + loctset->loct.bottom;
if (NJ_GET_DIC_FMT(loctset->loct.handle) == NJ_DIC_FMT_KANAKAN) {
data_end = loctset->loct.handle
+ NJ_DIC_COMMON_HEADER_SIZE
+ NJ_INT32_READ(loctset->loct.handle + NJ_DIC_POS_DATA_SIZE)
+ NJ_INT32_READ(loctset->loct.handle + NJ_DIC_POS_EXT_SIZE)
- NJ_DIC_ID_LEN;
} else {
data_end = CAND_IDX_AREA_TOP_ADDR(loctset->loct.handle);
}
if (condition->mode == NJ_CUR_MODE_FREQ) {
abPtrIdx = condition->yclen;
bottom_abIdx = psrhCache->keyPtr[abPtrIdx];
top_abIdx = psrhCache->keyPtr[abPtrIdx - 1];
if ((bottom_abIdx > NJ_SEARCH_CACHE_SIZE) || (top_abIdx >= NJ_SEARCH_CACHE_SIZE)) {
return NJ_SET_ERR_VAL(NJ_FUNC_NJD_B_SEARCH_WORD, NJ_ERR_CACHE_BROKEN);
}
count_abIdx = bottom_abIdx - top_abIdx;
if (!count_abIdx) {
loctset->loct.status = NJ_ST_SEARCH_END;
return 0;
}
old_abIdx = loctset->loct.current_cache;
loop_check = 0;
ret = bdic_get_next_data(data_top, data_end, loctset, psrhCache, old_abIdx);
if (ret == loctset->cache_freq) {
psrhCache->viewCnt++;
if (psrhCache->viewCnt <= NJ_CACHE_VIEW_CNT) {
loctset->loct.status = NJ_ST_SEARCH_READY;
loctset->loct.current_info = CURRENT_INFO_SET;
loctset->loct.current = psrhCache->storebuff[old_abIdx].current;
loctset->loct.current_cache = (NJ_UINT8)old_abIdx;
return 1;
} else {
freq_flag = 1;
psrhCache->viewCnt = 0;
}
} else {
if (ret == -1) {
loop_check++;
}
save_hindo = ret;
save_abIdx = old_abIdx;
}
current_abIdx = old_abIdx + 1;
if (current_abIdx >= bottom_abIdx) {
current_abIdx = top_abIdx;
}
while (loop_check != count_abIdx) {
ret = bdic_get_word_freq(data_top, loctset, psrhCache, current_abIdx);
if ((ret == loctset->cache_freq) &&
(loctset->loct.top == psrhCache->storebuff[current_abIdx].top) &&
(loctset->loct.current == psrhCache->storebuff[current_abIdx].current)) {
ret = bdic_get_next_data(data_top, data_end, loctset, psrhCache, current_abIdx);
}
if (ret == loctset->cache_freq) {
loctset->loct.status = NJ_ST_SEARCH_READY;
loctset->loct.current_info = CURRENT_INFO_SET;
loctset->loct.top = psrhCache->storebuff[current_abIdx].top;
loctset->loct.bottom = psrhCache->storebuff[current_abIdx].bottom;
loctset->loct.current = psrhCache->storebuff[current_abIdx].current;
loctset->loct.current_cache = (NJ_UINT8)current_abIdx;
psrhCache->viewCnt = 1;
return 1;
} else {
if (ret == -1) {
loop_check++;
}
if (save_hindo < ret) {
save_hindo = ret;
save_abIdx = current_abIdx;
}
}
current_abIdx++;
if (current_abIdx >= bottom_abIdx) {
current_abIdx = top_abIdx;
}
if (current_abIdx == old_abIdx) {
if (freq_flag == 1) {
loctset->loct.status = NJ_ST_SEARCH_READY;
loctset->loct.current_info = CURRENT_INFO_SET;
loctset->loct.top = psrhCache->storebuff[current_abIdx].top;
loctset->loct.bottom = psrhCache->storebuff[current_abIdx].bottom;
loctset->loct.current = psrhCache->storebuff[current_abIdx].current;
loctset->loct.current_cache = (NJ_UINT8)current_abIdx;
psrhCache->viewCnt = 1;
return 1;
} else if (save_hindo != -1) {
loctset->cache_freq = save_hindo;
loctset->loct.status = NJ_ST_SEARCH_READY;
loctset->loct.current_info = CURRENT_INFO_SET;
loctset->loct.top = psrhCache->storebuff[save_abIdx].top;
loctset->loct.bottom = psrhCache->storebuff[save_abIdx].bottom;
loctset->loct.current = psrhCache->storebuff[save_abIdx].current;
loctset->loct.current_cache = (NJ_UINT8)save_abIdx;
psrhCache->viewCnt = 1;
return 1;
}
}
}
} else {
i = get_stem_next(loctset->loct.handle, data);
data += i;
current += i;
if (data > bottom) {
loctset->loct.status = NJ_ST_SEARCH_END;
return 0;
}
hindo = (NJ_INT16)*((NJ_UINT8 *)(HINDO_NO_TOP_ADDR(loctset->loct.handle)
+ get_stem_hindo(loctset->loct.handle, data)));
loctset->cache_freq = CALCULATE_HINDO(hindo, loctset->dic_freq.base,
loctset->dic_freq.high, COMP_DIC_FREQ_DIV);
loctset->loct.status = NJ_ST_SEARCH_READY;
loctset->loct.current_info = CURRENT_INFO_SET;
loctset->loct.current = current;
return 1;
}
loctset->loct.status = NJ_ST_SEARCH_END;
return 0;
}
static NJ_INT16 bdic_get_next_data(NJ_UINT8 *data_top, NJ_UINT8 *data_end,
NJ_SEARCH_LOCATION_SET *loctset,
NJ_SEARCH_CACHE *psrhCache,
NJ_UINT16 abIdx)
{
NJ_UINT8 *data, *bottom;
NJ_INT16 i = 0;
NJ_INT16 hindo = 0;
NJ_INT16 hindo_max = -1;
NJ_UINT8 no_hit = 0;
NJ_UINT32 current = psrhCache->storebuff[abIdx].current;
NJ_UINT8 *current_org;
NJ_UINT32 hindo_data = 0;
NJ_INT16 freq_org = loctset->cache_freq;
if (psrhCache->storebuff[abIdx].current == LOC_CURRENT_NO_ENTRY) {
return (-1);
}
data = data_top + psrhCache->storebuff[abIdx].top + psrhCache->storebuff[abIdx].current;
current_org = data;
bottom = data_top + psrhCache->storebuff[abIdx].bottom;
while (data < data_end) {
i = get_stem_next(loctset->loct.handle, data);
data += i;
current += i;
if (data > bottom) {
if ((freq_org == 0) || (no_hit == 1)) {
psrhCache->storebuff[abIdx].current = LOC_CURRENT_NO_ENTRY;
return -1;
}
freq_org -= 1;
data = data_top + psrhCache->storebuff[abIdx].top;
current = 0;
no_hit = 1;
}
if ((hindo_max != -1) && (data == current_org)) {
psrhCache->storebuff[abIdx].current = hindo_data;
return hindo_max;
}
hindo = (NJ_INT16)*((NJ_UINT8 *)(HINDO_NO_TOP_ADDR(loctset->loct.handle)
+ get_stem_hindo(loctset->loct.handle, data)));
hindo = CALCULATE_HINDO(hindo, loctset->dic_freq.base, loctset->dic_freq.high, COMP_DIC_FREQ_DIV);
if (hindo == freq_org) {
psrhCache->storebuff[abIdx].current = current;
return hindo;
}
if (hindo < freq_org) {
if ((hindo > hindo_max) || ((hindo == hindo_max) && (current < hindo_data))) {
hindo_max = hindo;
hindo_data = current;
}
}
}
psrhCache->storebuff[abIdx].current = LOC_CURRENT_NO_ENTRY;
return -1;
}
static NJ_INT16 bdic_get_word_freq(NJ_UINT8 * data_top, NJ_SEARCH_LOCATION_SET * loctset,
NJ_SEARCH_CACHE * psrhCache, NJ_UINT16 abIdx)
{
NJ_UINT8 *data;
NJ_INT16 hindo = 0;
if (psrhCache->storebuff[abIdx].current != LOC_CURRENT_NO_ENTRY) {
data = data_top + psrhCache->storebuff[abIdx].top + psrhCache->storebuff[abIdx].current;
hindo = (NJ_INT16)*((NJ_UINT8 *)(HINDO_NO_TOP_ADDR(loctset->loct.handle)
+ get_stem_hindo(loctset->loct.handle, data)));
hindo = CALCULATE_HINDO(hindo, loctset->dic_freq.base, loctset->dic_freq.high, COMP_DIC_FREQ_DIV);
} else {
hindo = -1;
}
return hindo;
}