#define xzero(lvalue) ((void) memset (&(lvalue), '\0', sizeof (lvalue)))
+CHISE_Char_ID
+chise_char_id_parse_c_string (unsigned char *str, int len)
+{
+ int i = 0;
+
+ if ( (len >= 2) && (str[i++] == '?') )
+ {
+ unsigned char c = str[i++];
+ int counter;
+ CHISE_Char_ID cid;
+
+ if (c == '\\')
+ {
+ if (len < 3)
+ return -1;
+ c = str[i++];
+ if (c == '^')
+ {
+ if (len < 4)
+ return -1;
+ c = str[i++];
+ if (c == '?')
+ return 0x7F;
+ else
+ return c & (0x80 | 0x1F);
+ }
+ }
+ if ( c < 0xC0 )
+ {
+ cid = c;
+ counter = 0;
+ }
+ else if ( c < 0xE0 )
+ {
+ cid = c & 0x1f;
+ counter = 1;
+ }
+ else if ( c < 0xF0 )
+ {
+ cid = c & 0x0f;
+ counter = 2;
+ }
+ else if ( c < 0xF8 )
+ {
+ cid = c & 0x07;
+ counter = 3;
+ }
+ else if ( c < 0xFC )
+ {
+ cid = c & 0x03;
+ counter = 4;
+ }
+ else
+ {
+ cid = c & 0x01;
+ counter = 5;
+ }
+
+ if (counter + 2 <= len)
+ {
+ int j;
+
+ for (j = 0; j < counter; j++)
+ cid = (cid << 6) | (str[j + i] & 0x3F);
+ return cid;
+ }
+ }
+ return -1;
+}
int
chise_open_data_source (CHISE_DS *ds, CHISE_DS_Type type, char *location)
unsigned char *str
= (unsigned char *)chise_value_data (&valdatum);
int len = strnlen (str, chise_value_size (&valdatum));
- int i = 0;
-
- if ( (len >= 2) && (str[i++] == '?') )
- {
- unsigned char c = str[i++];
- int counter;
- CHISE_Char_ID cid;
-
- if (c == '\\')
- {
- if (len < 3)
- return -1;
- c = str[i++];
- if (c == '^')
- {
- if (len < 4)
- return -1;
- c = str[i++];
- if (c == '?')
- return 0x7F;
- else
- return c & (0x80 | 0x1F);
- }
- }
- if ( c < 0xC0 )
- {
- cid = c;
- counter = 0;
- }
- else if ( c < 0xE0 )
- {
- cid = c & 0x1f;
- counter = 1;
- }
- else if ( c < 0xF0 )
- {
- cid = c & 0x0f;
- counter = 2;
- }
- else if ( c < 0xF8 )
- {
- cid = c & 0x07;
- counter = 3;
- }
- else if ( c < 0xFC )
- {
- cid = c & 0x03;
- counter = 4;
- }
- else
- {
- cid = c & 0x01;
- counter = 5;
- }
- if (counter + 2 <= len)
- {
- int j;
-
- for (j = 0; j < counter; j++)
- cid = (cid << 6) | (str[j + i] & 0x3F);
- return cid;
- }
- }
+ return chise_char_id_parse_c_string (str, len);
}
return -1;
}
unsigned char key_buf[8];
key_buf[0] = '?';
- if (cid <= 0x7f)
+ if (cid == '\t')
+ {
+ key_buf[1] = '\\';
+ key_buf[2] = 't';
+ key_buf[3] = '\0';
+ }
+ else if (cid == '\n')
+ {
+ key_buf[1] = '\\';
+ key_buf[2] = 'n';
+ key_buf[3] = '\0';
+ }
+ else if (cid == '\r')
+ {
+ key_buf[1] = '\\';
+ key_buf[2] = 'r';
+ key_buf[3] = '\0';
+ }
+ else if (cid == 0x1C)
+ {
+ key_buf[1] = '\\';
+ key_buf[2] = '^';
+ key_buf[3] = '\\';
+ key_buf[4] = '\\';
+ key_buf[5] = '\0';
+ }
+ else if (cid <= 0x1F)
+ {
+ key_buf[1] = '\\';
+ key_buf[2] = '^';
+ key_buf[3] = '@' + cid;
+ key_buf[4] = '\0';
+ }
+ else if ( (cid == ' ') || (cid == '"') ||
+ (cid == '#') || (cid == '\'') ||
+ (cid == '(') || (cid == ')') ||
+ (cid == ',') || (cid == '.') ||
+ (cid == ';') || (cid == '?') ||
+ (cid == '[') || (cid == '\\') ||
+ (cid == ']') || (cid == '`') )
+ {
+ key_buf[1] = '\\';
+ key_buf[2] = cid;
+ key_buf[3] = '\0';
+ }
+ else if (cid <= 0x7E)
{
key_buf[1] = cid;
key_buf[2] = '\0';
}
- else if (cid <= 0x7ff)
+ else if (cid == 0x7F)
+ {
+ key_buf[1] = '\\';
+ key_buf[2] = '^';
+ key_buf[3] = '?';
+ key_buf[4] = '\0';
+ }
+ else if (cid <= 0x9F)
+ {
+ key_buf[1] = '\\';
+ key_buf[2] = '^';
+ key_buf[3] = ((cid + '@') >> 6) | 0xC0;
+ key_buf[4] = ((cid + '@') & 0x3F) | 0x80;
+ key_buf[5] = '\0';
+
+ }
+ else if (cid <= 0x7FF)
{
- key_buf[1] = (cid >> 6) | 0xc0;
- key_buf[2] = (cid & 0x3f) | 0x80;
+ key_buf[1] = (cid >> 6) | 0xC0;
+ key_buf[2] = (cid & 0x3F) | 0x80;
key_buf[3] = '\0';
}
- else if (cid <= 0xffff)
+ else if (cid <= 0xFFFF)
{
- key_buf[1] = (cid >> 12) | 0xe0;
- key_buf[2]= ((cid >> 6) & 0x3f) | 0x80;
- key_buf[3]= (cid & 0x3f) | 0x80;
+ key_buf[1] = (cid >> 12) | 0xE0;
+ key_buf[2]= ((cid >> 6) & 0x3F) | 0x80;
+ key_buf[3]= (cid & 0x3F) | 0x80;
key_buf[4] = '\0';
}
- else if (cid <= 0x1fffff)
+ else if (cid <= 0x1FFFFF)
{
- key_buf[1]= (cid >> 18) | 0xf0;
- key_buf[2]= ((cid >> 12) & 0x3f) | 0x80;
- key_buf[3]= ((cid >> 6) & 0x3f) | 0x80;
- key_buf[4]= (cid & 0x3f) | 0x80;
+ key_buf[1]= (cid >> 18) | 0xF0;
+ key_buf[2]= ((cid >> 12) & 0x3F) | 0x80;
+ key_buf[3]= ((cid >> 6) & 0x3F) | 0x80;
+ key_buf[4]= (cid & 0x3F) | 0x80;
key_buf[5] = '\0';
}
- else if (cid <= 0x3ffffff)
+ else if (cid <= 0x3FFFFFF)
{
- key_buf[1]= (cid >> 24) | 0xf8;
- key_buf[2]= ((cid >> 18) & 0x3f) | 0x80;
- key_buf[3]= ((cid >> 12) & 0x3f) | 0x80;
- key_buf[4]= ((cid >> 6) & 0x3f) | 0x80;
- key_buf[5]= (cid & 0x3f) | 0x80;
+ key_buf[1]= (cid >> 24) | 0xF8;
+ key_buf[2]= ((cid >> 18) & 0x3F) | 0x80;
+ key_buf[3]= ((cid >> 12) & 0x3F) | 0x80;
+ key_buf[4]= ((cid >> 6) & 0x3F) | 0x80;
+ key_buf[5]= (cid & 0x3F) | 0x80;
key_buf[6] = '\0';
}
else
{
- key_buf[1]= (cid >> 30) | 0xfc;
- key_buf[2]= ((cid >> 24) & 0x3f) | 0x80;
- key_buf[3]= ((cid >> 18) & 0x3f) | 0x80;
- key_buf[4]= ((cid >> 12) & 0x3f) | 0x80;
- key_buf[5]= ((cid >> 6) & 0x3f) | 0x80;
- key_buf[6]= (cid & 0x3f) | 0x80;
+ key_buf[1]= (cid >> 30) | 0xFC;
+ key_buf[2]= ((cid >> 24) & 0x3F) | 0x80;
+ key_buf[3]= ((cid >> 18) & 0x3F) | 0x80;
+ key_buf[4]= ((cid >> 12) & 0x3F) | 0x80;
+ key_buf[5]= ((cid >> 6) & 0x3F) | 0x80;
+ key_buf[6]= (cid & 0x3F) | 0x80;
key_buf[7] = '\0';
}
return
chise_get_attribute_table (db, key_buf, valdatum);
}
+void
+chise_ft_iterate (CHISE_Feature_Table *dbp,
+ int (*func) (CHISE_Feature_Table *db,
+ CHISE_Char_ID cid, CHISE_Value *valdatum))
+{
+ DBT keydatum, valdatum;
+ DBC *dbcp;
+ int status;
+
+ xzero (keydatum);
+ xzero (valdatum);
+
+ status = dbp->cursor (dbp, NULL, &dbcp, 0);
+ for (status = dbcp->c_get (dbcp, &keydatum, &valdatum, DB_FIRST);
+ status == 0;
+ status = dbcp->c_get (dbcp, &keydatum, &valdatum, DB_NEXT))
+ {
+ unsigned char *key_str = (unsigned char *)keydatum.data;
+ int key_len = strnlen (key_str, keydatum.size);
+ CHISE_Char_ID key = chise_char_id_parse_c_string (key_str, key_len);
+ int ret;
+
+ if (ret = func (dbp, key, &valdatum))
+ break;
+ }
+ dbcp->c_close (dbcp);
+}
int
chise_open_attribute_table (CHISE_Attribute_Table **db,