Skip to content
Projects
Groups
Snippets
Help
Loading...
Help
Support
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
M
mariadb
Project overview
Project overview
Details
Activity
Releases
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Issues
0
Issues
0
List
Boards
Labels
Milestones
Merge Requests
0
Merge Requests
0
Analytics
Analytics
Repository
Value Stream
Wiki
Wiki
Snippets
Snippets
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Create a new issue
Commits
Issue Boards
Open sidebar
Kirill Smelkov
mariadb
Commits
5c4b54f4
Commit
5c4b54f4
authored
Mar 22, 2004
by
bar@bar.intranet.mysql.r18.ru
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
uca-dump.c:
new file
parent
d82d09b6
Changes
1
Show whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
258 additions
and
0 deletions
+258
-0
strings/uca-dump.c
strings/uca-dump.c
+258
-0
No files found.
strings/uca-dump.c
0 → 100644
View file @
5c4b54f4
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
typedef
unsigned
char
uchar
;
typedef
unsigned
short
uint16
;
struct
uca_item_st
{
uchar
num
;
uint16
weight
[
4
][
8
];
};
#if 1
#define MY_UCA_NPAGES 1024
#define MY_UCA_NCHARS 64
#define MY_UCA_CMASK 63
#define MY_UCA_PSHIFT 6
#else
#define MY_UCA_NPAGES 256
#define MY_UCA_NCHARS 256
#define MY_UCA_CMASK 255
#define MY_UCA_PSHIFT 8
#endif
int
main
(
int
ac
,
char
**
av
)
{
char
str
[
256
];
char
*
weights
[
64
];
struct
uca_item_st
uca
[
64
*
1024
];
size_t
code
,
page
,
w
;
int
pagemaxlen
[
MY_UCA_NPAGES
];
bzero
(
uca
,
sizeof
(
uca
));
while
(
fgets
(
str
,
sizeof
(
str
),
stdin
))
{
char
*
comment
;
char
*
weight
;
char
*
s
;
size_t
codenum
;
code
=
strtol
(
str
,
NULL
,
16
);
if
(
str
[
0
]
==
'#'
||
(
code
>
0xFFFF
))
continue
;
if
((
comment
=
strchr
(
str
,
'#'
)))
{
*
comment
++=
'\0'
;
for
(
;
*
comment
==
' '
;
comment
++
);
}
else
continue
;
if
((
weight
=
strchr
(
str
,
';'
)))
{
*
weight
++=
'\0'
;
for
(
;
*
weight
==
' '
;
weight
++
);
}
else
continue
;
codenum
=
0
;
s
=
strtok
(
str
,
"
\t
"
);
while
(
s
)
{
s
=
strtok
(
NULL
,
"
\t
"
);
codenum
++
;
}
if
(
codenum
>
1
)
{
/* Multi-character weight */
continue
;
}
uca
[
code
].
num
=
0
;
s
=
strtok
(
weight
,
" []"
);
while
(
s
)
{
weights
[
uca
[
code
].
num
]
=
s
;
s
=
strtok
(
NULL
,
" []"
);
uca
[
code
].
num
++
;
}
for
(
w
=
0
;
w
<
uca
[
code
].
num
;
w
++
)
{
size_t
partnum
;
partnum
=
0
;
s
=
weights
[
w
];
while
(
*
s
)
{
char
*
endptr
;
size_t
part
;
part
=
strtol
(
s
+
1
,
&
endptr
,
16
);
uca
[
code
].
weight
[
partnum
][
w
]
=
part
;
s
=
endptr
;
partnum
++
;
}
}
}
/* Now set implicit weights */
for
(
code
=
0
;
code
<=
0xFFFF
;
code
++
)
{
size_t
base
,
aaaa
,
bbbb
;
if
(
uca
[
code
].
num
)
continue
;
/*
3400;<CJK Ideograph Extension A, First>
4DB5;<CJK Ideograph Extension A, Last>
4E00;<CJK Ideograph, First>
9FA5;<CJK Ideograph, Last>
*/
if
(
code
>=
0x3400
&&
code
<=
0x4DB5
)
base
=
0xFB80
;
else
if
(
code
>=
0x4E00
&&
code
<=
0x9FA5
)
base
=
0xFB40
;
else
base
=
0xFBC0
;
aaaa
=
base
+
(
code
>>
15
);
bbbb
=
(
code
&
0x7FFF
)
|
0x8000
;
uca
[
code
].
weight
[
0
][
0
]
=
aaaa
;
uca
[
code
].
weight
[
0
][
1
]
=
bbbb
;
uca
[
code
].
weight
[
1
][
0
]
=
0x0020
;
uca
[
code
].
weight
[
1
][
1
]
=
0x0000
;
uca
[
code
].
weight
[
2
][
0
]
=
0x0002
;
uca
[
code
].
weight
[
2
][
1
]
=
0x0000
;
uca
[
code
].
weight
[
3
][
0
]
=
0x0001
;
uca
[
code
].
weight
[
3
][
2
]
=
0x0000
;
uca
[
code
].
num
=
2
;
}
printf
(
"#include
\"
my_uca.h
\"\n
"
);
printf
(
"#define MY_UCA_NPAGES %d
\n
"
,
MY_UCA_NPAGES
);
printf
(
"#define MY_UCA_NCHARS %d
\n
"
,
MY_UCA_NCHARS
);
printf
(
"#define MY_UCA_CMASK %d
\n
"
,
MY_UCA_CMASK
);
printf
(
"#define MY_UCA_PSHIFT %d
\n
"
,
MY_UCA_PSHIFT
);
for
(
w
=
0
;
w
<
1
;
w
++
)
{
for
(
page
=
0
;
page
<
MY_UCA_NPAGES
;
page
++
)
{
size_t
offs
;
size_t
maxnum
=
0
;
size_t
nchars
=
0
;
size_t
mchars
;
/*
Calculate maximum weight
length for this page
*/
for
(
offs
=
0
;
offs
<
MY_UCA_NCHARS
;
offs
++
)
{
size_t
i
,
num
;
code
=
page
*
MY_UCA_NCHARS
+
offs
;
/* Calculate only non-zero weights */
num
=
0
;
for
(
i
=
0
;
i
<
uca
[
code
].
num
;
i
++
)
if
(
uca
[
code
].
weight
[
w
][
i
])
num
++
;
maxnum
=
maxnum
<
num
?
num
:
maxnum
;
}
if
(
!
maxnum
)
maxnum
=
1
;
switch
(
maxnum
)
{
case
0
:
mchars
=
8
;
break
;
case
1
:
mchars
=
8
;
break
;
case
2
:
mchars
=
8
;
break
;
case
3
:
mchars
=
9
;
break
;
case
4
:
mchars
=
8
;
break
;
default:
mchars
=
uca
[
code
].
num
;
}
pagemaxlen
[
page
]
=
maxnum
;
printf
(
"uint16 page%03Xdata[]= { /* %04X (%d weights per char) */
\n
"
,
page
,
page
*
MY_UCA_NCHARS
,
maxnum
);
/*
Now print this page
*/
for
(
offs
=
0
;
offs
<
MY_UCA_NCHARS
;
offs
++
)
{
uint16
weight
[
8
];
size_t
num
,
i
;
code
=
page
*
MY_UCA_NCHARS
+
offs
;
bzero
(
weight
,
sizeof
(
weight
));
/* Copy non-zero weights */
for
(
num
=
0
,
i
=
0
;
i
<
uca
[
code
].
num
;
i
++
)
{
if
(
uca
[
code
].
weight
[
w
][
i
])
{
weight
[
num
]
=
uca
[
code
].
weight
[
w
][
i
];
num
++
;
}
}
for
(
i
=
0
;
i
<
maxnum
;
i
++
)
{
printf
(
"0x%04X"
,(
int
)
weight
[
i
]);
if
((
offs
+
1
!=
MY_UCA_NCHARS
)
||
(
i
+
1
!=
maxnum
))
printf
(
","
);
nchars
++
;
}
if
(
nchars
>=
mchars
)
{
printf
(
"
\n
"
);
nchars
=
0
;
}
else
{
printf
(
" "
);
}
}
printf
(
"};
\n\n
"
);
}
}
printf
(
"uchar ucal[%d]={
\n
"
,
MY_UCA_NPAGES
);
for
(
page
=
0
;
page
<
MY_UCA_NPAGES
;
page
++
)
{
printf
(
"%d%s%s"
,
pagemaxlen
[
page
],
page
<
MY_UCA_NPAGES
-
1
?
","
:
""
,(
page
+
1
)
%
16
?
""
:
"
\n
"
);
}
printf
(
"};
\n
"
);
printf
(
"uint16 *ucaw[%d]={
\n
"
,
MY_UCA_NPAGES
);
for
(
page
=
0
;
page
<
MY_UCA_NPAGES
;
page
++
)
{
printf
(
"page%03Xdata%s%s"
,
page
,
page
<
MY_UCA_NPAGES
-
1
?
","
:
""
,
(
page
+
1
)
%
4
?
""
:
"
\n
"
);
}
printf
(
"};
\n
"
);
printf
(
"int main(void){ return 0;};
\n
"
);
return
0
;
}
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment