Skip to content
Projects
Groups
Snippets
Help
Loading...
Help
Support
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
M
mariadb
Project overview
Project overview
Details
Activity
Releases
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Issues
0
Issues
0
List
Boards
Labels
Milestones
Merge Requests
0
Merge Requests
0
Analytics
Analytics
Repository
Value Stream
Wiki
Wiki
Snippets
Snippets
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Create a new issue
Commits
Issue Boards
Open sidebar
Kirill Smelkov
mariadb
Commits
8aa866d9
Commit
8aa866d9
authored
Mar 22, 2004
by
unknown
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
uca-dump.c:
new file
parent
fb5d4bb5
Changes
1
Show whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
258 additions
and
0 deletions
+258
-0
strings/uca-dump.c
strings/uca-dump.c
+258
-0
No files found.
strings/uca-dump.c
0 → 100644
View file @
8aa866d9
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
typedef
unsigned
char
uchar
;
typedef
unsigned
short
uint16
;
struct
uca_item_st
{
uchar
num
;
uint16
weight
[
4
][
8
];
};
#if 1
#define MY_UCA_NPAGES 1024
#define MY_UCA_NCHARS 64
#define MY_UCA_CMASK 63
#define MY_UCA_PSHIFT 6
#else
#define MY_UCA_NPAGES 256
#define MY_UCA_NCHARS 256
#define MY_UCA_CMASK 255
#define MY_UCA_PSHIFT 8
#endif
int
main
(
int
ac
,
char
**
av
)
{
char
str
[
256
];
char
*
weights
[
64
];
struct
uca_item_st
uca
[
64
*
1024
];
size_t
code
,
page
,
w
;
int
pagemaxlen
[
MY_UCA_NPAGES
];
bzero
(
uca
,
sizeof
(
uca
));
while
(
fgets
(
str
,
sizeof
(
str
),
stdin
))
{
char
*
comment
;
char
*
weight
;
char
*
s
;
size_t
codenum
;
code
=
strtol
(
str
,
NULL
,
16
);
if
(
str
[
0
]
==
'#'
||
(
code
>
0xFFFF
))
continue
;
if
((
comment
=
strchr
(
str
,
'#'
)))
{
*
comment
++=
'\0'
;
for
(
;
*
comment
==
' '
;
comment
++
);
}
else
continue
;
if
((
weight
=
strchr
(
str
,
';'
)))
{
*
weight
++=
'\0'
;
for
(
;
*
weight
==
' '
;
weight
++
);
}
else
continue
;
codenum
=
0
;
s
=
strtok
(
str
,
"
\t
"
);
while
(
s
)
{
s
=
strtok
(
NULL
,
"
\t
"
);
codenum
++
;
}
if
(
codenum
>
1
)
{
/* Multi-character weight */
continue
;
}
uca
[
code
].
num
=
0
;
s
=
strtok
(
weight
,
" []"
);
while
(
s
)
{
weights
[
uca
[
code
].
num
]
=
s
;
s
=
strtok
(
NULL
,
" []"
);
uca
[
code
].
num
++
;
}
for
(
w
=
0
;
w
<
uca
[
code
].
num
;
w
++
)
{
size_t
partnum
;
partnum
=
0
;
s
=
weights
[
w
];
while
(
*
s
)
{
char
*
endptr
;
size_t
part
;
part
=
strtol
(
s
+
1
,
&
endptr
,
16
);
uca
[
code
].
weight
[
partnum
][
w
]
=
part
;
s
=
endptr
;
partnum
++
;
}
}
}
/* Now set implicit weights */
for
(
code
=
0
;
code
<=
0xFFFF
;
code
++
)
{
size_t
base
,
aaaa
,
bbbb
;
if
(
uca
[
code
].
num
)
continue
;
/*
3400;<CJK Ideograph Extension A, First>
4DB5;<CJK Ideograph Extension A, Last>
4E00;<CJK Ideograph, First>
9FA5;<CJK Ideograph, Last>
*/
if
(
code
>=
0x3400
&&
code
<=
0x4DB5
)
base
=
0xFB80
;
else
if
(
code
>=
0x4E00
&&
code
<=
0x9FA5
)
base
=
0xFB40
;
else
base
=
0xFBC0
;
aaaa
=
base
+
(
code
>>
15
);
bbbb
=
(
code
&
0x7FFF
)
|
0x8000
;
uca
[
code
].
weight
[
0
][
0
]
=
aaaa
;
uca
[
code
].
weight
[
0
][
1
]
=
bbbb
;
uca
[
code
].
weight
[
1
][
0
]
=
0x0020
;
uca
[
code
].
weight
[
1
][
1
]
=
0x0000
;
uca
[
code
].
weight
[
2
][
0
]
=
0x0002
;
uca
[
code
].
weight
[
2
][
1
]
=
0x0000
;
uca
[
code
].
weight
[
3
][
0
]
=
0x0001
;
uca
[
code
].
weight
[
3
][
2
]
=
0x0000
;
uca
[
code
].
num
=
2
;
}
printf
(
"#include
\"
my_uca.h
\"\n
"
);
printf
(
"#define MY_UCA_NPAGES %d
\n
"
,
MY_UCA_NPAGES
);
printf
(
"#define MY_UCA_NCHARS %d
\n
"
,
MY_UCA_NCHARS
);
printf
(
"#define MY_UCA_CMASK %d
\n
"
,
MY_UCA_CMASK
);
printf
(
"#define MY_UCA_PSHIFT %d
\n
"
,
MY_UCA_PSHIFT
);
for
(
w
=
0
;
w
<
1
;
w
++
)
{
for
(
page
=
0
;
page
<
MY_UCA_NPAGES
;
page
++
)
{
size_t
offs
;
size_t
maxnum
=
0
;
size_t
nchars
=
0
;
size_t
mchars
;
/*
Calculate maximum weight
length for this page
*/
for
(
offs
=
0
;
offs
<
MY_UCA_NCHARS
;
offs
++
)
{
size_t
i
,
num
;
code
=
page
*
MY_UCA_NCHARS
+
offs
;
/* Calculate only non-zero weights */
num
=
0
;
for
(
i
=
0
;
i
<
uca
[
code
].
num
;
i
++
)
if
(
uca
[
code
].
weight
[
w
][
i
])
num
++
;
maxnum
=
maxnum
<
num
?
num
:
maxnum
;
}
if
(
!
maxnum
)
maxnum
=
1
;
switch
(
maxnum
)
{
case
0
:
mchars
=
8
;
break
;
case
1
:
mchars
=
8
;
break
;
case
2
:
mchars
=
8
;
break
;
case
3
:
mchars
=
9
;
break
;
case
4
:
mchars
=
8
;
break
;
default:
mchars
=
uca
[
code
].
num
;
}
pagemaxlen
[
page
]
=
maxnum
;
printf
(
"uint16 page%03Xdata[]= { /* %04X (%d weights per char) */
\n
"
,
page
,
page
*
MY_UCA_NCHARS
,
maxnum
);
/*
Now print this page
*/
for
(
offs
=
0
;
offs
<
MY_UCA_NCHARS
;
offs
++
)
{
uint16
weight
[
8
];
size_t
num
,
i
;
code
=
page
*
MY_UCA_NCHARS
+
offs
;
bzero
(
weight
,
sizeof
(
weight
));
/* Copy non-zero weights */
for
(
num
=
0
,
i
=
0
;
i
<
uca
[
code
].
num
;
i
++
)
{
if
(
uca
[
code
].
weight
[
w
][
i
])
{
weight
[
num
]
=
uca
[
code
].
weight
[
w
][
i
];
num
++
;
}
}
for
(
i
=
0
;
i
<
maxnum
;
i
++
)
{
printf
(
"0x%04X"
,(
int
)
weight
[
i
]);
if
((
offs
+
1
!=
MY_UCA_NCHARS
)
||
(
i
+
1
!=
maxnum
))
printf
(
","
);
nchars
++
;
}
if
(
nchars
>=
mchars
)
{
printf
(
"
\n
"
);
nchars
=
0
;
}
else
{
printf
(
" "
);
}
}
printf
(
"};
\n\n
"
);
}
}
printf
(
"uchar ucal[%d]={
\n
"
,
MY_UCA_NPAGES
);
for
(
page
=
0
;
page
<
MY_UCA_NPAGES
;
page
++
)
{
printf
(
"%d%s%s"
,
pagemaxlen
[
page
],
page
<
MY_UCA_NPAGES
-
1
?
","
:
""
,(
page
+
1
)
%
16
?
""
:
"
\n
"
);
}
printf
(
"};
\n
"
);
printf
(
"uint16 *ucaw[%d]={
\n
"
,
MY_UCA_NPAGES
);
for
(
page
=
0
;
page
<
MY_UCA_NPAGES
;
page
++
)
{
printf
(
"page%03Xdata%s%s"
,
page
,
page
<
MY_UCA_NPAGES
-
1
?
","
:
""
,
(
page
+
1
)
%
4
?
""
:
"
\n
"
);
}
printf
(
"};
\n
"
);
printf
(
"int main(void){ return 0;};
\n
"
);
return
0
;
}
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment