do not unaccent Bengali characters (process like the Hindi ones)
This commit is contained in:
parent
6ec7f92938
commit
91dc09bc3c
5 changed files with 1604 additions and 1698 deletions
1647
src/unac/unac.c
1647
src/unac/unac.c
File diff suppressed because it is too large
Load diff
|
@ -35,7 +35,7 @@ extern "C" {
|
||||||
#define UNAC_BLOCK_SHIFT 3
|
#define UNAC_BLOCK_SHIFT 3
|
||||||
#define UNAC_BLOCK_MASK ((1 << UNAC_BLOCK_SHIFT) - 1)
|
#define UNAC_BLOCK_MASK ((1 << UNAC_BLOCK_SHIFT) - 1)
|
||||||
#define UNAC_BLOCK_SIZE (1 << UNAC_BLOCK_SHIFT)
|
#define UNAC_BLOCK_SIZE (1 << UNAC_BLOCK_SHIFT)
|
||||||
#define UNAC_BLOCK_COUNT 714
|
#define UNAC_BLOCK_COUNT 713
|
||||||
#define UNAC_INDEXES_SIZE (0x10000 >> UNAC_BLOCK_SHIFT)
|
#define UNAC_INDEXES_SIZE (0x10000 >> UNAC_BLOCK_SHIFT)
|
||||||
/* Generated by builder. Do not modify. End defines */
|
/* Generated by builder. Do not modify. End defines */
|
||||||
|
|
||||||
|
@ -893,7 +893,6 @@ extern unsigned short unac_data709[];
|
||||||
extern unsigned short unac_data710[];
|
extern unsigned short unac_data710[];
|
||||||
extern unsigned short unac_data711[];
|
extern unsigned short unac_data711[];
|
||||||
extern unsigned short unac_data712[];
|
extern unsigned short unac_data712[];
|
||||||
extern unsigned short unac_data713[];
|
|
||||||
/* Generated by builder. Do not modify. End declarations */
|
/* Generated by builder. Do not modify. End declarations */
|
||||||
|
|
||||||
#ifdef __cplusplus
|
#ifdef __cplusplus
|
||||||
|
|
|
@ -97,6 +97,8 @@ sub main {
|
||||||
# Hindi Devanagari
|
# Hindi Devanagari
|
||||||
&& !(hex $code_value >= 0x0900 && hex $code_value <= 0x097f)
|
&& !(hex $code_value >= 0x0900 && hex $code_value <= 0x097f)
|
||||||
&& !(hex $code_value >= 0xa8e0 && hex $code_value <= 0xa8ff)
|
&& !(hex $code_value >= 0xa8e0 && hex $code_value <= 0xa8ff)
|
||||||
|
# Bengali
|
||||||
|
&& !(hex $code_value >= 0x0980 && hex $code_value <= 0x09ff)
|
||||||
) {
|
) {
|
||||||
# If a decomposition exists, record it
|
# If a decomposition exists, record it
|
||||||
if($character_decomposition_mapping =~ /(<.*>)?\s*(.+)/) {
|
if($character_decomposition_mapping =~ /(<.*>)?\s*(.+)/) {
|
||||||
|
|
1647
unac/unac.c
1647
unac/unac.c
File diff suppressed because it is too large
Load diff
|
@ -35,7 +35,7 @@ extern "C" {
|
||||||
#define UNAC_BLOCK_SHIFT 3
|
#define UNAC_BLOCK_SHIFT 3
|
||||||
#define UNAC_BLOCK_MASK ((1 << UNAC_BLOCK_SHIFT) - 1)
|
#define UNAC_BLOCK_MASK ((1 << UNAC_BLOCK_SHIFT) - 1)
|
||||||
#define UNAC_BLOCK_SIZE (1 << UNAC_BLOCK_SHIFT)
|
#define UNAC_BLOCK_SIZE (1 << UNAC_BLOCK_SHIFT)
|
||||||
#define UNAC_BLOCK_COUNT 714
|
#define UNAC_BLOCK_COUNT 713
|
||||||
#define UNAC_INDEXES_SIZE (0x10000 >> UNAC_BLOCK_SHIFT)
|
#define UNAC_INDEXES_SIZE (0x10000 >> UNAC_BLOCK_SHIFT)
|
||||||
/* Generated by builder. Do not modify. End defines */
|
/* Generated by builder. Do not modify. End defines */
|
||||||
|
|
||||||
|
@ -893,7 +893,6 @@ extern unsigned short unac_data709[];
|
||||||
extern unsigned short unac_data710[];
|
extern unsigned short unac_data710[];
|
||||||
extern unsigned short unac_data711[];
|
extern unsigned short unac_data711[];
|
||||||
extern unsigned short unac_data712[];
|
extern unsigned short unac_data712[];
|
||||||
extern unsigned short unac_data713[];
|
|
||||||
/* Generated by builder. Do not modify. End declarations */
|
/* Generated by builder. Do not modify. End declarations */
|
||||||
|
|
||||||
#ifdef __cplusplus
|
#ifdef __cplusplus
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue