4
0
mirror of git://sourceware.org/git/newlib-cygwin.git synced 2025-01-19 04:49:25 +08:00
Jeff Johnston 01e0a77749 2004-01-27 Artem B. Bityuckiy <abitytsky@softminecorp.com>
* configure.in: Add support to generate iconv converter flags
	for newlib.h
	* newlib.hin: Add iconv converter flags.
	* configure: Regenerated.
	* libc/Makefile.in: Ditto.
	* libc/configure.in: Moved iconv converter parsing logic to
	top level newlib configure.in.
	* libc/configure: Regenerated.
	* libc/iconv/Makefile.in: Ditto.
	* libc/iconv/README.TODO
	* libc/iconv/charset.aliases: Remove wrong BE aliases for
	UCS2/UCS4/UTF8.
	* libc/iconv/ccs/Makefile.am: Remove C flag setting now that
	newlib.h can be used.
	* libc/iconv/ces/Makefile.am: Ditto.
	* libc/iconv/lib/Makefile.am: Ditto.
	* libc/iconv/ccs/Makefile.in: Regenerated.
	* libc/iconv/ces/Makefile.in: Ditto.
	* libc/iconv/lib/Makefile.in: Ditto.
	* libc/iconv/ccs/README.CCS.SOURCES: Updated.
	* libc/iconv/ccs/iconv_mktbl: Don't write junk strings to binaries.
	* libc/iconv/ccs/big5.c: Switch to use new underscored flags
	defined in newlib.h.
	* libc/iconv/ccs/cns11643_plane1.c: Ditto.
	* libc/iconv/ccs/cns11643_plane14.c: Ditto.
	* libc/iconv/ccs/cns11643_plane2.c: Ditto.
	* libc/iconv/ccs/cp775.c: Ditto.
	* libc/iconv/ccs/cp850.c: Ditto.
	* libc/iconv/ccs/cp852.c: Ditto.
	* libc/iconv/ccs/cp855.c: Ditto.
	* libc/iconv/ccs/cp866.c: Ditto.
	* libc/iconv/ccs/gb_2312_80.c: Ditto.
	* libc/iconv/ccs/iso_8859_1.c: Ditto.
	* libc/iconv/ccs/iso_8859_15.c: Ditto.
	* libc/iconv/ccs/iso_8859_2.c: Ditto.
	* libc/iconv/ccs/iso_8859_4.c: Ditto.
	* libc/iconv/ccs/iso_8859_5.c: Ditto.
	* libc/iconv/ccs/jis_x0201.c: Ditto.
	* libc/iconv/ccs/jis_x0208_1983.c: Ditto.
	* libc/iconv/ccs/jis_x0212_1990.c: Ditto.
	* libc/iconv/ccs/koi8_r.c: Ditto.
	* libc/iconv/ccs/koi8_u.c: Ditto.
	* libc/iconv/ccs/ksx1001.c: Ditto.
	* libc/iconv/ccs/shift_jis.c: Ditto.
	* libc/iconv/ccs/us_ascii.c: Ditto.
	* libc/iconv/ccs/binary/big5.cct: Newly generated.
	* libc/iconv/ccs/binary/cns11643_plane1.cct: Ditto.
	* libc/iconv/ccs/binary/cns11643_plane14.cct: Ditto.
	* libc/iconv/ccs/binary/cns11643_plane2.cct: Ditto.
	* libc/iconv/ccs/binary/cp775.cct: Ditto.
	* libc/iconv/ccs/binary/cp850.cct: Ditto.
	* libc/iconv/ccs/binary/cp852.cct: Ditto.
	* libc/iconv/ccs/binary/cp855.cct: Ditto.
	* libc/iconv/ccs/binary/cp866.cct: Ditto.
	* libc/iconv/ccs/binary/gb_2312_80.cct: Ditto.
	* libc/iconv/ccs/binary/iso_8859_1.cct: Ditto.
	* libc/iconv/ccs/binary/iso_8859_15.cct: Ditto.
	* libc/iconv/ccs/binary/iso_8859_2.cct: Ditto.
	* libc/iconv/ccs/binary/iso_8859_4.cct: Ditto.
	* libc/iconv/ccs/binary/iso_8859_5.cct: Ditto.
	* libc/iconv/ccs/binary/jis_x0201.cct: Ditto.
	* libc/iconv/ccs/binary/jis_x0208_1983.cct: Ditto.
	* libc/iconv/ccs/binary/jis_x0212_1990.cct: Ditto.
	* libc/iconv/ccs/binary/koi8_r.cct: Ditto.
	* libc/iconv/ccs/binary/koi8_u.cct: Ditto.
	* libc/iconv/ccs/binary/ksx1001.cct: Ditto.
	* libc/iconv/ccs/binary/shift_jis.cct: Ditto.
	* libc/iconv/ccs/binary/us_ascii.cct: Ditto.
	* libc/iconv/lib/bialiasesi.c: Sync with charset.aliases.
	* libc/iconv/ces/euc-jp.c: Use newlib.h macros.
	* libc/iconv/ces/euc-kr.c: Ditto.
	* libc/iconv/ces/euc-tw.c: Ditto.
	* libc/iconv/ces/gb2312.c: Ditto.
	* libc/iconv/ces/iso-10646-ucs-2.c: Ditto.
	* libc/iconv/ces/iso-10646-ucs-4.c: Ditto.
	* libc/iconv/ces/ucs-2-internal.c: Ditto.
	* libc/iconv/ces/ucs-4-internal.c: Ditto.
	* libc/iconv/ces/utf-16.c: Ditto.
	* libc/iconv/ces/utf-8.c: Ditto.
	* libc/iconv/lib/aliases.c: Ditto.
	* libc/iconv/lib/biccs.c: Ditto.
	* libc/iconv/lib/bices.c: Ditto.
	* libc/iconv/lib/ccs.c: Ditto.
	* libc/iconv/lib/ces.c: Ditto.
	* libc/iconv/lib/ces_euc.c: Ditto.
	* libc/iconv/lib/ces_iso2022.c: Ditto.
	* libc/iconv/lib/ces_table.c: Ditto.
	* libc/iconv/lib/converter.c: Ditto.
	* libc/iconv/lib/deps.h: Ditto.
	* libc/iconv/lib/endian.h: Ditto.
	* libc/iconv/lib/iconv.c: Ditto.
	* libc/iconv/lib/loaddata.c: Ditto.
	* libc/iconv/lib/local.h: Include newlib.h.
	* libc/argz/Makefile.in: Regenerated.
	* libc/ctype/Makefile.in: Ditto.
	* libc/errno/Makefile.in: Ditto.
	* libc/iconv/ccs/binary/Makefile.in: Ditto.
	* libc/locale/Makefile.in: Ditto.
	* libc/misc/Makefile.in: Ditto.
	* libc/posix/Makefile.in: Ditto.
	* libc/reent/Makefile.in: Ditto.
	* libc/search/Makefile.in: Ditto.
	* libc/signal/Makefile.in: Ditto.
	* libc/stdio/Makefile.in: Ditto.
	* libc/stdio64/Makefile.in: Ditto.
	* libc/stdlib/Makefile.in: Ditto.
	* libc/string/Makefile.in: Ditto.
	* libc/syscalls/Makefile.in: Ditto.
	* libc/time/Makefile.in: Ditto.
	* libc/unix/Makefile.in: Ditto.
	* testsuite/newlib.iconv/iconv.exp: New file.
	* testsuite/newlib.iconv/iconvjp.c: Ditto.
	* testsuite/newlib.iconv/iconvnm.c: Ditto.
	* testsuite/newlib.iconv/iconvru.c: Ditto.
2004-01-27 23:26:26 +00:00

270 lines
7.5 KiB
Perl

#! /usr/bin/perl
#
# Copyright (c) 1999, 2000
# Konstantin Chuguev. All rights reserved.
#
# Redistribution and use in source and binary forms, with or without
# modification, are permitted provided that the following conditions
# are met:
# 1. Redistributions of source code must retain the above copyright
# notice, this list of conditions and the following disclaimer.
# 2. Redistributions in binary form must reproduce the above copyright
# notice, this list of conditions and the following disclaimer in the
# documentation and/or other materials provided with the distribution.
#
# THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
# ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
# IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
# ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
# FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
# DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
# OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
# HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
# LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
# OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
# SUCH DAMAGE.
#
# iconv (Charset Conversion Library) v2.0
#
require 'getopts.pl';
use integer;
sub pack_hex {
"_$_[0](" . join(", ", map sprintf("0x%02X", $_), unpack('C4', $_[1]))
. ")";
}
sub pack_array {
my($size, $format, $array_ref) = @_;
return pack("$format$size", @$array_ref) unless $opt_C;
my($res, $i);
if ($format eq 'N') {
for ($i = 0; $i < $size; $i += 2) {
$res .= "\t"
. &pack_hex('1l', pack("N", $$array_ref[$i]))
. ", "
. &pack_hex('1l', pack("N", $$array_ref[$i+1]))
. ",\n";
}
$array_size += $size * 4;
} else {
for ($i = 0; $i < $size; $i += 4) {
$res .= "\t"
. &pack_hex('2s', pack("n2", $$array_ref[$i], $$array_ref[$i+1]))
. ", "
. &pack_hex('2s', pack("n2", $$array_ref[$i+2], $$array_ref[$i+3]))
. ",\n";
}
$array_size += $size * 2;
}
return $res;
}
# create an array of short/long values in network byte order
sub build_array {
my($size, $format, $default, $array_ref) = @_;
my($i);
for $i (0 .. $size-1) {
$$array_ref[$i] = $default unless defined($$array_ref[$i]);
}
return &pack_array($size, $format, $array_ref);
}
sub build_table1 {
my($size, $array_ref) = @_;
return &build_array($size, "n", 0xFFFE, $array_ref);
}
sub build_table2 {
my($size, $array_ref) = @_;
my($offset, $n, $i, @offs) = ($size * 4, 0);
for $i (0 .. $size-1) {
next unless defined($$array_ref[$i]);
$offs[$i] = $offset;
$offset += $size * 2;
}
my($data) = (&build_array($size, "N", 0, \@offs));
for $i (0 .. $size-1) {
next unless defined($$array_ref[$i]);
$n ++;
$data .= &build_table1($size, $$array_ref[$i]);
}
printf STDERR "%d subtables.\n", $n;
return $data;
}
$control0 = 0;
$control1 = 0;
$delete = 0;
@to_ucs;
@from_ucs;
# set a value in two charset conversion tables; update charset properties
# ($cs, $ucs) = (local charset code, Unicode)
#
sub set_val {
my($cs, $ucs) = @_;
return if $opt_a && $cs > 0x7F;
$to_ucs[$cs >> 8][$cs & 0xFF] = $ucs;
$from_ucs[$ucs >> 8][$ucs & 0xFF] = $cs;
if (($cs & 0x60) == 0) {
if($cs & 0x80) {
$control1 = 1;
} else {
$control0 = 1;
}
}
$delete = 1 if $cs == 0x7F;
if ($cs < 0x80) {
$_7bit = 1;
} elsif ($cs < 0x100) {
$_8bit = 1;
} elsif ($cs & 0x8080) {
$_16bit = 1;
} else {
$_14bit = 1;
}
}
# set a range of equal codes to charset conversion tables
#
sub set_range {
for (@_) {
&set_val($_, $_);
}
}
&Getopts('aCc:Mm:o:p:u:');
# ||| || | | +- u N: field number for Unicode character codes
# ||| || | +--- p str: prefix
# ||| || +----- o file: output file name
# ||| |+------- m file: character mnemonic table from RFC1345
# ||| +-------- M: Macintosh newline (<LF> only)
# ||+---------- c N: field number for charset character codes
# |+----------- C: make C source file
# +------------ a: ignore 8 bit (for ASCII)
$opt_c = 0 unless defined($opt_c);
$opt_p = '0x' unless defined($opt_p);
$opt_u = 1 unless defined($opt_u);
if ($opt_o) {
$opt_o =~ tr/-/_/;
open(STDOUT, ">$opt_o");
$opt_o =~ s/.c$//;
}
%map;
if ($opt_M) {
$/ = "\cM";
}
if ($opt_m) {
open(MAP, $opt_m);
while(<MAP>) {
chop;
next unless /^ [^ ]/;
next if 2 > split;
$map{$_[0]} = $_[1];
}
close(MAP);
local($code) = 0;
while (<>) {
chop;
s/^ *//;
if (/^&[a-z]/) {
split(' ', substr($_, 1));
if ($_[0] eq 'code') {
$code = $_[1];
}
} else {
foreach (split) {
&set_val($code, hex "0x$map{$_}") if $_ ne '??';
$code ++;
}
}
}
} else {
while (<>) {
s/[#\n].*//;
next if 2 > split; # too few fields
next if ($_[$opt_c] =~ s/^$opt_p/0x/o) != 1;
# local charset code prefix is invalid
&set_val(hex $_[$opt_c], hex $_[$opt_u]);
}
}
if (!$_16bit && !$_14bit) {
if ($_8bit) {
print STDERR "8bit charset";
if (!$control0) {
&set_range(0 .. 0x1F);
print STDERR "; control0 chars added";
}
if (!$control1) {
&set_range(0x80 .. 0x9F);
print STDERR "; control1 chars added";
}
if (!$delete) {
&set_range(0x7F);
print STDERR "; delete char added";
}
$nbits = 8;
$type = 1;
} else {
print STDERR "7bit charset";
$nbits = 7;
$type = 0;
}
print STDERR ".\n";
$to = &build_table1($_8bit ? 256 : 128, $to_ucs[0]);
} elsif ($_16bit) {
print STDERR "16bit charset";
if (!$_7bit && !$_8bit) {
&set_range(0 .. 0x7F);
print STDERR "; ASCII subset added";
} elsif (!$control0) {
&set_range(0 .. 0x1F);
print STDERR "; control0 chars added";
}
print STDERR ".\n";
$to = &build_table2(256, \@to_ucs);
$nbits = 16;
$type = 3;
} else {
print STDERR "14bit charset.\n";
$to = &build_table2(128, \@to_ucs);
$nbits = 14;
$type = 2;
}
$to_size = $opt_C ? $array_size : length($to);
$from = &build_table2(256, \@from_ucs);
if ($opt_C) {
die "-o option is mandatory with -C" unless $opt_o;
$opt_o =~ s/\.c$//;
$opt_o =~ tr/-/_/;
$name = $opt_o;
$name =~ tr/[a-z]/[A-Z]/;
print "#include \"..\/lib\/deps.h\"\n\n";
print "#ifdef _ICONV_CONVERTER_$name\n";
print "#include \"..\/lib\/endian.h\"\n\n";
print "_CONST unsigned char _iconv_ccs_table_$opt_o" . "[] = {\n";
print "\t3, 'C', 'S', 'C', 'T', ICONV_ORDER, $nbits, $type,\n";
print &pack_array(2, 'N', [8, 8 + $to_size]);
print $to;
print $from;
print "};\n\n";
print "#endif /* #ifdef _ICONV_CONVERTER_$name */\n\n";
} else {
print pack("A5CCCNN", "\003CSCT", 0, $nbits, $type, 8, 8 + $to_size);
print $to;
print $from;
}