b4c522fabd
ChangeLog: * Makefile.def (target_modules): Add libphobos. (flags_to_pass): Add GDC, GDCFLAGS, GDC_FOR_TARGET and GDCFLAGS_FOR_TARGET. (dependencies): Make libphobos depend on libatomic, libbacktrace configure, and zlib configure. (language): Add language d. * Makefile.in: Rebuild. * Makefile.tpl (BUILD_EXPORTS): Add GDC and GDCFLAGS. (HOST_EXPORTS): Add GDC. (POSTSTAGE1_HOST_EXPORTS): Add GDC and GDC_FOR_BUILD. (BASE_TARGET_EXPORTS): Add GDC. (GDC_FOR_BUILD, GDC, GDCFLAGS): New variables. (GDC_FOR_TARGET, GDC_FLAGS_FOR_TARGET): New variables. (EXTRA_HOST_FLAGS): Add GDC. (STAGE1_FLAGS_TO_PASS): Add GDC. (EXTRA_TARGET_FLAGS): Add GDC and GDCFLAGS. * config-ml.in: Treat GDC and GDCFLAGS like other compiler/flag environment variables. * configure: Rebuild. * configure.ac: Add target-libphobos to target_libraries. Set and substitute GDC_FOR_BUILD and GDC_FOR_TARGET. config/ChangeLog: * multi.m4: Set GDC. gcc/ChangeLog: * Makefile.in (tm_d_file_list, tm_d_include_list): New variables. (TM_D_H, D_TARGET_DEF, D_TARGET_H, D_TARGET_OBJS): New variables. (tm_d.h, cs-tm_d.h, default-d.o): New rules. (d/d-target-hooks-def.h, s-d-target-hooks-def-h): New rules. (s-tm-texi): Also check timestamp on d-target.def. (generated_files): Add TM_D_H and d-target-hooks-def.h. (build/genhooks.o): Also depend on D_TARGET_DEF. * config.gcc (tm_d_file, d_target_objs, target_has_targetdm): New variables. * config/aarch64/aarch64-d.c: New file. * config/aarch64/aarch64-linux.h (GNU_USER_TARGET_D_CRITSEC_SIZE): Define. * config/aarch64/aarch64-protos.h (aarch64_d_target_versions): New prototype. * config/aarch64/aarch64.h (TARGET_D_CPU_VERSIONS): Define. * config/aarch64/t-aarch64 (aarch64-d.o): New rule. * config/arm/arm-d.c: New file. * config/arm/arm-protos.h (arm_d_target_versions): New prototype. * config/arm/arm.h (TARGET_D_CPU_VERSIONS): Define. * config/arm/linux-eabi.h (EXTRA_TARGET_D_OS_VERSIONS): Define. * config/arm/t-arm (arm-d.o): New rule. * config/default-d.c: New file. * config/glibc-d.c: New file. * config/gnu.h (GNU_USER_TARGET_D_OS_VERSIONS): Define. * config/i386/i386-d.c: New file. * config/i386/i386-protos.h (ix86_d_target_versions): New prototype. * config/i386/i386.h (TARGET_D_CPU_VERSIONS): Define. * config/i386/linux-common.h (EXTRA_TARGET_D_OS_VERSIONS): Define. (GNU_USER_TARGET_D_CRITSEC_SIZE): Define. * config/i386/t-i386 (i386-d.o): New rule. * config/kfreebsd-gnu.h (GNU_USER_TARGET_D_OS_VERSIONS): Define. * config/kopensolaris-gnu.h (GNU_USER_TARGET_D_OS_VERSIONS): Define. * config/linux-android.h (ANDROID_TARGET_D_OS_VERSIONS): Define. * config/linux.h (GNU_USER_TARGET_D_OS_VERSIONS): Define. * config/mips/linux-common.h (EXTRA_TARGET_D_OS_VERSIONS): Define. * config/mips/mips-d.c: New file. * config/mips/mips-protos.h (mips_d_target_versions): New prototype. * config/mips/mips.h (TARGET_D_CPU_VERSIONS): Define. * config/mips/t-mips (mips-d.o): New rule. * config/powerpcspe/linux.h (GNU_USER_TARGET_D_OS_VERSIONS): Define. * config/powerpcspe/linux64.h (GNU_USER_TARGET_D_OS_VERSIONS): Define. * config/powerpcspe/powerpcspe-d.c: New file. * config/powerpcspe/powerpcspe-protos.h (rs6000_d_target_versions): New prototype. * config/powerpcspe/powerpcspe.c (rs6000_output_function_epilogue): Support GNU D by using 0 as the language type. * config/powerpcspe/powerpcspe.h (TARGET_D_CPU_VERSIONS): Define. * config/powerpcspe/t-powerpcspe (powerpcspe-d.o): New rule. * config/riscv/riscv-d.c: New file. * config/riscv/riscv-protos.h (riscv_d_target_versions): New prototype. * config/riscv/riscv.h (TARGET_D_CPU_VERSIONS): Define. * config/riscv/t-riscv (riscv-d.o): New rule. * config/rs6000/linux.h (GNU_USER_TARGET_D_OS_VERSIONS): Define. * config/rs6000/linux64.h (GNU_USER_TARGET_D_OS_VERSIONS): Define. * config/rs6000/rs6000-d.c: New file. * config/rs6000/rs6000-protos.h (rs6000_d_target_versions): New prototype. * config/rs6000/rs6000.c (rs6000_output_function_epilogue): Support GNU D by using 0 as the language type. * config/rs6000/rs6000.h (TARGET_D_CPU_VERSIONS): Define. * config/rs6000/t-rs6000 (rs6000-d.o): New rule. * config/s390/s390-d.c: New file. * config/s390/s390-protos.h (s390_d_target_versions): New prototype. * config/s390/s390.h (TARGET_D_CPU_VERSIONS): Define. * config/s390/t-s390 (s390-d.o): New rule. * config/sparc/sparc-d.c: New file. * config/sparc/sparc-protos.h (sparc_d_target_versions): New prototype. * config/sparc/sparc.h (TARGET_D_CPU_VERSIONS): Define. * config/sparc/t-sparc (sparc-d.o): New rule. * config/t-glibc (glibc-d.o): New rule. * configure: Regenerated. * configure.ac (tm_d_file): New variable. (tm_d_file_list, tm_d_include_list, d_target_objs): Add substitutes. * doc/contrib.texi (Contributors): Add self for the D frontend. * doc/frontends.texi (G++ and GCC): Mention D as a supported language. * doc/install.texi (Configuration): Mention libphobos as an option for --enable-shared. Mention d as an option for --enable-languages. (Testing): Mention check-d as a target. * doc/invoke.texi (Overall Options): Mention .d, .dd, and .di as file name suffixes. Mention d as a -x option. * doc/sourcebuild.texi (Top Level): Mention libphobos. * doc/standards.texi (Standards): Add section on D language. * doc/tm.texi: Regenerated. * doc/tm.texi.in: Add @node for D language and ABI, and @hook for TARGET_CPU_VERSIONS, TARGET_D_OS_VERSIONS, and TARGET_D_CRITSEC_SIZE. * dwarf2out.c (is_dlang): New function. (gen_compile_unit_die): Use DW_LANG_D for D. (declare_in_namespace): Return module die for D, instead of adding extra declarations into the namespace. (gen_namespace_die): Generate DW_TAG_module for D. (gen_decl_die): Handle CONST_DECLSs for D. (dwarf2out_decl): Likewise. (prune_unused_types_walk_local_classes): Handle DW_tag_interface_type. (prune_unused_types_walk): Handle DW_tag_interface_type same as other kinds of aggregates. * gcc.c (default_compilers): Add entries for .d, .dd and .di. * genhooks.c: Include d/d-target.def. gcc/po/ChangeLog: * EXCLUDES: Add sources from d/dmd. gcc/testsuite/ChangeLog: * gcc.misc-tests/help.exp: Add D to option descriptions check. * gdc.dg/asan/asan.exp: New file. * gdc.dg/asan/gdc272.d: New test. * gdc.dg/compilable.d: New test. * gdc.dg/dg.exp: New file. * gdc.dg/gdc254.d: New test. * gdc.dg/gdc260.d: New test. * gdc.dg/gdc270a.d: New test. * gdc.dg/gdc270b.d: New test. * gdc.dg/gdc282.d: New test. * gdc.dg/gdc283.d: New test. * gdc.dg/imports/gdc170.d: New test. * gdc.dg/imports/gdc231.d: New test. * gdc.dg/imports/gdc239.d: New test. * gdc.dg/imports/gdc241a.d: New test. * gdc.dg/imports/gdc241b.d: New test. * gdc.dg/imports/gdc251a.d: New test. * gdc.dg/imports/gdc251b.d: New test. * gdc.dg/imports/gdc253.d: New test. * gdc.dg/imports/gdc254a.d: New test. * gdc.dg/imports/gdc256.d: New test. * gdc.dg/imports/gdc27.d: New test. * gdc.dg/imports/gdcpkg256/package.d: New test. * gdc.dg/imports/runnable.d: New test. * gdc.dg/link.d: New test. * gdc.dg/lto/lto.exp: New file. * gdc.dg/lto/ltotests_0.d: New test. * gdc.dg/lto/ltotests_1.d: New test. * gdc.dg/runnable.d: New test. * gdc.dg/simd.d: New test. * gdc.test/gdc-test.exp: New file. * lib/gdc-dg.exp: New file. * lib/gdc.exp: New file. libphobos/ChangeLog: * Makefile.am: New file. * Makefile.in: New file. * acinclude.m4: New file. * aclocal.m4: New file. * config.h.in: New file. * configure: New file. * configure.ac: New file. * d_rules.am: New file. * libdruntime/Makefile.am: New file. * libdruntime/Makefile.in: New file. * libdruntime/__entrypoint.di: New file. * libdruntime/__main.di: New file. * libdruntime/gcc/attribute.d: New file. * libdruntime/gcc/backtrace.d: New file. * libdruntime/gcc/builtins.d: New file. * libdruntime/gcc/config.d.in: New file. * libdruntime/gcc/deh.d: New file. * libdruntime/gcc/libbacktrace.d.in: New file. * libdruntime/gcc/unwind/arm.d: New file. * libdruntime/gcc/unwind/arm_common.d: New file. * libdruntime/gcc/unwind/c6x.d: New file. * libdruntime/gcc/unwind/generic.d: New file. * libdruntime/gcc/unwind/package.d: New file. * libdruntime/gcc/unwind/pe.d: New file. * m4/autoconf.m4: New file. * m4/druntime.m4: New file. * m4/druntime/cpu.m4: New file. * m4/druntime/libraries.m4: New file. * m4/druntime/os.m4: New file. * m4/gcc_support.m4: New file. * m4/gdc.m4: New file. * m4/libtool.m4: New file. * src/Makefile.am: New file. * src/Makefile.in: New file. * src/libgphobos.spec.in: New file. * testsuite/Makefile.am: New file. * testsuite/Makefile.in: New file. * testsuite/config/default.exp: New file. * testsuite/lib/libphobos-dg.exp: New file. * testsuite/lib/libphobos.exp: New file. * testsuite/testsuite_flags.in: New file. From-SVN: r265573
959 lines
24 KiB
D
959 lines
24 KiB
D
/**
|
|
* This code handles decoding UTF strings for foreach_reverse loops. There are
|
|
* 6 combinations of conversions between char, wchar, and dchar, and 2 of each
|
|
* of those.
|
|
*
|
|
* Copyright: Copyright Digital Mars 2004 - 2010.
|
|
* License: $(WEB www.boost.org/LICENSE_1_0.txt, Boost License 1.0).
|
|
* Authors: Walter Bright, Sean Kelly
|
|
*/
|
|
|
|
/* Copyright Digital Mars 2004 - 2010.
|
|
* Distributed under the Boost Software License, Version 1.0.
|
|
* (See accompanying file LICENSE or copy at
|
|
* http://www.boost.org/LICENSE_1_0.txt)
|
|
*/
|
|
module rt.aApplyR;
|
|
|
|
/* This code handles decoding UTF strings for foreach_reverse loops.
|
|
* There are 6 combinations of conversions between char, wchar,
|
|
* and dchar, and 2 of each of those.
|
|
*/
|
|
|
|
private import rt.util.utf;
|
|
|
|
/**********************************************/
|
|
/* 1 argument versions */
|
|
|
|
// dg is D, but _aApplyRcd() is C
|
|
extern (D) alias int delegate(void *) dg_t;
|
|
|
|
extern (C) int _aApplyRcd1(in char[] aa, dg_t dg)
|
|
{ int result;
|
|
|
|
debug(apply) printf("_aApplyRcd1(), len = %d\n", aa.length);
|
|
for (size_t i = aa.length; i != 0; )
|
|
{ dchar d;
|
|
|
|
i--;
|
|
d = aa[i];
|
|
if (d & 0x80)
|
|
{ char c = cast(char)d;
|
|
uint j;
|
|
uint m = 0x3F;
|
|
d = 0;
|
|
while ((c & 0xC0) != 0xC0)
|
|
{ if (i == 0)
|
|
onUnicodeError("Invalid UTF-8 sequence", 0);
|
|
i--;
|
|
d |= (c & 0x3F) << j;
|
|
j += 6;
|
|
m >>= 1;
|
|
c = aa[i];
|
|
}
|
|
d |= (c & m) << j;
|
|
}
|
|
result = dg(cast(void *)&d);
|
|
if (result)
|
|
break;
|
|
}
|
|
return result;
|
|
}
|
|
|
|
unittest
|
|
{
|
|
debug(apply) printf("_aApplyRcd1.unittest\n");
|
|
|
|
auto s = "hello"c[];
|
|
int i;
|
|
|
|
foreach_reverse (dchar d; s)
|
|
{
|
|
switch (i)
|
|
{
|
|
case 0: assert(d == 'o'); break;
|
|
case 1: assert(d == 'l'); break;
|
|
case 2: assert(d == 'l'); break;
|
|
case 3: assert(d == 'e'); break;
|
|
case 4: assert(d == 'h'); break;
|
|
default: assert(0);
|
|
}
|
|
i++;
|
|
}
|
|
assert(i == 5);
|
|
|
|
s = "a\u1234\U000A0456b";
|
|
i = 0;
|
|
foreach_reverse (dchar d; s)
|
|
{
|
|
//printf("i = %d, d = %x\n", i, d);
|
|
switch (i)
|
|
{
|
|
case 0: assert(d == 'b'); break;
|
|
case 1: assert(d == '\U000A0456'); break;
|
|
case 2: assert(d == '\u1234'); break;
|
|
case 3: assert(d == 'a'); break;
|
|
default: assert(0);
|
|
}
|
|
i++;
|
|
}
|
|
assert(i == 4);
|
|
}
|
|
|
|
/*****************************/
|
|
|
|
extern (C) int _aApplyRwd1(in wchar[] aa, dg_t dg)
|
|
{ int result;
|
|
|
|
debug(apply) printf("_aApplyRwd1(), len = %d\n", aa.length);
|
|
for (size_t i = aa.length; i != 0; )
|
|
{ dchar d;
|
|
|
|
i--;
|
|
d = aa[i];
|
|
if (d >= 0xDC00 && d <= 0xDFFF)
|
|
{ if (i == 0)
|
|
onUnicodeError("Invalid UTF-16 sequence", 0);
|
|
i--;
|
|
d = ((aa[i] - 0xD7C0) << 10) + (d - 0xDC00);
|
|
}
|
|
result = dg(cast(void *)&d);
|
|
if (result)
|
|
break;
|
|
}
|
|
return result;
|
|
}
|
|
|
|
unittest
|
|
{
|
|
debug(apply) printf("_aApplyRwd1.unittest\n");
|
|
|
|
auto s = "hello"w[];
|
|
int i;
|
|
|
|
foreach_reverse (dchar d; s)
|
|
{
|
|
switch (i)
|
|
{
|
|
case 0: assert(d == 'o'); break;
|
|
case 1: assert(d == 'l'); break;
|
|
case 2: assert(d == 'l'); break;
|
|
case 3: assert(d == 'e'); break;
|
|
case 4: assert(d == 'h'); break;
|
|
default: assert(0);
|
|
}
|
|
i++;
|
|
}
|
|
assert(i == 5);
|
|
|
|
s = "a\u1234\U000A0456b";
|
|
i = 0;
|
|
foreach_reverse (dchar d; s)
|
|
{
|
|
//printf("i = %d, d = %x\n", i, d);
|
|
switch (i)
|
|
{
|
|
case 0: assert(d == 'b'); break;
|
|
case 1: assert(d == '\U000A0456'); break;
|
|
case 2: assert(d == '\u1234'); break;
|
|
case 3: assert(d == 'a'); break;
|
|
default: assert(0);
|
|
}
|
|
i++;
|
|
}
|
|
assert(i == 4);
|
|
}
|
|
|
|
/*****************************/
|
|
|
|
extern (C) int _aApplyRcw1(in char[] aa, dg_t dg)
|
|
{ int result;
|
|
|
|
debug(apply) printf("_aApplyRcw1(), len = %d\n", aa.length);
|
|
for (size_t i = aa.length; i != 0; )
|
|
{ dchar d;
|
|
wchar w;
|
|
|
|
i--;
|
|
w = aa[i];
|
|
if (w & 0x80)
|
|
{ char c = cast(char)w;
|
|
uint j;
|
|
uint m = 0x3F;
|
|
d = 0;
|
|
while ((c & 0xC0) != 0xC0)
|
|
{ if (i == 0)
|
|
onUnicodeError("Invalid UTF-8 sequence", 0);
|
|
i--;
|
|
d |= (c & 0x3F) << j;
|
|
j += 6;
|
|
m >>= 1;
|
|
c = aa[i];
|
|
}
|
|
d |= (c & m) << j;
|
|
|
|
if (d <= 0xFFFF)
|
|
w = cast(wchar) d;
|
|
else
|
|
{
|
|
w = cast(wchar) ((((d - 0x10000) >> 10) & 0x3FF) + 0xD800);
|
|
result = dg(cast(void *)&w);
|
|
if (result)
|
|
break;
|
|
w = cast(wchar) (((d - 0x10000) & 0x3FF) + 0xDC00);
|
|
}
|
|
}
|
|
result = dg(cast(void *)&w);
|
|
if (result)
|
|
break;
|
|
}
|
|
return result;
|
|
}
|
|
|
|
unittest
|
|
{
|
|
debug(apply) printf("_aApplyRcw1.unittest\n");
|
|
|
|
auto s = "hello"c[];
|
|
int i;
|
|
|
|
foreach_reverse (wchar d; s)
|
|
{
|
|
switch (i)
|
|
{
|
|
case 0: assert(d == 'o'); break;
|
|
case 1: assert(d == 'l'); break;
|
|
case 2: assert(d == 'l'); break;
|
|
case 3: assert(d == 'e'); break;
|
|
case 4: assert(d == 'h'); break;
|
|
default: assert(0);
|
|
}
|
|
i++;
|
|
}
|
|
assert(i == 5);
|
|
|
|
s = "a\u1234\U000A0456b";
|
|
i = 0;
|
|
foreach_reverse (wchar d; s)
|
|
{
|
|
//printf("i = %d, d = %x\n", i, d);
|
|
switch (i)
|
|
{
|
|
case 0: assert(d == 'b'); break;
|
|
case 1: assert(d == 0xDA41); break;
|
|
case 2: assert(d == 0xDC56); break;
|
|
case 3: assert(d == 0x1234); break;
|
|
case 4: assert(d == 'a'); break;
|
|
default: assert(0);
|
|
}
|
|
i++;
|
|
}
|
|
assert(i == 5);
|
|
}
|
|
|
|
/*****************************/
|
|
|
|
extern (C) int _aApplyRwc1(in wchar[] aa, dg_t dg)
|
|
{ int result;
|
|
|
|
debug(apply) printf("_aApplyRwc1(), len = %d\n", aa.length);
|
|
for (size_t i = aa.length; i != 0; )
|
|
{ dchar d;
|
|
char c;
|
|
|
|
i--;
|
|
d = aa[i];
|
|
if (d >= 0xDC00 && d <= 0xDFFF)
|
|
{ if (i == 0)
|
|
onUnicodeError("Invalid UTF-16 sequence", 0);
|
|
i--;
|
|
d = ((aa[i] - 0xD7C0) << 10) + (d - 0xDC00);
|
|
}
|
|
|
|
if (d & ~0x7F)
|
|
{
|
|
char[4] buf;
|
|
|
|
auto b = toUTF8(buf, d);
|
|
foreach (char c2; b)
|
|
{
|
|
result = dg(cast(void *)&c2);
|
|
if (result)
|
|
return result;
|
|
}
|
|
continue;
|
|
}
|
|
c = cast(char)d;
|
|
result = dg(cast(void *)&c);
|
|
if (result)
|
|
break;
|
|
}
|
|
return result;
|
|
}
|
|
|
|
unittest
|
|
{
|
|
debug(apply) printf("_aApplyRwc1.unittest\n");
|
|
|
|
auto s = "hello"w[];
|
|
int i;
|
|
|
|
foreach_reverse (char d; s)
|
|
{
|
|
switch (i)
|
|
{
|
|
case 0: assert(d == 'o'); break;
|
|
case 1: assert(d == 'l'); break;
|
|
case 2: assert(d == 'l'); break;
|
|
case 3: assert(d == 'e'); break;
|
|
case 4: assert(d == 'h'); break;
|
|
default: assert(0);
|
|
}
|
|
i++;
|
|
}
|
|
assert(i == 5);
|
|
|
|
s = "a\u1234\U000A0456b";
|
|
i = 0;
|
|
foreach_reverse (char d; s)
|
|
{
|
|
//printf("i = %d, d = %x\n", i, d);
|
|
switch (i)
|
|
{
|
|
case 0: assert(d == 'b'); break;
|
|
case 1: assert(d == 0xF2); break;
|
|
case 2: assert(d == 0xA0); break;
|
|
case 3: assert(d == 0x91); break;
|
|
case 4: assert(d == 0x96); break;
|
|
case 5: assert(d == 0xE1); break;
|
|
case 6: assert(d == 0x88); break;
|
|
case 7: assert(d == 0xB4); break;
|
|
case 8: assert(d == 'a'); break;
|
|
default: assert(0);
|
|
}
|
|
i++;
|
|
}
|
|
assert(i == 9);
|
|
}
|
|
|
|
/*****************************/
|
|
|
|
extern (C) int _aApplyRdc1(in dchar[] aa, dg_t dg)
|
|
{ int result;
|
|
|
|
debug(apply) printf("_aApplyRdc1(), len = %d\n", aa.length);
|
|
for (size_t i = aa.length; i != 0;)
|
|
{ dchar d = aa[--i];
|
|
char c;
|
|
|
|
if (d & ~0x7F)
|
|
{
|
|
char[4] buf;
|
|
|
|
auto b = toUTF8(buf, d);
|
|
foreach (char c2; b)
|
|
{
|
|
result = dg(cast(void *)&c2);
|
|
if (result)
|
|
return result;
|
|
}
|
|
continue;
|
|
}
|
|
else
|
|
{
|
|
c = cast(char)d;
|
|
}
|
|
result = dg(cast(void *)&c);
|
|
if (result)
|
|
break;
|
|
}
|
|
return result;
|
|
}
|
|
|
|
unittest
|
|
{
|
|
debug(apply) printf("_aApplyRdc1.unittest\n");
|
|
|
|
auto s = "hello"d[];
|
|
int i;
|
|
|
|
foreach_reverse (char d; s)
|
|
{
|
|
switch (i)
|
|
{
|
|
case 0: assert(d == 'o'); break;
|
|
case 1: assert(d == 'l'); break;
|
|
case 2: assert(d == 'l'); break;
|
|
case 3: assert(d == 'e'); break;
|
|
case 4: assert(d == 'h'); break;
|
|
default: assert(0);
|
|
}
|
|
i++;
|
|
}
|
|
assert(i == 5);
|
|
|
|
s = "a\u1234\U000A0456b";
|
|
i = 0;
|
|
foreach_reverse (char d; s)
|
|
{
|
|
//printf("i = %d, d = %x\n", i, d);
|
|
switch (i)
|
|
{
|
|
case 0: assert(d == 'b'); break;
|
|
case 1: assert(d == 0xF2); break;
|
|
case 2: assert(d == 0xA0); break;
|
|
case 3: assert(d == 0x91); break;
|
|
case 4: assert(d == 0x96); break;
|
|
case 5: assert(d == 0xE1); break;
|
|
case 6: assert(d == 0x88); break;
|
|
case 7: assert(d == 0xB4); break;
|
|
case 8: assert(d == 'a'); break;
|
|
default: assert(0);
|
|
}
|
|
i++;
|
|
}
|
|
assert(i == 9);
|
|
}
|
|
|
|
/*****************************/
|
|
|
|
extern (C) int _aApplyRdw1(in dchar[] aa, dg_t dg)
|
|
{ int result;
|
|
|
|
debug(apply) printf("_aApplyRdw1(), len = %d\n", aa.length);
|
|
for (size_t i = aa.length; i != 0; )
|
|
{ dchar d = aa[--i];
|
|
wchar w;
|
|
|
|
if (d <= 0xFFFF)
|
|
w = cast(wchar) d;
|
|
else
|
|
{
|
|
w = cast(wchar) ((((d - 0x10000) >> 10) & 0x3FF) + 0xD800);
|
|
result = dg(cast(void *)&w);
|
|
if (result)
|
|
break;
|
|
w = cast(wchar) (((d - 0x10000) & 0x3FF) + 0xDC00);
|
|
}
|
|
result = dg(cast(void *)&w);
|
|
if (result)
|
|
break;
|
|
}
|
|
return result;
|
|
}
|
|
|
|
unittest
|
|
{
|
|
debug(apply) printf("_aApplyRdw1.unittest\n");
|
|
|
|
auto s = "hello"d[];
|
|
int i;
|
|
|
|
foreach_reverse (wchar d; s)
|
|
{
|
|
switch (i)
|
|
{
|
|
case 0: assert(d == 'o'); break;
|
|
case 1: assert(d == 'l'); break;
|
|
case 2: assert(d == 'l'); break;
|
|
case 3: assert(d == 'e'); break;
|
|
case 4: assert(d == 'h'); break;
|
|
default: assert(0);
|
|
}
|
|
i++;
|
|
}
|
|
assert(i == 5);
|
|
|
|
s = "a\u1234\U000A0456b";
|
|
i = 0;
|
|
foreach_reverse (wchar d; s)
|
|
{
|
|
//printf("i = %d, d = %x\n", i, d);
|
|
switch (i)
|
|
{
|
|
case 0: assert(d == 'b'); break;
|
|
case 1: assert(d == 0xDA41); break;
|
|
case 2: assert(d == 0xDC56); break;
|
|
case 3: assert(d == 0x1234); break;
|
|
case 4: assert(d == 'a'); break;
|
|
default: assert(0);
|
|
}
|
|
i++;
|
|
}
|
|
assert(i == 5);
|
|
}
|
|
|
|
|
|
/****************************************************************************/
|
|
/* 2 argument versions */
|
|
|
|
// dg is D, but _aApplyRcd2() is C
|
|
extern (D) alias int delegate(void *, void *) dg2_t;
|
|
|
|
extern (C) int _aApplyRcd2(in char[] aa, dg2_t dg)
|
|
{ int result;
|
|
size_t i;
|
|
size_t len = aa.length;
|
|
|
|
debug(apply) printf("_aApplyRcd2(), len = %d\n", len);
|
|
for (i = len; i != 0; )
|
|
{ dchar d;
|
|
|
|
i--;
|
|
d = aa[i];
|
|
if (d & 0x80)
|
|
{ char c = cast(char)d;
|
|
uint j;
|
|
uint m = 0x3F;
|
|
d = 0;
|
|
while ((c & 0xC0) != 0xC0)
|
|
{ if (i == 0)
|
|
onUnicodeError("Invalid UTF-8 sequence", 0);
|
|
i--;
|
|
d |= (c & 0x3F) << j;
|
|
j += 6;
|
|
m >>= 1;
|
|
c = aa[i];
|
|
}
|
|
d |= (c & m) << j;
|
|
}
|
|
result = dg(&i, cast(void *)&d);
|
|
if (result)
|
|
break;
|
|
}
|
|
return result;
|
|
}
|
|
|
|
unittest
|
|
{
|
|
debug(apply) printf("_aApplyRcd2.unittest\n");
|
|
|
|
auto s = "hello"c[];
|
|
int i;
|
|
|
|
foreach_reverse (k, dchar d; s)
|
|
{
|
|
assert(k == 4 - i);
|
|
switch (i)
|
|
{
|
|
case 0: assert(d == 'o'); break;
|
|
case 1: assert(d == 'l'); break;
|
|
case 2: assert(d == 'l'); break;
|
|
case 3: assert(d == 'e'); break;
|
|
case 4: assert(d == 'h'); break;
|
|
default: assert(0);
|
|
}
|
|
i++;
|
|
}
|
|
assert(i == 5);
|
|
|
|
s = "a\u1234\U000A0456b";
|
|
i = 0;
|
|
foreach_reverse (k, dchar d; s)
|
|
{
|
|
//printf("i = %d, k = %d, d = %x\n", i, k, d);
|
|
switch (i)
|
|
{
|
|
case 0: assert(d == 'b'); assert(k == 8); break;
|
|
case 1: assert(d == '\U000A0456'); assert(k == 4); break;
|
|
case 2: assert(d == '\u1234'); assert(k == 1); break;
|
|
case 3: assert(d == 'a'); assert(k == 0); break;
|
|
default: assert(0);
|
|
}
|
|
i++;
|
|
}
|
|
assert(i == 4);
|
|
}
|
|
|
|
/*****************************/
|
|
|
|
extern (C) int _aApplyRwd2(in wchar[] aa, dg2_t dg)
|
|
{ int result;
|
|
|
|
debug(apply) printf("_aApplyRwd2(), len = %d\n", aa.length);
|
|
for (size_t i = aa.length; i != 0; )
|
|
{ dchar d;
|
|
|
|
i--;
|
|
d = aa[i];
|
|
if (d >= 0xDC00 && d <= 0xDFFF)
|
|
{ if (i == 0)
|
|
onUnicodeError("Invalid UTF-16 sequence", 0);
|
|
i--;
|
|
d = ((aa[i] - 0xD7C0) << 10) + (d - 0xDC00);
|
|
}
|
|
result = dg(&i, cast(void *)&d);
|
|
if (result)
|
|
break;
|
|
}
|
|
return result;
|
|
}
|
|
|
|
unittest
|
|
{
|
|
debug(apply) printf("_aApplyRwd2.unittest\n");
|
|
|
|
auto s = "hello"w[];
|
|
int i;
|
|
|
|
foreach_reverse (k, dchar d; s)
|
|
{
|
|
//printf("i = %d, k = %d, d = %x\n", i, k, d);
|
|
assert(k == 4 - i);
|
|
switch (i)
|
|
{
|
|
case 0: assert(d == 'o'); break;
|
|
case 1: assert(d == 'l'); break;
|
|
case 2: assert(d == 'l'); break;
|
|
case 3: assert(d == 'e'); break;
|
|
case 4: assert(d == 'h'); break;
|
|
default: assert(0);
|
|
}
|
|
i++;
|
|
}
|
|
assert(i == 5);
|
|
|
|
s = "a\u1234\U000A0456b";
|
|
i = 0;
|
|
foreach_reverse (k, dchar d; s)
|
|
{
|
|
//printf("i = %d, k = %d, d = %x\n", i, k, d);
|
|
switch (i)
|
|
{
|
|
case 0: assert(k == 4); assert(d == 'b'); break;
|
|
case 1: assert(k == 2); assert(d == '\U000A0456'); break;
|
|
case 2: assert(k == 1); assert(d == '\u1234'); break;
|
|
case 3: assert(k == 0); assert(d == 'a'); break;
|
|
default: assert(0);
|
|
}
|
|
i++;
|
|
}
|
|
assert(i == 4);
|
|
}
|
|
|
|
/*****************************/
|
|
|
|
extern (C) int _aApplyRcw2(in char[] aa, dg2_t dg)
|
|
{ int result;
|
|
|
|
debug(apply) printf("_aApplyRcw2(), len = %d\n", aa.length);
|
|
for (size_t i = aa.length; i != 0; )
|
|
{ dchar d;
|
|
wchar w;
|
|
|
|
i--;
|
|
w = aa[i];
|
|
if (w & 0x80)
|
|
{ char c = cast(char)w;
|
|
uint j;
|
|
uint m = 0x3F;
|
|
d = 0;
|
|
while ((c & 0xC0) != 0xC0)
|
|
{ if (i == 0)
|
|
onUnicodeError("Invalid UTF-8 sequence", 0);
|
|
i--;
|
|
d |= (c & 0x3F) << j;
|
|
j += 6;
|
|
m >>= 1;
|
|
c = aa[i];
|
|
}
|
|
d |= (c & m) << j;
|
|
|
|
if (d <= 0xFFFF)
|
|
w = cast(wchar) d;
|
|
else
|
|
{
|
|
w = cast(wchar) ((((d - 0x10000) >> 10) & 0x3FF) + 0xD800);
|
|
result = dg(&i, cast(void *)&w);
|
|
if (result)
|
|
break;
|
|
w = cast(wchar) (((d - 0x10000) & 0x3FF) + 0xDC00);
|
|
}
|
|
}
|
|
result = dg(&i, cast(void *)&w);
|
|
if (result)
|
|
break;
|
|
}
|
|
return result;
|
|
}
|
|
|
|
unittest
|
|
{
|
|
debug(apply) printf("_aApplyRcw2.unittest\n");
|
|
|
|
auto s = "hello"c[];
|
|
int i;
|
|
|
|
foreach_reverse (k, wchar d; s)
|
|
{
|
|
//printf("i = %d, k = %d, d = %x\n", i, k, d);
|
|
assert(k == 4 - i);
|
|
switch (i)
|
|
{
|
|
case 0: assert(d == 'o'); break;
|
|
case 1: assert(d == 'l'); break;
|
|
case 2: assert(d == 'l'); break;
|
|
case 3: assert(d == 'e'); break;
|
|
case 4: assert(d == 'h'); break;
|
|
default: assert(0);
|
|
}
|
|
i++;
|
|
}
|
|
assert(i == 5);
|
|
|
|
s = "a\u1234\U000A0456b";
|
|
i = 0;
|
|
foreach_reverse (k, wchar d; s)
|
|
{
|
|
//printf("i = %d, k = %d, d = %x\n", i, k, d);
|
|
switch (i)
|
|
{
|
|
case 0: assert(k == 8); assert(d == 'b'); break;
|
|
case 1: assert(k == 4); assert(d == 0xDA41); break;
|
|
case 2: assert(k == 4); assert(d == 0xDC56); break;
|
|
case 3: assert(k == 1); assert(d == 0x1234); break;
|
|
case 4: assert(k == 0); assert(d == 'a'); break;
|
|
default: assert(0);
|
|
}
|
|
i++;
|
|
}
|
|
assert(i == 5);
|
|
}
|
|
|
|
/*****************************/
|
|
|
|
extern (C) int _aApplyRwc2(in wchar[] aa, dg2_t dg)
|
|
{ int result;
|
|
|
|
debug(apply) printf("_aApplyRwc2(), len = %d\n", aa.length);
|
|
for (size_t i = aa.length; i != 0; )
|
|
{ dchar d;
|
|
char c;
|
|
|
|
i--;
|
|
d = aa[i];
|
|
if (d >= 0xDC00 && d <= 0xDFFF)
|
|
{ if (i == 0)
|
|
onUnicodeError("Invalid UTF-16 sequence", 0);
|
|
i--;
|
|
d = ((aa[i] - 0xD7C0) << 10) + (d - 0xDC00);
|
|
}
|
|
|
|
if (d & ~0x7F)
|
|
{
|
|
char[4] buf;
|
|
|
|
auto b = toUTF8(buf, d);
|
|
foreach (char c2; b)
|
|
{
|
|
result = dg(&i, cast(void *)&c2);
|
|
if (result)
|
|
return result;
|
|
}
|
|
continue;
|
|
}
|
|
c = cast(char)d;
|
|
result = dg(&i, cast(void *)&c);
|
|
if (result)
|
|
break;
|
|
}
|
|
return result;
|
|
}
|
|
|
|
unittest
|
|
{
|
|
debug(apply) printf("_aApplyRwc2.unittest\n");
|
|
|
|
auto s = "hello"w[];
|
|
int i;
|
|
|
|
foreach_reverse (k, char d; s)
|
|
{
|
|
//printf("i = %d, k = %d, d = %x\n", i, k, d);
|
|
assert(k == 4 - i);
|
|
switch (i)
|
|
{
|
|
case 0: assert(d == 'o'); break;
|
|
case 1: assert(d == 'l'); break;
|
|
case 2: assert(d == 'l'); break;
|
|
case 3: assert(d == 'e'); break;
|
|
case 4: assert(d == 'h'); break;
|
|
default: assert(0);
|
|
}
|
|
i++;
|
|
}
|
|
assert(i == 5);
|
|
|
|
s = "a\u1234\U000A0456b";
|
|
i = 0;
|
|
foreach_reverse (k, char d; s)
|
|
{
|
|
//printf("i = %d, k = %d, d = %x\n", i, k, d);
|
|
switch (i)
|
|
{
|
|
case 0: assert(k == 4); assert(d == 'b'); break;
|
|
case 1: assert(k == 2); assert(d == 0xF2); break;
|
|
case 2: assert(k == 2); assert(d == 0xA0); break;
|
|
case 3: assert(k == 2); assert(d == 0x91); break;
|
|
case 4: assert(k == 2); assert(d == 0x96); break;
|
|
case 5: assert(k == 1); assert(d == 0xE1); break;
|
|
case 6: assert(k == 1); assert(d == 0x88); break;
|
|
case 7: assert(k == 1); assert(d == 0xB4); break;
|
|
case 8: assert(k == 0); assert(d == 'a'); break;
|
|
default: assert(0);
|
|
}
|
|
i++;
|
|
}
|
|
assert(i == 9);
|
|
}
|
|
|
|
/*****************************/
|
|
|
|
extern (C) int _aApplyRdc2(in dchar[] aa, dg2_t dg)
|
|
{ int result;
|
|
|
|
debug(apply) printf("_aApplyRdc2(), len = %d\n", aa.length);
|
|
for (size_t i = aa.length; i != 0; )
|
|
{ dchar d = aa[--i];
|
|
char c;
|
|
|
|
if (d & ~0x7F)
|
|
{
|
|
char[4] buf;
|
|
|
|
auto b = toUTF8(buf, d);
|
|
foreach (char c2; b)
|
|
{
|
|
result = dg(&i, cast(void *)&c2);
|
|
if (result)
|
|
return result;
|
|
}
|
|
continue;
|
|
}
|
|
else
|
|
{ c = cast(char)d;
|
|
}
|
|
result = dg(&i, cast(void *)&c);
|
|
if (result)
|
|
break;
|
|
}
|
|
return result;
|
|
}
|
|
|
|
unittest
|
|
{
|
|
debug(apply) printf("_aApplyRdc2.unittest\n");
|
|
|
|
auto s = "hello"d[];
|
|
int i;
|
|
|
|
foreach_reverse (k, char d; s)
|
|
{
|
|
//printf("i = %d, k = %d, d = %x\n", i, k, d);
|
|
assert(k == 4 - i);
|
|
switch (i)
|
|
{
|
|
case 0: assert(d == 'o'); break;
|
|
case 1: assert(d == 'l'); break;
|
|
case 2: assert(d == 'l'); break;
|
|
case 3: assert(d == 'e'); break;
|
|
case 4: assert(d == 'h'); break;
|
|
default: assert(0);
|
|
}
|
|
i++;
|
|
}
|
|
assert(i == 5);
|
|
|
|
s = "a\u1234\U000A0456b";
|
|
i = 0;
|
|
foreach_reverse (k, char d; s)
|
|
{
|
|
//printf("i = %d, k = %d, d = %x\n", i, k, d);
|
|
switch (i)
|
|
{
|
|
case 0: assert(k == 3); assert(d == 'b'); break;
|
|
case 1: assert(k == 2); assert(d == 0xF2); break;
|
|
case 2: assert(k == 2); assert(d == 0xA0); break;
|
|
case 3: assert(k == 2); assert(d == 0x91); break;
|
|
case 4: assert(k == 2); assert(d == 0x96); break;
|
|
case 5: assert(k == 1); assert(d == 0xE1); break;
|
|
case 6: assert(k == 1); assert(d == 0x88); break;
|
|
case 7: assert(k == 1); assert(d == 0xB4); break;
|
|
case 8: assert(k == 0); assert(d == 'a'); break;
|
|
default: assert(0);
|
|
}
|
|
i++;
|
|
}
|
|
assert(i == 9);
|
|
}
|
|
|
|
/*****************************/
|
|
|
|
extern (C) int _aApplyRdw2(in dchar[] aa, dg2_t dg)
|
|
{ int result;
|
|
|
|
debug(apply) printf("_aApplyRdw2(), len = %d\n", aa.length);
|
|
for (size_t i = aa.length; i != 0; )
|
|
{ dchar d = aa[--i];
|
|
wchar w;
|
|
|
|
if (d <= 0xFFFF)
|
|
w = cast(wchar) d;
|
|
else
|
|
{
|
|
w = cast(wchar) ((((d - 0x10000) >> 10) & 0x3FF) + 0xD800);
|
|
result = dg(&i, cast(void *)&w);
|
|
if (result)
|
|
break;
|
|
w = cast(wchar) (((d - 0x10000) & 0x3FF) + 0xDC00);
|
|
}
|
|
result = dg(&i, cast(void *)&w);
|
|
if (result)
|
|
break;
|
|
}
|
|
return result;
|
|
}
|
|
|
|
unittest
|
|
{
|
|
debug(apply) printf("_aApplyRdw2.unittest\n");
|
|
|
|
auto s = "hello"d[];
|
|
int i;
|
|
|
|
foreach_reverse (k, wchar d; s)
|
|
{
|
|
//printf("i = %d, k = %d, d = %x\n", i, k, d);
|
|
assert(k == 4 - i);
|
|
switch (i)
|
|
{
|
|
case 0: assert(d == 'o'); break;
|
|
case 1: assert(d == 'l'); break;
|
|
case 2: assert(d == 'l'); break;
|
|
case 3: assert(d == 'e'); break;
|
|
case 4: assert(d == 'h'); break;
|
|
default: assert(0);
|
|
}
|
|
i++;
|
|
}
|
|
assert(i == 5);
|
|
|
|
s = "a\u1234\U000A0456b";
|
|
i = 0;
|
|
foreach_reverse (k, wchar d; s)
|
|
{
|
|
//printf("i = %d, k = %d, d = %x\n", i, k, d);
|
|
switch (i)
|
|
{
|
|
case 0: assert(k == 3); assert(d == 'b'); break;
|
|
case 1: assert(k == 2); assert(d == 0xDA41); break;
|
|
case 2: assert(k == 2); assert(d == 0xDC56); break;
|
|
case 3: assert(k == 1); assert(d == 0x1234); break;
|
|
case 4: assert(k == 0); assert(d == 'a'); break;
|
|
default: assert(0);
|
|
}
|
|
i++;
|
|
}
|
|
assert(i == 5);
|
|
}
|