cb41b9e70e
This imports readline 8.0. readline/ChangeLog.gdb 2019-08-12 Tom Tromey <tom@tromey.com> * Imported readline 8.0.
291 lines
6.8 KiB
C
291 lines
6.8 KiB
C
/* nls.c -- skeletal internationalization code. */
|
|
|
|
/* Copyright (C) 1996-2017 Free Software Foundation, Inc.
|
|
|
|
This file is part of the GNU Readline Library (Readline), a library
|
|
for reading lines of text with interactive input and history editing.
|
|
|
|
Readline is free software: you can redistribute it and/or modify
|
|
it under the terms of the GNU General Public License as published by
|
|
the Free Software Foundation, either version 3 of the License, or
|
|
(at your option) any later version.
|
|
|
|
Readline is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
GNU General Public License for more details.
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
along with Readline. If not, see <http://www.gnu.org/licenses/>.
|
|
*/
|
|
|
|
#define READLINE_LIBRARY
|
|
|
|
#if defined (HAVE_CONFIG_H)
|
|
# include <config.h>
|
|
#endif
|
|
|
|
#include <sys/types.h>
|
|
|
|
#include <stdio.h>
|
|
|
|
#if defined (HAVE_UNISTD_H)
|
|
# include <unistd.h>
|
|
#endif /* HAVE_UNISTD_H */
|
|
|
|
#if defined (HAVE_STDLIB_H)
|
|
# include <stdlib.h>
|
|
#else
|
|
# include "ansi_stdlib.h"
|
|
#endif /* HAVE_STDLIB_H */
|
|
|
|
#if defined (HAVE_LOCALE_H)
|
|
# include <locale.h>
|
|
#endif
|
|
|
|
#if defined (HAVE_LANGINFO_CODESET)
|
|
# include <langinfo.h>
|
|
#endif
|
|
|
|
#include <ctype.h>
|
|
|
|
#include "rldefs.h"
|
|
#include "readline.h"
|
|
#include "rlshell.h"
|
|
#include "rlprivate.h"
|
|
|
|
static int utf8locale PARAMS((char *));
|
|
|
|
#if !defined (HAVE_SETLOCALE)
|
|
/* A list of legal values for the LANG or LC_CTYPE environment variables.
|
|
If a locale name in this list is the value for the LC_ALL, LC_CTYPE,
|
|
or LANG environment variable (using the first of those with a value),
|
|
readline eight-bit mode is enabled. */
|
|
static char *legal_lang_values[] =
|
|
{
|
|
"iso88591",
|
|
"iso88592",
|
|
"iso88593",
|
|
"iso88594",
|
|
"iso88595",
|
|
"iso88596",
|
|
"iso88597",
|
|
"iso88598",
|
|
"iso88599",
|
|
"iso885910",
|
|
"koi8r",
|
|
"utf8",
|
|
0
|
|
};
|
|
|
|
static char *normalize_codeset PARAMS((char *));
|
|
#endif /* !HAVE_SETLOCALE */
|
|
|
|
static char *find_codeset PARAMS((char *, size_t *));
|
|
|
|
static char *_rl_get_locale_var PARAMS((const char *));
|
|
|
|
static char *
|
|
_rl_get_locale_var (const char *v)
|
|
{
|
|
char *lspec;
|
|
|
|
lspec = sh_get_env_value ("LC_ALL");
|
|
if (lspec == 0 || *lspec == 0)
|
|
lspec = sh_get_env_value (v);
|
|
if (lspec == 0 || *lspec == 0)
|
|
lspec = sh_get_env_value ("LANG");
|
|
|
|
return lspec;
|
|
}
|
|
|
|
static int
|
|
utf8locale (char *lspec)
|
|
{
|
|
char *cp;
|
|
size_t len;
|
|
|
|
#if HAVE_LANGINFO_CODESET
|
|
cp = nl_langinfo (CODESET);
|
|
return (STREQ (cp, "UTF-8") || STREQ (cp, "utf8"));
|
|
#else
|
|
cp = find_codeset (lspec, &len);
|
|
|
|
if (cp == 0 || len < 4 || len > 5)
|
|
return 0;
|
|
return ((len == 5) ? strncmp (cp, "UTF-8", len) == 0 : strncmp (cp, "utf8", 4) == 0);
|
|
#endif
|
|
}
|
|
|
|
/* Query the right environment variables and call setlocale() to initialize
|
|
the C library locale settings. */
|
|
char *
|
|
_rl_init_locale (void)
|
|
{
|
|
char *ret, *lspec;
|
|
|
|
/* Set the LC_CTYPE locale category from environment variables. */
|
|
lspec = _rl_get_locale_var ("LC_CTYPE");
|
|
/* Since _rl_get_locale_var queries the right environment variables,
|
|
we query the current locale settings with setlocale(), and, if
|
|
that doesn't return anything, we set lspec to the empty string to
|
|
force the subsequent call to setlocale() to define the `native'
|
|
environment. */
|
|
if (lspec == 0 || *lspec == 0)
|
|
lspec = setlocale (LC_CTYPE, (char *)NULL);
|
|
if (lspec == 0)
|
|
lspec = "";
|
|
ret = setlocale (LC_CTYPE, lspec); /* ok, since it does not change locale */
|
|
|
|
_rl_utf8locale = (ret && *ret) ? utf8locale (ret) : 0;
|
|
|
|
return ret;
|
|
}
|
|
|
|
/* Check for LC_ALL, LC_CTYPE, and LANG and use the first with a value
|
|
to decide the defaults for 8-bit character input and output. Returns
|
|
1 if we set eight-bit mode. */
|
|
int
|
|
_rl_init_eightbit (void)
|
|
{
|
|
/* If we have setlocale(3), just check the current LC_CTYPE category
|
|
value, and go into eight-bit mode if it's not C or POSIX. */
|
|
#if defined (HAVE_SETLOCALE)
|
|
char *lspec, *t;
|
|
|
|
t = _rl_init_locale (); /* returns static pointer */
|
|
|
|
if (t && *t && (t[0] != 'C' || t[1]) && (STREQ (t, "POSIX") == 0))
|
|
{
|
|
_rl_meta_flag = 1;
|
|
_rl_convert_meta_chars_to_ascii = 0;
|
|
_rl_output_meta_chars = 1;
|
|
return (1);
|
|
}
|
|
else
|
|
return (0);
|
|
|
|
#else /* !HAVE_SETLOCALE */
|
|
char *lspec, *t;
|
|
int i;
|
|
|
|
/* We don't have setlocale. Finesse it. Check the environment for the
|
|
appropriate variables and set eight-bit mode if they have the right
|
|
values. */
|
|
lspec = _rl_get_locale_var ("LC_CTYPE");
|
|
|
|
if (lspec == 0 || (t = normalize_codeset (lspec)) == 0)
|
|
return (0);
|
|
for (i = 0; t && legal_lang_values[i]; i++)
|
|
if (STREQ (t, legal_lang_values[i]))
|
|
{
|
|
_rl_meta_flag = 1;
|
|
_rl_convert_meta_chars_to_ascii = 0;
|
|
_rl_output_meta_chars = 1;
|
|
break;
|
|
}
|
|
|
|
_rl_utf8locale = *t ? STREQ (t, "utf8") : 0;
|
|
|
|
xfree (t);
|
|
return (legal_lang_values[i] ? 1 : 0);
|
|
#endif /* !HAVE_SETLOCALE */
|
|
}
|
|
|
|
#if !defined (HAVE_SETLOCALE)
|
|
static char *
|
|
normalize_codeset (char *codeset)
|
|
{
|
|
size_t namelen, i;
|
|
int len, all_digits;
|
|
char *wp, *retval;
|
|
|
|
codeset = find_codeset (codeset, &namelen);
|
|
|
|
if (codeset == 0)
|
|
return (codeset);
|
|
|
|
all_digits = 1;
|
|
for (len = 0, i = 0; i < namelen; i++)
|
|
{
|
|
if (ISALNUM ((unsigned char)codeset[i]))
|
|
{
|
|
len++;
|
|
all_digits &= _rl_digit_p (codeset[i]);
|
|
}
|
|
}
|
|
|
|
retval = (char *)malloc ((all_digits ? 3 : 0) + len + 1);
|
|
if (retval == 0)
|
|
return ((char *)0);
|
|
|
|
wp = retval;
|
|
/* Add `iso' to beginning of an all-digit codeset */
|
|
if (all_digits)
|
|
{
|
|
*wp++ = 'i';
|
|
*wp++ = 's';
|
|
*wp++ = 'o';
|
|
}
|
|
|
|
for (i = 0; i < namelen; i++)
|
|
if (ISALPHA ((unsigned char)codeset[i]))
|
|
*wp++ = _rl_to_lower (codeset[i]);
|
|
else if (_rl_digit_p (codeset[i]))
|
|
*wp++ = codeset[i];
|
|
*wp = '\0';
|
|
|
|
return retval;
|
|
}
|
|
#endif /* !HAVE_SETLOCALE */
|
|
|
|
/* Isolate codeset portion of locale specification. */
|
|
static char *
|
|
find_codeset (char *name, size_t *lenp)
|
|
{
|
|
char *cp, *language, *result;
|
|
|
|
cp = language = name;
|
|
result = (char *)0;
|
|
|
|
while (*cp && *cp != '_' && *cp != '@' && *cp != '+' && *cp != ',')
|
|
cp++;
|
|
|
|
/* This does not make sense: language has to be specified. As
|
|
an exception we allow the variable to contain only the codeset
|
|
name. Perhaps there are funny codeset names. */
|
|
if (language == cp)
|
|
{
|
|
*lenp = strlen (language);
|
|
result = language;
|
|
}
|
|
else
|
|
{
|
|
/* Next is the territory. */
|
|
if (*cp == '_')
|
|
do
|
|
++cp;
|
|
while (*cp && *cp != '.' && *cp != '@' && *cp != '+' && *cp != ',' && *cp != '_');
|
|
|
|
/* Now, finally, is the codeset. */
|
|
result = cp;
|
|
if (*cp == '.')
|
|
do
|
|
++cp;
|
|
while (*cp && *cp != '@');
|
|
|
|
if (cp - result > 2)
|
|
{
|
|
result++;
|
|
*lenp = cp - result;
|
|
}
|
|
else
|
|
{
|
|
*lenp = strlen (language);
|
|
result = language;
|
|
}
|
|
}
|
|
|
|
return result;
|
|
}
|