/*
* CDDL HEADER START
*
* The contents of this file are subject to the terms of the
* Common Development and Distribution License (the "License").
* You may not use this file except in compliance with the License.
*
* You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
* See the License for the specific language governing permissions
* and limitations under the License.
*
* When distributing Covered Code, include this CDDL HEADER in each
* file and include the License file at usr/src/OPENSOLARIS.LICENSE.
* If applicable, add the following below this CDDL HEADER, with the
* fields enclosed by brackets "[]" replaced with your own identifying
* information: Portions Copyright [yyyy] [name of copyright owner]
*
* CDDL HEADER END
*/
/*
*/
#include "lint.h"
#include <stdlib.h>
#include <stdio.h>
#include <dlfcn.h>
#include <fcntl.h>
#include <unistd.h>
#include <string.h>
#include <errno.h>
#include <alloca.h>
#include <langinfo.h>
#include "iconv.h"
#include "iconvP.h"
#include "../i18n/_loc_path.h"
static iconv_t iconv_open_real(const char *, const char *, int);
static iconv_p iconv_open_all(char *, char *, char *, int, int);
static iconv_p iconv_open_private(const char *, const char *, int, int);
static iconv_p iconv_search_alias(char **, char **, const char *,
const char *, char *, int, int);
size_t *);
static int passthru_icv_iconvctl(iconv_t, int, void *);
static void passthru_icv_close(iconv_t);
static char *process_conv_modifier_and_special_names(const char *, int *);
static void free_names(char *, const char *, char *, const char *);
/*
* These functions are mainly implemented by using a shared object and
* the dlopen() functions. The actual conversion algorithm for a particular
* conversion is implemented via a shared object as a loadable conversion
* module which is linked dynamically at run time.
*
* The loadable conversion module resides as either:
*
*
* if the conversion is supported through a geniconvtbl code conversion
* binary table or as a module that directly specifies the conversion at:
*
*
* where fromcode is the source encoding and tocode is the target encoding.
* The modules have three must-have entries, _icv_open(), _icv_iconv(), and
* _icv_close(), and three optional entries, _icv_open_attr(), _icv_iconvctl(),
* and _icv_iconvstr().
*
* If there is no code conversion supported and if the fromcode and the tocode
* are specifying the same codeset, then, the byte-by-byte, pass-through code
* conversion that is embedded in the libc is used instead.
*
* The following are the related PSARC cases:
*
* PSARC/1993/153 iconv/iconv_open/iconv_close
* PSARC/1999/292 Addition of geniconvtbl(1)
* PSARC/2001/072 GNU gettext support
* PSARC/2009/561 Pass-through iconv code conversion
* PSARC/2010/160 Libc iconv enhancement
*
*/
{
}
static iconv_t
{
char *ipath;
char *from;
char *from_canonical;
char *to;
char *to_canonical;
int flag;
flag = 0;
return ((iconv_t)-1);
}
return ((iconv_t)-1);
}
return ((iconv_t)-1);
}
/*
*/
return ((iconv_t)-1);
}
/* found a valid module for this conversion */
return (cd);
}
/*
* Now, try using the encoding name aliasing table
*/
/*
* As the last resort, check if the tocode and the fromcode
* are referring to the same codeset name or not. If so,
* assign the embedded pass-through code conversion.
*/
/*
* No valid conversion available. Do failure retrun
* with the errno set by iconv_search_alias().
*/
return ((iconv_t)-1);
}
/*
* For a pass-through byte-by-byte code conversion, allocate
* an internal conversion descriptor and initialize the data
* fields appropriately and we are done.
*/
return ((iconv_t)-1);
}
return ((iconv_t)-1);
}
}
/* found a valid module for this conversion */
return (cd);
}
static size_t
{
char *p, *sp, *q;
p = addr;
while (q > p) {
if (*p == '#') {
/*
* Line beginning with '#' is a comment
*/
p++;
while ((q > p) && (*p++ != '\n'))
;
continue;
}
/* skip leading spaces */
while ((q > p) &&
((*p == ' ') || (*p == '\t')))
p++;
if (q <= p)
break;
sp = p;
while ((q > p) && (*p != ' ') &&
(*p != '\t') && (*p != '\n'))
p++;
if (q <= p) {
/* invalid entry */
break;
}
if (*p == '\n') {
/* invalid entry */
p++;
continue;
}
/*
* didn't match
*/
/* skip remaining chars in this line */
p++;
while ((q > p) && (*p++ != '\n'))
;
continue;
}
/* matching entry found */
/* skip spaces */
while ((q > p) &&
((*p == ' ') || (*p == '\t')))
p++;
if (q <= p)
break;
sp = p;
while ((q > p) && (*p != ' ') &&
(*p != '\t') && (*p != '\n'))
p++;
if (can_len == 0) {
while ((q > p) && (*p++ != '\n'))
;
continue;
}
return (can_len);
/* NOTREACHED */
}
return (0);
}
static iconv_p
{
int len;
/*
* First, try using the geniconvtbl conversion, which is
* performed by /usr/lib/iconv/geniconvtbl.so with
* the conversion table file:
* /usr/lib/iconv/geniconvtbl/binarytables/fromcode%tocode.bt
*
* If the geniconvtbl conversion cannot be done,
* try the conversion by the individual shared object.
*/
/*
* from%to.bt exists in the table dir
*/
flag, string_based);
/* found a valid module for this conversion */
return (cv);
}
}
/*
* errno will be set by iconv_open_private on error
*/
}
/* no valid module for this conversion found */
return ((iconv_p)-1);
}
static iconv_p
int flag, int string_based)
{
char *p;
int fd;
*to_canonical = (char *)tocode;
*from_canonical = (char *)fromcode;
if (fd == -1) {
/*
* if no alias file found,
* errno will be set to EINVAL.
*/
return ((iconv_p)-1);
}
/* use errno set by fstat64 */
return ((iconv_p)-1);
}
if (addr == MAP_FAILED) {
/* use errno set by mmap */
return ((iconv_p)-1);
}
p = (char *)addr;
if (tolen) {
if (*to_canonical == NULL) {
*to_canonical = (char *)tocode;
return ((iconv_p)-1);
}
}
p = (char *)addr;
if (fromlen) {
if (*from_canonical == NULL) {
*from_canonical = (char *)fromcode;
return ((iconv_p)-1);
}
}
return ((iconv_p)-1);
}
flag, string_based);
/* errno set by iconv_open_all on error */
return (cv);
}
static iconv_p
{
return ((iconv_p)-1);
}
goto ICONV_OPEN_ERR_TWO;
/*
* If this is called from iconvstr(), get the address of
* _icv_iconvstr and return since that's all we need.
*/
if (string_based) {
if ((cdpath->_icv_iconvstr =
goto ICONV_OPEN_ERR_ONE;
return (cdpath);
}
/*
* Get address of _icv_open or _icv_open_attr depending on whether
* we have at least a value defined in the flag.
*/
if (flag == 0) {
goto ICONV_OPEN_ERR_ONE;
goto ICONV_OPEN_ERR_ONE;
}
/*
* gets address of _icv_iconv in the loadable conversion module
* and stores it in cdpath->_icv_iconv
*/
"_icv_iconv")) == NULL)
goto ICONV_OPEN_ERR_ONE;
/*
* gets address of _icv_close in the loadable conversion module
* and stores it in cd->_icv_close
*/
"_icv_close")) == NULL)
goto ICONV_OPEN_ERR_ONE;
/*
* Get the address of _icv_iconvctl() from the module.
* Saving NULL via dlsym() is normal and, in that case, simply,
* the module doesn't support the iconvctl().
*/
/*
* Initialize the state of the _icv_iconv conversion routine by
* calling _icv_open() or _icv_open_attr().
*
* For all regular iconv modules, NULL will be passed for the tbl
* argument although the iconv_open() of the module won't use that.
*/
if (flag == 0) {
} else {
}
return (cdpath);
return ((iconv_p)-1);
}
int
{
return (-1);
}
return (0);
}
static void
{
}
{
/* check if cd is valid */
return ((size_t)-1);
}
/* direct conversion */
}
static size_t
/*LINTED E_FUNC_ARG_UNUSED*/
{
/* For any state reset request, return success. */
return (0);
/*
* Initialize internally used variables for a better performance
* and prepare for a couple of the return values before the actual
* copying of the bytes.
*/
obl = *outbufleft;
} else {
ret_val = 0;
}
/*
* Do the copy using memmove(). There are no EILSEQ or EINVAL
* checkings since this is a simple copying.
*/
/* Update the return values related to the buffers then do return. */
return (ret_val);
}
int
{
int flag;
return (-1);
}
return (-1);
}
return (-1);
}
if (req == ICONV_SET_CONVERSION_BEHAVIOR) {
if ((flag & ICONV_CONV_ILLEGAL_DISCARD) != 0)
if ((flag & ICONV_CONV_NON_IDENTICAL_DISCARD) != 0)
if ((flag & ICONV_CONV_NON_IDENTICAL_REPLACE_HEX) != 0)
}
}
static int
{
int a;
long f;
a = *((int *)arg);
f = *((int *)cd);
switch (req) {
a = f;
break;
case ICONV_GET_DISCARD_ILSEQ:
if ((f & ICONV_CONV_ILLEGAL_DISCARD) != 0 &&
(f & ICONV_CONV_NON_IDENTICAL_DISCARD) != 0)
a = 1;
else
a = 0;
break;
case ICONV_GET_TRANSLITERATE:
if ((f & ICONV_CONV_NON_IDENTICAL_TRANSLITERATE) != 0)
a = 1;
else
a = 0;
break;
f = a;
break;
case ICONV_SET_DISCARD_ILSEQ:
if (a == 0)
f &= ~(ICONV_CONV_ILLEGAL_DISCARD |
else
f |= ICONV_CONV_ILLEGAL_DISCARD |
break;
case ICONV_SET_TRANSLITERATE:
if (a == 0)
else
break;
case ICONV_TRIVIALP:
a = 1;
break;
}
*((int *)cd) = f;
*((int *)arg) = a;
return (0);
}
{
size_t r;
return ((size_t)-1);
}
return (r);
}
static size_t
{
char *np;
if ((flag & ICONV_IGNORE_NULL) == 0 &&
else
} else {
ret_val = 0;
}
return (ret_val);
}
/*
* The following function maps "", "char", and "wchar_t" into some
* uniquely identifiable names as specified in the iconv-l10n-guide.txt at
* the materials directory of PSARC/2010/160.
*
* For any other names, if requested, it duplicates the name into
* a new memory block and returns.
*/
static char *
{
char *s;
s = nl_langinfo(CODESET);
return (NULL);
}
if (no_malloc)
return (name);
return (NULL);
s[len] = '\0';
return (s);
}
/*
* The min and max lengths of all indicators at this point are 6 of "IGNORE"
* and 27 of "NON_IDENTICAL_TRANSLITERATE", respectively.
*/
/*
* The following function clears any prior flag values that are
* conflicting with the new value asked in "s" and then sets the new
* one at the flag.
*/
static int
{
return (flag);
if (SAME_STR(s, "ILLEGAL_REPLACE_HEX"))
else if (SAME_STR(s, "ILLEGAL_RESTORE_HEX"))
if (SAME_STR(s, "NON_IDENTICAL_REPLACE_HEX"))
else if (SAME_STR(s, "NON_IDENTICAL_RESTORE_HEX"))
if (SAME_STR(s, "REPLACE_HEX"))
else if (SAME_STR(s, "RESTORE_HEX"))
}
return (flag);
}
/*
* code conversion behavior modification indicators if any and the actual
* codeset name from the name and sets the flag. It also processes special
* process_special_names().
*/
static char *
{
char *start;
char *prev_start;
char *end;
break;
start++;
}
continue;
}
}
}
static void
{
}