/*
 * Copyright 2002, 2004 by Paul Mattes.
 *  Permission to use, copy, modify, and distribute this software and its
 *  documentation for any purpose and without fee is hereby granted,
 *  provided that the above copyright notice appear in all copies and that
 *  both that copyright notice and this permission notice appear in
 *  supporting documentation.
 *
 * x3270 is distributed in the hope that it will be useful, but WITHOUT ANY
 * WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
 * FOR A PARTICULAR PURPOSE.  See the file LICENSE for more details.
 */

/*
 *	wide.c
 *		A 3270 Terminal Emulator for X11
 *		Wide character translation functions.
 */

#include "globals.h"
#include <errno.h>
#include <locale.h>
#include <langinfo.h>

#include "3270ds.h"
#if !defined(PR3287) /*[*/
#include "appres.h"
#endif /*]*/

#include "popupsc.h"
#include "tablesc.h"
#include "trace_dsc.h"
#if !defined(PR3287) /*[*/
#include "utilc.h"
#endif /*]*/

#include "widec.h"

#define ICU_DATA	"ICU_DATA"

char *local_encoding = CN;

static UConverter *dbcs_converter = NULL;
static char *dbcs_converter_name = CN;
static UConverter *sbcs_converter = NULL;
static char *sbcs_converter_name = CN;
static UConverter *local_converter = NULL;
#if defined(X3270_DISPLAY) /*[*/
static UConverter *wdisplay_converter = NULL;
#endif /*]*/
static Boolean same_converter = False;

/* Initialize, or reinitialize the EBCDIC DBCS converters. */
int
wide_init(char *converter_names, char *local_name)
{
	UErrorCode err = U_ZERO_ERROR;
	char *cur_path = CN;
	Boolean lib_ok = False;
	Boolean dot_ok = False;
	char *cn_copy, *buf, *token;
	char *sbcs_converters = NULL;
	char *dbcs_converters = NULL;
	int n_converter_sets = 0;
	int n_sbcs_converters = 0;
	int n_dbcs_converters = 0;

	/* This may be a reinit. */
	if (local_converter != NULL) {
		ucnv_close(local_converter);
		local_converter = NULL;
	}
	Replace(local_encoding, CN);
	if (sbcs_converter != NULL) {
		ucnv_close(sbcs_converter);
		sbcs_converter = NULL;
	}
	Replace(sbcs_converter_name, CN);
	if (dbcs_converter != NULL) {
		ucnv_close(dbcs_converter);
		dbcs_converter = NULL;
	}
	Replace(dbcs_converter_name, CN);
#if defined(X3270_DISPLAY) /*[*/
	if (wdisplay_converter != NULL) {
		ucnv_close(wdisplay_converter);
		wdisplay_converter = NULL;
	}
#endif /*]*/
	same_converter = False;

	/* Make sure that $ICU_DATA has LIBX3270DIR and . in it. */
	cur_path = getenv(ICU_DATA);
	if (cur_path != CN) {
		char *t = NewString(cur_path);
		char *token;
		char *buf = t;

		while (!(lib_ok && dot_ok) &&
		       (token = strtok(buf, ":")) != CN) {
			buf = CN;
			if (!strcmp(token, LIBX3270DIR)) {
				lib_ok = True;
			} else if (!strcmp(token, ".")) {
				dot_ok = True;
			}
		}
		Free(t);
	}
	if (!lib_ok || !dot_ok) {
		char *s, *new_path;

		s = new_path = Malloc(strlen(ICU_DATA) +
		    (cur_path? strlen(cur_path): 0) + 
		    strlen(LIBX3270DIR) + 5 /* ICU_DATA=*:*:.\n */);

		s += sprintf(s, "%s=", ICU_DATA);
		if (cur_path != CN)
			s += sprintf(s, "%s", cur_path);
		if (!lib_ok) {
			if (s[-1] != '=' && s[-1] != ':')
				*s++ = ':';
			s += sprintf(s, "%s", LIBX3270DIR);
		}
		if (!dot_ok) {
			if (s[-1] != '=' && s[-1] != ':')
				*s++ = ':';
			*s++ = '.';
		}
		*s = '\0';
		if (putenv(new_path) < 0) {
			popup_an_errno(errno, "putenv for " ICU_DATA " failed");
			return -1;
		}
	}

	/* Decode local converter name. */
	if (local_name == CN) {
		(void) setlocale(LC_CTYPE, "");
		local_name = nl_langinfo(CODESET);
	}
	if (local_name != CN) {
		err = U_ZERO_ERROR;
		local_converter = ucnv_open(local_name, &err);
		if (local_converter == NULL) {
			popup_an_error("Cannot find ICU converter for "
			    "local encoding:\n%s",
			    local_name);
		}
		Replace(local_encoding, NewString(local_name));
	}

	/* Decode host and display converter names. */
	if (converter_names == CN)
		return 0;

	/*
	 * Split into SBCS and DBCS converters, separated by '+'.  If only one
	 * converter is specified, it's the DBCS converter.
	 */
	n_converter_sets = 0;
	buf = cn_copy = NewString(converter_names);
	while ((token = strtok(buf, "+")) != CN) {
		buf = CN;
		switch (n_converter_sets) {
		case 0: /* DBCS or SBCS */
		    dbcs_converters = token;
		    break;
		case 1: /* DBCS */
		    sbcs_converters = dbcs_converters;
		    dbcs_converters = token;
		    break;
		default: /* extra */
		    popup_an_error("Extra converter set '%s' ignored", token);
		    break;
		}
		n_converter_sets++;
	}

	if (sbcs_converters != NULL) {
		n_sbcs_converters = 0;
		buf = sbcs_converters;
		while ((token = strtok(buf, ",")) != CN) {
			buf = CN;
			switch (n_sbcs_converters) {
			case 0: /* EBCDIC */
			    err = U_ZERO_ERROR;
			    sbcs_converter = ucnv_open(token, &err);
			    if (sbcs_converter == NULL) {
				    popup_an_error("Cannot find ICU converter "
					"for host SBCS:\n%s", token);
				    Free(cn_copy);
				    return -1;
			    }
			    Replace(sbcs_converter_name, NewString(token));
			    break;
			default: /* extra */
			    popup_an_error("Extra converter name '%s' ignored",
				token);
			    break;
			}
			n_sbcs_converters++;
		}
	}

	if (dbcs_converters != NULL) {
		n_dbcs_converters = 0;
		buf = dbcs_converters;
		while ((token = strtok(buf, ",")) != CN) {
			buf = CN;
			switch (n_dbcs_converters) {
			case 0: /* EBCDIC */
			    err = U_ZERO_ERROR;
			    dbcs_converter = ucnv_open(token, &err);
			    if (dbcs_converter == NULL) {
				    popup_an_error("Cannot find ICU converter "
					"for host DBCS:\n%s", token);
				    Free(cn_copy);
				    return -1;
			    }
			    Replace(dbcs_converter_name, NewString(token));
			    break;
			case 1: /* display */
#if defined(X3270_DISPLAY) /*[*/
			    err = U_ZERO_ERROR;
			    wdisplay_converter = ucnv_open(token, &err);
			    if (wdisplay_converter == NULL) {
				    popup_an_error("Cannot find ICU converter "
					"for display DBCS:\n%s", token);
				    Free(cn_copy);
				    return -1;
			    }
#endif /*]*/
			    break;
			default: /* extra */
			    popup_an_error("Extra converter name '%s' ignored",
				token);
			    break;
			}
			n_dbcs_converters++;
		}
	}

	Free(cn_copy);

	if (n_dbcs_converters < 2) {
		popup_an_error("Missing DBCS converter value");
		return -1;
	}
	if (dbcs_converter_name != CN &&
	    sbcs_converter_name != CN &&
	    !strcmp(dbcs_converter_name, sbcs_converter_name)) {
		same_converter = True;
	}

	return 0;
}

static void
xlate1(unsigned char from0, unsigned char from1, unsigned char to_buf[],
    UConverter *from_cnv, const char *from_name,
    UConverter *to_cnv, const char *to_name)
{
	UErrorCode err = U_ZERO_ERROR;
	UChar Ubuf[2];
	char from_buf[4];
	int from_len;
	char tmp_to_buf[3];
	int32_t len;
#if defined(WIDE_DEBUG) /*[*/
	int i;
#endif /*]*/

	/* Do something reasonable in case of failure. */
	to_buf[0] = to_buf[1] = 0;

	/* Convert string from source to Unicode. */
	if (same_converter) {
		from_buf[0] = EBC_so;
		from_buf[1] = from0;
		from_buf[2] = from1;
		from_buf[3] = EBC_si;
		from_len = 4;
	} else {
		from_buf[0] = from0;
		from_buf[1] = from1;
		from_len = 2;
	}
	len = ucnv_toUChars(from_cnv, Ubuf, 2, from_buf, from_len, &err);
	if (err != U_ZERO_ERROR) {
		trace_ds("[%s toUnicode of DBCS X'%02x%02x' failed, ICU "
		    "error %d]\n", from_name, from0, from1, (int)err);
		return;
	}
	if (Ubuf[0] == 0xfffd) {
		/* No translation. */
		trace_ds("[%s toUnicode of DBCS X'%02x%02x' failed]\n",
		    from_name, from0, from1);
		return;
	}
#if defined(WIDE_DEBUG) /*[*/
	printf("Got Unicode %x\n", Ubuf[0]);
#endif /*]*/

	if (to_cnv != NULL) {
		/* Convert string from Unicode to Destination. */
		len = ucnv_fromUChars(to_cnv, tmp_to_buf, 3, Ubuf, len, &err);
		if (err != U_ZERO_ERROR) {
			trace_ds("[fromUnicode of U+%04x to %s failed, ICU "
			    "error %d]\n", Ubuf[0], to_name, (int)err);
			return;
		}
		to_buf[0] = tmp_to_buf[0];
		to_buf[1] = tmp_to_buf[1];
#if defined(WIDE_DEBUG) /*[*/
		printf("Got %u %s characters:", len, to_name);
		for (i = 0; i < len; i++) {
			printf(" %02x", to_buf[i]);
		}
		printf("\n");
#endif /*]*/
	} else {
		to_buf[0] = (Ubuf[0] >> 8) & 0xff;
		to_buf[1] = Ubuf[0] & 0xff;
	}
}

#if defined(X3270_DISPLAY) /*[*/
/* Translate a DBCS EBCDIC character to a display character. */
void
dbcs_to_display(unsigned char ebc1, unsigned char ebc2, unsigned char c[])
{
	xlate1(ebc1, ebc2, c, dbcs_converter, "host DBCS", wdisplay_converter,
	    "wide display");
}
#endif /*]*/

/* Translate a DBCS EBCDIC character to a 2-byte Unicode character. */
void
dbcs_to_unicode16(unsigned char ebc1, unsigned char ebc2, unsigned char c[])
{
	xlate1(ebc1, ebc2, c, dbcs_converter, "host DBCS", NULL, NULL);
}

/*
 * Translate a DBCS EBCDIC character to a local multi-byte character.
 * Returns -1 for error, or the mb length.  NULL terminates.
 */
int
dbcs_to_mb(unsigned char ebc1, unsigned char ebc2, char *mb)
{
	UErrorCode err = U_ZERO_ERROR;
	unsigned char w[2];
	UChar Ubuf;
	int len;

	if (local_converter == NULL) {
		*mb = '?';
		*(mb + 1) = '\0';
		return 1;
	}

	/* Translate to Unicode first. */
	dbcs_to_unicode16(ebc1, ebc2, w);
	Ubuf = (w[0] << 8) | w[1];

	/* Then translate to the local encoding. */
	len = ucnv_fromUChars(local_converter, mb, 16, &Ubuf, 1, &err);
	if (err != U_ZERO_ERROR) {
		trace_ds("[fromUnicode of U+%04x to local failed, ICU "
		    "error %d]\n", Ubuf, (int)err);
		return -1;
	}
	return len;
}

/*
 * Translate an SBCS EBCDIC character to a local multi-byte character.
 * Returns -1 for error, or the mb length.  NULL terminates.
 */
int
sbcs_to_mb(unsigned char ebc, char *mb)
{
	UErrorCode err = U_ZERO_ERROR;
	UChar Ubuf;
	int len;

	if (sbcs_converter == NULL) {
		/* No SBCS converter, do EBCDIC to latin-1. */
		if (local_converter == NULL) {
			/* No local converter either, latin-1 is it. */
			*mb = ebc2asc[ebc];
			*(mb + 1) = '\0';
			return 1;
		}

		/* Have a local converter; use it below. */
		Ubuf = ebc2asc[ebc];
	} else {
		/* Have an SBCS converter.  Convert from SBCS to Unicode. */
		err = U_ZERO_ERROR;
		len = ucnv_toUChars(sbcs_converter, &Ubuf, 1, (char *)&ebc, 1,
				&err);
		if (err != U_ZERO_ERROR &&
				err != U_STRING_NOT_TERMINATED_WARNING) {
			trace_ds("[toUChars failed, ICU error %d]\n",
			    (int)err);
			return -1;
		}
	}

	/* Convert from Unicode to the local encoding. */
	len = ucnv_fromUChars(local_converter, mb, 16, &Ubuf, 1, &err);
	if (err != U_ZERO_ERROR) {
		trace_ds("[fromUnicode of U+%04x to local failed, ICU "
		    "error %d]\n", Ubuf, (int)err);
		return -1;
	}
	return len;
}

/*
 * Translate a local multi-byte string to Unicode characters.
 * Returns -1 for error, or the length.  NULL terminates.
 */
int
mb_to_unicode(char *mb, int mblen, UChar *u, int ulen, UErrorCode *err)
{
	UErrorCode local_err;
	int len;
	Boolean print_errs = False;

	if (local_converter == NULL) {
		int i;

		for (i = 0; i < mblen; i++) {
			u[i] = mb[i] & 0xff;
		}
		return mblen;
	}
	if (err == NULL) {
		err = &local_err;
		print_errs = True;
	}
	*err = U_ZERO_ERROR;
	len = ucnv_toUChars(local_converter, u, ulen, mb, mblen, err);
	if (*err != U_ZERO_ERROR && *err != U_STRING_NOT_TERMINATED_WARNING) {
		if (print_errs)
			trace_ds("[toUChars failed, ICU error %d]\n",
			    (int)*err);
		return -1;
	}
	return len;
}

/*
 * Try to map a Unicode character to the Host SBCS character set.
 * Returns ASCII in cp[0].
 */
int
dbcs_map8(UChar u, unsigned char *cp)
{
	UErrorCode err = U_ZERO_ERROR;
	int len;

	if (!(u & ~0xff)) {
		*cp = u;
		return 1;
	}
	if (sbcs_converter != NULL) {
		len = ucnv_fromUChars(sbcs_converter, (char *)cp, 1, &u, 1,
		    &err);
		if ((err != U_ZERO_ERROR &&
		     err != U_STRING_NOT_TERMINATED_WARNING) ||
		    (*cp == '?' && u != '?')) {
			*cp = ebc2asc[*cp];
			return 0;
		} else
			return 1;
	}
	return 0;
}

/*
 * Try to map a Unicode character to the Host DBCS character set.
 * Returns EBCDIC in cp[].
 */
int
dbcs_map16(UChar u, unsigned char *cp)
{
	UErrorCode err = U_ZERO_ERROR;
	int len;

	if (same_converter) {
		char tmp_cp[5];

		len = ucnv_fromUChars(dbcs_converter, tmp_cp, 5, &u, 1, &err);
		if (err != U_ZERO_ERROR ||
		    len < 3 ||
		    tmp_cp[0] != EBC_so)
			return 0;
		cp[0] = tmp_cp[1];
		cp[1] = tmp_cp[2];
		return 1;
	} else {
		len = ucnv_fromUChars(dbcs_converter, (char *)cp, 2, &u, 1,
				&err);
		return (err == U_ZERO_ERROR ||
			err == U_STRING_NOT_TERMINATED_WARNING);
	}
}


syntax highlighted by Code2HTML, v. 0.9.1