You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
269 lines
6.5 KiB
269 lines
6.5 KiB
/**
|
|
*** Transcoding support and wrappers.
|
|
***
|
|
*** See Copyright for the status of this software.
|
|
***
|
|
*** Author: Patrick Monnerat <pm@datasphere.ch>, DATASPHERE S.A.
|
|
**/
|
|
|
|
#define IN_LIBXML
|
|
#include "libxml.h"
|
|
|
|
#include <sys/types.h>
|
|
#include <iconv.h>
|
|
#include "libxml/xmlmemory.h"
|
|
#include "libxml/dict.h"
|
|
#include "transcode.h"
|
|
|
|
|
|
/**
|
|
*** Destroy a dictionary and mark as destroyed.
|
|
**/
|
|
|
|
void
|
|
xmlZapDict(xmlDictPtr * dict)
|
|
|
|
{
|
|
if (dict && *dict) {
|
|
xmlDictFree(*dict);
|
|
*dict = (xmlDictPtr) NULL;
|
|
}
|
|
}
|
|
|
|
|
|
/**
|
|
*** Support for inline conversion from/to UTF-8.
|
|
*** This is targeted to function parameter encoding conversion.
|
|
*** Method is:
|
|
*** - Convert string from/to UTF-8.
|
|
*** - Keep it in a dictionary.
|
|
*** - Free original string if a release procedure is provided.
|
|
*** Can also be called without dictionary to convert a string from/to UTF-8
|
|
*** into xmlMalloc'ed dynamic storage.
|
|
**/
|
|
|
|
const char *
|
|
xmlTranscodeResult(const xmlChar * s, const char * encoding,
|
|
xmlDictPtr * dict, void (*freeproc)(const void *))
|
|
|
|
{
|
|
size_t l;
|
|
iconv_t cd;
|
|
char * srcp;
|
|
char * dstp;
|
|
size_t srcc;
|
|
size_t dstc;
|
|
char * ts;
|
|
const char * ret;
|
|
int err;
|
|
static const int nullstring[] = { 0 };
|
|
|
|
/* Convert from UTF-8. */
|
|
|
|
if (!s)
|
|
return (const char *) NULL;
|
|
|
|
ret = (const char *) NULL;
|
|
ts = (char *) NULL;
|
|
err = 0;
|
|
l = xmlStrlen(s);
|
|
|
|
if (!l && dict)
|
|
ret = (const char *) nullstring;
|
|
else {
|
|
if (dict && !*dict)
|
|
err = !(*dict = xmlDictCreate());
|
|
|
|
if (!err)
|
|
err = !(ts = xmlMalloc(4 * l + 4));
|
|
|
|
dstp = ts;
|
|
dstc = 4 * l;
|
|
|
|
if (!err && l) {
|
|
if (!encoding)
|
|
encoding = "ibm-0"; /* Job's encoding. */
|
|
|
|
cd = iconv_open(encoding, "UTF-8");
|
|
|
|
if (cd == (iconv_t) -1)
|
|
err = 1;
|
|
else {
|
|
srcp = (char *) s;
|
|
srcc = l;
|
|
srcc = iconv(cd, &srcp, &srcc, &dstp, &dstc);
|
|
iconv_close(cd);
|
|
err = srcc == (size_t) -1;
|
|
}
|
|
}
|
|
|
|
if (!err) {
|
|
dstp[0] = dstp[1] = dstp[2] = dstp[3] = '\0';
|
|
|
|
if (!dict) {
|
|
if (dstc)
|
|
ts = xmlRealloc(ts, (dstp - ts) + 4);
|
|
|
|
ret = (const char *) ts;
|
|
ts = (char *) NULL;
|
|
}
|
|
else
|
|
ret = (char *) xmlDictLookup(*dict,
|
|
(xmlChar *) ts, dstp - ts + 1);
|
|
}
|
|
}
|
|
|
|
if (ts)
|
|
xmlFree(ts);
|
|
|
|
if (freeproc)
|
|
(*freeproc)(s);
|
|
|
|
return ret;
|
|
}
|
|
|
|
|
|
/**
|
|
*** Support for inline conversion to UTF-8.
|
|
*** Method is:
|
|
*** - Convert string to UTF-8.
|
|
*** - Keep it in a dictionary.
|
|
*** Can also be called without dictionary to convert a string to UTF-8 into
|
|
*** xmlMalloc'ed dynamic storage.
|
|
**/
|
|
|
|
static const xmlChar *
|
|
inTranscode(const char * s, size_t l, const char * encoding, xmlDictPtr * dict)
|
|
|
|
{
|
|
iconv_t cd;
|
|
char * srcp;
|
|
char * dstp;
|
|
size_t srcc;
|
|
size_t dstc;
|
|
xmlChar * ts;
|
|
const xmlChar * ret;
|
|
static const xmlChar nullstring[] = { 0 };
|
|
|
|
if (!l && dict)
|
|
return nullstring;
|
|
|
|
if (dict && !*dict)
|
|
if (!(*dict = xmlDictCreate()))
|
|
return (const xmlChar *) NULL;
|
|
|
|
ts = (xmlChar *) xmlMalloc(6 * l + 1);
|
|
|
|
if (!ts)
|
|
return (const xmlChar *) NULL;
|
|
|
|
dstp = (char *) ts;
|
|
dstc = 6 * l;
|
|
|
|
if (l) {
|
|
if (!encoding)
|
|
encoding = "ibm-0"; /* Use job's encoding. */
|
|
|
|
cd = iconv_open("UTF-8", encoding);
|
|
|
|
if (cd == (iconv_t) -1) {
|
|
xmlFree((char *) ts);
|
|
return (const xmlChar *) NULL;
|
|
}
|
|
|
|
srcp = (char *) s;
|
|
srcc = l;
|
|
srcc = iconv(cd, &srcp, &srcc, &dstp, &dstc);
|
|
iconv_close(cd);
|
|
|
|
if (srcc == (size_t) -1) {
|
|
xmlFree((char *) ts);
|
|
return (const xmlChar *) NULL;
|
|
}
|
|
}
|
|
|
|
*dstp = '\0';
|
|
|
|
if (!dict) {
|
|
if (dstc)
|
|
ts = xmlRealloc(ts, (dstp - ts) + 1);
|
|
|
|
return ts;
|
|
}
|
|
|
|
ret = xmlDictLookup(*dict, ts, dstp - ts + 1);
|
|
xmlFree((char *) ts);
|
|
return ret;
|
|
}
|
|
|
|
|
|
/**
|
|
*** Input 8-bit character string parameter.
|
|
**/
|
|
|
|
const xmlChar *
|
|
xmlTranscodeString(const char * s, const char * encoding, xmlDictPtr * dict)
|
|
|
|
{
|
|
if (!s)
|
|
return (const xmlChar *) NULL;
|
|
|
|
return inTranscode(s, xmlStrlen(s), encoding, dict);
|
|
}
|
|
|
|
|
|
/**
|
|
*** Input 16-bit character string parameter.
|
|
**/
|
|
|
|
const xmlChar *
|
|
xmlTranscodeWString(const char * s, const char * encoding, xmlDictPtr * dict)
|
|
|
|
{
|
|
size_t i;
|
|
|
|
if (!s)
|
|
return (const xmlChar *) NULL;
|
|
|
|
for (i = 0; s[i] && s[i + 1]; i += 2)
|
|
;
|
|
|
|
return inTranscode(s, i, encoding, dict);
|
|
}
|
|
|
|
|
|
/**
|
|
*** Input 32-bit character string parameter.
|
|
**/
|
|
|
|
const xmlChar *
|
|
xmlTranscodeHString(const char * s, const char * encoding, xmlDictPtr * dict)
|
|
|
|
{
|
|
size_t i;
|
|
|
|
if (!s)
|
|
return (const xmlChar *) NULL;
|
|
|
|
for (i = 0; s[i] && s[i + 1] && s[i + 2] && s[i + 3]; i += 4)
|
|
;
|
|
|
|
return inTranscode(s, i, encoding, dict);
|
|
}
|
|
|
|
|
|
/**
|
|
*** vasprintf() implementation with result transcoding.
|
|
**/
|
|
|
|
const char *
|
|
xmlVasprintf(xmlDictPtr * dict, const char * encoding,
|
|
const xmlChar * fmt, va_list args)
|
|
|
|
{
|
|
char * s = NULL;
|
|
|
|
vasprintf(&s, fmt, args);
|
|
return xmlTranscodeResult((const xmlChar *) s, encoding, dict, free);
|
|
}
|