/* try to guess how many bytes the identifier really is! */ static size_t cdata_one_character(yaz_marc_t mt, const char *buf) { if (mt->iconv_cd) { size_t i; for (i = 1; i<5; i++) { char outbuf[12]; size_t outbytesleft = sizeof(outbuf); char *outp = outbuf; const char *inp = buf; size_t inbytesleft = i; size_t r = yaz_iconv(mt->iconv_cd, (char**) &inp, &inbytesleft, &outp, &outbytesleft); yaz_iconv(mt->iconv_cd, 0, 0, &outp, &outbytesleft); if (r != (size_t) (-1)) return i; /* got a complete sequence */ } return 1; /* giving up */ } else { int error = 0; size_t no_read = 0; (void) yaz_read_UTF8_char((const unsigned char *) buf, strlen(buf), &no_read, &error); if (error == 0 && no_read > 0) return no_read; } return 1; /* we don't know */ }
static int tst_convert_l(yaz_iconv_t cd, size_t in_len, const char *in_buf, size_t expect_len, const char *expect_buf) { size_t r; char *inbuf= (char*) in_buf; size_t inbytesleft = in_len > 0 ? in_len : strlen(in_buf); char outbuf0[64]; char *outbuf = outbuf0; while (inbytesleft) { size_t outbytesleft = outbuf0 + sizeof(outbuf0) - outbuf; if (outbytesleft > 12) outbytesleft = 12; r = yaz_iconv(cd, &inbuf, &inbytesleft, &outbuf, &outbytesleft); if (r == (size_t) (-1)) { int e = yaz_iconv_error(cd); if (e != YAZ_ICONV_E2BIG) return 0; } else { yaz_iconv(cd, 0, 0, &outbuf, &outbytesleft); break; } } return compare_buffers("tsticonv 22", 0, expect_len, expect_buf, outbuf - outbuf0, outbuf0); }
static void dconvert(int mandatory, const char *tmpcode) { int i; int ret; yaz_iconv_t cd; for (i = 0; iso_8859_1_a[i]; i++) { size_t r; char *inbuf = (char*) iso_8859_1_a[i]; size_t inbytesleft = strlen(inbuf); char outbuf0[24]; char outbuf1[10]; char *outbuf = outbuf0; size_t outbytesleft = sizeof(outbuf0); cd = yaz_iconv_open(tmpcode, "ISO-8859-1"); YAZ_CHECK(cd || !mandatory); if (!cd) return; r = yaz_iconv(cd, &inbuf, &inbytesleft, &outbuf, &outbytesleft); YAZ_CHECK(r != (size_t) (-1)); r = yaz_iconv(cd, 0, 0, &outbuf, &outbytesleft); YAZ_CHECK(r != (size_t) (-1)); yaz_iconv_close(cd); if (r == (size_t) (-1)) return; cd = yaz_iconv_open("ISO-8859-1", tmpcode); YAZ_CHECK(cd || !mandatory); if (!cd) return; inbuf = outbuf0; inbytesleft = sizeof(outbuf0) - outbytesleft; outbuf = outbuf1; outbytesleft = sizeof(outbuf1); r = yaz_iconv(cd, &inbuf, &inbytesleft, &outbuf, &outbytesleft); YAZ_CHECK(r != (size_t) (-1)); r = yaz_iconv(cd, 0, 0, &outbuf, &outbytesleft); if (r == (size_t)(-1)) { fprintf(stderr, "failed\n"); } YAZ_CHECK(r != (size_t) (-1)); if (r != (size_t)(-1)) { ret = compare_buffers("dconvert", i, strlen(iso_8859_1_a[i]), iso_8859_1_a[i], sizeof(outbuf1) - outbytesleft, outbuf1); YAZ_CHECK(ret); } yaz_iconv_close(cd); } }
int utf8_check(unsigned c) { if (sizeof(c) >= 4) { size_t r; char src[4]; char dst[4]; char utf8buf[6]; char *inbuf = src; size_t inbytesleft = 4; char *outbuf = utf8buf; size_t outbytesleft = sizeof(utf8buf); int i; yaz_iconv_t cd = yaz_iconv_open("UTF-8", "UCS4LE"); if (!cd) return 0; for (i = 0; i<4; i++) src[i] = c >> (i*8); r = yaz_iconv(cd, &inbuf, &inbytesleft, &outbuf, &outbytesleft); yaz_iconv_close(cd); if (r == (size_t)(-1)) return 0; cd = yaz_iconv_open("UCS4LE", "UTF-8"); if (!cd) return 0; inbytesleft = sizeof(utf8buf) - outbytesleft; inbuf = utf8buf; outbuf = dst; outbytesleft = 4; r = yaz_iconv(cd, &inbuf, &inbytesleft, &outbuf, &outbytesleft); if (r == (size_t)(-1)) return 0; yaz_iconv_close(cd); if (memcmp(src, dst, 4)) return 0; }
CString CIconv::ConvertIconv(CString str) { if (m_hIconv == NULL) { #ifdef _UNICODE int nLen = _tcslen(m_TargetCharset); char *szTarget = new char[nLen+1]; int i; for (i = 0; i <= nLen; i++) szTarget[i] = (char)m_TargetCharset[i]; nLen = _tcslen(m_SourceCharset); char *szSource = new char[nLen+1]; for (i = 0; i <= nLen; i++) szSource[i] = (char)m_SourceCharset[i]; m_hIconv = yaz_iconv_open(szTarget, szSource); delete [] szTarget; delete [] szSource; #else m_hIconv = yaz_iconv_open(m_TargetCharset, m_SourceCharset); #endif #ifdef _DEBUG if (m_hIconv == NULL) TRACE2("CIconv::Convert(): iconv_open filed, source: %s; target: %s\n", m_SourceCharset, m_TargetCharset); #endif } if (!str.IsEmpty()) { if (m_hIconv != NULL) { CString out; size_t inleft = str.GetLength(); size_t outleft = 4 * inleft + 2; LPTSTR inbuff = str.GetBuffer(inleft); LPTSTR outbuff = out.GetBuffer(outleft); memset(outbuff, 0, outleft); size_t ret; #ifdef _UNICODE // FIXME ret = 0; #else ret = yaz_iconv(m_hIconv, &inbuff, &inleft, &outbuff, &outleft); #endif if (ret == (size_t)(-1)) { TRACE0("CIconv::Convert(): iconv failed\n"); return str; } outbuff -= ret; out.ReleaseBuffer(); return out; } } return str; }
static int tst_convert_x(yaz_iconv_t cd, const char *buf, const char *cmpbuf, int expect_error) { int ret = 1; WRBUF b = wrbuf_alloc(); char outbuf[16]; size_t inbytesleft = strlen(buf); const char *inp = buf; int rounds = 0; for (rounds = 0; inbytesleft && rounds < (int) sizeof(outbuf); rounds++) { size_t outbytesleft = sizeof(outbuf); char *outp = outbuf; size_t r = yaz_iconv(cd, (char**) &inp, &inbytesleft, &outp, &outbytesleft); wrbuf_write(b, outbuf, outp - outbuf); if (r == (size_t) (-1)) { int e = yaz_iconv_error(cd); if (e != YAZ_ICONV_E2BIG) { if (expect_error != -1) if (e != expect_error) ret = 0; break; } } else { size_t outbytesleft = sizeof(outbuf); char *outp = outbuf; r = yaz_iconv(cd, 0, 0, &outp, &outbytesleft); wrbuf_write(b, outbuf, outp - outbuf); if (expect_error != -1) if (expect_error) ret = 0; break; } } if (wrbuf_len(b) == strlen(cmpbuf) && !memcmp(cmpbuf, wrbuf_buf(b), wrbuf_len(b))) ; else { WRBUF w = wrbuf_alloc(); ret = 0; wrbuf_rewind(w); wrbuf_puts_escaped(w, buf); yaz_log(YLOG_LOG, "input %s", wrbuf_cstr(w)); wrbuf_rewind(w); wrbuf_write_escaped(w, wrbuf_buf(b), wrbuf_len(b)); yaz_log(YLOG_LOG, "got %s", wrbuf_cstr(w)); wrbuf_rewind(w); wrbuf_puts_escaped(w, cmpbuf); yaz_log(YLOG_LOG, "exp %s", wrbuf_cstr(w)); wrbuf_destroy(w); } wrbuf_destroy(b); return ret; }