X-Git-Url: http://www.project-moonshot.org/gitweb/?a=blobdiff_plain;f=xmltooling%2Funicode.cpp;h=b54d1ed2ddfcf66583006218424663ba50ba2341;hb=56a73c1c7b1e63f1ff1717b25a76ebd480594d5a;hp=dd8a45eff120de7582d8c5c392db8b432f318ed3;hpb=e7a65d784215bc04355f014141219b3e7ab4559a;p=shibboleth%2Fcpp-xmltooling.git diff --git a/xmltooling/unicode.cpp b/xmltooling/unicode.cpp index dd8a45e..b54d1ed 100644 --- a/xmltooling/unicode.cpp +++ b/xmltooling/unicode.cpp @@ -1,17 +1,21 @@ -/* - * Copyright 2001-2006 Internet2 - * - * Licensed under the Apache License, Version 2.0 (the "License"); - * you may not use this file except in compliance with the License. - * You may obtain a copy of the License at +/** + * Licensed to the University Corporation for Advanced Internet + * Development, Inc. (UCAID) under one or more contributor license + * agreements. See the NOTICE file distributed with this work for + * additional information regarding copyright ownership. + * + * UCAID licenses this file to you under the Apache License, + * Version 2.0 (the "License"); you may not use this file except + * in compliance with the License. You may obtain a copy of the + * License at * - * http://www.apache.org/licenses/LICENSE-2.0 + * http://www.apache.org/licenses/LICENSE-2.0 * - * Unless required by applicable law or agreed to in writing, software - * distributed under the License is distributed on an "AS IS" BASIS, - * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. - * See the License for the specific language governing permissions and - * limitations under the License. + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, + * either express or implied. See the License for the specific + * language governing permissions and limitations under the License. */ /** @@ -26,28 +30,49 @@ #include #include +using namespace xercesc; + static const XMLCh UTF8[]={ chLatin_U, chLatin_T, chLatin_F, chDigit_8, chNull }; -char* xmltooling::toUTF8(const XMLCh* src) +char* xmltooling::toUTF8(const XMLCh* src, bool use_malloc) { - unsigned int eaten; - unsigned int srclen=XMLString::stringLen(src); - XMLUTF8Transcoder t(UTF8, srclen*4 + 1); - char* buf=new char[srclen*4 + 1]; - memset(buf,0,srclen*4 + 1); - t.transcodeTo( - src,srclen, - reinterpret_cast(buf),srclen*4, - eaten,XMLTranscoder::UnRep_RepChar); - return buf; + xsecsize_t eaten,factor=1,bufsize; + xsecsize_t srclen=XMLString::stringLen(src); + XMLUTF8Transcoder t(UTF8, 4096); // block size isn't used any more anyway + do { + bufsize = factor*srclen + 10; + char* buf = use_malloc ? reinterpret_cast(malloc(bufsize)) : new char[bufsize]; + memset(buf,0,bufsize); + try { + t.transcodeTo( + src,srclen, + reinterpret_cast(buf),bufsize-1, + eaten, + XMLTranscoder::UnRep_Throw); + } + catch (XMLException&) { + if (use_malloc) + free(buf); + else + delete[] buf; + throw XMLToolingException("Source string contained an unrepresentable character."); + } + if (eaten >= srclen) + return buf; + if (use_malloc) + free(buf); + else + delete[] buf; + factor++; + } while (1); } -XMLCh* xmltooling::fromUTF8(const char* src) +XMLCh* xmltooling::fromUTF8(const char* src, bool use_malloc) { - unsigned int eaten; - unsigned int srclen=strlen(src); - XMLUTF8Transcoder t(UTF8, srclen + 1); - XMLCh* buf=new XMLCh[srclen + 1]; + xsecsize_t eaten; + xsecsize_t srclen=strlen(src); + XMLUTF8Transcoder t(UTF8, 4096); // block size isn't used any more anyway + XMLCh* buf = use_malloc ? reinterpret_cast(malloc((srclen+1)*sizeof(XMLCh))) : new XMLCh[srclen + 1]; unsigned char* sizes=new unsigned char[srclen]; memset(buf,0,(srclen+1)*sizeof(XMLCh)); t.transcodeFrom( @@ -57,3 +82,18 @@ XMLCh* xmltooling::fromUTF8(const char* src) delete[] sizes; return buf; } + +std::ostream& xmltooling::operator<<(std::ostream& ostr, const XMLCh* s) +{ + if (s) { + char* p=xmltooling::toUTF8(s); + ostr << p; + delete[] p; + } + return ostr; +} + +std::ostream& xmltooling::operator<<(std::ostream& ostr, const xstring& s) +{ + return ostr << s.c_str(); +}