169 lines
4.0 KiB
C++
169 lines
4.0 KiB
C++
//
|
|
// VMime library (http://www.vmime.org)
|
|
// Copyright (C) 2002-2013 Vincent Richard <vincent@vmime.org>
|
|
//
|
|
// This program is free software; you can redistribute it and/or
|
|
// modify it under the terms of the GNU General Public License as
|
|
// published by the Free Software Foundation; either version 3 of
|
|
// the License, or (at your option) any later version.
|
|
//
|
|
// This program is distributed in the hope that it will be useful,
|
|
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
// General Public License for more details.
|
|
//
|
|
// You should have received a copy of the GNU General Public License along
|
|
// with this program; if not, write to the Free Software Foundation, Inc.,
|
|
// 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
|
|
//
|
|
// Linking this library statically or dynamically with other modules is making
|
|
// a combined work based on this library. Thus, the terms and conditions of
|
|
// the GNU General Public License cover the whole combination.
|
|
//
|
|
|
|
#include "vmime/charsetConverter_idna.hpp"
|
|
|
|
#include "vmime/exception.hpp"
|
|
|
|
#include "vmime/utility/stringUtils.hpp"
|
|
#include "vmime/utility/streamUtils.hpp"
|
|
#include "vmime/utility/outputStreamStringAdapter.hpp"
|
|
|
|
|
|
extern "C"
|
|
{
|
|
|
|
#include "contrib/punycode/punycode.h"
|
|
#include "contrib/punycode/punycode.c"
|
|
|
|
}
|
|
|
|
#include "contrib/utf8/utf8.h"
|
|
|
|
|
|
namespace vmime
|
|
{
|
|
|
|
|
|
charsetConverter_idna::charsetConverter_idna
|
|
(const charset& source, const charset& dest, const charsetConverterOptions& opts)
|
|
: m_source(source), m_dest(dest), m_options(opts)
|
|
{
|
|
}
|
|
|
|
|
|
charsetConverter_idna::~charsetConverter_idna()
|
|
{
|
|
}
|
|
|
|
|
|
void charsetConverter_idna::convert(utility::inputStream& in, utility::outputStream& out)
|
|
{
|
|
// IDNA should be used for short strings, so it does not matter if we
|
|
// do not work directly on the stream
|
|
string inStr;
|
|
vmime::utility::outputStreamStringAdapter os(inStr);
|
|
vmime::utility::bufferedStreamCopy(in, os);
|
|
|
|
string outStr;
|
|
convert(inStr, outStr);
|
|
|
|
out << outStr;
|
|
}
|
|
|
|
|
|
void charsetConverter_idna::convert(const string& in, string& out)
|
|
{
|
|
if (m_source == m_dest)
|
|
{
|
|
// No conversion needed
|
|
out = in;
|
|
return;
|
|
}
|
|
|
|
out.clear();
|
|
|
|
if (m_dest == "idna")
|
|
{
|
|
if (utility::stringUtils::is7bit(in))
|
|
{
|
|
// No need to encode as Punycode
|
|
out = in;
|
|
return;
|
|
}
|
|
|
|
string inUTF8;
|
|
charset::convert(in, inUTF8, m_source, vmime::charsets::UTF_8);
|
|
|
|
const string::value_type* ch = inUTF8.c_str();
|
|
const string::value_type* end = inUTF8.c_str() + inUTF8.length();
|
|
|
|
std::vector <punycode_uint> unichars;
|
|
unichars.reserve(inUTF8.length());
|
|
|
|
while (ch < end)
|
|
{
|
|
const utf8::uint32_t uc = utf8::unchecked::next(ch);
|
|
unichars.push_back(uc);
|
|
}
|
|
|
|
std::vector <char> output(inUTF8.length() * 2);
|
|
punycode_uint outputLen = output.size();
|
|
|
|
const punycode_status status = punycode_encode
|
|
(unichars.size(), &unichars[0], /* case_flags */ NULL, &outputLen, &output[0]);
|
|
|
|
if (status == punycode_success)
|
|
{
|
|
out = string("xn--") + string(output.begin(), output.begin() + outputLen);
|
|
}
|
|
else
|
|
{
|
|
// TODO
|
|
}
|
|
}
|
|
else if (m_source == "idna")
|
|
{
|
|
if (in.length() < 5 || in.substr(0, 4) != "xn--")
|
|
{
|
|
// Not an IDNA string
|
|
out = in;
|
|
return;
|
|
}
|
|
|
|
std::vector <punycode_uint> output(in.length() - 4);
|
|
punycode_uint outputLen = output.size();
|
|
|
|
const punycode_status status = punycode_decode
|
|
(in.length() - 4, &in[4], &outputLen, &output[0], /* case_flags */ NULL);
|
|
|
|
if (status == punycode_success)
|
|
{
|
|
std::vector <string::value_type> outUTF8Bytes(outputLen * 4);
|
|
string::value_type* p = &outUTF8Bytes[0];
|
|
|
|
for (std::vector <punycode_uint>::const_iterator it = output.begin() ;
|
|
it != output.begin() + outputLen ; ++it)
|
|
{
|
|
p = utf8::unchecked::append(*it, p);
|
|
}
|
|
|
|
string outUTF8(&outUTF8Bytes[0], p);
|
|
charset::convert(outUTF8, out, vmime::charsets::UTF_8, m_dest);
|
|
}
|
|
else
|
|
{
|
|
// TODO
|
|
}
|
|
}
|
|
}
|
|
|
|
|
|
ref <utility::charsetFilteredOutputStream> charsetConverter_idna::getFilteredOutputStream(utility::outputStream& /* os */)
|
|
{
|
|
return NULL;
|
|
}
|
|
|
|
|
|
} // vmime
|