~ubuntu-branches/ubuntu/trusty/cajun/trusty

« back to all changes in this revision

Viewing changes to debian/patches/0001-Fix-for-embedded-unicode.patch

Committer: Package Import Robot
Author(s): Daniel Pocock
Date: 2013-09-26 14:03:24 UTC
mfrom: (1.1.1)
Revision ID: package-import@ubuntu.com-20130926140324-m8cerngq0ct7rfoj

Tags: 2.0.3-1

* New upstream release
* Upstream now includes UTF-8 fix, local patch removed

files added:
cajun-jsonapi.spec

files removed:
.pc/0001-Fix-for-embedded-unicode.patch

.pc/0001-Fix-for-embedded-unicode.patch/json

.pc/0001-Fix-for-embedded-unicode.patch/json/reader.inl

.pc/0001-Fix-for-embedded-unicode.patch/json/writer.inl

debian/patches

debian/patches/0001-Fix-for-embedded-unicode.patch

debian/patches/series

files modified:
.pc/applied-patches

Makefile

ReleaseNotes.txt

debian/changelog

debian/control

debian/copyright

debian/watch

Show diffs side-by-side

added added

removed removed

debian/patches/0001-Fix-for-embedded-unicode.patch

diff --git a/json/reader.inl b/json/reader.inl

index fc20833..60c1b93 100644

--- a/json/reader.inl

+++ b/json/reader.inl

@@ -35,7 +35,6 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

TODO:

* better documentation

-* unicode character decoding

@@ -308,7 +307,7 @@ inline std::string Reader::MatchString(InputStream& inputStream)

// escape?

if (c == '\\' &&

- inputStream.EOS() == false) // shouldn't have reached the end yet

+ inputStream.EOS() == false) // shouldn't have reached the end yet

{

c = inputStream.Get();

switch (c) {

@@ -320,7 +319,37 @@ inline std::string Reader::MatchString(InputStream& inputStream)

case 'n': string.push_back('\n'); break;

case 'r': string.push_back('\r'); break;

case 't': string.push_back('\t'); break;

- case 'u': string.push_back('\u'); break; // TODO: what do we do with this?

+ case 'u': { // convert unicode to UTF-8

+ int x = 0, i;

+ // next four characters should be hex

+ for (i = 0; i < 4; ++i) {

+ c = inputStream.Get();

+ if (c >= '0' && c <= '9') {

+ x = (x << 4) | (c - '0');

+ } else if (c >= 'a' && c <= 'f') {

+ x = (x << 4) | (c - 'a' + 10);

+ } else if (c >= 'A' && c <= 'F') {

+ x = (x << 4) | (c - 'A' + 10);

+ } else {

+ std::string sMessage = std::string("Unrecognized hexadecimal character found in string: ") + c;

+ throw ScanException(sMessage, inputStream.GetLocation());

+ }

+ // encode as UTF-8

+ if (x < 0x80) {

+ string.push_back(x);

+ } else if (x < 0x800) {

+ string.push_back(0xc0 | (x >> 6));

+ string.push_back(0x80 | (x & 0x3f));

+ } else {

+ string.push_back(0xe0 | (x >> 12));

+ string.push_back(0x80 | ((x >> 6) & 0x3f));

+ string.push_back(0x80 | (x & 0x3f));

+ }

+ break;

+ }

default: {

std::string sMessage = std::string("Unrecognized escape sequence found in string: \\") + c;

throw ScanException(sMessage, inputStream.GetLocation());

diff --git a/json/writer.inl b/json/writer.inl

index b16401b..27226b6 100644

--- a/json/writer.inl

+++ b/json/writer.inl

@@ -35,7 +35,6 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

TODO:

* better documentation

-* unicode character encoding

@@ -122,7 +121,7 @@ inline void Writer::Write_i(const Object& object)

inline void Writer::Write_i(const Number& numberElement)

{

- m_ostr << std::setprecision(20) << numberElement.Value();

+ m_ostr << std::dec << std::setprecision(20) << numberElement.Value();

}

inline void Writer::Write_i(const Boolean& booleanElement)

@@ -139,6 +138,48 @@ inline void Writer::Write_i(const String& stringElement)

itEnd(s.end());

for (; it != itEnd; ++it)

{

+ // check for UTF-8 unicode encoding

+ unsigned char u = static_cast<unsigned char>(*it);

+ if (u & 0xc0) {

+ if ((u & 0xe0) == 0xc0) {

+ // two-character sequence

+ int x = (*it & 0x1f) << 6;

+ if ((it + 1) == itEnd) {

+ m_ostr << *it; continue;

+ }

+ u = static_cast<unsigned char>(*(it + 1));

+ if ((u & 0xc0) == 0x80) {

+ x |= u & 0x3f;

+ m_ostr << "\\u" << std::hex << std::setfill('0')

+ << std::setw(4) << x;

100

+ ++it;

101

+ continue;

102

+ }

103

104

+ } else if ((u & 0xf0) == 0xe0) {

105

+ // three-character sequence

106

+ int x = (u & 0x0f) << 12;

107

+ if ((it + 1) == itEnd) {

108

+ m_ostr << *it; continue;

109

+ }

110

+ u = static_cast<unsigned char>(*(it + 1));

111

+ if ((u & 0xc0) == 0x80) {

112

+ x |= (u & 0x3f) << 6;

113

+ if ((it + 2) == itEnd) {

114

+ m_ostr << *it; continue;

115

+ }

116

+ u = static_cast<unsigned char>(*(it + 2));

117

+ if ((u & 0xc0) == 0x80) {

118

+ x |= u & 0x3f;

119

+ m_ostr << "\\u" << std::hex << std::setfill('0')

120

+ << std::setw(4) << x;

121

+ it = it + 2;

122

+ continue;

123

+ }

124

+ }

125

+ }

126

+ }

127

128

switch (*it)

129

{

130

case '"': m_ostr << "\\\""; break;

131

@@ -148,7 +189,6 @@ inline void Writer::Write_i(const String& stringElement)

132

case '\n': m_ostr << "\\n"; break;

133

case '\r': m_ostr << "\\r"; break;

134

case '\t': m_ostr << "\\t"; break;

135

- case '\u': m_ostr << "\\u"; break; // uh...

136

default: m_ostr << *it; break;

137

}

138

}

Older »