~ubuntu-branches/debian/wheezy/libnjb/wheezy

« back to all changes in this revision

Viewing changes to src/unicode.c

Committer: Bazaar Package Importer
Author(s): Shaun Jackman
Date: 2004-05-25 13:06:10 UTC
Revision ID: james.westby@ubuntu.com-20040525130610-vexcucw1qxq1g4dp

Tags: upstream-1.1

Import upstream version 1.1

files added:

AUTHORS

CHANGES

HACKING

INSTALL

LICENSE

Makefile.in

README

acconfig.h

aclocal.m4

config.guess

config.h.in

config.sub

configure

configure.in

debian

debian/changelog

debian/control

debian/copyright

debian/libnjb-dev.files

debian/libnjb-dev.links

debian/libnjb-dev.manpages

debian/libnjb0.docs

debian/libnjb0.files

debian/rules

debian/watch

distignore

hotplug.sh.in

install-sh

libnjb.spec

ltmain.sh

man/man3

man/man3/NJB_Adjust_Sound.3

man/man3/NJB_Capture.3

man/man3/NJB_Close.3

man/man3/NJB_Delete_Datafile.3

man/man3/NJB_Delete_Playlist.3

man/man3/NJB_Delete_Track.3

man/man3/NJB_Discover.3

man/man3/NJB_Get_Datafile_Tag.3

man/man3/NJB_Get_Disk_Usage.3

man/man3/NJB_Get_EAX.3

man/man3/NJB_Get_Extended_Tags.3

man/man3/NJB_Get_File.3

man/man3/NJB_Get_Owner_String.3

man/man3/NJB_Get_Playlist.3

man/man3/NJB_Get_Time.3

man/man3/NJB_Get_TmpDir.3

man/man3/NJB_Get_Track.3

man/man3/NJB_Get_Track_Tag.3

man/man3/NJB_Open.3

man/man3/NJB_Ping.3

man/man3/NJB_Play_Track.3

man/man3/NJB_Queue_Track.3

man/man3/NJB_Release.3

man/man3/NJB_Replace_Track_Tag.3

man/man3/NJB_Reset_Get_Datafile_Tag.3

man/man3/NJB_Reset_Get_Playlist.3

man/man3/NJB_Reset_Get_Track_Tag.3

man/man3/NJB_Send_File.3

man/man3/NJB_Send_Track.3

man/man3/NJB_Set_Owner_String.3

man/man3/NJB_Set_Time.3

man/man3/NJB_Set_TmpDir.3

man/man3/NJB_Set_Unicode.3

man/man3/NJB_Stop_Play.3

man/man3/NJB_Update_Playlist.3

man/man3/XferCallback.3

man/man3/datafile.3

man/man3/playlist.3

man/man3/songid.3

man/man3/template

nomad.usermap

nomadjukebox.in

sample

sample/Makefile.in

sample/cursesplay.c

sample/delfile.c

sample/deltr.c

sample/dumpeax.c

sample/dumptime.c

sample/files.c

sample/getfile.c

sample/getowner.c

sample/gettr.c

sample/getusage.c

sample/handshake.c

sample/pl.c

sample/play.c

sample/playlists.c

sample/sendfile.c

sample/sendtr.c

sample/setowner.c

sample/setpbm.c

sample/settime.c

sample/tagtr.c

sample/tracks.c

src/Makefile.in

src/base.c

src/base.h

src/byteorder.c

src/byteorder.h

src/datafile.c

src/defs.h

src/eax.c

src/ioutil.c

src/ioutil.h

src/libnjb.h.in

src/njb_error.c

src/njb_error.h

src/njbusb.h

src/playlist.c

src/procedure.c

src/procedure.h

src/protocol.c

src/protocol.h

src/protocol3.c

src/protocol3.h

src/songid.c

src/time.c

src/unicode.c

src/unicode.h

src/usb_io.c

src/usb_io.h

Show diffs side-by-side

added added

removed removed

src/unicode.c

#include "../config.h"

#include <stdlib.h>

#include <string.h>

#include <errno.h>

#include "libnjb.h"

#include "njbusb.h"

#include "protocol.h"

#include "protocol3.h"

#include "unicode.h"

#include "njb_error.h"

#include "usb_io.h"

#include "ioutil.h"

#include "defs.h"

#include "base.h"

extern int __sub_depth;

int njb_unicode_flag = NJB_UC_8859;

#define MAX_STRING_LENGTH 512

/* This flag determines whether to use ISO 8859-1

* or unicode UTF-8 for ALL strings */

void njb_set_unicode (int flag)

{

njb_unicode_flag = flag;

}

/* Gets the length (in characters, not bytes) of a unicode

* UCS-2 string, eg a string which physically is 0x00 0x41 0x00 0x00

* will return a value of 1. */

int ucs2strlen(const unsigned char *unicstr){

__dsub= "ucs2strlen";

int length=0;

int i;

__enter;

/* Unicode strings are terminated with 2 * 0x00 */

for(i=0; (unicstr[i] | unicstr[i+1])!='\0'; i+=2) {

length++;

}

__leave;

return length;

}

/* This routine returns the length in bytes that this

* UCS-2 string would occupy if encoded as UTF-8 */

static int ucs2utf8len(const unsigned char *unicstr){

int length=0;

int i;

for(i=0; (unicstr[i] | unicstr[i+1]) != '\0'; i+=2) {

if (unicstr[i] == 0x00 && unicstr[i+1] < 0x80)

length++;

else if (unicstr[i] < 0x08)

length+=2;

else

length+=3;

}

return length;

}

/* Create a new, allocated UCS-2 string that is a copy

* of the parameter */

static unsigned char *ucs2strdup(const unsigned char *unicstr) {

int length = ucs2strlen(unicstr);

unsigned char *data;

data= (char *) malloc(length*2+2);

if ( data == NULL ) {

return NULL;

}

memcpy(data, unicstr, length*2+2);

return data;

}

/* This function converts an ordinary ISO 8859-1 string

* to a unicode UTF-8 string */

char *strtoutf8(const unsigned char *str) {

unsigned char buffer[MAX_STRING_LENGTH];

int l=0;

int i;

memset(buffer,0,MAX_STRING_LENGTH);

for (i=0;i<strlen(str);i++) {

if (str[i]<0x80) {

buffer[l] = str[i];

l++;

} else {

buffer[l] = 0xC0 | (str[i]>>6 & 0x03);

buffer[l+1] = 0x80 | (str[i] & 0x3F);

l+=2;

}

buffer[l] = 0x00;

}

/* The duplicate the string and return it */

return strdup(buffer);

100

}

101

102

/* This function approximates an ISO 8859-1 string from

103

* a UTF-8 string, leaving out untranslatable characters */

104

char *utf8tostr(const unsigned char *str) {

105

unsigned char buffer[MAX_STRING_LENGTH];

106

unsigned char *ucs2string;

107

int i = 0;

108

int l = 0;

109

110

memset(buffer,0,MAX_STRING_LENGTH);

111

112

ucs2string = strtoucs2(str);

113

if (ucs2string == NULL)

114

return NULL;

115

116

for(i=0; (ucs2string[i] | ucs2string[i+1])!='\0'; i+=2) {

117

if (ucs2string[i] == '\0') {

118

buffer[l] = ucs2string[i+1];

119

l++;

120

}

121

}

122

buffer[l] = '\0';

123

124

free(ucs2string);

125

126

/* If there was nothing in this string, return NULL */

127

if (l>0 || i == 0)

128

return strdup(buffer);

129

else

130

return NULL;

131

}

132

133

/* Converts a unicode 2-byte string to a common string

134

* quick and dirty (japanese unicodes etc, that use all 16 bits

135

* will fail miserably) */

136

char *ucs2tostr(const unsigned char *unicstr){

137

138

__dsub= "ucs2tostr";

139

140

char *data = NULL;

141

int i = 0;

142

int l = 0;

143

144

__enter;

145

146

147

/* Real unicode support in UTF8 */

148

if (njb_unicode_flag == NJB_UC_UTF8) {

149

int length8 = ucs2utf8len(unicstr);

150

data= (char *) malloc(length8+1);

151

if ( data == NULL ) {

152

NJB_ERROR(EO_NOMEM);

153

__leave;

154

return NULL;

155

}

156

for(l=0;(unicstr[l] | unicstr[l+1])!='\0'; l+=2) {

157

if (unicstr[l] == 0x00 && unicstr[l+1] < 0x80) {

158

data[i]=unicstr[l+1];

159

i++;

160

} else if (unicstr[l] < 0x08) {

161

data[i] = 0xc0 | (unicstr[l]<<2 & 0x1C) | (unicstr[l+1]>>6 & 0x03);

162

data[i+1] = 0x80 | (unicstr[l+1] & 0x3F);

163

i+=2;

164

} else {

165

data[i] = 0xe0 | (unicstr[l]>>4 & 0x0F);

166

data[i+1] = 0x80 | (unicstr[l]<<2 & 0x3C) | (unicstr[l+1]>>6 & 0x03);

167

data[i+2] = 0x80 | (unicstr[l+1] & 0x3F);

168

i+=3;

169

}

170

}

171

/* Terminate string */

172

data[i]=0x00;

173

} else {

174

/* If we're running in ISO 8859-1 mode, approximate

175

* and concatenate, loosing any chars above 0xff */

176

int length=ucs2strlen(unicstr);

177

178

data= (char *) malloc(length+1);

179

if ( data == NULL ) {

180

NJB_ERROR(EO_NOMEM);

181

__leave;

182

return NULL;

183

}

184

185

l = 0;

186

for(i=0;l<length*2;){

187

if (unicstr[l] == 0x00) {

188

data[i]=unicstr[l+1];

189

i++;

190

}

191

l+=2;

192

}

193

/* Terminate string */

194

data[i]=0x00;

195

}

196

197

198

__leave;

199

return data;

200

}

201

202

/* Convert a simple ISO 8859-1 or a Unicode

203

* UTF8 string to a unicode UCS2 string */

204

unsigned char *strtoucs2(const unsigned char *str) {

205

206

__dsub= "strtoucs2";

207

208

unsigned char *data = NULL;

209

int i=0;

210

int l=0;

211

212

__enter;

213

214

/* Real unicode support in UTF8 */

215

if (njb_unicode_flag == NJB_UC_UTF8) {

216

unsigned char buffer[MAX_STRING_LENGTH*2];

217

218

int length=0;

219

int i;

220

221

for(i=0; str[i] != '\0';) {

222

if (str[i] < 0x80) {

223

buffer[length] = 0x00;

224

buffer[length+1] = str[i];

225

length += 2;

226

i++;

227

} else {

228

unsigned char numbytes = 0;

229

unsigned char lenbyte = 0;

230

231

/* Read the number of encoded bytes */

232

lenbyte = str[i];

233

while (lenbyte & 0x80) {

234

numbytes++;

235

lenbyte = lenbyte<<1;

236

}

237

/* UCS-2 can handle no more than 3 UTF-8 encoded bytes */

238

if (numbytes <= 3) {

239

if (numbytes == 2 && str[i+1] > 0x80) {

240

/* This character can always be handled correctly */

241

buffer[length] = (str[i]>>3 & 0x07);

242

buffer[length+1] = (str[i]<<6 & 0xC0) | (str[i+1] & 0x3F);

243

i += 2;

244

length += 2;

245

} else if (numbytes == 3 && str[i+1] > 0x80 && str[i+2] > 0x80) {

246

buffer[length] = (str[i]<<4 & 0xF0) | (str[i+1]>>2 & 0x0F);

247

buffer[length+1]= (str[i+1]<<6 & 0xC0) | (str[i+2] & 0x3F);

248

i += 3;

249

length += 2;

250

} else {

251

/* Abnormal string character, just skip */

252

i += numbytes;

253

}

254

} else {

255

/* Just skip that character */

256

i += numbytes;

257

}

258

}

259

}

260

/* Copy the buffer contents */

261

buffer[length] = 0x00;

262

buffer[length+1] = 0x00;

263

data = ucs2strdup(buffer);

264

if (data == NULL) {

265

NJB_ERROR(EO_NOMEM);

266

__leave;

267

return NULL;

268

}

269

} else {

270

/* If we're running in ISO 8859-1 mode, approximate

271

* and concatenate, loosing any chars above 0xff */

272

data= (unsigned char *) malloc(2*strlen(str)+2);

273

if ( data == NULL ) {

274

NJB_ERROR(EO_NOMEM);

275

__leave;

276

return NULL;

277

}

278

279

for(i=0;i<=strlen(str);i++){

280

data[l]=0x00;

281

data[l+1]=str[i];

282

l+=2;

283

}

284

}

285

286

__leave;

287

return data;

288

}

Older »