~ubuntu-branches/ubuntu/gutsy/icu/gutsy-updates

me->errln("error: Unicode::characterDirection(U+%04lx)==%u instead of %u (%s)\n", c, Unicode::characterDirection(c), me->MakeDir(fields[4][0]), fields[4][0]);

376

*pErrorCode = U_PARSE_ERROR;

377

return;

378

}

379

380

/* get uppercase mapping, field 12 */

381

if(fields[12][0]!=fields[12][1]) {

382

value=(uint32_t)uprv_strtoul(fields[12][0], &end, 16);

383

if(end!=fields[12][1]) {

384

me->errln("error: syntax error in field 12 at code 0x%lx\n", c);

385

*pErrorCode = U_PARSE_ERROR;

386

return;

387

}

388

if((UChar32)value!=Unicode::toUpperCase(c)) {

389

me->errln("error: Unicode::toUpperCase(U+%04lx)==U+%04lx instead of U+%04lx\n", c, Unicode::toUpperCase(c), value);

390

*pErrorCode = U_PARSE_ERROR;

391

return;

392

}

393

} else {

394

/* no case mapping: the API must map the code point to itself */

395

if(c!=Unicode::toUpperCase(c)) {

396

me->errln("error: U+%04lx does not have an uppercase mapping but Unicode::toUpperCase()==U+%04lx\n", c, Unicode::toUpperCase(c));

397

*pErrorCode = U_PARSE_ERROR;

398

return;

399

}

400

}

401

402

/* get lowercase mapping, field 13 */

403

if(fields[13][0]!=fields[13][1]) {

404

value=(uint32_t)uprv_strtoul(fields[13][0], &end, 16);

405

if(end!=fields[13][1]) {

406

me->errln("error: syntax error in field 13 at code 0x%lx\n", c);

407

*pErrorCode = U_PARSE_ERROR;

408

return;

409

}

410

if((UChar32)value!=Unicode::toLowerCase(c)) {

411

me->errln("error: Unicode::toLowerCase(U+%04lx)==U+%04lx instead of U+%04lx\n", c, Unicode::toLowerCase(c), value);

412

*pErrorCode = U_PARSE_ERROR;

413

return;

414

}

415

} else {

416

/* no case mapping: the API must map the code point to itself */

417

if(c!=Unicode::toLowerCase(c)) {

418

me->errln("error: U+%04lx does not have a lowercase mapping but Unicode::toLowerCase()==U+%04lx\n", c, Unicode::toLowerCase(c));

419

*pErrorCode = U_PARSE_ERROR;

420

return;

421

}

422

}

423

424

/* get titlecase mapping, field 14 */

425

if(fields[14][0]!=fields[14][1]) {

426

value=(uint32_t)uprv_strtoul(fields[14][0], &end, 16);

427

if(end!=fields[14][1]) {

428

me->errln("error: syntax error in field 14 at code 0x%lx\n", c);

429

*pErrorCode = U_PARSE_ERROR;

430

return;

431

}

432

if((UChar32)value!=Unicode::toTitleCase(c)) {

433

me->errln("error: Unicode::toTitleCase(U+%04lx)==U+%04lx instead of U+%04lx\n", c, Unicode::toTitleCase(c), value);

434

*pErrorCode = U_PARSE_ERROR;

435

return;

436

}

437

} else {

438

/* no case mapping: the API must map the code point to itself */

439

if(c!=Unicode::toTitleCase(c)) {

440

me->errln("error: U+%04lx does not have a titlecase mapping but Unicode::toTitleCase()==U+%04lx\n", c, Unicode::toTitleCase(c));

441

*pErrorCode = U_PARSE_ERROR;

442

return;

443

}

444

}

445

}

446

447

/* tests for several properties */

448

void UnicodeTest::TestUnicodeData()

449

{

450

char newPath[256];

451

char backupPath[256];

452

char *fields[15][2];

453

UErrorCode errorCode = U_ZERO_ERROR;

454

455

/* Look inside ICU_DATA first */

456

strcpy(newPath, u_getDataDirectory());

457

strcat(newPath, "unidata" U_FILE_SEP_STRING "UnicodeData.txt");

458

459

460

// As a fallback, try to guess where the source data was located

461

// at the time ICU was built, and look there.

462

# if defined (U_TOPSRCDIR)

463

strcpy(backupPath, U_TOPSRCDIR U_FILE_SEP_STRING "data");

464

# else

465

strcpy(backupPath, u_getDataDirectory());

466

strcat(backupPath, ".." U_FILE_SEP_STRING ".." U_FILE_SEP_STRING "data");

467

# endif

468

strcat(backupPath, U_FILE_SEP_STRING);

469

strcat(backupPath, "unidata" U_FILE_SEP_STRING "UnicodeData.txt");

470

471

u_parseDelimitedFile(newPath, ';', fields, 15, unicodeDataLineFn, this, &errorCode);

472

473

if(errorCode==U_FILE_ACCESS_ERROR) {

474

errorCode=U_ZERO_ERROR;

475

u_parseDelimitedFile(backupPath, ';', fields, 15, unicodeDataLineFn, this, &errorCode);

476

477

}

478

if(U_FAILURE(errorCode)) {

479

errln("error parsing UnicodeData.txt: %s\n" + UnicodeString(u_errorName(errorCode), ""));

480

return;

481

}

482

483

// test Unicode::getCharName()

484

// a more thorough test of u_charName() is in cintltst/cucdtst.c

485

char buffer[100];

486

int32_t length=Unicode::getCharName(0x284, buffer, (int32_t)sizeof(buffer));

487

488

// use invariant-character conversion to Unicode

489

UnicodeString name(buffer, length, "");

490

if(name!=UNICODE_STRING("LATIN SMALL LETTER DOTLESS J WITH STROKE AND HOOK", 49)) {

491

errln("Unicode character name lookup failed\n");

492

}

493

494

// test Unicode::isMirrored() and charMirror()

495

// see also cintltst/cucdtest.c

496

if(!(Unicode::isMirrored(0x28) && Unicode::isMirrored(0xbb) && Unicode::isMirrored(0x2045) && Unicode::isMirrored(0x232a) &&

497

!Unicode::isMirrored(0x27) && !Unicode::isMirrored(0x61) && !Unicode::isMirrored(0x284) && !Unicode::isMirrored(0x3400)

498

)

499

) {

500

errln("Unicode::isMirrored() does not work correctly\n");

501

}

502

503

if(!(Unicode::charMirror(0x3c)==0x3e && Unicode::charMirror(0x5d)==0x5b && Unicode::charMirror(0x208d)==0x208e && Unicode::charMirror(0x3017)==0x3016 &&

504

Unicode::charMirror(0x2e)==0x2e && Unicode::charMirror(0x6f3)==0x6f3 && Unicode::charMirror(0x301c)==0x301c && Unicode::charMirror(0xa4ab)==0xa4ab

505

)

506

) {

507

errln("Unicode::charMirror() does not work correctly\n");

508

}

509

}

510

511

int32_t UnicodeTest::MakeProp(char* str)

512

{

513

int32_t result = 0;

514

const char* matchPosition;

515

516

matchPosition = strstr(tagStrings, str);

517

if (matchPosition == 0) errln((UnicodeString)"unrecognized type letter " + str);

518

else result = ((matchPosition - tagStrings) / 2);

519

return result;

520

}

521

522

int32_t UnicodeTest::MakeDir(char* str)

523

{

524

int32_t pos = 0;

525

for (pos = 0; pos < 19; pos++) {

526

if (strcmp(str, dirStrings[pos]) == 0) {

527

return pos;

528

}

529

}

530

return -1;

531

}

532

/*Tests added by Madhu*/

533

534

/* Tests for isSingle(), isLead(), isTrial(), isSurrogate */

535

void UnicodeTest::TestCodeUnit(){

536

const UChar codeunit[]={0x0000,0xe065,0x20ac,0xd7ff,0xd800,0xd841,0xd905,0xdbff,0xdc00,0xdc02,0xddee,0xdfff,0};

537

538

int32_t i;

539

540

for(i=0; i<(int32_t)(sizeof(codeunit)/sizeof(codeunit[0])); i++){

541

UChar c=codeunit[i];

542

UnicodeString msg;

543

msg.append((UChar32)c);

544

logln((UnicodeString)"Testing code unit value of " + prettify(msg));

545

if(i<4){

546

if(!(Unicode::isSingle(c)) || (Unicode::isLead(c)) || (Unicode::isTrail(c)) ||(Unicode::isSurrogate(c))){

547

errln((UnicodeString)"ERROR:" + prettify(msg) + " is a single");

548

}

549

550

}

551

if(i >= 4 && i< 8){

552

if(!(Unicode::isLead(c)) || Unicode::isSingle(c) || Unicode::isTrail(c) || !(Unicode::isSurrogate(c))){

553

errln((UnicodeString)"ERROR:" + prettify(msg) + " is a first surrogate");

554

}

555

}

556

if(i >= 8 && i< 12){

557

if(!(Unicode::isTrail(c)) || Unicode::isSingle(c) || Unicode::isLead(c) || !(Unicode::isSurrogate(c))){

558

errln((UnicodeString)"ERROR:" + prettify(msg) + " is a second surrogate");

559

}

560

}

561

}

562

563

}

564

/* Tests for isSurrogate(), isUnicodeChar(), isError(), isValid() */

565

void UnicodeTest::TestCodePoint(){

566

const UChar32 codePoint[]={

567

//surrogate, notvalid(codepoint), not a UnicodeChar, not Error

568

0xd800,

569

0xdbff,

570

0xdc00,

571

0xdfff,

572

0xdc04,

573

0xd821,

574

//not a surrogate, valid, isUnicodeChar , not Error

575

0x20ac,

576

0xd7ff,

577

0xe000,

578

0xe123,

579

0x0061,

580

0xe065,

581

0x20402,

582

0x24506,

583

0x23456,

584

0x20402,

585

0x10402,

586

0x23456,

587

//not a surrogate, not valid, isUnicodeChar, isError

588

0x0015,

589

0x009f,

590

//not a surrogate, not valid, not isUnicodeChar, isError

591

0xffff,

592

0xfffe,

593

};

594

int32_t i;

595

for(i=0; i<(int32_t)(sizeof(codePoint)/sizeof(codePoint[0])); i++){

596

UChar32 c=codePoint[i];

597

UnicodeString msg;

598

msg.append(c);

599

logln((UnicodeString)"Testing code Point value of " + prettify(msg));

600

if(i<6){

601

if(!Unicode::isSurrogate(c)){

602

errln((UnicodeString)"ERROR: isSurrogate() failed for" + prettify(msg));

603

}

604

if(Unicode::isValid(c)){

605

errln((UnicodeString)"ERROR: isValid() failed for "+ prettify(msg));

606

}

607

if(Unicode::isUnicodeChar(c)){

608

errln((UnicodeString)"ERROR: isUnicodeChar() failed for "+ prettify(msg));

609

}

610

if(Unicode::isError(c)){

611

errln((UnicodeString)"ERROR: isError() failed for "+ prettify(msg));

612

}

613

}else if(i >=6 && i<18){

614

if(Unicode::isSurrogate(c)){

615

errln((UnicodeString)"ERROR: isSurrogate() failed for" + prettify(msg));

616

}

617

if(!Unicode::isValid(c)){

618

errln((UnicodeString)"ERROR: isValid() failed for "+ prettify(msg));

619

}

620

if(!Unicode::isUnicodeChar(c)){

621

errln((UnicodeString)"ERROR: isUnicodeChar() failed for "+ prettify(msg));

622

}

623

if(Unicode::isError(c)){

624

errln((UnicodeString)"ERROR: isError() failed for "+ prettify(msg));

625

}

626

}else if(i >=18 && i<20){

627

if(Unicode::isSurrogate(c)){

628

errln((UnicodeString)"ERROR: isSurrogate() failed for" + prettify(msg));

629

}

630

if(Unicode::isValid(c)){

631

errln((UnicodeString)"ERROR: isValid() failed for "+ prettify(msg));

632

}

633

if(!Unicode::isUnicodeChar(c)){

634

errln((UnicodeString)"ERROR: isUnicodeChar() failed for "+ prettify(msg));

635

}

636

if(!Unicode::isError(c)){

637

errln((UnicodeString)"ERROR: isError() failed for "+ prettify(msg));

638

}

639

}

640

else if(i >=18 && i<(int32_t)(sizeof(codePoint)/sizeof(codePoint[0]))){

641

if(Unicode::isSurrogate(c)){

642

errln((UnicodeString)"ERROR: isSurrogate() failed for" + prettify(msg));

643

}

644

if(Unicode::isValid(c)){

645

errln((UnicodeString)"ERROR: isValid() failed for "+ prettify(msg));

646

}

647

if(Unicode::isUnicodeChar(c)){

648

errln((UnicodeString)"ERROR: isUnicodeChar() failed for "+ prettify(msg));

649

}

650

if(!Unicode::isError(c)){

651

errln((UnicodeString)"ERROR: isError() failed for "+ prettify(msg));

652

}

653

}

654

}

655

656

}

657

658

void UnicodeTest::TestCharLength()

659

{

660

const int32_t codepoint[]={

661

1, 0x0061,

662

1, 0xe065,

663

1, 0x20ac,

664

2, 0x20402,

665

2, 0x23456,

666

2, 0x24506,

667

2, 0x20402,

668

2, 0x10402,

669

1, 0xd7ff,

670

1, 0xe000

671

};

672

673

int32_t i;

674

UBool multiple;

675

for(i=0; i<(int32_t)(sizeof(codepoint)/sizeof(codepoint[0])); i=(int16_t)(i+2)){

676

UChar32 c=codepoint[i+1];

677

UnicodeString msg;

678

msg.append(c);

679

if(Unicode::charLength(c) != codepoint[i]){

680

errln((UnicodeString)"The no: of code units for" + prettify(msg)+

681

":- Expected: " + (int32_t)codepoint[i] + " Got: " + Unicode::charLength(c));

682

}else{

683

logln((UnicodeString)"The no: of code units for" + prettify(msg) + " is " + Unicode::charLength(c));

684

}

685

multiple=(UBool)(codepoint[i] == 1 ? FALSE : TRUE);

686

if(Unicode::needMultipleUChar(c) != multiple){

687

errln("ERROR: Unicode::needMultipleUChar() failed for" + prettify(msg));

688

}

689

}

690

}

691

692

693

Various script value testing.

694

This makes sure that the Unicode::EUnicodeScript

695

and UCharScript enum values are the same.

696

697

void UnicodeTest::TestScript()

698

{

699

if ((int32_t)Unicode::kScriptCount != (int32_t)UBLOCK_COUNT) {

700

errln("ERROR: Unicode::EUnicodeScript is not the same size as UCharScript");

701

}

702

703

if ((int32_t)Unicode::kBasicLatin != (int32_t)U_BASIC_LATIN) {

704

errln("ERROR: Different Basic Latin values in EUnicodeScript and UCharScript");

705

}

706

707

if ((int32_t)Unicode::kHighSurrogate != (int32_t)U_HIGH_SURROGATES) {

708

errln("ERROR: Different High Surrogate values in EUnicodeScript and UCharScript");

709

}

710

711

if ((int32_t)Unicode::kLowSurrogate != (int32_t)U_LOW_SURROGATES) {

712

errln("ERROR: Different Low Surrogate values in EUnicodeScript and UCharScript");

713

}

714

715

if ((int32_t)Unicode::kCJKRadicalsSupplement != (int32_t)U_CJK_RADICALS_SUPPLEMENT) {

716

errln("ERROR: Different CJK Radicals Supplement values in EUnicodeScript and UCharScript");

717

}

718

719

if ((int32_t)Unicode::kGreek != (int32_t)U_GREEK) {

720

errln("ERROR: Different Greek values in EUnicodeScript and UCharScript");

721

}

722

723

if ((int32_t)Unicode::kThai != (int32_t)U_THAI) {

724

errln("ERROR: Diffe rent Thai values in EUnicodeScript and UCharScript");

725

}

726

}

Older »