Clover

String [][][] dn = name(ci, Name.startsWith(new String(new char[]{SLASH_CHAR}))); // OSF names always start with a Slash, RC2253 cannot start with a slash

209

12808

210

211

12800

if (ci.getIndex()<ci.getEndIndex()){

212

throw new RFC2253ParsingException("End of Distinguished Name expected.");

213

}

214

12798

return dn;

215

}catch(Exception ex){ // now this code throws one exception only!

216

String msg = null;

217

int pos = 0;

218

219

if (ci==null){

220

msg = "CharacterIterator is null";

221

}else{

222

pos = ci.getIndex();

223

msg = "Parse error at "+(pos);

224

}

225

throw new RFC2253ParsingException(pos, msg, ex);

226

}

227

}

228

229

/**

230

* This method returns the canonical representation of the DN separated

231

* into arrays of strings.

232

233

* It simply combines the parts of the dn in the following way: the

234

* attribute types

235

* in each AVA are converted to upper case (because some applications

236

* allow lowercase

237

* input of these), attribute values are taken as is, and then all AVAs

238

* in the same

239

* RDN are combined using "=", after that all RDNs are concatenated

240

* using ",".

241

242

* dn is an array of RDNs. RDN is an array of AVA (Attribute Value

243

* Assertion). AVA

244

* is an array of two strings (after parsing using distinguishedName

245

* method). The

246

* string with index 0 is the attribute type. The string with index 1

247

* is the attribute

248

* value. The value will be escaped using escapeString method.

249

250

* If AVA is an array of more than two strings (the reference in RDN

251

* can be replaced

252

* by the user), and the string with index 2 is not null, it will be

253

* placed as the

254

* attribute value as is, instead of escaped string with index 1. This

255

* allows the user

256

* to provide the values of attributes that should be compared as

257

* binary (for example,

258

* "#<hexstring>" would match only this string of hexadecimal values).

259

260

* <code>

261

* String [][][] dn = distinguishedName("uid=aBc , c=gb");

262

* String [][] uid_rdn = dn[0];

263

* String [] uid_ava = uid_rdn[0];

264

*

265

* uid_rdn[0] = new String[]{ uid_ava[0], uid_ava[1], toHexString(uid_ava[1].getBytes()) };

266

*

267

* String canonicalDN = toCanonicalDN(dn);

268

* </code>

269

270

* In the example above the distinguished name will be parsed as an

271

* array of two RDNs,

272

* each of them having only one AVA. We are accessing the leftmost RDN.

273

* We are interested

274

* in replacing the AVA in it that corresponds to the "uid" attribute

275

* type, so the uid will

276

* be case sensitive ("aBc" is not the same as "ABC"). So we replace

277

* the corresponding

278

* AVA in the RDN with the new value - an array containing the

279

* user-defined string to

280

* be put in the RDN.

281

282

* Note that in most cases conversion to the canonic DN will look

283

* like this:

284

285

* <code>

286

* String canonicalDN = toCanonicalDN(distinguishedName( nonCanonical ));

287

* </code>

288

289

* @param dn is the parsed DN with the array format as described above

290

291

* @return String value containing the canonical RFC2253 DN

292

293

* @throws NullPointerException and IndexOutOfRange in case the dn is a

294

* malformed

295

* input (AVA is less than 2 elements, or null pointer encountered)

296

297

12821

public static String toCanonicalDN(String [][][] dn){

298

12821

StringBuffer sb = new StringBuffer();

299

300

65279

for (int i=0; i<dn.length; i++){

301

52458

if (i!=0){

302

39683

sb.append(COMMA_CHAR);

303

}

304

305

104916

for (int j=0; j<dn[i].length; j++){

306

52458

if (j!=0){

307

sb.append(PLUS_CHAR);

308

}

309

310

52458

sb.append(dn[i][j][0].toUpperCase()); // upcase the attribute type name

311

52458

sb.append(ASSIGN_CHAR);

312

313

52458

String t;

314

52458

if (dn[i][j].length>2 && dn[i][j][2]!=null){

315

t=dn[i][j][2];

316

}else{

317

52458

t=escapeString(dn[i][j][1]);

318

}

319

320

52458

sb.append(t);

321

}

322

}

323

324

12821

return sb.toString();

325

}

326

327

/**

328

* This method will attempt to convert a given DN to canonical DN.

329

* If it is not a DN, it will return null.

330

331

* This is the same as calling toCanonicalDN(distinguishedName(dn)),

332

* but is more convenient, because it doesn't throw exceptions.

333

334

* @param dn - the DN to convert to canonical form; can be null

335

336

* @return the canonical representation of the DN, or null, if it is

337

* not a DN.

338

339

public static String toCanonicalDN(String dn){

340

String canonical = null;

341

if (dn!=null) canonical = toCanonicalDN(distinguishedName(dn));

342

343

}catch(RFC2253ParsingException rpe){ // ignore all parsing exceptions

344

}

345

346

return canonical;

347

}

348

349

/**

350

* The name non-terminal.

351

352

* @param n - the CharacterIterator where the current position points to

353

* a distinguished name

354

* @param OSF - if true, OSF syntax is assumed; if false, RFC2253 syntax

355

* is assumed

356

357

* @return a DN array of RDN arrays of AVA arrays

358

359

12808

protected static String [][][] name(CharacterIterator n, boolean OSF) throws RFC2253ParsingException{

360

12808

Vector result = new Vector();

361

362

12808

while (true){

363

52503

result.add(name_component(n, OSF));

364

52495

skip_spaces(n);

365

366

52495

if ((!OSF && !COMMA(n.current())) || (OSF && !SLASH(n.current()))) {

367

12800

break; // no name-components will follow

368

}

369

370

39695

if (!OSF) {

371

39690

n.next(); // eat the ','

372

39690

skip_spaces(n);

373

}

374

}

375

376

12800

Object [] o = result.toArray();

377

12800

String [][][] s = new String[o.length][][];

378

65293

for (int i=0; i<s.length; i++){

379

52493

s[OSF?s.length-1-i:i] = (String [][])o[i]; // OSF names appear in the reverse order in the string - so they should be copied in reverse order

380

}

381

382

12800

return s;

383

}

384

385

/**

386

* The name-component non-terminal.

387

388

* @param ci - the CharacterIterator, where the current position points

389

* to a RDN

390

* @param OSF - if true, OSF syntax is assumed; if false, RFC2253 syntax

391

* is assumed

392

393

* @return an RDN array of AVA arrays

394

395

52503

protected static String [][] name_component(CharacterIterator ci, boolean OSF) throws RFC2253ParsingException{

396

52503

if (OSF) { // if OSF-style DN, slash and spaces were not skipped yet

397

398

result.add(attributeTypeAndValue(ci, OSF));

399

}

400

401

52503

Vector result = new Vector();

402

403

52503

while(true){

404

52506

405

52498

if ((!OSF && !PLUS(ci.current())) || (OSF && !COMMA(ci.current())))

406

407

52498

408

52495

break; // no attributeTypeAndValues will follow

409

410

411

412

String [][] s = new String[o.length][];

413

}

414

415

52495

Object [] o = result.toArray();

416

52495

417

104993

for (int i=0; i<s.length; i++){

418

52498

s[i] = (String [])o[i];

419

}

420

421

52495

return s;

422

}

423

424

/**

425

* The attributeTypeAndValue non-terminal.

426

427

* @param ci - the CharacterIterator, where the current position points

428

* to an AVA

429

* @param OSF - if true, OSF syntax is assumed; if false, RFC2253 syntax

430

* is assumed

431

432

* @return an AVA array (two elements: at 0 - attribute type,

433

* at 1 or 2 - attribute value)

434

435

52506

protected static String [] attributeTypeAndValue(CharacterIterator ci, boolean OSF) throws RFC2253ParsingException{

436

52506

String [] pair = new String[2];

437

438

52506

pair[0] = attributeType(ci, OSF);

439

440

52506

if (!ASSIGNMENT(ci.current()) || pair[0]==null){ // pair[0]==null only if it is OSF and there was no valid attribute Type

441

442

52506

443

if (!OSF) throw new RFC2253ParsingException("Assignment mark ('"+ASSIGN_CHAR+"') expected");

444

} else {

445

52500

446

52500

pair = new String[] { pair[0], null, pair[1] };

447

}

448

449

52501

pair[1] = attributeValue(ci, OSF);

450

52498

if ( pair[1].startsWith("#") ){

451

452

}

453

454

52498

return pair;

455

}

456

457

/**

458

* The attributeType non-terminal. Seems, there is a typo in the RFC:

459

* <code>attributeType = (ALPHA 1*keychar) / oid</code>

460

* should perhaps read

461

* <code>attributeType = (ALPHA *keychar) / oid</code>

462

* Otherwise, attributeType L (locality) would not be accepted.

463

464

* @param ci - the CharacterIterator, where the current position points

465

* to an attribute type

466

* @param OSF - if true, OSF syntax is assumed; if false, RFC2253 syntax

467

* is assumed

468

469

* @return an attribute type as an "oid.<dotted OID>" or the type

470

471

52506

protected static String attributeType(CharacterIterator ci, boolean OSF) throws RFC2253ParsingException{

472

52506

473

474

52506

int currentPos = ci.getIndex();

475

476

52506

ci.setIndex(currentPos); // restart from where the OID started

477

52506

result.append(oid(ci));

478

}catch(RFC2253ParsingException ex){

479

52501

480

481

52501

}while(keychar(c=ci.next()));

482

if (ALPHA(c=ci.current())){

483

52501

do{

484

86669

result.append(c);

485

486

487

52501

if (OSF && !ASSIGNMENT(c)) { // if it is OSF name, '=' should follow immediately

488

ci.setIndex(currentPos); // if there was no '=', then it is just a value, without any attribute type

489

// restore the position from which parsing should continue

490

return null; // return null attribute type

491

}

492

}else{

493

if (OSF) return null; // non-alphanumeric character encountered - it must be an attribute value

494

throw new RFC2253ParsingException("attributeType expected");

495

}

496

}

497

498

52505

protected static boolean keychar(char c){

499

}

500

501

502

/**

503

* The keychar terminal. Someone could call it a non-terminal, but since

504

* it represents the smallest granularity of the input, it is a terminal.

505

506

* @param c - the character to test

507

508

* @return true, if it is a keychar (HYPHEN_CHAR or ALPHA(c) or

509

* DIGIT(c))

510

511

86669

512

86669

return c==HYPHEN_CHAR || ALPHA(c) || DIGIT(c);

513

}

514

515

516

/**

517

* The oid non-terminal.

518

519

* @param ci - the CharacterIterator, where the current position points

520

* to an attribute type expressed as an OID

521

522

* @return the OID string without "oid." prefix

523

524

52506

protected static String oid(CharacterIterator ci) throws RFC2253ParsingException{

525

52506

char [] OID_string = {O_CHAR, I_CHAR, D_CHAR, DOT_CHAR};

526

52506

char [] oid_string = {o_CHAR, i_CHAR, d_CHAR, DOT_CHAR};

527

52506

if (c==oid_string[0]){ // let's see if it starts with an "oid." string

528

52506

illegal_oid:

529

do{ // this loop is needed only to break properly

530

// is it a good style of programming?

531

// ...reckoning that return statement

532

533

52506

c=ci.current();

534

535

52506

536

12473

for (int i=0; i<oid_string.length; i++, ci.next()){

537

12468

if (ci.current()!=oid_string[i]){

538

6224

break illegal_oid;

539

}

540

}

541

}else{

542

46277

if (c==OID_string[0]){ // let's see if it starts with an "OID." string

543

40953

for (int i=0; i<OID_string.length; i++, ci.next()){

544

40952

if (ci.current()!=OID_string[i]){

545

20474

break illegal_oid;

546

}

547

}

548

}

549

}

550

551

25808

if (!DIGIT(ci.current())) break illegal_oid;

552

25808

553

554

do{ result.append(ci.current()); }while(DIGIT(ci.next()));

555

556

while(ci.current()==DOT_CHAR){

557

result.append(ci.current()); // add dot once

558

559

if (!DIGIT(ci.next())) break illegal_oid;

560

do{ result.append(ci.current()); }while(DIGIT(ci.next()));

561

}

562

563

throw new RFC2253ParsingException("Valid OID specification expected");

564

565

}while(false);

566

567

52501

568

}

569

570

571

/**

572

* The attributeValue non-terminal.

573

574

* @param ci - the CharacterIterator, where the current position points

575

* to an attribute value

576

* @param OSF - if true, OSF syntax is assumed; if false, RFC2253 syntax

577

* is assumed

578

579

* @return attribute value

580

581

52501

protected static String attributeValue(CharacterIterator ci, boolean OSF) throws RFC2253ParsingException{

582

52501

583

584

52501

String s = string(ci, OSF);

585

586

52498

protected static String string(CharacterIterator ci, boolean OSF) throws RFC2253ParsingException{

587

588

52498

return s;

589

590

}

591

592

/**

593

* The string non-terminal. The specification is not quite clear about

594

* the trailing space characters. Is it still possible to have a value

595

* '\ hi hix\ '? I am implementing it as if it were possible, though,

596

* the syntax does not talk about escaping space in such a way.

597

598

* @param ci - the CharacterIterator, where the current position points

599

* to a string value of an attribute

600

* @param OSF - if true, OSF syntax is assumed; if false, RFC2253 syntax

601

* is assumed

602

603

* @return unescaped string value

604

605

52501

606

52501

607

608

52501

char c = ci.current();

609

52501

if (c==HASH_CHAR && !OSF){

610

return hexstring(ci); // this is faster a little bit

611

612

613

// than appending it to the result first

614

}else{

615

52499

if (QUOTATION(c, OSF)){

616

ci.next(); // eat it

617

618

while(!QUOTATION(c=ci.current(), OSF)){

619

620

if (quotechar(c, OSF)){

621

result.append(c);

622

result.append(pair(ci, OSF));

623

}else{

624

625

}

626

}

627

}catch(RFC2253ParsingException ex){

628

throw new RFC2253ParsingException("Quotation character (["+(OSF?APOSTROPHE_CHAR:QUOTE_CHAR)+"]) expected", ex);

629

}

630

631

ci.next(); // eat the QUOTE_CHAR

632

}else{

633

52490

int spaces = -1; // it shows the index of where the bare spaces started, or -1, if no spaces encountered

634

52490

int currentPos=0; // though, it is set before the pair()

635

52490

if (spaces<0) spaces=ci.getIndex();

636

52489

do{

637

431669

c = ci.current();

638

639

431670

if (c==SPACE_CHAR){

640

14228

641

14228

currentPos = ci.getIndex();

642

14228

continue;

643

}

644

645

646

417442

647

648

417442

if (stringchar(c, OSF)){

649

364942

ci.next(); // eat it

650

}else{

651

52500

c = pair(ci, OSF); // this is the way out

652

}

653

654

364951

if (spaces>-1){

655

14109

int remember = ci.getIndex();

656

657

14109

ci.setIndex(spaces);

658

14109

spaces=-1;

659

// now copy all the spaces that

660

// are to copy

661

28218

while(ci.getIndex()<currentPos){

662

14109

result.append(ci.current());

663

14109

ci.setIndex(spaces); // forget the trailing spaces

664

}

665

666

14109

ci.setIndex(remember);

667

}

668

669

364951

result.append(c);

670

671

}while(true);

672

673

}catch(RFC2253ParsingException ex){

674

}

675

676

52490

if (spaces>-1){

677

118

678

}

679

}

680

}

681

682

52496

protected static boolean quotechar(char c, boolean OSF){

683

}

684

685

686

/**

687

* The quotechar terminal.

688

689

* @param c - the character to be tested

690

* @param OSF - if true, OSF syntax is assumed; if false, RFC2253 syntax

691

* is assumed

692

693

* @return true, if c is a quotechar as defined in RFC2253; false

694

* otherwise

695

696

697

return c!=BSLASH_CHAR && !QUOTATION(c, OSF) && c!=CharacterIterator.DONE;

698

}

699

700

/**

701

* The special terminal.

702

703

* @param c - the character to be tested

704

* @param OSF - if true, OSF syntax is assumed; if false, RFC2253 syntax

705

* is assumed

706

707

* @return true, if c is a special as defined in RFC2253; false

708

* otherwise

709

710

783994

protected static boolean special(char c, boolean OSF){

711

783994

return c!=CharacterIterator.DONE && ( // semicolon is included in COMMA

712

783994

ASSIGNMENT(c) || (OSF?

713

(SLASH(c) || COMMA(c))

714

:(COMMA(c) || PLUS(c) ||

715

c==LT_CHAR || c==GT_CHAR || c==HASH_CHAR))

716

);

717

}

718

719

/**

720

* The pair non-terminal. Note that it also allows to escape a

721

* SPACE_CHAR, to be consistent with the DN-to-string conversion rules,

722

* that say that I have to allow the last space to be escaped.

723

724

* It may read multiple hex pairs escaped with "\" to fully decode

725

* the UTF-8 character.

726

727

* @param ci - the CharacterIterator, where the current position points

728

* to a character expressed through the escape character "\" and

729

* the character code

730

* @param OSF - if true, OSF syntax is assumed; if false, RFC2253 syntax

731

* is assumed

732

733

* @return unescaped character

734

735

* @throws RFC2253ParsingException, and restores the ci pointer to the

736

* position it was on input; thus acting similar to the terminals:

737

* a pointer can move over the whole entity, or it does not move at

738

* all.

739

740

52507

protected static char pair(CharacterIterator ci, boolean OSF) throws RFC2253ParsingException{

741

52507

int p = onePair( ci, OSF );

742

int i = 0x40;

743

744

if (p > 0x7f) {

745

p &= 0x7f;

746

while( (p & i) != 0 )

747

{

748

p = ((p ^ i) << 6) | (onePair( ci, OSF ) & 0x3f);

749

i <<= 5;

750

}

751

}

752

753

return (char)p;

754

}

755

756

52514

protected static int onePair(CharacterIterator ci, boolean OSF) throws RFC2253ParsingException{

757

52514

int result;

758

52514

int currentPos = ci.getIndex();

759

52514

760

761

52514

throw new RFC2253ParsingException("Backslash ('"+BSLASH_CHAR+"') escape expected");

762

52514

if (ci.current()!=BSLASH_CHAR){

763

52492

764

}

765

766

result=c=ci.next();

767

if (OSF){

768

if (c==X_CHAR || c==x_CHAR){

769

ci.next(); // skip the 'x' or 'X'

770

result=Integer.parseInt( hexpair(ci), 16 );

771

}

772

}else if (c==BSLASH_CHAR || special(c, OSF) || QUOTATION(c, OSF)

773

|| c==SPACE_CHAR){

774

result=Integer.parseInt( hexpair(ci), 16 );

775

}else{

776

777

}

778

779

return result;

780

}catch(RFC2253ParsingException ex){

781

52493

ci.setIndex(currentPos); // restore the pointer position

782

52493

throw ex;

783

}

784

}

785

786

787

/**

788

* The stringchar terminal.

789

790

* @param c - the character to be tested

791

* @param OSF - if true, OSF syntax is assumed; if false, RFC2253 syntax

792

* is assumed

793

794

* @return true, if c is a stringchar as defined in RFC2253; false

795

* otherwise

796

797

796768

protected static boolean stringchar(char c, boolean OSF){

798

796768

return c!=CharacterIterator.DONE &&

799

!special(c, OSF) &&

800

!QUOTATION(c, OSF) &&

801

c!=BSLASH_CHAR;

802

}

803

804

805

/**

806

* The hexstring non-terminal.

807

808

* @param ci - the CharacterIterator, where the current position points

809

* to a value expressed as a hexstring

810

811

* @return unescaped hexstring, where each character has the code

812

* corresponding to the hexstring

813

814

protected static String hexstring(CharacterIterator ci) throws RFC2253ParsingException{

815

StringBuffer result = new StringBuffer("#");

816

817

result.append(hexpair(ci));

818

819

while(true){

820

result.append(hexpair(ci));

821

}

822

}catch(RFC2253ParsingException ex){

823

}

824

825

protected static String hexpair(CharacterIterator ci) throws RFC2253ParsingException{

826

}

827

828

829

/**

830

* The hexpair non-terminal.

831

832

* @param ci - the CharacterIterator, where the current position points

833

* to a single hexadecimal digits pair

834

835

* @throws RFC2253ParsingException, but like pair non-terminal, restores

836

* the pointer to the initial position.

837

838

839

int currentPos = ci.getIndex();

840

841

842

if (hexchar(c=ci.current())){

843

char c1;

844

if (hexchar(c1=ci.next())){

845

return new String( new char[]{c, c1} );

846

847

}

848

}

849

850

ci.setIndex(currentPos);

851

throw new RFC2253ParsingException("Valid hexadecimal 8-bit number expected");

852

}

853

854

/**

855

* This is a utility method to return a value, corresponding to the char

856

* value.

857

* It is private, and I am sure I will use it correctly; you should

858

* not use it at all: it does not check if the input is correct.

859

860

private static int unhex(char c){

861

if (c<A_CHAR){ // it must be an ASCII '0'..'9'

862

return c-ZERO_CHAR;

863

}

864

865

if (c<a_CHAR){ // it must be an ASCII 'A'..'F'

866

return c-A_CHAR+10;

867

}

868

869

return c-a_CHAR+10; // here it is 'a'..'f'

870

}

871

872

873

/**

874

* The hexchar terminal.

875

876

* @param c - the character to be tested

877

878

* @return true, if c is a hexchar as defined in RFC2253; false

879

* otherwise

880

881

protected static boolean hexchar(char c){

882

return DIGIT(c) || (c>=A_CHAR && c<=F_CHAR) || (c>='a' && c<='f');

883

}

884

885

886

/**

887

* The DIGIT terminal.

888

889

* @param c - the character to be tested

890

891

* @return true, if c is a digit as defined in RFC2253; false

892

* otherwise

893

894

78382

protected static boolean DIGIT(char c){

895

78382

return c>=ZERO_CHAR && c<=NINE_CHAR; // 0-9

896

}

897

898

/**

899

* The ALPHA terminal.

900

901

* @param c - the character to be tested

902

903

* @return true, if c is an alpha as defined in RFC2253; false

904

* otherwise

905

906

139170

protected static boolean ALPHA(char c){

907

139170

return (c>=A_CHAR && c<=Z_CHAR) || (c>=a_CHAR && c<=z_CHAR);

908

// A-Z, a-z

909

}

910

911

/**

912

* The QUOTATION terminal.

913

914

* @param c - the character to be tested

915

* @param OSF - if true, OSF syntax is assumed; if false, RFC2253 syntax

916

* is assumed

917

918

* @return true, if c is a quotation as defined in RFC2253 or OSF; false

919

* otherwise

920

921

796853

protected static boolean QUOTATION(char c, boolean OSF){

922

796853

return c==(OSF?APOSTROPHE_CHAR:QUOTE_CHAR); // ' or "

923

}

924

925

926

/**

927

* The skip_spaces() non-terminal.

928

* <code>skip_spaces = *space</code>

929

930

* @param ci - the CharacterIterator, where the current position points

931

* to sequence of spaces

932

933

354700

protected static void skip_spaces(CharacterIterator ci){

934

354700

ci.previous();

935

358764

while(ci.next()==SPACE_CHAR);

936

}

937

938

939

/**

940

* The COMMA terminal.

941

* <code>COMMA = "," / ";"</code>

942

943

* @param c - the character to be tested

944

945

* @return true, if c is a comma as defined in RFC2253; false

946

* otherwise

947

948

836486

protected static boolean COMMA(char c){

949

836485

return c==COMMA_CHAR || c==SEMICOLON_CHAR;

950

}

951

952

953

/**

954

* The PLUS terminal.

955

* <code>PLUS = "+"</code>

956

957

* @param c - the character to be tested

958

959

* @return true, if c is a PLUS as defined in RFC2253; false

960

* otherwise

961

962

796741

protected static boolean PLUS(char c){

963

796741

return c==PLUS_CHAR;

964

}

965

966

967

/**

968

* The ASSIGNMENT terminal.

969

* <code>ASSIGNMENT = "="</code>

970

971

* @param c - the character to be tested

972

973

* @return true, if c is a assignment as defined in RFC2253; false

974

* otherwise

975

976

836510

protected static boolean ASSIGNMENT(char c){

977

836510

return c==ASSIGN_CHAR;

978

}

979

980

981

/**

982

* The SLASH terminal.

983

* <code>SLASH = "/"</code>

984

985

* @param c - the character to be tested

986

987

* @return true, if c is a slash as defined in RFC2253; false

988

* otherwise

989

990

protected static boolean SLASH(char c){

991

return c==SLASH_CHAR;

992

}

993

994

995

/**

996

* This routine converts a given byte array into a hexstring, prepended

997

* with a HASH_CHAR. The array can be empty, but not null; in the

998

* latter case an IllegalArgumentException is thrown, whilst in the

999

* former case an empty string is returned (see hexstring syntax spec).

1000

1001

* @param b - the byte array to be converted into a hexstring

1002

1003

* @return a hexstring with the leading "#", or an empty string, if

1004

* b has zero length

1005

1006

public static String toHexString(byte [] b){

1007

if (b==null) throw new IllegalArgumentException("Cannot convert null to hexstring");

1008

1009

if (b.length==0) return "";

1010

1011

StringBuffer result = new StringBuffer(HASH_CHAR);

1012

1013

for (int i=0; i<b.length; i++){

1014

result.append(intToHex(b[i]>>4));

1015

result.append(intToHex(b[i]));

1016

}

1017

1018

private static char intToHex(int a){ // don't touch this; it is mine

1019

}

1020

1021

/**

1022

* This method returns a character corresponding to a hexadecimal digit.

1023

1024

* @param a - a digit

1025

1026

* @return the ASCII character representing it

1027

1028

1029

a&=0xf;

1030

return (char)((a<10)?(ZERO_CHAR+a):

1031

(a_CHAR+a-10)); // I am using lowercase; do you mind? I find it neater.

1032

}

1033

1034

1035

/**

1036

* This routine gets a Unicode String on input, and converts any

1037

* character, that is outside latin alphabet and numbers, to hexpair,

1038

* and escapes all special characters.

1039

1040

* @param s - the string to convert

1041

1042

* @return the string where all characters outside latin alphabet have

1043

* been escaped, including spaces and other special characters

1044

1045

52492

public static String escapeString(String s){

1046

52492

char [] c = s.toCharArray();

1047

52492

if (!stringchar(c[i], false) || // thus we will escape ``=`` and ``#`` as well; but it says ``implementations MAY escape other symbols as well; though, this is for easier coding only, not for correct parsing

1048

1049

431818

for (int i=0; i<c.length; i++){

1050

379326

1051

(c[i]==SPACE_CHAR &&

1052

(i==0 || i==c.length-1)

1053

)

1054

){

1055

result.append(BSLASH_CHAR);

1056

}

1057

1058

379326

result.append(c[i]);

1059

}

1060

1061

52492

return toUTF8(result.toString());

1062

}

1063

1064

1065

/**

1066

* This routine converts the given Unicode string (in fact, even UCS-4)

1067

* into a UTF-8 representation of it, with back-slashes where

1068

* appropriate.

1069

1070

* @param s - the string to be converted into UTF-8

1071

1072

* @return a string where the characters outside latin alphabet have

1073

* been escaped with the UTF-8 code provided

1074

1075

* @see RFC2279

1076

1077

52492

private static String toUTF8(String s){

1078

52492

char [] c = s.toCharArray();

1079

52492

for (int j=0; j<a.length; j++){

1080

1081

431826

for (int i=0; i<c.length; i++){

1082

379334

if (c[i]<0x80){

1083

379320

result.append(c[i]);

1084

}else{

1085

byte [] a = toUTF8(c[i]);

1086

1087

result.append(BSLASH_CHAR);

1088

result.append(intToHex(a[j]>>4));

1089

result.append(intToHex(a[j]));

1090

}

1091

}

1092

}

1093

1094

52492