~ubuntu-branches/ubuntu/trusty/patch/trusty-security

Committer: Bazaar Package Importer
Author(s): Christoph Berg
Date: 2009-12-02 10:25:26 UTC
mfrom: (5.1.1 sid)
Revision ID: james.westby@ubuntu.com-20091202102526-5luk0zsqhghu58l2

Tags: 2.6-2

http://bugs.debian.org/558974

* Update watch file.
* Section: vcs.
* Suggests: diffutils-doc instead of diff-doc, thanks Christoph Anton
Mitterer for spotting. Closes: #558974.

files added:
VERSION

config.guess

config.sub

debian/NEWS

debian/README.source

debian/patches/558485-backupmode

debian/patches/lenny-options

gl/lib

gl/lib/argmatch.c

gl/lib/argmatch.h

gl/lib/backupfile.c

gl/lib/backupfile.h

gl/lib/basename.c

gl/lib/dirname.c

gl/lib/dirname.h

gl/lib/error.c

gl/lib/error.h

gl/lib/exitfail.c

gl/lib/exitfail.h

gl/lib/full-write.c

gl/lib/full-write.h

gl/lib/getopt.c

gl/lib/getopt.hin

gl/lib/getopt1.c

gl/lib/getopt_int.h

gl/lib/gettext.h

gl/lib/hash.c

gl/lib/hash.h

gl/lib/malloc.c

gl/lib/mbrtowc.c

gl/lib/memchr.c

gl/lib/minmax.h

gl/lib/quote.c

gl/lib/quote.h

gl/lib/quotearg.c

gl/lib/quotearg.h

gl/lib/realloc.c

gl/lib/rename.c

gl/lib/safe-read.c

gl/lib/safe-write.c

gl/lib/safe-write.h

gl/lib/stdbool.hin

gl/lib/strcasecmp.c

gl/lib/stripslash.c

gl/lib/strncasecmp.c

gl/lib/strndup.c

gl/lib/unlocked-io.h

gl/lib/verify.h

gl/lib/xalloc.h

gl/lib/xmalloc.c

gl/lib/xstrndup.c

gl/lib/xstrndup.h

gl/m4

gl/m4/argmatch.m4

gl/m4/backupfile.m4

gl/m4/d-ino.m4

gl/m4/dirname.m4

gl/m4/dos.m4

gl/m4/double-slash-root.m4

gl/m4/error.m4

gl/m4/exitfail.m4

gl/m4/extensions.m4

gl/m4/getopt.m4

gl/m4/gettext.m4

gl/m4/hash.m4

gl/m4/inline.m4

gl/m4/malloc.m4

gl/m4/mbrtowc.m4

gl/m4/mbstate_t.m4

gl/m4/memchr.m4

gl/m4/minmax.m4

gl/m4/onceonly.m4

gl/m4/quote.m4

gl/m4/quotearg.m4

gl/m4/realloc.m4

gl/m4/rename.m4

gl/m4/safe-write.m4

gl/m4/ssize_t.m4

gl/m4/stdbool.m4

gl/m4/strcase.m4

gl/m4/strndup.m4

gl/m4/unlocked-io.m4

gl/m4/utimbuf.m4

gl/m4/xalloc.m4

gl/m4/xstrndup.m4

src/bestmatch.h

src/common.h

src/diffseq.h

src/inp.c

src/inp.h

src/maketime.c

src/maketime.h

src/merge.c

src/partime.c

src/partime.h

src/patch.c

src/pch.c

src/pch.h

src/quotesys.c

src/quotesys.h

src/util.c

src/util.h

src/version.c

src/version.h

tests

tests/asymmetric-hunks

tests/backup-prefix-suffix

tests/corrupt-reject-files

tests/create-delete

tests/crlf-handling

tests/dash-o-append

tests/global-reject-files

tests/inname

tests/line-numbers

tests/merge

tests/munged-context-format

tests/need-filename

tests/no-newline-triggers-assert

tests/preserve-c-function-names

tests/preserve-mode-and-timestamp

tests/reject-format

tests/remember-backup-files

tests/remember-reject-files

tests/test-lib.sh

tests/unmodified-files

update-version.sh

files removed:
addext.c

argmatch.c

argmatch.h

backupfile.c

backupfile.h

basename.c

common.h

debian/patches/10_unified-reject-files

debian/patches/20_global-reject-file

debian/patches/30_manpage-char

dirname.c

dirname.h

error.c

error.h

getopt.c

getopt.h

getopt1.c

gettext.h

hash.c

hash.h

inp.c

inp.h

m4/backupfile.m4

m4/d-ino.m4

m4/dirname.m4

m4/dos.m4

m4/error.m4

m4/getopt.m4

m4/hash.m4

m4/malloc.m4

m4/mbrtowc.m4

m4/mbstate_t.m4

m4/memchr.m4

m4/nanosecond_stat.m4

m4/onceonly.m4

m4/quote.m4

m4/quotearg.m4

m4/realloc.m4

m4/rmdir.m4

m4/stdbool.m4

m4/unlocked-io.m4

m4/utimbuf.m4

m4/xalloc.m4

maketime.c

maketime.h

malloc.c

memchr.c

mkdir.c

partime.c

partime.h

patch.c

pch.c

pch.h

quote.c

quote.h

quotearg.c

quotearg.h

quotesys.c

quotesys.h

realloc.c

rmdir.c

stdbool.h.in

strcasecmp.c

strncasecmp.c

unlocked-io.h

util.c

util.h

version.c

version.h

xalloc.h

xmalloc.c

files modified:
AUTHORS

COPYING

ChangeLog

Makefile.in

NEWS

README

aclocal.m4

config.hin

configure

configure.ac

debian/changelog

debian/compat

debian/control

debian/patches/series

debian/rules

debian/watch

install-sh *

m4/mkdir.m4

m4/setmode.m4

mkinstalldirs *

patch.man

Show diffs side-by-side

added added

removed removed

gl/lib/hash.c

/* hash - hashing table processing.

Software Foundation, Inc.

Written by Jim Meyering, 1992.

This program is free software: you can redistribute it and/or modify

it under the terms of the GNU General Public License as published by

the Free Software Foundation; either version 3 of the License, or

(at your option) any later version.

This program is distributed in the hope that it will be useful,

but WITHOUT ANY WARRANTY; without even the implied warranty of

MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

GNU General Public License for more details.

You should have received a copy of the GNU General Public License

along with this program. If not, see <http://www.gnu.org/licenses/>. */

/* A generic hash table package. */

/* Define USE_OBSTACK to 1 if you want the allocator to use obstacks instead

of malloc. If you change USE_OBSTACK, you have to recompile! */

#include <config.h>

#include "hash.h"

#include "xalloc.h"

#include <limits.h>

#include <stdio.h>

#include <stdlib.h>

#if USE_OBSTACK

# include "obstack.h"

# ifndef obstack_chunk_alloc

# define obstack_chunk_alloc malloc

# endif

# ifndef obstack_chunk_free

# define obstack_chunk_free free

# endif

#endif

#ifndef SIZE_MAX

# define SIZE_MAX ((size_t) -1)

#endif

struct hash_table

{

/* The array of buckets starts at BUCKET and extends to BUCKET_LIMIT-1,

for a possibility of N_BUCKETS. Among those, N_BUCKETS_USED buckets

are not empty, there are N_ENTRIES active entries in the table. */

struct hash_entry *bucket;

struct hash_entry const *bucket_limit;

size_t n_buckets;

size_t n_buckets_used;

size_t n_entries;

/* Tuning arguments, kept in a physicaly separate structure. */

const Hash_tuning *tuning;

/* Three functions are given to `hash_initialize', see the documentation

block for this function. In a word, HASHER randomizes a user entry

into a number up from 0 up to some maximum minus 1; COMPARATOR returns

true if two user entries compare equally; and DATA_FREER is the cleanup

function for a user entry. */

Hash_hasher hasher;

Hash_comparator comparator;

Hash_data_freer data_freer;

/* A linked list of freed struct hash_entry structs. */

struct hash_entry *free_entry_list;

#if USE_OBSTACK

/* Whenever obstacks are used, it is possible to allocate all overflowed

entries into a single stack, so they all can be freed in a single

operation. It is not clear if the speedup is worth the trouble. */

struct obstack entry_stack;

#endif

};

/* A hash table contains many internal entries, each holding a pointer to

some user provided data (also called a user entry). An entry indistinctly

refers to both the internal entry and its associated user entry. A user

entry contents may be hashed by a randomization function (the hashing

function, or just `hasher' for short) into a number (or `slot') between 0

and the current table size. At each slot position in the hash table,

starts a linked chain of entries for which the user data all hash to this

slot. A bucket is the collection of all entries hashing to the same slot.

A good `hasher' function will distribute entries rather evenly in buckets.

In the ideal case, the length of each bucket is roughly the number of

entries divided by the table size. Finding the slot for a data is usually

done in constant time by the `hasher', and the later finding of a precise

entry is linear in time with the size of the bucket. Consequently, a

larger hash table size (that is, a larger number of buckets) is prone to

yielding shorter chains, *given* the `hasher' function behaves properly.

100

Long buckets slow down the lookup algorithm. One might use big hash table

101

sizes in hope to reduce the average length of buckets, but this might

102

become inordinate, as unused slots in the hash table take some space. The

103

best bet is to make sure you are using a good `hasher' function (beware

104

that those are not that easy to write! :-), and to use a table size

105

larger than the actual number of entries. */

106

107

/* If an insertion makes the ratio of nonempty buckets to table size larger

108

than the growth threshold (a number between 0.0 and 1.0), then increase

109

the table size by multiplying by the growth factor (a number greater than

110

1.0). The growth threshold defaults to 0.8, and the growth factor

111

defaults to 1.414, meaning that the table will have doubled its size

112

every second time 80% of the buckets get used. */

113

#define DEFAULT_GROWTH_THRESHOLD 0.8

114

#define DEFAULT_GROWTH_FACTOR 1.414

115

116

/* If a deletion empties a bucket and causes the ratio of used buckets to

117

table size to become smaller than the shrink threshold (a number between

118

0.0 and 1.0), then shrink the table by multiplying by the shrink factor (a

119

number greater than the shrink threshold but smaller than 1.0). The shrink

120

threshold and factor default to 0.0 and 1.0, meaning that the table never

121

shrinks. */

122

#define DEFAULT_SHRINK_THRESHOLD 0.0

123

#define DEFAULT_SHRINK_FACTOR 1.0

124

125

/* Use this to initialize or reset a TUNING structure to

126

some sensible values. */

127

static const Hash_tuning default_tuning =

128

{

129

DEFAULT_SHRINK_THRESHOLD,

130

DEFAULT_SHRINK_FACTOR,

131

DEFAULT_GROWTH_THRESHOLD,

132

DEFAULT_GROWTH_FACTOR,

133

false

134

};

135

136

/* Information and lookup. */

137

138

/* The following few functions provide information about the overall hash

139

table organization: the number of entries, number of buckets and maximum

140

length of buckets. */

141

142

/* Return the number of buckets in the hash table. The table size, the total

143

number of buckets (used plus unused), or the maximum number of slots, are

144

the same quantity. */

145

146

size_t

147

hash_get_n_buckets (const Hash_table *table)

148

{

149

return table->n_buckets;

150

}

151

152

/* Return the number of slots in use (non-empty buckets). */

153

154

size_t

155

hash_get_n_buckets_used (const Hash_table *table)

156

{

157

return table->n_buckets_used;

158

}

159

160

/* Return the number of active entries. */

161

162

size_t

163

hash_get_n_entries (const Hash_table *table)

164

{

165

return table->n_entries;

166

}

167

168

/* Return the length of the longest chain (bucket). */

169

170

size_t

171

hash_get_max_bucket_length (const Hash_table *table)

172

{

173

struct hash_entry const *bucket;

174

size_t max_bucket_length = 0;

175

176

for (bucket = table->bucket; bucket < table->bucket_limit; bucket++)

177

{

178

if (bucket->data)

179

{

180

struct hash_entry const *cursor = bucket;

181

size_t bucket_length = 1;

182

183

while (cursor = cursor->next, cursor)

184

bucket_length++;

185

186

if (bucket_length > max_bucket_length)

187

max_bucket_length = bucket_length;

188

}

189

}

190

191

return max_bucket_length;

192

}

193

194

/* Do a mild validation of a hash table, by traversing it and checking two

195

statistics. */

196

197

bool

198

hash_table_ok (const Hash_table *table)

199

{

200

struct hash_entry const *bucket;

201

size_t n_buckets_used = 0;

202

size_t n_entries = 0;

203

204

for (bucket = table->bucket; bucket < table->bucket_limit; bucket++)

205

{

206

if (bucket->data)

207

{

208

struct hash_entry const *cursor = bucket;

209

210

/* Count bucket head. */

211

n_buckets_used++;

212

n_entries++;

213

214

/* Count bucket overflow. */

215

while (cursor = cursor->next, cursor)

216

n_entries++;

217

}

218

}

219

220

if (n_buckets_used == table->n_buckets_used && n_entries == table->n_entries)

221

return true;

222

223

return false;

224

}

225

226

void

227

hash_print_statistics (const Hash_table *table, FILE *stream)

228

{

229

size_t n_entries = hash_get_n_entries (table);

230

size_t n_buckets = hash_get_n_buckets (table);

231

size_t n_buckets_used = hash_get_n_buckets_used (table);

232

size_t max_bucket_length = hash_get_max_bucket_length (table);

233

234

fprintf (stream, "# entries: %lu\n", (unsigned long int) n_entries);

235

fprintf (stream, "# buckets: %lu\n", (unsigned long int) n_buckets);

236

fprintf (stream, "# buckets used: %lu (%.2f%%)\n",

237

(unsigned long int) n_buckets_used,

238

(100.0 * n_buckets_used) / n_buckets);

239

fprintf (stream, "max bucket length: %lu\n",

240

(unsigned long int) max_bucket_length);

241

}

242

243

/* If ENTRY matches an entry already in the hash table, return the

244

entry from the table. Otherwise, return NULL. */

245

246

void *

247

hash_lookup (const Hash_table *table, const void *entry)

248

{

249

struct hash_entry const *bucket

250

= table->bucket + table->hasher (entry, table->n_buckets);

251

struct hash_entry const *cursor;

252

253

if (! (bucket < table->bucket_limit))

254

abort ();

255

256

if (bucket->data == NULL)

257

return NULL;

258

259

for (cursor = bucket; cursor; cursor = cursor->next)

260

if (table->comparator (entry, cursor->data))

261

return cursor->data;

262

263

return NULL;

264

}

265

266

/* Walking. */

267

268

/* The functions in this page traverse the hash table and process the

269

contained entries. For the traversal to work properly, the hash table

270

should not be resized nor modified while any particular entry is being

271

processed. In particular, entries should not be added or removed. */

272

273

/* Return the first data in the table, or NULL if the table is empty. */

274

275

void *

276

hash_get_first (const Hash_table *table)

277

{

278

struct hash_entry const *bucket;

279

280

if (table->n_entries == 0)

281

return NULL;

282

283

for (bucket = table->bucket; ; bucket++)

284

if (! (bucket < table->bucket_limit))

285

abort ();

286

else if (bucket->data)

287

return bucket->data;

288

}

289

290

/* Return the user data for the entry following ENTRY, where ENTRY has been

291

returned by a previous call to either `hash_get_first' or `hash_get_next'.

292

Return NULL if there are no more entries. */

293

294

void *

295

hash_get_next (const Hash_table *table, const void *entry)

296

{

297

struct hash_entry const *bucket

298

= table->bucket + table->hasher (entry, table->n_buckets);

299

struct hash_entry const *cursor;

300

301

if (! (bucket < table->bucket_limit))

302

abort ();

303

304

/* Find next entry in the same bucket. */

305

for (cursor = bucket; cursor; cursor = cursor->next)

306

if (cursor->data == entry && cursor->next)

307

return cursor->next->data;

308

309

/* Find first entry in any subsequent bucket. */

310

while (++bucket < table->bucket_limit)

311

if (bucket->data)

312

return bucket->data;

313

314

/* None found. */

315

return NULL;

316

}

317

318

/* Fill BUFFER with pointers to active user entries in the hash table, then

319

return the number of pointers copied. Do not copy more than BUFFER_SIZE

320

pointers. */

321

322

size_t

323

hash_get_entries (const Hash_table *table, void **buffer,

324

size_t buffer_size)

325

{

326

size_t counter = 0;

327

struct hash_entry const *bucket;

328

struct hash_entry const *cursor;

329

330

for (bucket = table->bucket; bucket < table->bucket_limit; bucket++)

331

{

332

if (bucket->data)

333

{

334

for (cursor = bucket; cursor; cursor = cursor->next)

335

{

336

if (counter >= buffer_size)

337

return counter;

338

buffer[counter++] = cursor->data;

339

}

340

}

341

}

342

343

return counter;

344

}

345

346

/* Call a PROCESSOR function for each entry of a hash table, and return the

347

number of entries for which the processor function returned success. A

348

pointer to some PROCESSOR_DATA which will be made available to each call to

349

the processor function. The PROCESSOR accepts two arguments: the first is

350

the user entry being walked into, the second is the value of PROCESSOR_DATA

351

as received. The walking continue for as long as the PROCESSOR function

352

returns nonzero. When it returns zero, the walking is interrupted. */

353

354

size_t

355

hash_do_for_each (const Hash_table *table, Hash_processor processor,

356

void *processor_data)

357

{

358

size_t counter = 0;

359

struct hash_entry const *bucket;

360

struct hash_entry const *cursor;

361

362

for (bucket = table->bucket; bucket < table->bucket_limit; bucket++)

363

{

364

if (bucket->data)

365

{

366

for (cursor = bucket; cursor; cursor = cursor->next)

367

{

368

if (!(*processor) (cursor->data, processor_data))

369

return counter;

370

counter++;

371

}

372

}

373

}

374

375

return counter;

376

}

377

378

/* Allocation and clean-up. */

379

380

/* Return a hash index for a NUL-terminated STRING between 0 and N_BUCKETS-1.

381

This is a convenience routine for constructing other hashing functions. */

382

383

#if USE_DIFF_HASH

384

385

/* About hashings, Paul Eggert writes to me (FP), on 1994-01-01: "Please see

386

B. J. McKenzie, R. Harries & T. Bell, Selecting a hashing algorithm,

387

Software--practice & experience 20, 2 (Feb 1990), 209-224. Good hash

388

algorithms tend to be domain-specific, so what's good for [diffutils'] io.c

389

may not be good for your application." */

390

391

size_t

392

hash_string (const char *string, size_t n_buckets)

393

{

394

# define ROTATE_LEFT(Value, Shift) \

395

((Value) << (Shift) | (Value) >> ((sizeof (size_t) * CHAR_BIT) - (Shift)))

396

# define HASH_ONE_CHAR(Value, Byte) \

397

((Byte) + ROTATE_LEFT (Value, 7))

398

399

size_t value = 0;

400

unsigned char ch;

401

402

for (; (ch = *string); string++)

403

value = HASH_ONE_CHAR (value, ch);

404

return value % n_buckets;

405

406

# undef ROTATE_LEFT

407

# undef HASH_ONE_CHAR

408

}

409

410

#else /* not USE_DIFF_HASH */

411

412

/* This one comes from `recode', and performs a bit better than the above as

413

per a few experiments. It is inspired from a hashing routine found in the

414

very old Cyber `snoop', itself written in typical Greg Mansfield style.

415

(By the way, what happened to this excellent man? Is he still alive?) */

416

417

size_t

418

hash_string (const char *string, size_t n_buckets)

419

{

420

size_t value = 0;

421

unsigned char ch;

422

423

for (; (ch = *string); string++)

424

value = (value * 31 + ch) % n_buckets;

425

return value;

426

}

427

428

#endif /* not USE_DIFF_HASH */

429

430

/* Return true if CANDIDATE is a prime number. CANDIDATE should be an odd

431

number at least equal to 11. */

432

433

static bool

434

is_prime (size_t candidate)

435

{

436

size_t divisor = 3;

437

size_t square = divisor * divisor;

438

439

while (square < candidate && (candidate % divisor))

440

{

441

divisor++;

442

square += 4 * divisor;

443

divisor++;

444

}

445

446

return (candidate % divisor ? true : false);

447

}

448

449

/* Round a given CANDIDATE number up to the nearest prime, and return that

450

prime. Primes lower than 10 are merely skipped. */

451

452

static size_t

453

next_prime (size_t candidate)

454

{

455

/* Skip small primes. */

456

if (candidate < 10)

457

candidate = 10;

458

459

/* Make it definitely odd. */

460

candidate |= 1;

461

462

while (!is_prime (candidate))

463

candidate += 2;

464

465

return candidate;

466

}

467

468

void

469

hash_reset_tuning (Hash_tuning *tuning)

470

{

471

*tuning = default_tuning;

472

}

473

474

/* For the given hash TABLE, check the user supplied tuning structure for

475

reasonable values, and return true if there is no gross error with it.

476

Otherwise, definitively reset the TUNING field to some acceptable default

477

in the hash table (that is, the user loses the right of further modifying

478

tuning arguments), and return false. */

479

480

static bool

481

check_tuning (Hash_table *table)

482

{

483

const Hash_tuning *tuning = table->tuning;

484

485

/* Be a bit stricter than mathematics would require, so that

486

rounding errors in size calculations do not cause allocations to

487

fail to grow or shrink as they should. The smallest allocation

488

is 11 (due to next_prime's algorithm), so an epsilon of 0.1

489

should be good enough. */

490

float epsilon = 0.1f;

491

492

if (epsilon < tuning->growth_threshold

493

&& tuning->growth_threshold < 1 - epsilon

494

&& 1 + epsilon < tuning->growth_factor

495

&& 0 <= tuning->shrink_threshold

496

&& tuning->shrink_threshold + epsilon < tuning->shrink_factor

497

&& tuning->shrink_factor <= 1

498

&& tuning->shrink_threshold + epsilon < tuning->growth_threshold)

499

return true;

500

501

table->tuning = &default_tuning;

502

return false;

503

}

504

505

/* Allocate and return a new hash table, or NULL upon failure. The initial

506

number of buckets is automatically selected so as to _guarantee_ that you

507

may insert at least CANDIDATE different user entries before any growth of

508

the hash table size occurs. So, if have a reasonably tight a-priori upper

509

bound on the number of entries you intend to insert in the hash table, you

510

may save some table memory and insertion time, by specifying it here. If

511

the IS_N_BUCKETS field of the TUNING structure is true, the CANDIDATE

512

argument has its meaning changed to the wanted number of buckets.

513

514

TUNING points to a structure of user-supplied values, in case some fine

515

tuning is wanted over the default behavior of the hasher. If TUNING is

516

NULL, the default tuning parameters are used instead.

517

518

The user-supplied HASHER function should be provided. It accepts two

519

arguments ENTRY and TABLE_SIZE. It computes, by hashing ENTRY contents, a

520

slot number for that entry which should be in the range 0..TABLE_SIZE-1.

521

This slot number is then returned.

522

523

The user-supplied COMPARATOR function should be provided. It accepts two

524

arguments pointing to user data, it then returns true for a pair of entries

525

that compare equal, or false otherwise. This function is internally called

526

on entries which are already known to hash to the same bucket index.

527

528

The user-supplied DATA_FREER function, when not NULL, may be later called

529

with the user data as an argument, just before the entry containing the

530

data gets freed. This happens from within `hash_free' or `hash_clear'.

531

You should specify this function only if you want these functions to free

532

all of your `data' data. This is typically the case when your data is

533

simply an auxiliary struct that you have malloc'd to aggregate several

534

values. */

535

536

Hash_table *

537

hash_initialize (size_t candidate, const Hash_tuning *tuning,

538

Hash_hasher hasher, Hash_comparator comparator,

539

Hash_data_freer data_freer)

540

{

541

Hash_table *table;

542

543

if (hasher == NULL || comparator == NULL)

544

return NULL;

545

546

table = malloc (sizeof *table);

547

if (table == NULL)

548

return NULL;

549

550

if (!tuning)

551

tuning = &default_tuning;

552

table->tuning = tuning;

553

if (!check_tuning (table))

554

{

555

/* Fail if the tuning options are invalid. This is the only occasion

556

when the user gets some feedback about it. Once the table is created,

557

if the user provides invalid tuning options, we silently revert to

558

using the defaults, and ignore further request to change the tuning

559

options. */

560

goto fail;

561

}

562

563

if (!tuning->is_n_buckets)

564

{

565

float new_candidate = candidate / tuning->growth_threshold;

566

if (SIZE_MAX <= new_candidate)

567

goto fail;

568

candidate = new_candidate;

569

}

570

571

if (xalloc_oversized (candidate, sizeof *table->bucket))

572

goto fail;

573

table->n_buckets = next_prime (candidate);

574

if (xalloc_oversized (table->n_buckets, sizeof *table->bucket))

575

goto fail;

576

577

table->bucket = calloc (table->n_buckets, sizeof *table->bucket);

578

if (table->bucket == NULL)

579

goto fail;

580

table->bucket_limit = table->bucket + table->n_buckets;

581

table->n_buckets_used = 0;

582

table->n_entries = 0;

583

584

table->hasher = hasher;

585

table->comparator = comparator;

586

table->data_freer = data_freer;

587

588

table->free_entry_list = NULL;

589

#if USE_OBSTACK

590

obstack_init (&table->entry_stack);

591

#endif

592

return table;

593

594

fail:

595

free (table);

596

return NULL;

597

}

598

599

/* Make all buckets empty, placing any chained entries on the free list.

600

Apply the user-specified function data_freer (if any) to the datas of any

601

affected entries. */

602

603

void

604

hash_clear (Hash_table *table)

605

{

606

struct hash_entry *bucket;

607

608

for (bucket = table->bucket; bucket < table->bucket_limit; bucket++)

609

{

610

if (bucket->data)

611

{

612

struct hash_entry *cursor;

613

struct hash_entry *next;

614

615

/* Free the bucket overflow. */

616

for (cursor = bucket->next; cursor; cursor = next)

617

{

618

if (table->data_freer)

619

(*table->data_freer) (cursor->data);

620

cursor->data = NULL;

621

622

next = cursor->next;

623

/* Relinking is done one entry at a time, as it is to be expected

624

that overflows are either rare or short. */

625

cursor->next = table->free_entry_list;

626

table->free_entry_list = cursor;

627

}

628

629

/* Free the bucket head. */

630

if (table->data_freer)

631

(*table->data_freer) (bucket->data);

632

bucket->data = NULL;

633

bucket->next = NULL;

634

}

635

}

636

637

table->n_buckets_used = 0;

638

table->n_entries = 0;

639

}

640

641

/* Reclaim all storage associated with a hash table. If a data_freer

642

function has been supplied by the user when the hash table was created,

643

this function applies it to the data of each entry before freeing that

644

entry. */

645

646

void

647

hash_free (Hash_table *table)

648

{

649

struct hash_entry *bucket;

650

struct hash_entry *cursor;

651

struct hash_entry *next;

652

653

/* Call the user data_freer function. */

654

if (table->data_freer && table->n_entries)

655

{

656

for (bucket = table->bucket; bucket < table->bucket_limit; bucket++)

657

{

658

if (bucket->data)

659

{

660

for (cursor = bucket; cursor; cursor = cursor->next)

661

{

662

(*table->data_freer) (cursor->data);

663

}

664

}

665

}

666

}

667

668

#if USE_OBSTACK

669

670

obstack_free (&table->entry_stack, NULL);

671

672

#else

673

674

/* Free all bucket overflowed entries. */

675

for (bucket = table->bucket; bucket < table->bucket_limit; bucket++)

676

{

677

for (cursor = bucket->next; cursor; cursor = next)

678

{

679

next = cursor->next;

680

free (cursor);

681

}

682

}

683

684

/* Also reclaim the internal list of previously freed entries. */

685

for (cursor = table->free_entry_list; cursor; cursor = next)

686

{

687

next = cursor->next;

688

free (cursor);

689

}

690

691

#endif

692

693

/* Free the remainder of the hash table structure. */

694

free (table->bucket);

695

free (table);

696

}

697

698

/* Insertion and deletion. */

699

700

/* Get a new hash entry for a bucket overflow, possibly by reclying a

701

previously freed one. If this is not possible, allocate a new one. */

702

703

static struct hash_entry *

704

allocate_entry (Hash_table *table)

705

{

706

struct hash_entry *new;

707

708

if (table->free_entry_list)

709

{

710

new = table->free_entry_list;

711

table->free_entry_list = new->next;

712

}

713

else

714

{

715

#if USE_OBSTACK

716

new = obstack_alloc (&table->entry_stack, sizeof *new);

717

#else

718

new = malloc (sizeof *new);

719

#endif

720

}

721

722

return new;

723

}

724

725

/* Free a hash entry which was part of some bucket overflow,

726

saving it for later recycling. */

727

728

static void

729

free_entry (Hash_table *table, struct hash_entry *entry)

730

{

731

entry->data = NULL;

732

entry->next = table->free_entry_list;

733

table->free_entry_list = entry;

734

}

735

736

/* This private function is used to help with insertion and deletion. When

737

ENTRY matches an entry in the table, return a pointer to the corresponding

738

user data and set *BUCKET_HEAD to the head of the selected bucket.

739

Otherwise, return NULL. When DELETE is true and ENTRY matches an entry in

740

the table, unlink the matching entry. */

741

742

static void *

743

hash_find_entry (Hash_table *table, const void *entry,

744

struct hash_entry **bucket_head, bool delete)

745

{

746

struct hash_entry *bucket

747

= table->bucket + table->hasher (entry, table->n_buckets);

748

struct hash_entry *cursor;

749

750

if (! (bucket < table->bucket_limit))

751

abort ();

752

753

*bucket_head = bucket;

754

755

/* Test for empty bucket. */

756

if (bucket->data == NULL)

757

return NULL;

758

759

/* See if the entry is the first in the bucket. */

760

if ((*table->comparator) (entry, bucket->data))

761

{

762

void *data = bucket->data;

763

764

if (delete)

765

{

766

if (bucket->next)

767

{

768

struct hash_entry *next = bucket->next;

769

770

/* Bump the first overflow entry into the bucket head, then save

771

the previous first overflow entry for later recycling. */

772

*bucket = *next;

773

free_entry (table, next);

774

}

775

else

776

{

777

bucket->data = NULL;

778

}

779

}

780

781

return data;

782

}

783

784

/* Scan the bucket overflow. */

785

for (cursor = bucket; cursor->next; cursor = cursor->next)

786

{

787

if ((*table->comparator) (entry, cursor->next->data))

788

{

789

void *data = cursor->next->data;

790

791

if (delete)

792

{

793

struct hash_entry *next = cursor->next;

794

795

/* Unlink the entry to delete, then save the freed entry for later

796

recycling. */

797

cursor->next = next->next;

798

free_entry (table, next);

799

}

800

801

return data;

802

}

803

}

804

805

/* No entry found. */

806

return NULL;

807

}

808

809

/* For an already existing hash table, change the number of buckets through

810

specifying CANDIDATE. The contents of the hash table are preserved. The

811

new number of buckets is automatically selected so as to _guarantee_ that

812

the table may receive at least CANDIDATE different user entries, including

813

those already in the table, before any other growth of the hash table size

814

occurs. If TUNING->IS_N_BUCKETS is true, then CANDIDATE specifies the

815

exact number of buckets desired. */

816

817

bool

818

hash_rehash (Hash_table *table, size_t candidate)

819

{

820

Hash_table *new_table;

821

struct hash_entry *bucket;

822

struct hash_entry *cursor;

823

struct hash_entry *next;

824

825

new_table = hash_initialize (candidate, table->tuning, table->hasher,

826

table->comparator, table->data_freer);

827

if (new_table == NULL)

828

return false;

829

830

/* Merely reuse the extra old space into the new table. */

831

#if USE_OBSTACK

832

obstack_free (&new_table->entry_stack, NULL);

833

new_table->entry_stack = table->entry_stack;

834

#endif

835

new_table->free_entry_list = table->free_entry_list;

836

837

for (bucket = table->bucket; bucket < table->bucket_limit; bucket++)

838

if (bucket->data)

839

for (cursor = bucket; cursor; cursor = next)

840

{

841

void *data = cursor->data;

842

struct hash_entry *new_bucket

843

= (new_table->bucket

844

+ new_table->hasher (data, new_table->n_buckets));

845

846

if (! (new_bucket < new_table->bucket_limit))

847

abort ();

848

849

next = cursor->next;

850

851

if (new_bucket->data)

852

{

853

if (cursor == bucket)

854

{

855

/* Allocate or recycle an entry, when moving from a bucket

856

header into a bucket overflow. */

857

struct hash_entry *new_entry = allocate_entry (new_table);

858

859

if (new_entry == NULL)

860

return false;

861

862

new_entry->data = data;

863

new_entry->next = new_bucket->next;

864

new_bucket->next = new_entry;

865

}

866

else

867

{

868

/* Merely relink an existing entry, when moving from a

869

bucket overflow into a bucket overflow. */

870

cursor->next = new_bucket->next;

871

new_bucket->next = cursor;

872

}

873

}

874

else

875

{

876

/* Free an existing entry, when moving from a bucket

877

overflow into a bucket header. Also take care of the

878

simple case of moving from a bucket header into a bucket

879

header. */

880

new_bucket->data = data;

881

new_table->n_buckets_used++;

882

if (cursor != bucket)

883

free_entry (new_table, cursor);

884

}

885

}

886

887

free (table->bucket);

888

table->bucket = new_table->bucket;

889

table->bucket_limit = new_table->bucket_limit;

890

table->n_buckets = new_table->n_buckets;

891

table->n_buckets_used = new_table->n_buckets_used;

892

table->free_entry_list = new_table->free_entry_list;

893

/* table->n_entries already holds its value. */

894

#if USE_OBSTACK

895

table->entry_stack = new_table->entry_stack;

896

#endif

897

free (new_table);

898

899

return true;

900

}

901

902

/* If ENTRY matches an entry already in the hash table, return the pointer

903

to the entry from the table. Otherwise, insert ENTRY and return ENTRY.

904

Return NULL if the storage required for insertion cannot be allocated. */

905

906

void *

907

hash_insert (Hash_table *table, const void *entry)

908

{

909

void *data;

910

struct hash_entry *bucket;

911

912

/* The caller cannot insert a NULL entry. */

913

if (! entry)

914

abort ();

915

916

/* If there's a matching entry already in the table, return that. */

917

if ((data = hash_find_entry (table, entry, &bucket, false)) != NULL)

918

return data;

919

920

/* ENTRY is not matched, it should be inserted. */

921

922

if (bucket->data)

923

{

924

struct hash_entry *new_entry = allocate_entry (table);

925

926

if (new_entry == NULL)

927

return NULL;

928

929

/* Add ENTRY in the overflow of the bucket. */

930

931

new_entry->data = (void *) entry;

932

new_entry->next = bucket->next;

933

bucket->next = new_entry;

934

table->n_entries++;

935

return (void *) entry;

936

}

937

938

/* Add ENTRY right in the bucket head. */

939

940

bucket->data = (void *) entry;

941

table->n_entries++;

942

table->n_buckets_used++;

943

944

/* If the growth threshold of the buckets in use has been reached, increase

945

the table size and rehash. There's no point in checking the number of

946

entries: if the hashing function is ill-conditioned, rehashing is not

947

likely to improve it. */

948

949

if (table->n_buckets_used

950

> table->tuning->growth_threshold * table->n_buckets)

951

{

952

/* Check more fully, before starting real work. If tuning arguments

953

became invalid, the second check will rely on proper defaults. */

954

check_tuning (table);

955

if (table->n_buckets_used

956

> table->tuning->growth_threshold * table->n_buckets)

957

{

958

const Hash_tuning *tuning = table->tuning;

959

float candidate =

960

(tuning->is_n_buckets

961

? (table->n_buckets * tuning->growth_factor)

962

: (table->n_buckets * tuning->growth_factor

963

* tuning->growth_threshold));

964

965

if (SIZE_MAX <= candidate)

966

return NULL;

967

968

/* If the rehash fails, arrange to return NULL. */

969

if (!hash_rehash (table, candidate))

970

entry = NULL;

971

}

972

}

973

974

return (void *) entry;

975

}

976

977

/* If ENTRY is already in the table, remove it and return the just-deleted

978

data (the user may want to deallocate its storage). If ENTRY is not in the

979

table, don't modify the table and return NULL. */

980

981

void *

982

hash_delete (Hash_table *table, const void *entry)

983

{

984

void *data;

985

struct hash_entry *bucket;

986

987

data = hash_find_entry (table, entry, &bucket, true);

988

if (!data)

989

return NULL;

990

991

table->n_entries--;

992

if (!bucket->data)

993

{

994

table->n_buckets_used--;

995

996

/* If the shrink threshold of the buckets in use has been reached,

997

rehash into a smaller table. */

998

999

if (table->n_buckets_used

1000

< table->tuning->shrink_threshold * table->n_buckets)

1001

{

1002

/* Check more fully, before starting real work. If tuning arguments

1003

became invalid, the second check will rely on proper defaults. */

1004

check_tuning (table);

1005

if (table->n_buckets_used

1006

< table->tuning->shrink_threshold * table->n_buckets)

1007

{

1008

const Hash_tuning *tuning = table->tuning;

1009

size_t candidate =

1010

(tuning->is_n_buckets

1011

? table->n_buckets * tuning->shrink_factor

1012

: (table->n_buckets * tuning->shrink_factor

1013

* tuning->growth_threshold));

1014

1015

hash_rehash (table, candidate);

1016

}

1017

}

1018

}

1019

1020

return data;

1021

}

1022

1023

/* Testing. */

1024

1025

#if TESTING

1026

1027

void

1028

hash_print (const Hash_table *table)

1029

{

1030

struct hash_entry const *bucket;

1031

1032

for (bucket = table->bucket; bucket < table->bucket_limit; bucket++)

1033

{

1034

struct hash_entry *cursor;

1035

1036

if (bucket)

1037

printf ("%lu:\n", (unsigned long int) (bucket - table->bucket));

1038

1039

for (cursor = bucket; cursor; cursor = cursor->next)

1040

{

1041

char const *s = cursor->data;

1042

/* FIXME */

1043

if (s)

1044

printf (" %s\n", s);

1045

}

1046

}

1047

}

1048

1049

#endif /* TESTING */

Older »