hashtable.c 18 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703
  1. /*
  2. * This implementation is based on code from uClibc-0.9.30.3 but was
  3. * modified and extended for use within U-Boot.
  4. *
  5. * Copyright (C) 2010 Wolfgang Denk <wd@denx.de>
  6. *
  7. * Original license header:
  8. *
  9. * Copyright (C) 1993, 1995, 1996, 1997, 2002 Free Software Foundation, Inc.
  10. * This file is part of the GNU C Library.
  11. * Contributed by Ulrich Drepper <drepper@gnu.ai.mit.edu>, 1993.
  12. *
  13. * The GNU C Library is free software; you can redistribute it and/or
  14. * modify it under the terms of the GNU Lesser General Public
  15. * License as published by the Free Software Foundation; either
  16. * version 2.1 of the License, or (at your option) any later version.
  17. *
  18. * The GNU C Library is distributed in the hope that it will be useful,
  19. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  20. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  21. * Lesser General Public License for more details.
  22. *
  23. * You should have received a copy of the GNU Lesser General Public
  24. * License along with the GNU C Library; if not, write to the Free
  25. * Software Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
  26. * 02111-1307 USA.
  27. */
  28. #include <errno.h>
  29. #include <malloc.h>
  30. #ifdef USE_HOSTCC /* HOST build */
  31. # include <string.h>
  32. # include <assert.h>
  33. # ifndef debug
  34. # ifdef DEBUG
  35. # define debug(fmt,args...) printf(fmt ,##args)
  36. # else
  37. # define debug(fmt,args...)
  38. # endif
  39. # endif
  40. #else /* U-Boot build */
  41. # include <common.h>
  42. # include <linux/string.h>
  43. #endif
  44. #ifndef CONFIG_ENV_MIN_ENTRIES /* minimum number of entries */
  45. #define CONFIG_ENV_MIN_ENTRIES 64
  46. #endif
  47. #ifndef CONFIG_ENV_MAX_ENTRIES /* maximum number of entries */
  48. #define CONFIG_ENV_MAX_ENTRIES 512
  49. #endif
  50. #include "search.h"
  51. /*
  52. * [Aho,Sethi,Ullman] Compilers: Principles, Techniques and Tools, 1986
  53. * [Knuth] The Art of Computer Programming, part 3 (6.4)
  54. */
  55. /*
  56. * The reentrant version has no static variables to maintain the state.
  57. * Instead the interface of all functions is extended to take an argument
  58. * which describes the current status.
  59. */
  60. typedef struct _ENTRY {
  61. unsigned int used;
  62. ENTRY entry;
  63. } _ENTRY;
  64. /*
  65. * hcreate()
  66. */
  67. /*
  68. * For the used double hash method the table size has to be a prime. To
  69. * correct the user given table size we need a prime test. This trivial
  70. * algorithm is adequate because
  71. * a) the code is (most probably) called a few times per program run and
  72. * b) the number is small because the table must fit in the core
  73. * */
  74. static int isprime(unsigned int number)
  75. {
  76. /* no even number will be passed */
  77. unsigned int div = 3;
  78. while (div * div < number && number % div != 0)
  79. div += 2;
  80. return number % div != 0;
  81. }
  82. /*
  83. * Before using the hash table we must allocate memory for it.
  84. * Test for an existing table are done. We allocate one element
  85. * more as the found prime number says. This is done for more effective
  86. * indexing as explained in the comment for the hsearch function.
  87. * The contents of the table is zeroed, especially the field used
  88. * becomes zero.
  89. */
  90. int hcreate_r(size_t nel, struct hsearch_data *htab)
  91. {
  92. /* Test for correct arguments. */
  93. if (htab == NULL) {
  94. __set_errno(EINVAL);
  95. return 0;
  96. }
  97. /* There is still another table active. Return with error. */
  98. if (htab->table != NULL)
  99. return 0;
  100. /* Change nel to the first prime number not smaller as nel. */
  101. nel |= 1; /* make odd */
  102. while (!isprime(nel))
  103. nel += 2;
  104. htab->size = nel;
  105. htab->filled = 0;
  106. /* allocate memory and zero out */
  107. htab->table = (_ENTRY *) calloc(htab->size + 1, sizeof(_ENTRY));
  108. if (htab->table == NULL)
  109. return 0;
  110. /* everything went alright */
  111. return 1;
  112. }
  113. /*
  114. * hdestroy()
  115. */
  116. /*
  117. * After using the hash table it has to be destroyed. The used memory can
  118. * be freed and the local static variable can be marked as not used.
  119. */
  120. void hdestroy_r(struct hsearch_data *htab)
  121. {
  122. int i;
  123. /* Test for correct arguments. */
  124. if (htab == NULL) {
  125. __set_errno(EINVAL);
  126. return;
  127. }
  128. /* free used memory */
  129. for (i = 1; i <= htab->size; ++i) {
  130. if (htab->table[i].used) {
  131. ENTRY *ep = &htab->table[i].entry;
  132. free(ep->key);
  133. free(ep->data);
  134. }
  135. }
  136. free(htab->table);
  137. /* the sign for an existing table is an value != NULL in htable */
  138. htab->table = NULL;
  139. }
  140. /*
  141. * hsearch()
  142. */
  143. /*
  144. * This is the search function. It uses double hashing with open addressing.
  145. * The argument item.key has to be a pointer to an zero terminated, most
  146. * probably strings of chars. The function for generating a number of the
  147. * strings is simple but fast. It can be replaced by a more complex function
  148. * like ajw (see [Aho,Sethi,Ullman]) if the needs are shown.
  149. *
  150. * We use an trick to speed up the lookup. The table is created by hcreate
  151. * with one more element available. This enables us to use the index zero
  152. * special. This index will never be used because we store the first hash
  153. * index in the field used where zero means not used. Every other value
  154. * means used. The used field can be used as a first fast comparison for
  155. * equality of the stored and the parameter value. This helps to prevent
  156. * unnecessary expensive calls of strcmp.
  157. *
  158. * This implementation differs from the standard library version of
  159. * this function in a number of ways:
  160. *
  161. * - While the standard version does not make any assumptions about
  162. * the type of the stored data objects at all, this implementation
  163. * works with NUL terminated strings only.
  164. * - Instead of storing just pointers to the original objects, we
  165. * create local copies so the caller does not need to care about the
  166. * data any more.
  167. * - The standard implementation does not provide a way to update an
  168. * existing entry. This version will create a new entry or update an
  169. * existing one when both "action == ENTER" and "item.data != NULL".
  170. * - Instead of returning 1 on success, we return the index into the
  171. * internal hash table, which is also guaranteed to be positive.
  172. * This allows us direct access to the found hash table slot for
  173. * example for functions like hdelete().
  174. */
  175. int hsearch_r(ENTRY item, ACTION action, ENTRY ** retval,
  176. struct hsearch_data *htab)
  177. {
  178. unsigned int hval;
  179. unsigned int count;
  180. unsigned int len = strlen(item.key);
  181. unsigned int idx;
  182. /* Compute an value for the given string. Perhaps use a better method. */
  183. hval = len;
  184. count = len;
  185. while (count-- > 0) {
  186. hval <<= 4;
  187. hval += item.key[count];
  188. }
  189. /*
  190. * First hash function:
  191. * simply take the modul but prevent zero.
  192. */
  193. hval %= htab->size;
  194. if (hval == 0)
  195. ++hval;
  196. /* The first index tried. */
  197. idx = hval;
  198. if (htab->table[idx].used) {
  199. /*
  200. * Further action might be required according to the
  201. * action value.
  202. */
  203. unsigned hval2;
  204. if (htab->table[idx].used == hval
  205. && strcmp(item.key, htab->table[idx].entry.key) == 0) {
  206. /* Overwrite existing value? */
  207. if ((action == ENTER) && (item.data != NULL)) {
  208. free(htab->table[idx].entry.data);
  209. htab->table[idx].entry.data =
  210. strdup(item.data);
  211. if (!htab->table[idx].entry.data) {
  212. __set_errno(ENOMEM);
  213. *retval = NULL;
  214. return 0;
  215. }
  216. }
  217. /* return found entry */
  218. *retval = &htab->table[idx].entry;
  219. return idx;
  220. }
  221. /*
  222. * Second hash function:
  223. * as suggested in [Knuth]
  224. */
  225. hval2 = 1 + hval % (htab->size - 2);
  226. do {
  227. /*
  228. * Because SIZE is prime this guarantees to
  229. * step through all available indices.
  230. */
  231. if (idx <= hval2)
  232. idx = htab->size + idx - hval2;
  233. else
  234. idx -= hval2;
  235. /*
  236. * If we visited all entries leave the loop
  237. * unsuccessfully.
  238. */
  239. if (idx == hval)
  240. break;
  241. /* If entry is found use it. */
  242. if ((htab->table[idx].used == hval)
  243. && strcmp(item.key, htab->table[idx].entry.key) == 0) {
  244. /* Overwrite existing value? */
  245. if ((action == ENTER) && (item.data != NULL)) {
  246. free(htab->table[idx].entry.data);
  247. htab->table[idx].entry.data =
  248. strdup(item.data);
  249. if (!htab->table[idx].entry.data) {
  250. __set_errno(ENOMEM);
  251. *retval = NULL;
  252. return 0;
  253. }
  254. }
  255. /* return found entry */
  256. *retval = &htab->table[idx].entry;
  257. return idx;
  258. }
  259. }
  260. while (htab->table[idx].used);
  261. }
  262. /* An empty bucket has been found. */
  263. if (action == ENTER) {
  264. /*
  265. * If table is full and another entry should be
  266. * entered return with error.
  267. */
  268. if (htab->filled == htab->size) {
  269. __set_errno(ENOMEM);
  270. *retval = NULL;
  271. return 0;
  272. }
  273. /*
  274. * Create new entry;
  275. * create copies of item.key and item.data
  276. */
  277. htab->table[idx].used = hval;
  278. htab->table[idx].entry.key = strdup(item.key);
  279. htab->table[idx].entry.data = strdup(item.data);
  280. if (!htab->table[idx].entry.key ||
  281. !htab->table[idx].entry.data) {
  282. __set_errno(ENOMEM);
  283. *retval = NULL;
  284. return 0;
  285. }
  286. ++htab->filled;
  287. /* return new entry */
  288. *retval = &htab->table[idx].entry;
  289. return 1;
  290. }
  291. __set_errno(ESRCH);
  292. *retval = NULL;
  293. return 0;
  294. }
  295. /*
  296. * hdelete()
  297. */
  298. /*
  299. * The standard implementation of hsearch(3) does not provide any way
  300. * to delete any entries from the hash table. We extend the code to
  301. * do that.
  302. */
  303. int hdelete_r(const char *key, struct hsearch_data *htab)
  304. {
  305. ENTRY e, *ep;
  306. int idx;
  307. debug("hdelete: DELETE key \"%s\"\n", key);
  308. e.key = (char *)key;
  309. if ((idx = hsearch_r(e, FIND, &ep, htab)) == 0) {
  310. __set_errno(ESRCH);
  311. return 0; /* not found */
  312. }
  313. /* free used ENTRY */
  314. debug("hdelete: DELETING key \"%s\"\n", key);
  315. free(ep->key);
  316. free(ep->data);
  317. htab->table[idx].used = 0;
  318. --htab->filled;
  319. return 1;
  320. }
  321. /*
  322. * hexport()
  323. */
  324. /*
  325. * Export the data stored in the hash table in linearized form.
  326. *
  327. * Entries are exported as "name=value" strings, separated by an
  328. * arbitrary (non-NUL, of course) separator character. This allows to
  329. * use this function both when formatting the U-Boot environment for
  330. * external storage (using '\0' as separator), but also when using it
  331. * for the "printenv" command to print all variables, simply by using
  332. * as '\n" as separator. This can also be used for new features like
  333. * exporting the environment data as text file, including the option
  334. * for later re-import.
  335. *
  336. * The entries in the result list will be sorted by ascending key
  337. * values.
  338. *
  339. * If the separator character is different from NUL, then any
  340. * separator characters and backslash characters in the values will
  341. * be escaped by a preceeding backslash in output. This is needed for
  342. * example to enable multi-line values, especially when the output
  343. * shall later be parsed (for example, for re-import).
  344. *
  345. * There are several options how the result buffer is handled:
  346. *
  347. * *resp size
  348. * -----------
  349. * NULL 0 A string of sufficient length will be allocated.
  350. * NULL >0 A string of the size given will be
  351. * allocated. An error will be returned if the size is
  352. * not sufficient. Any unused bytes in the string will
  353. * be '\0'-padded.
  354. * !NULL 0 The user-supplied buffer will be used. No length
  355. * checking will be performed, i. e. it is assumed that
  356. * the buffer size will always be big enough. DANGEROUS.
  357. * !NULL >0 The user-supplied buffer will be used. An error will
  358. * be returned if the size is not sufficient. Any unused
  359. * bytes in the string will be '\0'-padded.
  360. */
  361. static int cmpkey(const void *p1, const void *p2)
  362. {
  363. ENTRY *e1 = *(ENTRY **) p1;
  364. ENTRY *e2 = *(ENTRY **) p2;
  365. return (strcmp(e1->key, e2->key));
  366. }
  367. ssize_t hexport_r(struct hsearch_data *htab, const char sep,
  368. char **resp, size_t size)
  369. {
  370. ENTRY *list[htab->size];
  371. char *res, *p;
  372. size_t totlen;
  373. int i, n;
  374. /* Test for correct arguments. */
  375. if ((resp == NULL) || (htab == NULL)) {
  376. __set_errno(EINVAL);
  377. return (-1);
  378. }
  379. debug("EXPORT table = %p, htab.size = %d, htab.filled = %d, size = %d\n",
  380. htab, htab->size, htab->filled, size);
  381. /*
  382. * Pass 1:
  383. * search used entries,
  384. * save addresses and compute total length
  385. */
  386. for (i = 1, n = 0, totlen = 0; i <= htab->size; ++i) {
  387. if (htab->table[i].used) {
  388. ENTRY *ep = &htab->table[i].entry;
  389. list[n++] = ep;
  390. totlen += strlen(ep->key) + 2;
  391. if (sep == '\0') {
  392. totlen += strlen(ep->data);
  393. } else { /* check if escapes are needed */
  394. char *s = ep->data;
  395. while (*s) {
  396. ++totlen;
  397. /* add room for needed escape chars */
  398. if ((*s == sep) || (*s == '\\'))
  399. ++totlen;
  400. ++s;
  401. }
  402. }
  403. totlen += 2; /* for '=' and 'sep' char */
  404. }
  405. }
  406. #ifdef DEBUG
  407. /* Pass 1a: print unsorted list */
  408. printf("Unsorted: n=%d\n", n);
  409. for (i = 0; i < n; ++i) {
  410. printf("\t%3d: %p ==> %-10s => %s\n",
  411. i, list[i], list[i]->key, list[i]->data);
  412. }
  413. #endif
  414. /* Sort list by keys */
  415. qsort(list, n, sizeof(ENTRY *), cmpkey);
  416. /* Check if the user supplied buffer size is sufficient */
  417. if (size) {
  418. if (size < totlen + 1) { /* provided buffer too small */
  419. debug("### buffer too small: %d, but need %d\n",
  420. size, totlen + 1);
  421. __set_errno(ENOMEM);
  422. return (-1);
  423. }
  424. } else {
  425. size = totlen + 1;
  426. }
  427. /* Check if the user provided a buffer */
  428. if (*resp) {
  429. /* yes; clear it */
  430. res = *resp;
  431. memset(res, '\0', size);
  432. } else {
  433. /* no, allocate and clear one */
  434. *resp = res = calloc(1, size);
  435. if (res == NULL) {
  436. __set_errno(ENOMEM);
  437. return (-1);
  438. }
  439. }
  440. /*
  441. * Pass 2:
  442. * export sorted list of result data
  443. */
  444. for (i = 0, p = res; i < n; ++i) {
  445. char *s;
  446. s = list[i]->key;
  447. while (*s)
  448. *p++ = *s++;
  449. *p++ = '=';
  450. s = list[i]->data;
  451. while (*s) {
  452. if ((*s == sep) || (*s == '\\'))
  453. *p++ = '\\'; /* escape */
  454. *p++ = *s++;
  455. }
  456. *p++ = sep;
  457. }
  458. *p = '\0'; /* terminate result */
  459. return size;
  460. }
  461. /*
  462. * himport()
  463. */
  464. /*
  465. * Import linearized data into hash table.
  466. *
  467. * This is the inverse function to hexport(): it takes a linear list
  468. * of "name=value" pairs and creates hash table entries from it.
  469. *
  470. * Entries without "value", i. e. consisting of only "name" or
  471. * "name=", will cause this entry to be deleted from the hash table.
  472. *
  473. * The "flag" argument can be used to control the behaviour: when the
  474. * H_NOCLEAR bit is set, then an existing hash table will kept, i. e.
  475. * new data will be added to an existing hash table; otherwise, old
  476. * data will be discarded and a new hash table will be created.
  477. *
  478. * The separator character for the "name=value" pairs can be selected,
  479. * so we both support importing from externally stored environment
  480. * data (separated by NUL characters) and from plain text files
  481. * (entries separated by newline characters).
  482. *
  483. * To allow for nicely formatted text input, leading white space
  484. * (sequences of SPACE and TAB chars) is ignored, and entries starting
  485. * (after removal of any leading white space) with a '#' character are
  486. * considered comments and ignored.
  487. *
  488. * [NOTE: this means that a variable name cannot start with a '#'
  489. * character.]
  490. *
  491. * When using a non-NUL separator character, backslash is used as
  492. * escape character in the value part, allowing for example for
  493. * multi-line values.
  494. *
  495. * In theory, arbitrary separator characters can be used, but only
  496. * '\0' and '\n' have really been tested.
  497. */
  498. int himport_r(struct hsearch_data *htab,
  499. const char *env, size_t size, const char sep, int flag)
  500. {
  501. char *data, *sp, *dp, *name, *value;
  502. /* Test for correct arguments. */
  503. if (htab == NULL) {
  504. __set_errno(EINVAL);
  505. return 0;
  506. }
  507. /* we allocate new space to make sure we can write to the array */
  508. if ((data = malloc(size)) == NULL) {
  509. debug("himport_r: can't malloc %d bytes\n", size);
  510. __set_errno(ENOMEM);
  511. return 0;
  512. }
  513. memcpy(data, env, size);
  514. dp = data;
  515. if ((flag & H_NOCLEAR) == 0) {
  516. /* Destroy old hash table if one exists */
  517. debug("Destroy Hash Table: %p table = %p\n", htab,
  518. htab->table);
  519. if (htab->table)
  520. hdestroy_r(htab);
  521. }
  522. /*
  523. * Create new hash table (if needed). The computation of the hash
  524. * table size is based on heuristics: in a sample of some 70+
  525. * existing systems we found an average size of 39+ bytes per entry
  526. * in the environment (for the whole key=value pair). Assuming a
  527. * size of 8 per entry (= safety factor of ~5) should provide enough
  528. * safety margin for any existing environment definitions and still
  529. * allow for more than enough dynamic additions. Note that the
  530. * "size" argument is supposed to give the maximum enviroment size
  531. * (CONFIG_ENV_SIZE). This heuristics will result in
  532. * unreasonably large numbers (and thus memory footprint) for
  533. * big flash environments (>8,000 entries for 64 KB
  534. * envrionment size), so we clip it to a reasonable value.
  535. * On the other hand we need to add some more entries for free
  536. * space when importing very small buffers. Both boundaries can
  537. * be overwritten in the board config file if needed.
  538. */
  539. if (!htab->table) {
  540. int nent = CONFIG_ENV_MIN_ENTRIES + size / 8;
  541. if (nent > CONFIG_ENV_MAX_ENTRIES)
  542. nent = CONFIG_ENV_MAX_ENTRIES;
  543. debug("Create Hash Table: N=%d\n", nent);
  544. if (hcreate_r(nent, htab) == 0) {
  545. free(data);
  546. return 0;
  547. }
  548. }
  549. /* Parse environment; allow for '\0' and 'sep' as separators */
  550. do {
  551. ENTRY e, *rv;
  552. /* skip leading white space */
  553. while ((*dp == ' ') || (*dp == '\t'))
  554. ++dp;
  555. /* skip comment lines */
  556. if (*dp == '#') {
  557. while (*dp && (*dp != sep))
  558. ++dp;
  559. ++dp;
  560. continue;
  561. }
  562. /* parse name */
  563. for (name = dp; *dp != '=' && *dp && *dp != sep; ++dp)
  564. ;
  565. /* deal with "name" and "name=" entries (delete var) */
  566. if (*dp == '\0' || *(dp + 1) == '\0' ||
  567. *dp == sep || *(dp + 1) == sep) {
  568. if (*dp == '=')
  569. *dp++ = '\0';
  570. *dp++ = '\0'; /* terminate name */
  571. debug("DELETE CANDIDATE: \"%s\"\n", name);
  572. if (hdelete_r(name, htab) == 0)
  573. debug("DELETE ERROR ##############################\n");
  574. continue;
  575. }
  576. *dp++ = '\0'; /* terminate name */
  577. /* parse value; deal with escapes */
  578. for (value = sp = dp; *dp && (*dp != sep); ++dp) {
  579. if ((*dp == '\\') && *(dp + 1))
  580. ++dp;
  581. *sp++ = *dp;
  582. }
  583. *sp++ = '\0'; /* terminate value */
  584. ++dp;
  585. /* enter into hash table */
  586. e.key = name;
  587. e.data = value;
  588. hsearch_r(e, ENTER, &rv, htab);
  589. if (rv == NULL) {
  590. printf("himport_r: can't insert \"%s=%s\" into hash table\n",
  591. name, value);
  592. return 0;
  593. }
  594. debug("INSERT: table %p, filled %d/%d rv %p ==> name=\"%s\" value=\"%s\"\n",
  595. htab, htab->filled, htab->size,
  596. rv, name, value);
  597. } while ((dp < data + size) && *dp); /* size check needed for text */
  598. /* without '\0' termination */
  599. debug("INSERT: free(data = %p)\n", data);
  600. free(data);
  601. debug("INSERT: done\n");
  602. return 1; /* everything OK */
  603. }