Source code of Windows XP (NT5)
You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

550 lines
20 KiB

  1. #include <precomp.h>
  2. #include "tracing.h"
  3. #include "utils.h"
  4. #include "hash.h"
  5. //~~~~~~~~~~~~~~~~~~~~~~~~ PRIVATE HASH FUNCTIONS ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
  6. //
  7. // Matches the keys one against the other.
  8. UINT // [RET] number of matching chars
  9. HshPrvMatchKeys(
  10. LPWSTR wszKey1, // [IN] key 1
  11. LPWSTR wszKey2) // [IN] key 2
  12. {
  13. UINT i = 0;
  14. while (*wszKey1 != L'\0' && *wszKey1 == *wszKey2)
  15. {
  16. wszKey1++; wszKey2++;
  17. i++;
  18. }
  19. return i;
  20. }
  21. // deletes all the pHash tree - doesn't touch the pObjects from
  22. // within (if any)
  23. VOID
  24. HshDestructor(
  25. PHASH_NODE pHash) // [IN] hash tree to delete
  26. {
  27. // pHash should not be NULL -- but who knows what the caller is doing!
  28. if (pHash != NULL)
  29. {
  30. while(!IsListEmpty(&(pHash->lstDown)))
  31. {
  32. PHASH_NODE pChild;
  33. pChild = CONTAINING_RECORD(pHash->lstDown.Flink, HASH_NODE, lstHoriz);
  34. HshDestructor(pChild);
  35. }
  36. RemoveEntryList(&(pHash->lstHoriz));
  37. MemFree(pHash->wszKey);
  38. MemFree(pHash);
  39. }
  40. }
  41. //~~~~~~~~~~~~~~~~~~~~~~~~ PUBLIC HASH FUNCTIONS ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
  42. //
  43. // Initializes a HASH structure
  44. DWORD
  45. HshInitialize(PHASH pHash)
  46. {
  47. DWORD dwErr = ERROR_SUCCESS;
  48. if (pHash != NULL)
  49. {
  50. __try
  51. {
  52. InitializeCriticalSection(&(pHash->csMutex));
  53. pHash->bValid = TRUE;
  54. }
  55. __except(EXCEPTION_EXECUTE_HANDLER)
  56. {
  57. dwErr = GetExceptionCode();
  58. }
  59. pHash->pRoot = NULL;
  60. }
  61. else
  62. dwErr = ERROR_INVALID_PARAMETER;
  63. return dwErr;
  64. }
  65. // Cleans all resources referenced by a HASH structures
  66. VOID
  67. HshDestroy(PHASH pHash)
  68. {
  69. HshDestructor(pHash->pRoot);
  70. if (pHash->bValid)
  71. {
  72. DeleteCriticalSection(&(pHash->csMutex));
  73. pHash->bValid = FALSE;
  74. }
  75. }
  76. // Inserts an opaque object into the cache. The object is keyed on a wstring
  77. // The call could alter the structure of the hash, hence it returns the reference
  78. // to the updated hash.
  79. DWORD // [RET] win32 error code
  80. HshInsertObjectRef(
  81. PHASH_NODE pHash, // [IN] hash to operate on
  82. LPWSTR wszKey, // [IN] key of the object to insert
  83. LPVOID pObject, // [IN] object itself to insert in the cache
  84. PHASH_NODE *ppOutHash) // [OUT] pointer to the updated hash
  85. {
  86. DWORD dwErr = ERROR_SUCCESS;
  87. DbgPrint((TRC_HASH,"[HshInsertObject(%S)", wszKey));
  88. DbgAssert((ppOutHash != NULL, "No output hash expected??"));
  89. DbgAssert((wszKey != NULL, "Key info should not be NULL"));
  90. // if the node passed in is NULL this means a new node
  91. // has to be created
  92. if (pHash == NULL)
  93. {
  94. // this node is definitely not in the hash
  95. // allocate the new node
  96. pHash = MemCAlloc(sizeof(HASH_NODE));
  97. if (pHash == NULL)
  98. {
  99. dwErr = GetLastError();
  100. goto exit;
  101. }
  102. // allocate mem for the new key
  103. pHash->wszKey = MemCAlloc(sizeof(WCHAR)*(wcslen(wszKey)+1));
  104. if (pHash->wszKey == NULL)
  105. {
  106. dwErr = GetLastError();
  107. MemFree(pHash);
  108. goto exit;
  109. }
  110. // copy the new key
  111. wcscpy(pHash->wszKey, wszKey);
  112. // initialize the horizontal and down lists
  113. InitializeListHead(&(pHash->lstHoriz));
  114. InitializeListHead(&(pHash->lstDown));
  115. // copy the reference to the object associated with the key
  116. pHash->pObject = pObject;
  117. // at this point we have a standalone newly created node:
  118. // no links are defined either on the horizontal, downwards or upwards
  119. // these will be set up (if needed) by the caller.
  120. *ppOutHash = pHash;
  121. }
  122. // if the node passed in is not NULL, we need to match as many
  123. // characters between wszKey and the node's key. Based on who's shorter
  124. // we decide to either set the reference (if keys identical) or
  125. // break the branch (if wszKey is shorter than the current one) or
  126. // to recurse down the insertion.
  127. else
  128. {
  129. UINT nMatch;
  130. PHASH_NODE pChild;
  131. enum { MATCH, SUBSET, SUPERSET, UNDECIDED, RECURSE} nAnalysis;
  132. nMatch = HshPrvMatchKeys(wszKey, pHash->wszKey);
  133. // analyze the given key with respect to the current node;
  134. if (wszKey[nMatch] == L'\0' && pHash->wszKey[nMatch] == L'\0')
  135. // the key matches the current node
  136. nAnalysis = MATCH;
  137. else if (wszKey[nMatch] == L'\0')
  138. // the key is a subset of the current node
  139. nAnalysis = SUBSET;
  140. else
  141. {
  142. // so far undecided - further see if this translates to SUPERSET
  143. // or even better, if SUPERSET can be handled by a child, hence
  144. // RECURSE.
  145. nAnalysis = UNDECIDED;
  146. if (pHash->wszKey[nMatch] == L'\0')
  147. {
  148. PLIST_ENTRY pEntry;
  149. // the new key is a superset of the current nod
  150. nAnalysis = SUPERSET;
  151. // the new key could be covered by one of the existent children.
  152. // check then if it is the case to send the work down to some child
  153. for (pEntry = pHash->lstDown.Flink;
  154. pEntry != &(pHash->lstDown);
  155. pEntry = pEntry->Flink)
  156. {
  157. pChild = CONTAINING_RECORD(pEntry, HASH_NODE, lstHoriz);
  158. if (wszKey[nMatch] == pChild->wszKey[0])
  159. {
  160. // the child to follow up has been located and saved
  161. // in pChild. Set nAnalysis to UNDECIDED and break;
  162. nAnalysis = RECURSE;
  163. break;
  164. }
  165. }
  166. }
  167. }
  168. // if the key matches exactly the current node
  169. // then is only a matter of setting the object's reference
  170. if (nAnalysis == MATCH)
  171. {
  172. // if the node is already referencing an object..
  173. if (pHash->pObject != NULL)
  174. {
  175. // signal out ERROR_DUPLICATE_TAG
  176. dwErr = ERROR_DUPLICATE_TAG;
  177. }
  178. else
  179. {
  180. // just insert the reference and get out with success.
  181. pHash->pObject = pObject;
  182. // save the Out hash pointer
  183. *ppOutHash = pHash;
  184. }
  185. }
  186. // if a child has been identified, let pChild (saved previously)
  187. // to follow up
  188. else if (nAnalysis == RECURSE)
  189. {
  190. dwErr = HshInsertObjectRef(
  191. pChild,
  192. wszKey+nMatch,
  193. pObject,
  194. ppOutHash);
  195. if (dwErr == ERROR_SUCCESS)
  196. *ppOutHash = pHash;
  197. }
  198. // if any of SUBSET, SUPERSET or UNDECIDED
  199. else
  200. {
  201. PHASH_NODE pParent = NULL;
  202. LPWSTR wszTrailKey = NULL;
  203. UINT nTrailLen = 0;
  204. // [C = common part; c = current key; n = new key]
  205. // (SUBSET) (UNDECIDED)
  206. // current: CCCCCccc or current: CCCCCccc
  207. // new: CCCCC new: CCCCCnnnnn
  208. //
  209. // In both cases, the current node splits.
  210. // Create first a new node, containing just CCCCC
  211. if (nAnalysis != SUPERSET)
  212. {
  213. // get the number of chars in pHash's key that are not matching
  214. nTrailLen = wcslen(pHash->wszKey) - nMatch;
  215. // create first the trailing part of the key (allocate the number of
  216. // chars from the current node that didn't match)
  217. wszTrailKey = MemCAlloc(sizeof(WCHAR)*(nTrailLen+1));
  218. if (wszTrailKey == NULL)
  219. {
  220. // if anything went wrong, just go out with the error.
  221. // hash hasn't been modified.
  222. dwErr = GetLastError();
  223. goto exit;
  224. }
  225. // wcsncpy doesn't append the null terminator but the string
  226. // is already nulled out and it has the right size
  227. wcsncpy(wszTrailKey, pHash->wszKey+nMatch, nTrailLen);
  228. // create then the node that will act as the common parent
  229. pHash->wszKey[nMatch] = L'\0';
  230. dwErr = HshInsertObjectRef(
  231. NULL, // request a new node to be created
  232. pHash->wszKey, // common part of the current keys
  233. NULL, // this node is not referencing any object
  234. &pParent); // get back the newly created pointer.
  235. pHash->wszKey[nMatch] = wszTrailKey[0];
  236. // in case anything went wrong, the hash has not been altered,
  237. // we just need to bubble up the error.
  238. if (dwErr != ERROR_SUCCESS)
  239. {
  240. MemFree(wszTrailKey);
  241. goto exit;
  242. }
  243. // set the new parent up link
  244. pParent->pUpLink = pHash->pUpLink;
  245. }
  246. // (SUPERSET) (UNDECIDED)
  247. // current: CCCCC or current: CCCCCccccc
  248. // new: CCCCCnnn new: CCCCCnnn
  249. // In both cases a new node has to be created for the "nnn" part.
  250. if (nAnalysis != SUBSET)
  251. {
  252. dwErr = HshInsertObjectRef(
  253. NULL,
  254. wszKey + nMatch,
  255. pObject,
  256. &pChild);
  257. if (dwErr != ERROR_SUCCESS)
  258. {
  259. // second creation failed, clean up everything and bail out
  260. MemFree(wszTrailKey);
  261. if (pParent != NULL)
  262. {
  263. MemFree(pParent->wszKey);
  264. MemFree(pParent);
  265. }
  266. // hash structure is not altered at this point.
  267. goto exit;
  268. }
  269. // link it up to the corresponding parent.
  270. pChild->pUpLink = (nAnalysis == SUPERSET) ? pHash : pParent;
  271. }
  272. // NO WAY BACK FROM NOW ON - hash is about to be altered
  273. // success is guaranteed
  274. // at this point, pChild is a non null pointer, with all the
  275. // LIST_ENTRIES from within the HASH_NODE initialized correctly.
  276. // (SUBSET) (UNDECIDED)
  277. // current: CCCCCccccc or current: CCCCCccccc
  278. // new: CCCCC new: CCCCCnnn
  279. // if the node has split, put the new parent in its place
  280. if (nAnalysis != SUPERSET)
  281. {
  282. // set the current key to the shrinked unmatched trailing part
  283. MemFree(pHash->wszKey);
  284. pHash->wszKey = wszTrailKey;
  285. // set the current upLink to the new pParent node
  286. pHash->pUpLink = pParent;
  287. // insert the new parent into its place
  288. InsertHeadList(&(pHash->lstHoriz), &(pParent->lstHoriz));
  289. // remove the node from its previous parent
  290. RemoveEntryList(&(pHash->lstHoriz));
  291. // reset the current node's list
  292. InitializeListHead(&(pHash->lstHoriz));
  293. // insert the node to its new parent down list.
  294. InsertHeadList(&(pParent->lstDown), &(pHash->lstHoriz));
  295. }
  296. // (SUPERSET) (UNDECIDED)
  297. // current: CCCCC or current: CCCCCccccc
  298. // new: CCCCCnnn new: CCCCCnnn
  299. // if a new child node has been created, link it in the hash
  300. if (nAnalysis != SUBSET)
  301. {
  302. // if the given key was either a superset of the
  303. // current key or derived from the current key,
  304. // there is a separated node for it. Insert it in the down list
  305. if (nAnalysis == SUPERSET)
  306. {
  307. InsertTailList(&(pHash->lstDown), &(pChild->lstHoriz));
  308. }
  309. else
  310. {
  311. InsertTailList(&(pParent->lstDown), &(pChild->lstHoriz));
  312. }
  313. }
  314. else
  315. {
  316. // set the new parent's reference to this data.
  317. pParent->pObject = pObject;
  318. }
  319. *ppOutHash = (nAnalysis == SUPERSET) ? pHash : pParent;
  320. // and that's all - we're done successfully!
  321. }
  322. }
  323. exit:
  324. DbgPrint((TRC_HASH,"HshInsertObject]=%d", dwErr));
  325. return dwErr;
  326. }
  327. // Retrieves an object from the hash. The hash structure is not touched in
  328. // any manner.
  329. DWORD // [RET] win32 error code
  330. HshQueryObjectRef(
  331. PHASH_NODE pHash, // [IN] hash to operate on
  332. LPWSTR wszKey, // [IN] key of the object to retrieve
  333. PHASH_NODE *ppHashNode) // [OUT] hash node referencing the queried object
  334. {
  335. DWORD dwErr = ERROR_FILE_NOT_FOUND;
  336. INT nDiff;
  337. DbgPrint((TRC_HASH,"[HshQueryObjectRef(0x%p)", wszKey));
  338. if (wszKey == NULL)
  339. {
  340. dwErr = ERROR_INVALID_PARAMETER;
  341. goto exit;
  342. }
  343. if (pHash == NULL)
  344. {
  345. dwErr = ERROR_FILE_NOT_FOUND;
  346. goto exit;
  347. }
  348. nDiff = wcscmp(wszKey, pHash->wszKey);
  349. if (nDiff == 0)
  350. {
  351. // The key is identical with the one in this node
  352. if (pHash->pObject != NULL)
  353. {
  354. if (ppHashNode != NULL)
  355. {
  356. *ppHashNode = pHash;
  357. }
  358. dwErr = ERROR_SUCCESS;
  359. }
  360. // If there is no object in this node, this means
  361. // the query failed with FILE_NOT_FOUND
  362. }
  363. else if (nDiff > 0)
  364. {
  365. // The key is larger than the current node's key
  366. UINT nTrail = wcslen(pHash->wszKey);
  367. PLIST_ENTRY pEntry;
  368. // The trailing part of the key could be covered by one of
  369. // the children nodes. Scan then the Down list.
  370. for (pEntry = pHash->lstDown.Flink;
  371. pEntry != &(pHash->lstDown);
  372. pEntry = pEntry->Flink)
  373. {
  374. PHASH_NODE pChild;
  375. pChild = CONTAINING_RECORD(pEntry, HASH_NODE, lstHoriz);
  376. if (wszKey[nTrail] == pChild->wszKey[0])
  377. {
  378. // the child to follow up has been located and saved
  379. // in pChild. Try to match the trailing key against this node
  380. dwErr = HshQueryObjectRef(pChild, wszKey+nTrail, ppHashNode);
  381. break;
  382. }
  383. }
  384. // if no child has been located, dwErr is the default FILE_NOT_FOUND
  385. }
  386. // if nDiff < 0 - meaning key is included in the current node's key then
  387. // dwErr is the default FILE_NOT_FOUND which is good.
  388. exit:
  389. DbgPrint((TRC_HASH,"HshQueryObjectRef]=%d", dwErr));
  390. return dwErr;
  391. }
  392. // Removes the object referenced by the pHash node. This could lead to one or
  393. // more hash node removals (if a leaf node on an isolated branch) but it could
  394. // also let the hash node untouched (i.e. internal node).
  395. // It is the caller's responsibility to clean up the object pointed by ppObject
  396. DWORD // [RET] win32 error code
  397. HshRemoveObjectRef(
  398. PHASH_NODE pHash, // [IN] hash to operate on
  399. PHASH_NODE pRemoveNode, // [IN] hash node to clear the reference to pObject
  400. LPVOID *ppObject, // [OUT] pointer to the object whose reference has been cleared
  401. PHASH_NODE *ppOutHash) // [OUT] pointer to the updated hash
  402. {
  403. DWORD dwErr = ERROR_SUCCESS;
  404. PHASH_NODE pNewRoot = NULL;
  405. DbgPrint((TRC_HASH,"[HshRemoveObjectRef(%p)", pHash));
  406. DbgAssert((ppObject != NULL, "No output object expected??"));
  407. DbgAssert((ppOutHash != NULL, "No output hash expected??"));
  408. DbgAssert((pRemoveNode != NULL, "No node to remove??"));
  409. // if the node contains no reference, return FILE_NOT_FOUND
  410. if (pRemoveNode->pObject == NULL)
  411. {
  412. dwErr = ERROR_FILE_NOT_FOUND;
  413. goto exit;
  414. }
  415. // remove the reference to the object at this moment
  416. *ppObject = pRemoveNode->pObject;
  417. pRemoveNode->pObject = NULL;
  418. // now climb the tree up to the root (!! - well it's a reversed tree) and merge
  419. // whatever nodes can be merged.
  420. // Merging: A node not referencing any object and having 0 or at most 1
  421. // successor can be deleted from the hash tree structure.
  422. while ((pRemoveNode != NULL) &&
  423. (pRemoveNode->pObject == NULL) &&
  424. (pRemoveNode->lstDown.Flink->Flink == &(pRemoveNode->lstDown)))
  425. {
  426. PHASH_NODE pUp = pRemoveNode->pUpLink;
  427. // if there is exactly 1 successor, its key needs to be prefixed with
  428. // the key of the node that is about to be removed. The successor also
  429. // needs to replace its parent in the hash tree structure.
  430. if (!IsListEmpty(&(pRemoveNode->lstDown)))
  431. {
  432. PHASH_NODE pDown;
  433. LPWSTR wszNewKey;
  434. pDown = CONTAINING_RECORD(pRemoveNode->lstDown.Flink, HASH_NODE, lstHoriz);
  435. wszNewKey = MemCAlloc(sizeof(WCHAR)*(wcslen(pRemoveNode->wszKey)+wcslen(pDown->wszKey)+1));
  436. if (wszNewKey == NULL)
  437. {
  438. // if the allocation failed, bail out with the error code.
  439. // the reference had already been removed, the hash might
  440. // not be compacted but it is still valid!
  441. dwErr = GetLastError();
  442. goto exit;
  443. }
  444. wcscpy(wszNewKey, pRemoveNode->wszKey);
  445. wcscat(wszNewKey, pDown->wszKey);
  446. MemFree(pDown->wszKey);
  447. pDown->wszKey = wszNewKey;
  448. // now raise the child node as a replacement of its parent
  449. pDown->pUpLink = pRemoveNode->pUpLink;
  450. InsertHeadList(&(pRemoveNode->lstHoriz), &(pDown->lstHoriz));
  451. pNewRoot = pDown;
  452. }
  453. // remove the current node
  454. RemoveEntryList(&(pRemoveNode->lstHoriz));
  455. // cleanup all its memory
  456. MemFree(pRemoveNode->wszKey);
  457. MemFree(pRemoveNode);
  458. // finally go and check the upper level node (if there is any)
  459. pRemoveNode = pUp;
  460. }
  461. // if pRemoveNode ended up to be NULL, this means either the whole hash has been cleared
  462. // or a "brother" took the role of the root. pNewRoot has the right value in both cases
  463. // if pRemoveNode is not NULL, since it walked up the chain constantly it means pHash (the
  464. // original root) was not affected. Hence, return it out.
  465. *ppOutHash = (pRemoveNode == NULL) ? pNewRoot : pHash;
  466. exit:
  467. DbgPrint((TRC_HASH,"HshRemoveObjectRef]=%d", dwErr));
  468. return dwErr;
  469. }
  470. CHAR szBlanks[256];
  471. VOID
  472. HshDbgPrintHash (
  473. PHASH_NODE pHash,
  474. UINT nLevel)
  475. {
  476. memset(szBlanks,' ', sizeof(szBlanks));
  477. if (pHash == NULL)
  478. {
  479. sprintf(szBlanks+nLevel,"(null)");
  480. DbgPrint((TRC_GENERIC,"%s", szBlanks));
  481. }
  482. else
  483. {
  484. PLIST_ENTRY pEntry;
  485. sprintf(szBlanks+nLevel,"%p:\"%S~[%p]\", up:%p",
  486. pHash,
  487. pHash->wszKey,
  488. pHash->pObject,
  489. pHash->pUpLink);
  490. DbgPrint((TRC_GENERIC,"%s", szBlanks));
  491. for (pEntry = pHash->lstDown.Flink;
  492. pEntry != &(pHash->lstDown);
  493. pEntry = pEntry->Flink)
  494. {
  495. PHASH_NODE pChild;
  496. pChild = CONTAINING_RECORD(pEntry, HASH_NODE, lstHoriz);
  497. HshDbgPrintHash(pChild, nLevel+1);
  498. }
  499. }
  500. }