跟线性数组和链表不同。HashTable是高速查找的数据结构。本文中的HashTable使用链表处理数组。
该HashTable能够指定table的长度。提供了遍历的方法。
包含table的长度的选择也比較讲究。
其它c的数据结构实现。dyArray參考点击打开链接 treeStruct參考点击打开链接
cp_int32 nPrime[MAX_HASH_PRIME_ARRAY_NUM] = { 17, 37, 79, 163, 331, 673, 1361 };就是说table的长度来取自上面这个数组。比方用户设定了200。那么table的长度就是331,找到第一次比输入值大的数值。能够注意到上面的都是素数。
以下是详细的代码贴出来。共大家參考。
代码中有个接口是查到多个key使用到了动态数组dyArray。參考上一篇点击打开链接
// // cpPlatform.h // dataStruct // // Created by hherima on 14-7-29. // Copyright (c) 2014年 . All rights reserved. // #ifndef dataStruct_cpPlatform_h #define dataStruct_cpPlatform_h enum { CP_FALSE = 0, CP_TRUE = !CP_FALSE }; #define F_MALLOC_TYPE(s) (s*)f_malloc(sizeof(s)) #define FREEFUN free #define MIN_PRE_ALLOCATE_SIZE 10 //The initial size of the dynamic array. #define MEMSETFUN memset #define REALLOCFUN realloc #define MALLOCFUN malloc #define MEMCMPFUN memcmp #define MEMCPYFUN memcpy typedef unsigned char cp_bool; typedef signed int cp_int32; typedef char cp_int8; typedef unsigned int cp_uint32; #endif上面是数据类型的定义。为了跨平台使用
以下是hashtable的数据结构头文件
// // hashStruct.h // dataStruct // // Created by hherima on 14-7-29. // Copyright (c) 2014年 . All rights reserved. // #ifndef dataStruct_hashStruct_h #define dataStruct_hashStruct_h #include <stdlib.h> #include "cpPlatform.h" #include "dyArray.h" struct Node { cp_int8* m_pKey; //the hash key. cp_int32 m_nKeyLength; // the length of the hash key in bytes. void* m_pVal;//hash_node value struct Node* m_pNext; };//hash table,use link list to process conflict struct HashTable { cp_int32 m_nLength; //hash table's length. cp_int32 m_nEleNum; //hash table's element count. struct Node **m_ppHead;//the hash table's array to record all key's value. }; cp_int32 GetHashFileNum(cp_int8* pKey, cp_int32 nKeyLength); struct Node* HashFindOne(cp_int8* pKey,cp_int32 nKeyLength,struct HashTable *pTable);//search cp_int32 HashFindMultkeyredund(cp_int8* pKey,cp_int32 nKeyLength,struct HashTable *pTable,struct DynamicArray *pdestArray); void HashInsertOne(cp_int8* pKey,cp_int32 nKeyLength,void* pVal,struct HashTable *pTable);//insert void HashInsertOneKeyredund(char* pKey,cp_int32 nKeyLength,void* pVal,struct HashTable *pTable); void HashDelOne(struct HashTable * pTable,void (*pFreeFunc) (void *),cp_int8 *pKey,cp_int32 nKeyLength); struct HashTable * HashTableCreate(cp_int32 nKeyNum); struct Node* HashGetFirst(struct HashTable *pTable); struct Node* HashGetNext(struct HashTable *pTable,cp_int8* pKey,cp_int32 nKeyLength); cp_int32 HashGetLength(struct HashTable *pTable); void HashTableVisit(struct HashTable * pTable,void (*pVisitFunc) (void *,void *),void *pAgent); void HashTableReset(struct HashTable * pTable,void (*pFreeFunc) (void *)); void HashTableDestroy(struct HashTable * pTable,void (*pFreeFunc) (void *)); cp_int32 HashGetValue(cp_int8* pKey,cp_int32 nKeyLength,cp_int32 nTableLength); #endif
源文件
// // hashStruct.c // dataStruct // // Created by hherima on 14-7-29. // Copyright (c) 2014年 . All rights reserved. // #include "hashStruct.h" #define MAX_HASH_PRIME_ARRAY_NUM 7 /************************************************************************************************** function name: HashGetValue description: the hash arithmetic to get the position of the certain key. parameter: pKey: the exclusive symbol which is related to a data block in hash table. nKeyLength: the key string's length. nTableLength: the hash table's length. return value: the position of the certain key. ***************************************************************************************************/ cp_int32 HashGetValue(cp_int8* pKey,cp_int32 nKeyLength,cp_int32 nTableLength) { cp_uint32 h = 0; cp_uint32 g = 0; if(!pKey || nKeyLength<1 || nTableLength<1) //if the input parameter is invalid, return. { return -1; } while(nKeyLength--) // get each charactor and use it to compute hash value. { h = (h<<4) + *pKey++; g = h & 0xF0000000L; if(g) { h ^= g>>24; } h &= ~g; } return h % nTableLength; } /************************************************************************************************** function name: HashFindOne description: search the position's node of the certain key. parameter: pKey: the exclusive symbol which is related to a data block in hash table. nKeyLength: the key string's length. pTable: the hash table. return value: the node pointer or null. ***************************************************************************************************/ struct Node* HashFindOne(cp_int8* pKey,cp_int32 nKeyLength,struct HashTable *pTable)//search { cp_int32 nPos = 0; struct Node* pCur = NULL; //if the input parameter is invalid, return. if(!pTable || !pKey || nKeyLength<1) { return NULL; } nPos = HashGetValue(pKey,nKeyLength,pTable->m_nLength); if(nPos>=0) pCur = pTable->m_ppHead[nPos]; //cur = table->head[hash_get_value(key,key_length,table->length)]; while(pCur) // if has link list, visit all the list to find the right one. { if(pCur->m_nKeyLength == nKeyLength && MEMCMPFUN(pCur->m_pKey,pKey,nKeyLength) == 0) { return pCur; } pCur = pCur->m_pNext; } return NULL; } /************************************************************************************************** function name: HashFindMultkeyredund description: search the node of the certain key, there will be several one. parameter: pKey: the exclusive symbol which is related to several data block in hash table. nKeyLength: the key string's length. pTable: the hash table. pdestArray: the dynamic array which is used to save results and need be initilalized. return value: the node pointer or null. ***************************************************************************************************/ cp_int32 HashFindMultkeyredund(cp_int8* pKey,cp_int32 nKeyLength,struct HashTable *pTable,struct DynamicArray *pDestArray) //search ,the key is redundant. { int nResNum = 0; struct Node* pCur = NULL; //if the input parameter is invalid, return. if(!pTable || !pKey || nKeyLength<1 || !pDestArray) { return -1; } pCur = pTable->m_ppHead[HashGetValue(pKey,nKeyLength,pTable->m_nLength)]; while(pCur) //if has link list, visit all the list and find the right one. { if(pCur->m_nKeyLength == nKeyLength && MEMCMPFUN(pCur->m_pKey,pKey,nKeyLength) == 0) { DyArrayAppend(pDestArray, pCur->m_pVal); // put the right one to array. nResNum++; //return cur; } pCur = pCur->m_pNext; } return nResNum; } /************************************************************************************************** function name: hashExpand description: expand the array when it's too small.THIS FUNCTION CAN'T BE USED BECAUSE HASH VALUE IS CHANGED WHEN TABLE LENGTH CHANGED. parameter: pTable: the hash table. nNeed: the needed new size. return value: if succeed,return the true, else, return false. ***************************************************************************************************/ cp_bool HashExpand(struct HashTable * pTable, cp_int32 nNeed) { cp_int32 i; struct Node ** pData = NULL; cp_int32 nAllocSize = 0; cp_int32 nPrime[MAX_HASH_PRIME_ARRAY_NUM] = { 17, //0 37, //1 79, //2 163, //3 331, //4 673, //5 1361 //6 };//The prime table used to be the length of hash table to decrease conflict. //if the input parameter is invalid, return. if(!pTable || nNeed<1) { return CP_FALSE; } //if need, expand to one and half times of original size. if(((pTable->m_nEleNum + nNeed) + ((pTable->m_nEleNum + nNeed)>>1) ) > pTable->m_nLength) { nAllocSize = pTable->m_nLength + (pTable->m_nLength>>1); for(i=0; i<MAX_HASH_PRIME_ARRAY_NUM; i++) //find the nearest one of prime array. { if(nPrime[i] > nAllocSize) { nAllocSize = nPrime[i]; break; } } pData = (struct Node **)REALLOCFUN(pTable->m_ppHead, sizeof(struct Node *) * nAllocSize); if(pData != NULL) { // clear the expanded space. MEMSETFUN(pData+pTable->m_nLength,0,(nAllocSize-pTable->m_nLength)*sizeof(struct Node *)); pTable->m_ppHead = pData; pTable->m_nLength = nAllocSize; } } return ((pTable->m_nEleNum + nNeed) + ((pTable->m_nEleNum + nNeed)>>1) <= pTable->m_nLength) ? CP_TRUE : CP_FALSE; } /************************************************************************************************** function name: HashInsertOne description: insert the node of the certain key. parameter: pKey: the exclusive symbol which is related to a data block in hash table. nKeyLength: the key string's length. pVal: the node pointer of the certain key. pTable: the hash table. return value: none. ***************************************************************************************************/ void HashInsertOne(cp_int8* pKey,cp_int32 nKeyLength,void* pVal,struct HashTable *pTable)//insert { cp_int32 nPos = 0; struct Node** pNode = NULL; struct Node* pTmp = NULL; //if the input parameter is invalid, return. if(!pTable || !pKey || nKeyLength<1) { return ; } //comment it because when it expands, the same key's position changed and the original key position CAN'T be found. /*if((pTable->m_EleNum + 1) + ((pTable->m_EleNum + 1)>>1) > pTable->m_nLength) { HashExpand(pTable, 1); }*/ //compute the hash position. pTable->m_nEleNum++; nPos = HashGetValue(pKey,nKeyLength,pTable->m_nLength); pNode = &pTable->m_ppHead[nPos]; //if this key is NOT exist, insert it. if(HashFindOne(pKey,nKeyLength,pTable) == NULL) { //malloc a new node and set the value. pTmp=(struct Node*)MALLOCFUN(sizeof(struct Node)); MEMSETFUN(pTmp,0,sizeof(struct Node)); pTmp->m_pKey = (char*)MALLOCFUN(nKeyLength+2);//for Unicode, two bytes zero is needed. MEMSETFUN(pTmp->m_pKey,0,nKeyLength+2); MEMCPYFUN(pTmp->m_pKey,pKey,nKeyLength); pTmp->m_nKeyLength = nKeyLength; pTmp->m_pVal = pVal; pTmp->m_pNext=NULL; //if there is a list, then insert to the tail. while(*pNode) { pNode = &((*pNode)->m_pNext); } *pNode = pTmp; } } /************************************************************************************************** function name: HashInsertOneKeyredund description: insert the node of the certain key. parameter: pKey: the symbol which is related to a data block in hash table. nKeyLength: the key string's length. pVal: the node pointer of the certain key. pTable: the hash table. return value: none. ***************************************************************************************************/ void HashInsertOneKeyredund(cp_int8* pKey,cp_int32 nKeyLength,void* pVal,struct HashTable *pTable) //insert,key is redundant. { cp_int32 nPos = 0; struct Node** pNode = NULL; struct Node* pTmp = NULL; //if the input parameter is invalid, return. if(!pTable || !pKey || nKeyLength<1) { return ; } //comment it because when it expands, the same key's position changed and the original key position CAN'T be found. /*if((table->ele_num + 1) + ((table->ele_num + 1)>>1) > table->length) { hash_expand(table, 1); }*/ //compute the hash position. pTable->m_nEleNum++; nPos= HashGetValue(pKey,nKeyLength,pTable->m_nLength); pNode = &pTable->m_ppHead[nPos]; //compare with HashInsertOne, comment this line. if(hash_find_one(key,key_length,table) == NULL) { //malloc a new node and set the value. pTmp=(struct Node*)MALLOCFUN(sizeof(struct Node)); MEMSETFUN(pTmp,0,sizeof(struct Node)); pTmp->m_pKey = (char*)MALLOCFUN(nKeyLength+2);//for Unicode, two bytes zero is needed. MEMSETFUN(pTmp->m_pKey,0,nKeyLength+2); MEMCPYFUN(pTmp->m_pKey,pKey,nKeyLength); pTmp->m_nKeyLength = nKeyLength; pTmp->m_pVal = pVal; pTmp->m_pNext=NULL; //if has a link list, then insert the new node to the tail. while(*pNode) { pNode = &((*pNode)->m_pNext); } *pNode = pTmp; } } /************************************************************************************************** function name: HashTableCreate description: create the hash table when the program starts. parameter: nKeyNum: the key count of the program's data. return value: the hash table. ***************************************************************************************************/ struct HashTable * HashTableCreate(cp_int32 nKeyNum) { struct HashTable * pTable = NULL; cp_int32 i; cp_int32 nPrime[MAX_HASH_PRIME_ARRAY_NUM] = { 17, //0 37, //1 79, //2 163, //3 331, //4 673, //5 1361 //6 };//The prime table used to be the length of hash table to decrease conflict. //if the input parameter is invalid, return. if(nKeyNum < 1) { return NULL; } pTable = (struct HashTable *)MALLOCFUN(sizeof(struct HashTable)); if(!pTable) { return NULL; } MEMSETFUN(pTable,0,sizeof(struct HashTable)); //The default length is 1.5 times of key's number. pTable->m_nLength = nKeyNum + (nKeyNum<<1); //find the nearest size of prime array. for(i=0; i<MAX_HASH_PRIME_ARRAY_NUM; i++) { if(nPrime[i] > pTable->m_nLength) { pTable->m_nLength = nPrime[i]; break; } } pTable->m_ppHead = (struct Node **) MALLOCFUN(sizeof(struct Node *)*pTable->m_nLength); if(!pTable->m_ppHead) { FREEFUN(pTable); return NULL; } MEMSETFUN(pTable->m_ppHead,0,sizeof(struct Node *)*pTable->m_nLength); return pTable; } /************************************************************************************************** function name: HashTableVisit description: visit all the elements of the hash table. parameter: pTable: the hash table. pVisitFunc: the visit function for each element of the hash table, the first parameter is hash's element, the second parameter is 'agent' which is to pass to caller. pAgent: used to pass to the call back funtion. return value: none ***************************************************************************************************/ void HashTableVisit(struct HashTable * pTable,void (*pVisitFunc) (void *,void *),void *pAgent) { cp_int32 i; struct Node * pTmp = NULL; //if the input parameter is invalid, return. if(!pTable) { return ; } //visit each position if it's not null. for(i=0; i<pTable->m_nLength; i++) { if(pTable->m_ppHead[i] == NULL) { continue; } if(pTable->m_ppHead[i]->m_pKey) { if(pVisitFunc) { pVisitFunc(pTable->m_ppHead[i]->m_pVal,pAgent); } pTmp = pTable->m_ppHead[i]->m_pNext; //if has link list, then visit the whole list. while(pTmp) { if(pVisitFunc) { pVisitFunc(pTmp->m_pVal,pAgent); } pTmp = pTmp->m_pNext; } } } return ; } /************************************************************************************************** function name: HashGetFirst description: get the first element of the hash table. parameter: pTable: the hash table. return value: the first element ***************************************************************************************************/ struct Node* HashGetFirst(struct HashTable *pTable) { cp_int32 i; //if the input parameter is invalid, return. if(!pTable) { return NULL; } //find the first not null element of head array. for(i=0; i<pTable->m_nLength; i++) { if(pTable->m_ppHead[i] == NULL) { continue; } if(pTable->m_ppHead[i]->m_pKey) { return pTable->m_ppHead[i]; } } return NULL; } /************************************************************************************************** function name: HashGetNext description: get the next element of the current node which key is given. parameter: pTable: the hash table. pKey: the exclusive symbol which is related to a data block in hash table. nKeyLength: the key string's length. return value: the next element ***************************************************************************************************/ struct Node* HashGetNext(struct HashTable *pTable,cp_int8* pKey,cp_int32 nKeyLength) { struct Node* pNext = NULL; struct Node* pCur = NULL; cp_int32 nPos; cp_int32 i; //if the input parameter is invalid, return. if(!pTable) { return NULL; } //get the position of the key. nPos = HashGetValue(pKey,nKeyLength,pTable->m_nLength); if(nPos == -1) { return NULL; } pCur = pTable->m_ppHead[nPos]; if(!pCur) { return NULL;//the related node of the pKey is NOT exist, so return null. } //find the right one whose key is same with pKey. while(pCur) { if(pCur->m_nKeyLength == nKeyLength && MEMCMPFUN(pCur->m_pKey,pKey,nKeyLength) == 0) { break; } pCur = pCur->m_pNext; } //get the next pointer directly. if(pCur && pCur->m_pNext) { pNext = pCur->m_pNext; } else { //get the next not null one from the head array. nPos++; for(i=nPos; i<pTable->m_nLength; i++) { if(pTable->m_ppHead[i] == NULL) { continue; } if(pTable->m_ppHead[i]->m_pKey) { pNext = pTable->m_ppHead[i]; break; } } } return pNext; } /************************************************************************************************** function name: HashTableReset description: clear the hash table. parameter: pTable: the hash table. pFreeFunc: the free function for hash data "val" which is given by caller. return value: none ***************************************************************************************************/ void HashTableReset(struct HashTable * pTable,void (*pFreeFunc) (void *)) { cp_int32 i; struct Node * pTmp = NULL; struct Node * pTmp1 = NULL; //if the input parameter is invalid, return. if(!pTable) { return; } //reset each element of the head array and free related memory. for(i=0; i<pTable->m_nLength; i++) { if(pTable->m_ppHead[i] == NULL) { continue; } if(pTable->m_ppHead[i]->m_pKey) { FREEFUN(pTable->m_ppHead[i]->m_pKey); if(pFreeFunc) { pFreeFunc(pTable->m_ppHead[i]->m_pVal); } pTmp = pTable->m_ppHead[i]->m_pNext; FREEFUN(pTable->m_ppHead[i]); pTable->m_ppHead[i] = NULL; //free all the link list. while(pTmp) { FREEFUN(pTmp->m_pKey); if(pFreeFunc) { pFreeFunc(pTmp->m_pVal); } pTmp1 = pTmp; pTmp = pTmp->m_pNext; FREEFUN(pTmp1); } } } //clear the table. MEMSETFUN(pTable->m_ppHead,0,sizeof(struct Node *)*pTable->m_nLength); pTable->m_nEleNum = 0; return ; } /************************************************************************************************** function name: HashTableDestroy description: destroy the hash table when the program exits. parameter: pTable: the hash table. pFreeFunc: the free function for hash data "val" which is given by caller. return value: none ***************************************************************************************************/ void HashTableDestroy(struct HashTable * pTable,void (*pFreeFunc) (void *)) { cp_int32 i; struct Node * pTmp = NULL; struct Node * pTmp1 = NULL; //if the input parameter is invalid, return. if(!pTable) { return; } //clear each element and free its memory. for(i=0; i<pTable->m_nLength; i++) { if(pTable->m_ppHead[i] == NULL) { continue; } if(pTable->m_ppHead[i]->m_pKey) { FREEFUN(pTable->m_ppHead[i]->m_pKey); if(pFreeFunc) { pFreeFunc(pTable->m_ppHead[i]->m_pVal); } pTmp = pTable->m_ppHead[i]->m_pNext; FREEFUN(pTable->m_ppHead[i]); pTable->m_ppHead[i] = NULL; //free the link list. while(pTmp) { FREEFUN(pTmp->m_pKey); if(pFreeFunc) { pFreeFunc(pTmp->m_pVal); } pTmp1 = pTmp; pTmp = pTmp->m_pNext; FREEFUN(pTmp1); } } } //free the table. FREEFUN(pTable->m_ppHead); pTable->m_ppHead = NULL; FREEFUN(pTable); return ; } /************************************************************************************************** function name: HashDelOne description: delete one node of hash table. parameter: pTable: the hash table. pFreeFunc: the free function for hash data "val" which is given by caller. pKey: the exclusive symbol which is related to a data block in hash table. nKeyLength: the key string's length. return value: none ***************************************************************************************************/ void HashDelOne(struct HashTable * pTable,void (*pFreeFunc) (void *),char *pKey,cp_int32 nKeyLength) { cp_int32 nPos = 0; struct Node *pTmp = NULL; struct Node **pTmp1 = NULL; struct Node *pTmp2 = NULL; //if the input parameter is invalid, return. if(!pTable || !pKey || nKeyLength<1) { return; } //compute the hash position. nPos = HashGetValue(pKey,nKeyLength,pTable->m_nLength); if(!pTable->m_ppHead[nPos]) { return;//the related node of the key is NOT exist, return. } //the first one is the right one. if(pTable->m_ppHead[nPos]->m_nKeyLength == nKeyLength && MEMCMPFUN(pTable->m_ppHead[nPos]->m_pKey,pKey,nKeyLength) == 0) { pTable->m_nEleNum--; FREEFUN(pTable->m_ppHead[nPos]->m_pKey); pTable->m_ppHead[nPos]->m_pKey = NULL; if(pFreeFunc) pFreeFunc(pTable->m_ppHead[nPos]->m_pVal); pTable->m_ppHead[nPos]->m_pVal = NULL; if(pTable->m_ppHead[nPos]->m_pNext) { pTmp = pTable->m_ppHead[nPos]; pTable->m_ppHead[nPos] = pTable->m_ppHead[nPos]->m_pNext; FREEFUN(pTmp); } else { FREEFUN(pTable->m_ppHead[nPos]); pTable->m_ppHead[nPos] = NULL; } } else { //find the right one in the link list. pTmp1 = &(pTable->m_ppHead[nPos]->m_pNext); while(*pTmp1) { if((*pTmp1)->m_nKeyLength == nKeyLength && MEMCMPFUN((*pTmp1)->m_pKey,pKey,nKeyLength) == 0) { //find it, free it and relink the link list. pTable->m_nEleNum--; FREEFUN((*pTmp1)->m_pKey); (*pTmp1)->m_pKey = NULL; if(pFreeFunc) pFreeFunc((*pTmp1)->m_pVal); (*pTmp1)->m_pVal = NULL; if((*pTmp1)->m_pNext) { pTmp2 = *pTmp1; *pTmp1 = (*pTmp1)->m_pNext; FREEFUN(pTmp2); } else { FREEFUN(*pTmp1); *pTmp1 = NULL; } break; } else { pTmp1 = &((*pTmp1)->m_pNext); } } } return ; } /************************************************************************************************** function name: HashGetLength description: get the total length of the hash table. parameter: pTable: the hash table. return value: none ***************************************************************************************************/ cp_int32 HashGetLength(struct HashTable *pTable) { return pTable ? pTable->m_nEleNum : -1; }