Some Hashing Functions

2023-11-24 03:11:14

转自：http://digipen2.xmmg.com/dpweb/Courses/CS280/HashFunctions-1.html

unsigned ConstantHash(const char *Key, unsigned TableSize)
{return 1;
}unsigned ReflexiveHash(const char *Key, unsigned TableSize)
{return StrToInt(Key) % TableSize;
}unsigned PJWHash(const char *Key, unsigned TableSize)
{// Initial value of hashunsigned hash = 0;// Process each char in the stringwhile (*Key){// Shift hash left 4hash = (hash << 4);// Add in current charhash = hash + (*Key);// Get the four high-order bitsunsigned bits = hash & 0xF0000000;// If any of the four bits are non-zero,if (bits){// Shift the four bits right 24 positions (...bbbb0000)// and XOR them back in to the hashhash = hash ^ (bits >> 24);// Now, XOR the four bits back inhash = hash ^ bits;}// Next charKey++;}// Modulo so hash is within 0 - TableSizereturn hash % TableSize;
}unsigned SimpleHash(const char *Key, unsigned TableSize)
{// Initial value of hashunsigned hash = 0;// Process each char in the stringwhile (*Key){// Add in current charhash += *Key;// Next charKey++;}// Modulo so hash is within the tablereturn hash % TableSize;
}unsigned RSHash(const char *Key, unsigned TableSize)
{unsigned hash = 0;         // Initial value of hashunsigned multiplier = 127; // Prevent anomalies// Process each char in the stringwhile (*Key){// Adjust hash totalhash = hash * multiplier;// Add in current char and mod resulthash = (hash + *Key) % TableSize;// Next charKey++;}// Hash is within 0 - TableSizereturn hash;
}// Same as above but performing the modulo once at the end
unsigned RSHashMod(const char *Key, unsigned TableSize)
{unsigned hash = 0;         // Initial value of hashunsigned multiplier = 127; // Prevent anomalies// Process each char in the stringwhile (*Key){// Adjust hash totalhash = hash * multiplier;// Add in current char and mod resulthash = hash + *Key;// Next charKey++;}// Hash is within 0 - TableSizereturn hash % TableSize;;
}unsigned UHash(const char *Key, unsigned TableSize)
{unsigned hash = 0;       // Initial value of hashunsigned rand1 = 31415; // "Random" 1unsigned rand2 = 27183; // "Random" 2// Process each char in stringwhile (*Key){// Multiply hash by randomhash = hash * rand1;// Add in current char, keep within TableSizehash = (hash + *Key) % TableSize;// Update rand1 for next "random" numberrand1 = (rand1 * rand2) % (TableSize - 1);// Next charKey++;}// Hash value is within 0 - TableSize - 1return hash;
}// Same as above but performing the modulo once at the end
unsigned UHashMod(const char *Key, unsigned TableSize)
{unsigned hash = 0;       // Initial value of hashunsigned rand1 = 31415; // "Random" 1unsigned rand2 = 27183; // "Random" 2// Process each char in stringwhile (*Key){// Multiply hash by randomhash = hash * rand1;// Add in current char, keep within TableSizehash = (hash + *Key);// Update rand1 for next "random" numberrand1 = (rand1 * rand2);// Next charKey++;}// Hash value is within 0 - TableSize - 1return hash % TableSize;
}// Daniel J. Bernstein
/** DJBX33A (Daniel J. Bernstein, Times 33 with Addition)** This is Daniel J. Bernstein's popular `times 33' hash function as* posted by him years ago on comp.lang.c. It basically uses a function* like ``hash(i) = hash(i-1) * 33 + string[i]''. This is one of the* best hashing functions for strings. Because it is both computed very* fast and distributes very well.** The magic of the number 33, i.e. why it works better than many other* constants, prime or not, has never been adequately explained by* anyone. So I try an own RSE-explanation: if one experimentally tests* all multipliers between 1 and 256 (as I did it) one detects that* even numbers are not useable at all. The remaining 128 odd numbers* (except for the number 1) work more or less all equally well. They* all distribute in an acceptable way and this way fill a hash table* with an average percent of approx. 86%.** If one compares the Chi/2 values resulting of the various* multipliers, the 33 not even has the best value. But the 33 and a* few other equally good values like 17, 31, 63, 127 and 129 have* nevertheless a great advantage over the remaining values in the large* set of possible multipliers: their multiply operation can be replaced* by a faster operation based on just one bit-wise shift plus either a* single addition or subtraction operation. And because a hash function* has to both distribute good and has to be very fast to compute, those* few values should be preferred and seems to be also the reason why* Daniel J. Bernstein also preferred it.** Lawsuit here:* http://epic.org/crypto/export_controls/bernstein_decision_9_cir.html*///  Daniel J. Bernstein #1
unsigned DJB1Hash(const char *Key, unsigned TableSize)
{unsigned hash = 0;while (*Key){hash *= 33;hash += *Key;Key++;}return hash % TableSize;
}//  Daniel J. Bernstein  #2
unsigned DJB2Hash(const char *Key, unsigned TableSize)
{unsigned hash = 5381;while (*Key){hash <<= 5;hash += hash;hash += *Key;Key++;}return hash % TableSize;
}// Donald E. Knuth
unsigned DEKHash(const char *Key, unsigned TableSize)
{unsigned hash = (unsigned)strlen(Key);while (*Key){hash <<= 5;hash ^= (hash >> 27);hash ^= *Key;Key++;}return hash % TableSize;
}// K&R Hash page 144 in the white book (second edition)
unsigned KRHash(const char *Key, unsigned TableSize)
{unsigned seed = 31;unsigned hash = 0;while (*Key){hash *= seed;hash += *Key;Key++;}return hash % TableSize;
}// Fowler, Noll, Vo
// http://isthe.com/chongo/tech/comp/fnv/
unsigned FNVHash(const char *Key, unsigned TableSize)
{unsigned FNV_prime32 = 16777619;unsigned FNV_offset32 = 2166136261;unsigned hash = FNV_offset32;while (*Key){hash *= FNV_prime32;hash ^= *Key;Key++;}return hash % TableSize;
}// SuperFastHash by Paul Hsieh
// http://www.azillionmonkeys.com/qed/hash.html
#include  /* Replace with  if appropriate */
#undef get16bits
#if (defined(__GNUC__) && defined(__i386__)) || defined(__WATCOMC__) \|| defined(_MSC_VER) || defined (__BORLANDC__) || defined (__TURBOC__)
#define get16bits(d) (*((const uint16_t *) (d)))
#endif#if !defined (get16bits)
#define get16bits(d) ((((uint32_t)(((const uint8_t *)(d))[1])) << 8)\+(uint32_t)(((const uint8_t *)(d))[0]) )
#endifuint32_t SFHash (const char * data, unsigned TableSize)
{int len = strlen(data);uint32_t hash = len;uint32_t tmp;int rem;if (len <= 0 || data == NULL) return 0;rem = len & 3;len >>= 2;/* Main loop */for (;len > 0; len--) {hash  += get16bits (data);tmp    = (get16bits (data+2) << 11) ^ hash;hash   = (hash << 16) ^ tmp;data  += 2*sizeof (uint16_t);hash  += hash >> 11;}/* Handle end cases */switch (rem) {case 3: hash += get16bits (data);hash ^= hash << 16;hash ^= data[sizeof (uint16_t)] << 18;hash += hash >> 11;break;case 2: hash += get16bits (data);hash ^= hash << 11;hash += hash >> 17;break;case 1: hash += *data;hash ^= hash << 10;hash += hash >> 1;}/* Force "avalanching" of final 127 bits */hash ^= hash << 3;hash += hash >> 5;hash ^= hash << 4;hash += hash >> 17;hash ^= hash << 25;hash += hash >> 6;return hash % TableSize;
}// STLPort 4.6.2
unsigned STLPortHash(const char *Key, unsigned TableSize)
{unsigned hash = 0;while (*Key){hash = (hash * 5) + *Key;Key++;}return hash % TableSize;
}int GetRandom(int Low, int High)
{return rand() % (High - Low + 1) + Low;
}// Code to test the performance in the GUI.
void TOAHashMain::TestPerformance(HASHFUNC fn, const AnsiString& fname, int keysize, int iterations)
{srand(123);char *buffer = new char[keysize + 1];// Generate a random "key"for (int i = 0; i < keysize; i++){char c = (char)GetRandom(32, 255);buffer[i] = c;}buffer[keysize] = 0;char buf[100];// Time the performance of this hash functionclock_t start = clock();for (int i = 0; i < iterations; i++){fn(buffer, keysize);  // call hash functionif (FStopPerformanceTest)break;// Give the app a chance to respond to other events once in a whileif (!(i % 1000))Application->ProcessMessages();}clock_t end = clock();std::sprintf(buf, "%18s... %5.3f s", fname.c_str(), (end - start) / (double)CLOCKS_PER_SEC);mmoResults->Lines->Add(buf);delete [] buffer;
}

本文来自互联网用户投稿，文章观点仅代表作者本人，不代表本站立场，不承担相关法律责任。如若转载，请注明出处。 如若内容造成侵权/违法违规/事实不符，请点击【内容举报】进行投诉反馈！

标签：技术

上一篇 > cygwin编译的win32程序不需要cygwin1.dll库的方法(1)
下一篇 > MyBatis分页实现 - Oracle

Duilib中list控件支持ctrl和shif多行选中的实现

[ICML2015]Batch Normalization:Accelerating Deep Network Training by Reducing Internal Covariate Shif

win10系统微软输入法于eclipse ctrl+shif+f冲突间接处理办法

Codeforces Round #259 (Div. 2) B. Little Pony and Sort by Shif

读LDD3，内存映射与DMA--PAGE_SHIF…

VMware虚拟机安装XP【要先分区，再设置BOOT 启动CD，shif+上移】

更换iBus五笔的左与右Shif

sublime ctrl+shif+f 没用解决办法

idea 对 ctrl + z 的撤销是 ctrl + shif + z

计算机最早的设计师应用于,计算机应用基础选择题doc.doc

win10自带截图神器：Win+Shift+S

Python基础之文件目录操作

python简述目录_Python基础之文件目录操作(示例代码)

tp5 如何做数据采集

任务2-7(服务器字体+阿里巴巴矢量库)

html标签（1)：h1~h6,p,br,pre,hr

TI 电量计介绍与芯片选型指南

几款TI电源芯片简介

TI DSP芯片C2000系列读取FLASH数据

德州仪器(Ti)平台嵌入式开发基础

TI三相电机智能栅极驱动芯片特点分类

省选模拟（12.08） T3 圈圈圈圈圈圈圈圈

Hadoop生态圈技术栈（上）

大数据开发基础入门与项目实战（三）Hadoop核心及生态圈技术栈之6.Impala交互式查询

小猿圈之Linux下Mysql 操作命令

大数据Hadoop生态圈常用面试题

大数据开发基础入门与项目实战（三）Hadoop核心及生态圈技术栈之4.Hive DDL、DQL和数据操作

备战Noip2018模拟赛11（B组）T3 Monogatari 物语

【智能优化算法-圆圈搜索算法】基于圆圈搜索算法Circle Search Algorithm求解单目标优化问题附matlab代码

NYOJ 78 圈水池

递归问题跑道汽车绕圈问题 Python实现

Hadoop生态圈（三）：MapReduce

Some Hashing Functions

相关文章