redis7.2.2|Dict-编程知识

文章目录

Struct
- redisDB
- dict
- dictType
- dictEntry
宏定义
散列函数
散列冲突
dictEntry pointer bit tricks[指针位技巧]
API implementation
- _dictReset
- _dictInit
- dictCreate
- dictGetHash
- dictSetKey
- dictSetVal
- dictSetNext
- dictGetNext
- dictGetVal
- dictGetKey
- _dictClear
- dictEmpty
- dictRelease
扩容
- dictResize|dictExpand|_dictExpand|_dictNextExp
- 扩容触发条件
- - **dictAdd**
  - **dictAddRaw**
  - **dictFindPositionForInsert**
  - **_dictExpandIfNeeded**
  - **dictTypeExpandAllowed**
  - **扩容策略**
  - **扩容触发条件**
  - **dictInsertAtPosition**
缩容
- - dictDelete
  - htNeedsResize
  - 缩容条件
  - 缩容策略
迁移
- 迁移时机
- 迁移步骤
- - _dictRehashStep
  - dictRehash
- redis服务器定时任务----迁移数据
旧版本中dict的结构
总结

字典是Redis服务器中出现最为频繁的复合型数据结构，除了hash结构的数据会用到字典外，整个redis数据库的所有key和value也组成一个全局字典，还有带有过期时间的key集合也是一个字典。zet集合中存储value和score值的映射关系也是通过字典结构实现的。

先看一下redisDB的结构，它里面存储着数据字典和过期字典

Struct

redisDB

[redis-7.2.2\src\server.h]
redisDB

typedef struct redisDb {//全局数据字典dict *dict;                 /* The keyspace for this DB *///全局过期字典dict *expires;              /* Timeout of keys with a timeout set */dict *blocking_keys;        /* Keys with clients waiting for data (BLPOP)*/dict *blocking_keys_unblock_on_nokey;   /* Keys with clients waiting for* data, and should be unblocked if key is deleted (XREADEDGROUP).* This is a subset of blocking_keys*/dict *ready_keys;           /* Blocked keys that received a PUSH */dict *watched_keys;         /* WATCHED keys for MULTI/EXEC CAS *///当前的数据库IDint id;                     /* Database ID */long long avg_ttl;          /* Average TTL, just for stats */unsigned long expires_cursor; /* Cursor of the active expire cycle. */list *defrag_later;         /* List of key names to attempt to defrag one by one, gradually. */clusterSlotToKeyMapping *slots_to_keys; /* Array of slots to keys. Only used in cluster mode (db 0). */
} redisDb;

dict

struct dict {//dictType是一个struct里面存储了各种与hashtable相关的function pointer,详细的见下面dictType *type;/*正常情况下，使用ht_table[0]存储数据；发生扩容或者缩容时，用ht_table[1]。*/dictEntry **ht_table[2];/*对应着两个ht_table的元素个数;ht_used[0]表示ht_table[0]的对象总数;ht_used[1]表示ht_table[1]的对象总数.*/unsigned long ht_used[2];/*标记当前的hashtable是否处于rehash状态，如果rehashidx==-1则当前没有处于rehash状态，如果rehashidx>=0则表明当前处于rehash状态并且按照rehashidx指示的顺序进行迁移。*/long rehashidx; /* rehashing not in progress if rehashidx == -1 *//*该值大于0表示rehash终止，小于0表示编码错误*/int16_t pauserehash; /*通过ht_size_exp可以计算出两个表的一维长度也即是槽的个数。pow(2,ht_size_exp[0])表示ht_table[0]槽的个数；pow(2,ht_size_exp[1])表示ht_table[1]槽的个数；*/signed char ht_size_exp[2]; /*metadata是用于存储额外信息的字段，可以存储一些元数据*/void *metadata[];          
};

在这里插入图片描述

dictType

typedef struct dictType {uint64_t (*hashFunction)(const void *key);void *(*keyDup)(dict *d, const void *key);void *(*valDup)(dict *d, const void *obj);int (*keyCompare)(dict *d, const void *key1, const void *key2);void (*keyDestructor)(dict *d, void *key);void (*valDestructor)(dict *d, void *obj);int (*expandAllowed)(size_t moreMem, double usedRatio);/*如果设置了'no_value'标志，则表示没有使用值，即字典是一个集合。设置此标志时，无法访问dictEntry的值，也无法使用dicsetkey()。metadata也不能使用。*/unsigned int no_value:1;/*如果no_value =1并且所有的键都是奇数(LSB=1)，那么设置keys_are_odd =1可以实现另一个优化:在不分配dictEntry的情况下存储键。*/unsigned int keys_are_odd:1;size_t (*dictEntryMetadataBytes)(dict *d);size_t (*dictMetadataBytes)(void);void (*afterReplaceEntry)(dict *d, dictEntry *entry);
} dictType;

set是一个集合，它的底层实现也是dict，但是对于集合来说只有key值没有value值；所以为了兼容set的实现，dictType中有一个标志性的字段"no_value"，只要设置了该字段就表明这个dictEntry中只有key值没有value值，也就实现了set。

dictEntry

//dict中的entry
struct dictEntry {void *key;//指向key//union是指内存的同一个位置可以存储不同的数据类型，是为了兼容不同类型的value。//当value是uint64_t、int64_t、double的数据类型的时候，//可以直接内嵌在dictentry中，无需为此分配额外的内存，这样可以节省内存union {void *val;uint64_t u64;int64_t s64;double d;} v;struct dictEntry *next;     /* Next entry in the same hash bucket. 采用拉链法解决哈希冲突*/void *metadata[];           //存储额外的信息/*一个任意数量的字节（从指针对齐的地址开始），大小由dictType的dictEntryMetadataBytes()返回。*/
};

当no_value=1时对应的结构是

//只有key没有value相当于set
typedef struct {void *key;dictEntry *next;
} dictEntryNoValue;

宏定义

[redis-7.2.2\src\dict.h]

//根据ht_size_exp计算dictht_size
#define DICTHT_SIZE(exp) ((exp) == -1 ? 0 : (unsigned long)1<<(exp))
//获取sizemask
#define DICTHT_SIZE_MASK(exp) ((exp) == -1 ? 0 : (DICTHT_SIZE(exp))-1)

//每一个hashtable的初始化大小
#define DICT_HT_INITIAL_EXP      2
#define DICT_HT_INITIAL_SIZE     (1<<(DICT_HT_INITIAL_EXP))

#define dictFreeVal(d, entry) do {                     \if ((d)->type->valDestructor)                      \(d)->type->valDestructor((d), dictGetVal(entry)); \} while(0)#define dictFreeKey(d, entry) \if ((d)->type->keyDestructor) \(d)->type->keyDestructor((d), dictGetKey(entry))#define dictCompareKeys(d, key1, key2) \(((d)->type->keyCompare) ? \(d)->type->keyCompare((d), key1, key2) : \(key1) == (key2))#define dictEntryMetadataSize(d) ((d)->type->dictEntryMetadataBytes     \? (d)->type->dictEntryMetadataBytes(d) : 0)
#define dictMetadataSize(d) ((d)->type->dictMetadataBytes               \? (d)->type->dictMetadataBytes() : 0)

//获取key的哈希值
#define dictHashKey(d, key) ((d)->type->hashFunction(key))
//获取两个dictht的总slot个数
#define dictSlots(d) (DICTHT_SIZE((d)->ht_size_exp[0])+DICTHT_SIZE((d)->ht_size_exp[1]))
//获取两个dictht的总对象个数
#define dictSize(d) ((d)->ht_used[0]+(d)->ht_used[1])
//判断当前是否处在rehash阶段
#define dictIsRehashing(d) ((d)->rehashidx != -1)
//终止rehash
#define dictPauseRehashing(d) ((d)->pauserehash++)
//重新开始rehash
#define dictResumeRehashing(d) ((d)->pauserehash--)/* If our unsigned long type can store a 64 bit number, use a 64 bit PRNG. */
#if ULONG_MAX >= 0xffffffffffffffff
#define randomULong() ((unsigned long) genrand64_int64())
#else
#define randomULong() random()
#endif

散列函数

在这里插入图片描述

redis的字典默认的哈希函数是siphash，siphash算法即使在key很小的情况下，也可以产生随机性特别好的输出，性能非常突出。

散列冲突

通过dictEntry的结构中包含"struct entry *next 指向同一个slot的下一个next entry"可以得出，dict采用"拉链法"解决"散列冲突"。

在这里插入图片描述

dictEntry pointer bit tricks[指针位技巧]

/* 
指向dictEntry的指针中的最低3位决定了该指针实际指向的是什么。如果最小的位被设置，它就是一个键值。否则，最少的3位有效位标记条目的类型。
*/#define ENTRY_PTR_MASK     7 /* 111  与Mask相与获取数据的低三bit位*/
#define ENTRY_PTR_NORMAL   0 /* 000 已分配的entry并且带有value值*/
#define ENTRY_PTR_NO_VALUE 2 /* 010  已分配的entry但是不带有value值*/

/*返回1：entry pointer指向一个key值，而不是已经分配好的entry。其它情况返回0.
*/
static inline int entryIsKey(const dictEntry *de) {
//最低位设置了就是keyreturn (uintptr_t)(void *)de & 1;
}

/*entry pointer指向的是一个dictentry struct返回1否则返回0
*/
static inline int entryIsNormal(const dictEntry *de) {return ((uintptr_t)(void *)de & ENTRY_PTR_MASK) == ENTRY_PTR_NORMAL;
}

/*entry 指向的是一个不带value值得 dictentry struct返回1否则返回0*/
static inline int entryIsNoValue(const dictEntry *de) {return ((uintptr_t)(void *)de & ENTRY_PTR_MASK) == ENTRY_PTR_NO_VALUE;
}

/* Creates an entry without a value field. */
static inline dictEntry *createEntryNoValue(void *key, dictEntry *next) {dictEntryNoValue *entry = zmalloc(sizeof(*entry));entry->key = key;entry->next = next;//设置标记位ENTRY_PTR_NO_VALUE/*void*是普通指针相互转换的桥梁uintptr_t可以与void*相互转换uintptr_t可以参与指针计算    	*/return (dictEntry *)(void *)((uintptr_t)(void *)entry | ENTRY_PTR_NO_VALUE);
}

//编码，设置标志位
static inline dictEntry *encodeMaskedPtr(const void *ptr, unsigned int bits) {assert(((uintptr_t)ptr & ENTRY_PTR_MASK) == 0);return (dictEntry *)(void *)((uintptr_t)ptr | bits);
}
//解码，消除标志位
static inline void *decodeMaskedPtr(const dictEntry *de) {//非key才进行获取标志位操作assert(!entryIsKey(de));//"~"的优先级高于"&"，先进行取反操作后进行按位与操作//&~操作消除左操作数中与右操作数对应位置的1return (void *)((uintptr_t)(void *)de & ~ENTRY_PTR_MASK);
}//使用该函数之前确保dictEntry没有value,可以使用
//static inline int entryIsNoValue(const dictEntry *de) 进行判断
static inline dictEntryNoValue *decodeEntryNoValue(const dictEntry *de) {return decodeMaskedPtr(de);
}//如果entry有一个value值，也就是正常的ENTRY_PTR_NORMAL，返回1
static inline int entryHasValue(const dictEntry *de) {return entryIsNormal(de);
}

API implementation

_dictReset

/* Reset hash table parameters already initialized with _dictInit()*/
static void _dictReset(dict *d, int htidx)
{d->ht_table[htidx] = NULL;d->ht_size_exp[htidx] = -1;d->ht_used[htidx] = 0;
}

_dictInit

/* Initialize the hash table */
int _dictInit(dict *d, dictType *type)
{_dictReset(d, 0);_dictReset(d, 1);d->type = type;d->rehashidx = -1;d->pauserehash = 0;return DICT_OK;
}

dictCreate

//创建一个新的hashtable
dict *dictCreate(dictType *type)
{size_t metasize = type->dictMetadataBytes ? type->dictMetadataBytes() : 0;dict *d = zmalloc(sizeof(*d) + metasize);if (metasize) {memset(dictMetadata(d), 0, metasize);}_dictInit(d,type);return d;
}

dictGetHash

uint64_t dictGetHash(dict *d, const void *key) {return dictHashKey(d, key);
}

dictSetKey

void dictSetKey(dict *d, dictEntry* de, void *key) {//如果dictEntry设置了no_value标识，则不能使用该函数assert(!d->type->no_value);if (d->type->keyDup)de->key = d->type->keyDup(d, key);elsede->key = key;
}

dictSetVal

void dictSetVal(dict *d, dictEntry *de, void *val) {//entry有value值才可以设置assert(entryHasValue(de));//前面分析过，de->v是一个unionde->v.val = d->type->valDup ? d->type->valDup(d, val) : val;
}

dictSetNext

static void dictSetNext(dictEntry *de, dictEntry *next) {//分配好的entry struct才可以设置nextassert(!entryIsKey(de));if (entryIsNoValue(de)) {dictEntryNoValue *entry = decodeEntryNoValue(de);entry->next = next;} else {de->next = next;}
}

dictGetNext

/* Returns the 'next' field of the entry or 
NULL if the entry doesn't have a'next' field. 
*/
static dictEntry *dictGetNext(const dictEntry *de) {if (entryIsKey(de)) return NULL; /* there's no next */if (entryIsNoValue(de)) return decodeEntryNoValue(de)->next;return de->next;
}

dictGetVal

void *dictGetVal(const dictEntry *de) {assert(entryHasValue(de));return de->v.val;
}

dictGetKey

void *dictGetKey(const dictEntry *de) {if (entryIsKey(de)) return (void*)de;if (entryIsNoValue(de)) return decodeEntryNoValue(de)->key;return de->key;
}

_dictClear

/* Destroy an entire dictionary */
//销毁一个完整的字典
//callback回调函数，传入参数是dict*传出参数是void
int _dictClear(dict *d, int htidx, void(callback)(dict*)) {unsigned long i;//释放所有的元素for (i = 0; i < DICTHT_SIZE(d->ht_size_exp[htidx]) && d->ht_used[htidx] > 0; i++) {dictEntry *he, *nextHe;if (callback && (i & 65535) == 0) callback(d);if ((he = d->ht_table[htidx][i]) == NULL) continue;while(he) {nextHe = dictGetNext(he);//释放keydictFreeKey(d, he);//释放valdictFreeVal(d, he);//如果entry he不是一个key，释放entry structif (!entryIsKey(he)) zfree(decodeMaskedPtr(he));//元素个数减一d->ht_used[htidx]--;he = nextHe;}}/* Free the table and the allocated cache structure *///释放整个表zfree(d->ht_table[htidx]);/* Re-initialize the table *///初始化d[htidx]_dictReset(d, htidx);return DICT_OK; /* never fails */
}

dictEmpty

void dictEmpty(dict *d, void(callback)(dict*)) {
//清除第一个表dictht[0]_dictClear(d,0,callback);//清除第二个表dictht[1]_dictClear(d,1,callback);//重置rehashidx和pauserehashd->rehashidx = -1;d->pauserehash = 0;
}

dictRelease

/* Clear & Release the hash table */
void dictRelease(dict *d)
{
//清除第一个表dictht[0]_dictClear(d,0,NULL);//清除第二个表dictht[1]_dictClear(d,1,NULL);//释放字典zfree(d);
}

扩容

dictResize|dictExpand|_dictExpand|_dictNextExp

这个函数是用来重新设置dictht的大小。在达到扩容条件或者缩容条件的时候，进行内存重新分配的时候就会用到此函数计算出正确的内存大小。

typedef enum {DICT_RESIZE_ENABLE,DICT_RESIZE_AVOID,DICT_RESIZE_FORBID,
} dictResizeEnable;
static dictResizeEnable dict_can_resize = DICT_RESIZE_ENABLE;

/*
将表的大小调整为包含所有元素的最小大小,并且还要保证负载因子"used(表中的元素个数)/size(表的长度)"<=1;
*/
int dictResize(dict *d)
{unsigned long minimal;//如果当前的hashtable处于不能resize或者正在rehash的状态，则不能进行扩容或者缩容if (dict_can_resize != DICT_RESIZE_ENABLE || dictIsRehashing(d)) return DICT_ERR;//获取旧表的元素个数minimal = d->ht_used[0];//#define DICT_HT_INITIAL_EXP      2//#define DICT_HT_INITIAL_SIZE     (1<<(DICT_HT_INITIAL_EXP))if (minimal < DICT_HT_INITIAL_SIZE)minimal = DICT_HT_INITIAL_SIZE;return dictExpand(d, minimal);
}

第一步先矫正minimal。
之后调用dictExpand，先根据_dictNextExp计算新表的容量之后重新分配内存。

/* return DICT_ERR if expand was not performed */
int dictExpand(dict *d, unsigned long size) {return _dictExpand(d, size, NULL);
}

辅助函数dictNextExp

//返回大于等于size的第一个pow(2,exp)中的exp
static signed char _dictNextExp(unsigned long size)
{
//#define DICT_HT_INITIAL_EXP      2unsigned char e = DICT_HT_INITIAL_EXP;//2if (size >= LONG_MAX) return (8*sizeof(long)-1);while(1) {if (((unsigned long)1<<e) >= size)return e;e++;}
}

/* 成功分配返回DICT_OK，否则返回DICT_ERR*/
int _dictExpand(dict *d, unsigned long size, int* malloc_failed)
{//清空指针if (malloc_failed) *malloc_failed = 0;//正处于rehashing阶段或者申请内存小于当前元素个数[发生这种可能是刚刚迁移完数据，新表替代旧表]if (dictIsRehashing(d) || d->ht_used[0] > size)return DICT_ERR;// new hashtabledictEntry **new_ht_table;// the use of the new hashtableunsigned long new_ht_used;//根据size[旧表容量]计算出新表的容量//作用是返回第一次大于等于size的pow(2,exp)的expsigned char new_ht_size_exp = _dictNextExp(size);//检测是否溢出size_t newsize = 1ul<<new_ht_size_exp;if (newsize < size || newsize * sizeof(dictEntry*) < newsize)return DICT_ERR;//新表的大小等于旧表的大小if (new_ht_size_exp == d->ht_size_exp[0]) return DICT_ERR;/* Allocate the new hash table and initialize all pointers to NULL *///malloc_failed记录是否分配成功if (malloc_failed) {new_ht_table = ztrycalloc(newsize*sizeof(dictEntry*));*malloc_failed = new_ht_table == NULL;if (*malloc_failed)return DICT_ERR;} elsenew_ht_table = zcalloc(newsize*sizeof(dictEntry*));new_ht_used = 0;//重置新表的元素个数//d->ht_table[0]==NULL表明是第一次插入数据，此时d->ht_table被初始化默认的大小4if (d->ht_table[0] == NULL) {d->ht_size_exp[0] = new_ht_size_exp;d->ht_used[0] = new_ht_used;d->ht_table[0] = new_ht_table;return DICT_OK;}/* Prepare a second hash table for incremental rehashing *///为rehashing做准备，设置ht_table[1]d->ht_size_exp[1] = new_ht_size_exp;d->ht_used[1] = new_ht_used;d->ht_table[1] = new_ht_table;d->rehashidx = 0;//从0号索引开始迁移//此时只是为rehashing做了准备阶段，并没有真正的开启迁移数据return DICT_OK;
}

扩容触发条件

随着数据量的不断增大，哈希碰撞产生的可能性越来越大，同一个槽内的链表越来越长，为了保持查找，删除，添加的效率，需要进行扩容。所以我们从dictAdd函数下手。

dictAdd

/* Add an element to the target hash table */
int dictAdd(dict *d, void *key, void *val)
{//dictAddRaw找出key合适的插入位置并插入，如果已经存在返回NULLdictEntry *entry = dictAddRaw(d,key,NULL);//key已经存在if (!entry) return DICT_ERR;//没有设置no_value标识，设置相应的value值if (!d->type->no_value) dictSetVal(d, entry, val);return DICT_OK;
}

dictAddRaw

/**/
dictEntry *dictAddRaw(dict *d, void *key, dictEntry **existing)
{//寻找key的插入位置，如果key已经存在返回NULLvoid *position = dictFindPositionForInsert(d, key, existing);//key已经存在if (!position) return NULL;/* Dup the key if necessary. */if (d->type->keyDup) key = d->type->keyDup(d, key);//在合适的位置插入key，此时不设置对应的key，是为了满足用户根据自己的意愿设置或者不设置value值。return dictInsertAtPosition(d, key, position);
}

dictFindPositionForInsert

//寻找目标key的插入位置，如果key已经存在返回NULL
void *dictFindPositionForInsert(dict *d, const void *key, dictEntry **existing) {unsigned long idx, table;dictEntry *he;//获取key对应的hash值uint64_t hash = dictHashKey(d, key);if (existing) *existing = NULL;/*如果当前处于rehash的状态[rehashidx!=-1]，进行数据的迁移操作。这也是数据迁移触发的条件之一针对迁移的详细分析在下面。*/if (dictIsRehashing(d)) _dictRehashStep(d);/* Expand the hash table if needed */if (_dictExpandIfNeeded(d) == DICT_ERR)return NULL;//开始查找for (table = 0; table <= 1; table++) {//哈希值与MASK相与，得出寻找的目标key在dictht的位置下标idx = hash & DICTHT_SIZE_MASK(d->ht_size_exp[table]);//获取下标所在位置的第一个dictEntryhe = d->ht_table[table][idx];//像遍历链表那样，依次寻找目标keywhile(he) {//获取dictEntry的key值void *he_key = dictGetKey(he);if (key == he_key || dictCompareKeys(d, key, he_key)) {//key存在，返回NULL；并将目标key存储在existing中if (existing) *existing = he;return NULL;}//继续寻找下一个entryhe = dictGetNext(he);}//没有rehash,说明ht[1]没有，故不需要在ht[1]中寻找，直接退出外层循环。if (!dictIsRehashing(d)) break;}//走到这一步说明在ht中没有找到目标key，返回插入位置为插入操作做准备//如果正处于rehash,插入位置在ht[1]中，否则插入在ht[0]中。[头插法]dictEntry **bucket = &d->ht_table[dictIsRehashing(d) ? 1 : 0][idx];return bucket;
}

_dictExpandIfNeeded

/* Expand the hash table if needed */
static int _dictExpandIfNeeded(dict *d)
{//如果正在rehashing就直接返回//迁移数据的阶段不需要扩容if (dictIsRehashing(d)) return DICT_OK;//第一插入数据，将ht[0]扩大为初始的大小if (DICTHT_SIZE(d->ht_size_exp[0]) == 0) return dictExpand(d, DICT_HT_INITIAL_SIZE);/*检验是否允许expand,详细代码如下不允许的话，直接返回。*/if (!dictTypeExpandAllowed(d))return DICT_OK;//以下是扩容触发的条件if ((dict_can_resize == DICT_RESIZE_ENABLE &&d->ht_used[0] >= DICTHT_SIZE(d->ht_size_exp[0])) ||(dict_can_resize != DICT_RESIZE_FORBID &&d->ht_used[0] / DICTHT_SIZE(d->ht_size_exp[0]) > dict_force_resize_ratio)){return dictExpand(d, d->ht_used[0] + 1);}return DICT_OK;
}

/* Using dictEnableResize() / dictDisableResize() we make possible to* enable/disable resizing of the hash table as needed. This is very important* for Redis, as we use copy-on-write and don't want to move too much memory* around when there is a child performing saving operations.*  * Note that even when dict_can_resize is set to 0, not all resizes are* prevented: a hash table is still allowed to grow if the ratio between* the number of elements and the buckets > dict_force_resize_ratio. */
static unsigned int dict_force_resize_ratio = 5;

翻译一下上述的那段英文。在进行copy-on-write[写时复制，执行bgsave或者aofrewrite的时候会发生cop]，为了避免过多的内存从child中分离，此时不希望进行扩容操作。
如果装载因子超过安全值，不论当前有没有发生写时复制都会执行扩容操作。

dictTypeExpandAllowed

/*
扩容的时候，因为要一次性分配足够大的内存，所以需要根据成员函数"expandAlloewd"判断是否能够完成本次分配。
*/
static int dictTypeExpandAllowed(dict *d) {if (d->type->expandAllowed == NULL) return 1;return d->type->expandAllowed(DICTHT_SIZE(_dictNextExp(d->ht_used[0] + 1)) * sizeof(dictEntry*),(double)d->ht_used[0] / DICTHT_SIZE(d->ht_size_exp[0]));
}

expandAllowed的第一个参数是计算扩容之后新的容量，也即是第一次大于等于(d->ht_used[0]+1)的pow(2,exp)[这里的d->ht_used[0]加1是因为，需要先判断是否需要扩容，接着才会把新的key加入；所以计算的时候，新key还没有加入表中但是要计算的时候要将其包括在内。]
expandAllowed的第二个参数是，哈希表的装载因子

扩容策略

在这里插入图片描述

插入一个新的key之前，先判断是否需要扩容，如果需要扩容的话，先申请新的更大的空间，之后再将新的key插入新的表中。
扩容的原则就是"在满足能够包含所有元素[包括新插入的key]的基础上，保证新表的大小是最小的pow(2,exp)"。

扩容触发条件

在这里插入图片描述

扩容的触发条件1。装载因子大于等于1并且当前没有进行写时复制[bgsave，aofrewrite]
扩容的触发条件2。装载因子大于5.

dictInsertAtPosition

通过"dictFindPositionForInsert"找到目标key的插入位置，[key已经存在返回NULL此时不需要插入]。通过"dictInsertAtPosition"插入目标key。


dictEntry *dictInsertAtPosition(dict *d, void *key, void *position) {dictEntry **bucket = position; /* It's a bucket, but the API hides that. */dictEntry *entry;//判断插入位置position是否适当合理int htidx = dictIsRehashing(d) ? 1 : 0;assert(bucket >= &d->ht_table[htidx][0] &&bucket <= &d->ht_table[htidx][DICTHT_SIZE_MASK(d->ht_size_exp[htidx])]);size_t metasize = dictEntryMetadataSize(d);//如果设置了no_value标识if (d->type->no_value) {//不能使用metadataassert(!metasize); /* Entry metadata + no value not supported. */if (d->type->keys_are_odd && !*bucket) {/* We can store the key directly in the destination bucket without the* allocated entry.** TODO: Add a flag 'keys_are_even' and if set, we can use this* optimization for these dicts too. We can set the LSB bit when* stored as a dict entry and clear it again when we need the key* back. */entry = key;assert(entryIsKey(entry));} else {/* Allocate an entry without value. */entry = createEntryNoValue(key, *bucket);}} else {entry = zmalloc(sizeof(*entry) + metasize);assert(entryIsNormal(entry)); /* Check alignment of allocation */if (metasize > 0) {memset(dictEntryMetadata(entry), 0, metasize);}//link newentryentry->key = key;entry->next = *bucket;}*bucket = entry;d->ht_used[htidx]++;return entry;
}

通过代码可以发现，插入的操作很简单就是头插法

缩容

随着删除操作的不断执行，表中的数据越来越少，为了节约内存空间，需要把当前的表在满足装下所有元素的基础上进行缩小。所以从"Delete操作"入手。
[redis-7.2.2\src\t_hash.c]

dictDelete

//成功删除返回DICT_OK，否则返回DICT_ERR
int dictDelete(dict *ht, const void *key) {return dictGenericDelete(ht,key,0) ? DICT_OK : DICT_ERR;
}

//找到目标key并删除
static dictEntry *dictGenericDelete(dict *d, const void *key, int nofree) {uint64_t h, idx;dictEntry *he, *prevHe;int table;/* dict is empty */if (dictSize(d) == 0) return NULL;//此时正处于rehash阶段，先进行数据的迁移工作if (dictIsRehashing(d)) _dictRehashStep(d);//获取目标key的哈希值h = dictHashKey(d, key);for (table = 0; table <= 1; table++) {//获取目标key在ht中的位置下标idx = h & DICTHT_SIZE_MASK(d->ht_size_exp[table]);//获取下标所在的buckethe = d->ht_table[table][idx];prevHe = NULL;//遍历链表while(he) {//获取entry指向的keyvoid *he_key = dictGetKey(he);//找到目标keyif (key == he_key || dictCompareKeys(d, key, he_key)) {//目标key处在中间位置if (prevHe)dictSetNext(prevHe, dictGetNext(he));else//当前目标节点是bucket中的第一个节点d->ht_table[table][idx] = dictGetNext(he);if (!nofree) {//释放节点dictFreeUnlinkedEntry(d, he);}//元素个数减一d->ht_used[table]--;return he;}//保存prevhe,继续检测下一个entryprevHe = he;he = dictGetNext(he);}//没有rehash无需寻找ht[1]if (!dictIsRehashing(d)) break;}return NULL; /* not found */
}

htNeedsResize

int htNeedsResize(dict *dict) {long long size, used;//获取dict中两个ht的buckets长度之和size = dictSlots(dict);//获取dict中两个ht的元素总个数used = dictSize(dict);//#define HASHTABLE_MIN_FILL        10      /* Minimal hash table fill 10% */return (size > DICT_HT_INITIAL_SIZE &&(used*100/size < HASHTABLE_MIN_FILL));
}

缩容条件

在这里插入图片描述

缩容条件：装载因子小于0.1

缩容策略

if (htNeedsResize(o->ptr)) dictResize(o->ptr);

dictResize前面分析过：获取并修正旧表ht[0]的元素个数，以此为基础进行扩容，扩大[缩小为]为
大于等于used的第一个pow(2,exp)

迁移

迁移时机

扩容只是第一步，接下来需要逐步，以增量的方式迁移数据，将旧表中的数据迁移到新表，然后用新表替代旧表，将新表重置待下次扩容[缩容]时使用。

通过以上"扩容，缩容的分析"，我们可以发现，迁移触发的时机有以下两个
在这里插入图片描述

在hashtable中寻找新key的目标位置的时候，如果当前正处在rehash阶段，会先rehash进行数据的迁移，[如果不处于rehash阶段，会先判断是否需要扩容，先扩容]，然后会遍历key所在的槽判断key是否已经存在，不存在返回应该插入的位置，已经存在返回NULL。

在这里插入图片描述

删除一个key的时候，如果当前处于rehash阶段，会先进行rehash数据的迁移，之后遍历寻找目标key，找到之后删除key。

总结一下，就是在执行写操作的时候会触发数据的迁移rehash。可是也存在一个问题，如果线上客户端都不在执行删除，修改，插入这些写操作，那永远都不会触发迁移，那旧表中的数据该如何安置。其实redis服务器会有定时任务进行数据的迁移，即使线上没有写操作的执行也会进行数据的迁移。定时任务在后面介绍

接下俩看看，迁移的流程

迁移步骤

_dictRehashStep

/*
该函数由字典中的常见查找或更新操作调用，以便哈希表在活跃使用时自动从H1迁移到H2。也就是所查找和更新操作会触发rehash而且每次只rehash一个位置处[rehashidx指向的位置]的key链表
*/
static void _dictRehashStep(dict *d) {
//如果rehash没有被终止，就进行数据的迁移if (d->pauserehash == 0) dictRehash(d,1);
}

dictRehash

/*
执行N步增量散列。如果仍有键需要从old-hashtable迁移到new-hashtable则返回1，否则返回0；
一个rehash步骤在于移动一个bucket[包括产生hash冲突的key即一个槽内所有的key]从old-hashtable到new-hashtable；
由于hashtable的一部分可能由空白空间组成，因此不能保证此函数会rehash整个单个bucket，因为最多可以访问N*10个empty bucket，超过将会停止当前轮的rehash，该函数会阻塞很长时间
*/
int dictRehash(dict *d, int n) {int empty_visits = n*10; //最多能够访问N*10个empty bucket//hashatable[0]的sizeunsigned long s0 = DICTHT_SIZE(d->ht_size_exp[0]);//hashatable[1]的sizeunsigned long s1 = DICTHT_SIZE(d->ht_size_exp[1]);//如果当前的状态处于禁止rehash或者，没有设置rehashidx直接返回if (dict_can_resize == DICT_RESIZE_FORBID || !dictIsRehashing(d)) return 0;if (dict_can_resize == DICT_RESIZE_AVOID && ((s1 > s0 && s1 / s0 < dict_force_resize_ratio) ||(s1 < s0 && s0 / s1 < dict_force_resize_ratio))){return 0;}//开始进行迁移，n表示迁移的步数//如果过hashtable[0]没有元素则表示迁移结束while(n-- && d->ht_used[0] != 0) {dictEntry *de, *nextde;/*确保rehashidx没有超出范围 */assert(DICTHT_SIZE(d->ht_size_exp[0]) > (unsigned long)d->rehashidx);//从rehashidx开始，寻找一个非空的bucket，最多只能有n*10个empty bucketwhile(d->ht_table[0][d->rehashidx] == NULL) {d->rehashidx++;//遍历下一个bucketif (--empty_visits == 0) return 1;}//获取rehashidx指向槽的第一个Entryde = d->ht_table[0][d->rehashidx];//相当于遍历单链表while(de) {uint64_t h;//获取下一个dictentrynextde = dictGetNext(de);//从de中找出keyvoid *key = dictGetKey(de);//扩容状态，获取entry在新表中的位置if (d->ht_size_exp[1] > d->ht_size_exp[0]) {//重新计算哈希值h = dictHashKey(d, key) & DICTHT_SIZE_MASK(d->ht_size_exp[1]);} else {//处在缩容阶段h = d->rehashidx & DICTHT_SIZE_MASK(d->ht_size_exp[1]);}//设置了no_value标识if (d->type->no_value) {if (d->type->keys_are_odd && !d->ht_table[1][h]) {assert(entryIsKey(key));if (!entryIsKey(de)) zfree(decodeMaskedPtr(de));de = key;} else if (entryIsKey(de)) {/* We don't have an allocated entry but we need one. */de = createEntryNoValue(key, d->ht_table[1][h]);} else {/* Just move the existing entry to the destination table and* update the 'next' field. */assert(entryIsNoValue(de));dictSetNext(de, d->ht_table[1][h]);}} else {//将de插入newhashtable对应的位置处dictSetNext(de, d->ht_table[1][h]);}//修改槽的位置d->ht_table[1][h] = de;//ht[0]的元素个数减1d->ht_used[0]--;//ht[1]的元素个数加1d->ht_used[1]++;//继续迁移槽内的下一个entryde = nextde;}//ht[0]rehashidx指向的bucket已经全部迁移到ht[1]中，将其置为空d->ht_table[0][d->rehashidx] = NULL;d->rehashidx++;//为下一次rehash做准备}/* Check if we already rehashed the whole table... *///rehash完成，释放hashtable[0];//hashatable[1]成为hashtable[0]if (d->ht_used[0] == 0) {//释放ht[0]zfree(d->ht_table[0]);/* Copy the new ht onto the old one */d->ht_table[0] = d->ht_table[1];d->ht_used[0] = d->ht_used[1];d->ht_size_exp[0] = d->ht_size_exp[1];//重置ht1_dictReset(d, 1);//关闭rehash标识d->rehashidx = -1;//迁移全部完成返回0return 0;}/* More to rehash... */return 1;
}

迁移的顺序

通过源码分析，可以得出迁移的顺序是按照"rehashidx"进行的，并且每次只迁移一个非空的bucket，寻找非空的bucket时最多只能扫描到n*10个 empty bucket。[这里的n表示每次进行几次迁移操作，每次只迁移一次]

迁移何时停止，或者说如何判断迁移是否完成

分析源码可以发现，ht_used[0]==0表示数据迁移全部完成。即是否迁移完成是根据旧表是否还有元素来进行判断的。

redis服务器定时任务----迁移数据

为了防止，线上的客户端不再执行写操作(hset,hdel等指令)，导致迁移操作无法继续进行。redis会在定时任务对字典进行主动搬迁。
[redis-7.2.2\src\server.c]


void databasesCron(void) {//通过随机采样删除过期key，从节点不需要主动删除//通过主节点同步del语句即可if (server.active_expire_enabled) {if (iAmMaster()) {activeExpireCycle(ACTIVE_EXPIRE_CYCLE_SLOW);} else {expireSlaveKeys();}}/* Defrag keys gradually. */activeDefragCycle();/*如果需要，执行散列表重新散列，但只有在没有其他进程在磁盘上保存DB时才执行。否则，重新散列是不好的，因为会导致大量的写时复制内存页。*/if (!hasActiveChildProcess()) {static unsigned int resize_db = 0;static unsigned int rehash_db = 0;//#define CRON_DBS_PER_CALL 16int dbs_per_call = CRON_DBS_PER_CALL;int j;/* Don't test more DBs than we have. */if (dbs_per_call > server.dbnum) dbs_per_call = server.dbnum;/* Resize */for (j = 0; j < dbs_per_call; j++) {tryResizeHashTables(resize_db % server.dbnum);resize_db++;}/* Rehash */if (server.activerehashing) {for (j = 0; j < dbs_per_call; j++) {int work_done = incrementallyRehash(rehash_db);if (work_done) {/* If the function did some work, stop here, we'll do* more at the next cron loop. */break;} else {/* If this db didn't need rehash, we'll try the next one. */rehash_db++;rehash_db %= server.dbnum;}}}}
}

/* If the percentage of used slots in the HT reaches HASHTABLE_MIN_FILL* we resize the hash table to save memory */
void tryResizeHashTables(int dbid) {if (htNeedsResize(server.db[dbid].dict))dictResize(server.db[dbid].dict);if (htNeedsResize(server.db[dbid].expires))dictResize(server.db[dbid].expires);
}

/*
我们的哈希表实现在我们从哈希表中写入/读取时执行增量的重新哈希。但是，如果服务器空闲，哈希表将长时间使用两个表。因此，我们尝试在每次调用该函数时使用1毫秒的CPU时间来执行一些重新散列。
如果执行了一些散列，该函数返回1，否则返回0。
*/
int incrementallyRehash(int dbid) {/* Keys dictionary */if (dictIsRehashing(server.db[dbid].dict)) {dictRehashMilliseconds(server.db[dbid].dict,1);return 1; /* already used our millisecond for this loop... */}/* Expires */if (dictIsRehashing(server.db[dbid].expires)) {dictRehashMilliseconds(server.db[dbid].expires,1);return 1; /* already used our millisecond for this loop... */}return 0;
}

旧版本中dict的结构

typedef struct dict {dictType *type;void *privdata;dictht ht[2];long rehashidx; /* rehashing not in progress if rehashidx == -1 */unsigned long iterators; /* number of iterators currently running */
} dict;/* This is our hash table structure. Every dictionary has two of this as we* implement incremental rehashing, for the old to the new table. */
typedef struct dictht {dictEntry **table;unsigned long size;unsigned long sizemask;unsigned long used;
} dictht;typedef struct dictEntry {void *key;union {void *val;uint64_t u64;int64_t s64;double d;} v;struct dictEntry *next;
} dictEntry;//Union允许在同一内存位置存储不同的数据类型，而Enum用于定义一组相关常量并赋予它们有意义的名称。

在这里插入图片描述

总结

负载因子ratio=used/buckets[表中的元素数量/哈希表一维数组长度]

扩容时机

ratio>=1并且不发生aofwrite，bgsave，这样做是为了防止更多的内存分离
ratio>5，强制进行扩容

缩容时机

ratio<0.1强制缩容，为了节省内存空间

扩容策略

新表的大小为第一次大于原表uesd+1的2的次幂[redis3.2.100版本是原表used*2]

缩容策略

容纳所有元素的最小大小；新表的大小为第一次大于原表uesd的2的次幂[redis3.2.100版本是原表used]

迁移的实现

迁移的时机。在"dictFindPositionForInsert"和"dictGenericDelete"这两个函数中会发生数据的迁移dictRehash，也就是线上执行写操作的时候会触发rehash。为了防止客户端下线不再执行写操作，dict长时间占用着两个表，redis后台线程会专门维护一个定时任务用来进行数据的迁移。
迁移的顺序。按照rehashidx指向的顺序进行数据的迁移，而且每次只迁移一个bucket。
迁移完成。如果旧表中的元素个数变为0则表明迁移完成。(通过源码可以发现，最外层循环是通过判断旧表中的元素个数是否为0，不为0的话进入循环内会继续判断rehashidx是否超过旧表数组的一维长度，所以我认为判断迁移是否完成是通过used和rehashidx共同完成的。)