本篇内容介绍了“怎么理解PostgreSQL的后台进程autovacuum”的有关知识,在实际案例的操作过程中,不少人都会遇到这样的困境,接下来就让小编带领大家学习一下如何处理这些情况吧!希望大家仔细阅读,能够学有所成!
一、数据结构
AutoVacuumShmem
主要的autovacuum共享内存结构体,存储在shared memory中,同时WorkerInfo也会存储在其中.
typedef struct{ sig_atomic_t av_signal[AutoVacNumSignals]; pid_t av_launcherpid; dlist_head av_freeWorkers; dlist_head av_runningWorkers; WorkerInfo av_startingWorker; AutoVacuumWorkItem av_workItems[NUM_WORKITEMS];} AutoVacuumShmemStruct;static AutoVacuumShmemStruct *AutoVacuumShmem;
avw_dbase
用于跟踪worker中的数据库的结构体
//用于跟踪worker中的数据库的结构体typedef struct avw_dbase{ Oid adw_datid; char *adw_name; TransactionId adw_frozenxid; MultiXactId adw_minmulti; PgStat_StatDBEntry *adw_entry;} avw_dbase;
二、源码解读
rebuild_database_list用于构建出现变化后的DatabaseList,链表中的数据库应出现在pgstats中,在autovacuum_naptime所设定的时间间隔范围内均匀分布。
比如autovacuum_naptime = 60s,有4个数据库db1->db4,那么每隔60s/4就会有启动一个autovacuum worker对相应的DB进行处理。
可能的一个处理时间序列是:db1->XX(时):XX(分):18(秒),db4->XX:XX:33,db4->XX:XX:48,db4->XX:XX:03
后续如需要对db1->db4进行vacuum,那么db1->db4会在下一个18秒、33秒、48秒和03秒触发autovacuum。
static voidrebuild_database_list(Oid newdb){ List *dblist; ListCell *cell; MemoryContext newcxt; MemoryContext oldcxt; MemoryContext tmpcxt; HASHCTL hctl; int score; int nelems; HTAB *dbhash; dlist_iter iter; autovac_refresh_stats(); newcxt = AllocSetContextCreate(AutovacMemCxt, "AV dblist", ALLOCSET_DEFAULT_SIZES); tmpcxt = AllocSetContextCreate(newcxt, "tmp AV dblist", ALLOCSET_DEFAULT_SIZES); oldcxt = MemoryContextSwitchTo(tmpcxt); hctl.keysize = sizeof(Oid); hctl.entrysize = sizeof(avl_dbase); hctl.hcxt = tmpcxt; dbhash = hash_create("db hash", 20, &hctl, HASH_ELEM | HASH_BLOBS | HASH_CONTEXT); score = 0;//分值从0开始 if (OidIsValid(newdb)) { avl_dbase *db; PgStat_StatDBEntry *entry; //只关注存在pgstat条目的数据库 entry = pgstat_fetch_stat_dbentry(newdb); if (entry != NULL) { db = hash_search(dbhash, &newdb, HASH_ENTER, NULL); db->adl_score = score++; } } //从现存链表中插入到数据库中 dlist_foreach(iter, &DatabaseList) { avl_dbase *avdb = dlist_container(avl_dbase, adl_node, iter.cur); avl_dbase *db; bool found; PgStat_StatDBEntry *entry; entry = pgstat_fetch_stat_dbentry(avdb->adl_datid); if (entry == NULL) continue; db = hash_search(dbhash, &(avdb->adl_datid), HASH_ENTER, &found); if (!found) { db->adl_score = score++; } } //插入先前没有处理过的数据库 dblist = get_database_list(); foreach(cell, dblist) { avw_dbase *avdb = lfirst(cell); avl_dbase *db; bool found; PgStat_StatDBEntry *entry; //只考虑存在pgstat的数据库 entry = pgstat_fetch_stat_dbentry(avdb->adw_datid); if (entry == NULL) continue; db = hash_search(dbhash, &(avdb->adw_datid), HASH_ENTER, &found); if (!found) { db->adl_score = score++; } } nelems = score; MemoryContextSwitchTo(newcxt); dlist_init(&DatabaseList); if (nelems > 0) { TimestampTz current_time; int millis_increment; avl_dbase *dbary; avl_dbase *db; HASH_SEQ_STATUS seq; int i; //放到数组中 dbary = palloc(nelems * sizeof(avl_dbase)); i = 0; hash_seq_init(&seq, dbhash); while ((db = hash_seq_search(&seq)) != NULL) memcpy(&(dbary[i++]), db, sizeof(avl_dbase)); //排序 qsort(dbary, nelems, sizeof(avl_dbase), db_comparator); //确定数据库之间的调度间隔:autovacuum_naptime/数据库个数 millis_increment = 1000.0 * autovacuum_naptime / nelems; if (millis_increment <= MIN_AUTOVAC_SLEEPTIME) millis_increment = MIN_AUTOVAC_SLEEPTIME * 1.1; current_time = GetCurrentTimestamp(); for (i = 0; i < nelems; i++) { avl_dbase *db = &(dbary[i]); current_time = TimestampTzPlusMilliseconds(current_time, millis_increment); db->adl_next_worker = current_time; dlist_push_head(&DatabaseList, &db->adl_node); } } if (DatabaseListCxt != NULL) MemoryContextDelete(DatabaseListCxt); MemoryContextDelete(tmpcxt); DatabaseListCxt = newcxt; MemoryContextSwitchTo(oldcxt);}
三、跟踪分析
启动gdb,设置信号处理,设置断点
(gdb) b rebuild_database_listBreakpoint 1 at 0x82eb2a: file autovacuum.c, line 931.(gdb) handle SIGINT print nostop passSIGINT is used by the debugger.Are you sure you want to change it? (y or n) ySignal Stop Print Pass to program DescriptionSIGINT No Yes Yes Interrupt(gdb) cContinuing.^CProgram received signal SIGINT, Interrupt.
进入断点
Breakpoint 1, rebuild_database_list (newdb=0) at autovacuum.c:931931 autovac_refresh_stats();(gdb) n933 newcxt = AllocSetContextCreate(AutovacMemCxt,(gdb) 936 tmpcxt = AllocSetContextCreate(newcxt,(gdb) 939 oldcxt = MemoryContextSwitchTo(tmpcxt);(gdb) 957 hctl.keysize = sizeof(Oid);(gdb) 958 hctl.entrysize = sizeof(avl_dbase);(gdb) 959 hctl.hcxt = tmpcxt;
查看统计信息文件:pg_stat_tmp/global.stat
(gdb) p *pgstat_stat_filename$1 = 112 'p'(gdb) p pgstat_stat_filename$2 = 0x203d7e0 "pg_stat_tmp/global.stat"(gdb) n960 dbhash = hash_create("db hash", 20, &hctl, (gdb) ###[pg12@localhost pg_stat_tmp]$ pwd/data/pgsql/pg121db/pg_stat_tmp[pg12@localhost pg_stat_tmp]$ lltotal 4-rw------- 1 pg12 pg12 237 Dec 11 16:40 global.stat[pg12@localhost pg_stat_tmp]$
构建需处理的数据库链表
964 score = 0;(gdb) 965 if (OidIsValid(newdb))(gdb) p *hctlStructure has no component named operator*.(gdb) p hctl$3 = {num_partitions = 140725872814104, ssize = 34131296, dsize = 32, max_dsize = 0, ffactor = 257, keysize = 4, entrysize = 40, hash = 0xc6afd3, match = 0x208cd60, keycopy = 0x0, alloc = 0x1, hcxt = 0x2090d80, hctl = 0xfe3a00 <ConfigureNamesString+4864>}(gdb) n984 dlist_foreach(iter, &DatabaseList)(gdb) p *DatabaseListStructure has no component named operator*.(gdb) p DatabaseList$4 = {head = {prev = 0xfd9880 <DatabaseList>, next = 0xfd9880 <DatabaseList>}}(gdb) n1010 dblist = get_database_list();(gdb) 1011 foreach(cell, dblist)(gdb) p *dblist$5 = {type = T_List, length = 7, head = 0x2090ef8, tail = 0x2091240}(gdb) p *dblist->head$6 = {data = {ptr_value = 0x2090e98, int_value = 34147992, oid_value = 34147992}, next = 0x2090fb0}(gdb) p *(Node *)dblist->head->data.ptr_value$7 = {type = 13591}(gdb) p *dblist->head->data.ptr_valueAttempt to dereference a generic pointer.(gdb) n1013 avw_dbase *avdb = lfirst(cell);(gdb)
如没有统计信息,则不予处理
1019 entry = pgstat_fetch_stat_dbentry(avdb->adw_datid);(gdb) p *avdb$8 = {adw_datid = 13591, adw_name = 0x2090ed0 "postgres", adw_frozenxid = 479, adw_minmulti = 1, adw_entry = 0x0}(gdb) n1020 if (entry == NULL)(gdb) 1011 foreach(cell, dblist)(gdb) 1013 avw_dbase *avdb = lfirst(cell);(gdb) 1019 entry = pgstat_fetch_stat_dbentry(avdb->adw_datid);(gdb) p *avdb$9 = {adw_datid = 16384, adw_name = 0x2090f90 "testdb", adw_frozenxid = 2921, adw_minmulti = 1, adw_entry = 0x0}(gdb) steppgstat_fetch_stat_dbentry (dbid=16384) at pgstat.c:24382438 backend_read_statsfile();(gdb) stepbackend_read_statsfile () at pgstat.c:56445644 TimestampTz min_ts = 0;(gdb) n5645 TimestampTz ref_ts = 0;(gdb) 5650 if (pgStatDBHash)(gdb) 5651 return;(gdb) 5766 }(gdb) pgstat_fetch_stat_dbentry (dbid=16384) at pgstat.c:24432443 return (PgStat_StatDBEntry *) hash_search(pgStatDBHash,(gdb) 2446 }(gdb) rebuild_database_list (newdb=0) at autovacuum.c:10201020 if (entry == NULL)(gdb) n1011 foreach(cell, dblist)(gdb) 1013 avw_dbase *avdb = lfirst(cell);(gdb) 1019 entry = pgstat_fetch_stat_dbentry(avdb->adw_datid);(gdb) 1020 if (entry == NULL)(gdb) 1011 foreach(cell, dblist)(gdb) 1013 avw_dbase *avdb = lfirst(cell);(gdb) 1019 entry = pgstat_fetch_stat_dbentry(avdb->adw_datid);(gdb) 1020 if (entry == NULL)(gdb) 1011 foreach(cell, dblist)(gdb) 1013 avw_dbase *avdb = lfirst(cell);(gdb) 1019 entry = pgstat_fetch_stat_dbentry(avdb->adw_datid);(gdb) 1020 if (entry == NULL)(gdb) 1011 foreach(cell, dblist)(gdb) 1013 avw_dbase *avdb = lfirst(cell);(gdb) 1019 entry = pgstat_fetch_stat_dbentry(avdb->adw_datid);(gdb) 1020 if (entry == NULL)(gdb) 1011 foreach(cell, dblist)(gdb) 1013 avw_dbase *avdb = lfirst(cell);(gdb) 1019 entry = pgstat_fetch_stat_dbentry(avdb->adw_datid);(gdb) 1020 if (entry == NULL)(gdb) 1011 foreach(cell, dblist)(gdb) 1032 nelems = score;(gdb) 1035 MemoryContextSwitchTo(newcxt);(gdb) n1036 dlist_init(&DatabaseList);(gdb)
所有数据库都不需要处理,返回
1038 if (nelems > 0)(gdb) p nelems$10 = 0(gdb) n1089 if (DatabaseListCxt != NULL)(gdb) 1091 MemoryContextDelete(tmpcxt);(gdb) 1092 DatabaseListCxt = newcxt;(gdb) 1093 MemoryContextSwitchTo(oldcxt);(gdb) 1094 }(gdb) AutoVacLauncherMain (argc=0, argv=0x0) at autovacuum.c:625625 while (!got_SIGTERM)(gdb)
“怎么理解PostgreSQL的后台进程autovacuum”的内容就介绍到这里了,感谢大家的阅读。如果想了解更多行业相关的知识可以关注编程网网站,小编将为大家输出更多高质量的实用文章!