PostgreSQL์—์„œ ์ž ๊ธˆ ๊ธฐ๋ก์„ ๊ฐ€์ ธ์˜ค๋Š” ๋ฐฉ๋ฒ• ์ค‘ ํ•˜๋‚˜

๊ธฐ์‚ฌ ๊ณ„์† โ€œPostgreSQL์šฉ ASH ์•„๋‚ ๋กœ๊ทธ๋ฅผ ์ƒ์„ฑํ•˜๋ ค๋Š” ์‹œ๋„ ".

์ด ๊ธฐ์‚ฌ์—์„œ๋Š” ํŠน์ • ์ฟผ๋ฆฌ์™€ ์˜ˆ์ œ๋ฅผ ์‚ฌ์šฉํ•˜์—ฌ pg_locks ๋ทฐ์˜ ๊ธฐ๋ก์„ ์‚ฌ์šฉํ•˜์—ฌ ์–ด๋–ค ์œ ์šฉํ•œ ์ •๋ณด๋ฅผ ์–ป์„ ์ˆ˜ ์žˆ๋Š”์ง€ ์กฐ์‚ฌํ•˜๊ณ  ๋ณด์—ฌ์ค„ ๊ฒƒ์ž…๋‹ˆ๋‹ค.

๊ฒฝ๊ณ 
์ฃผ์ œ์˜ ์ฐธ์‹ ํ•จ๊ณผ ์™„๋ฃŒ๋˜์ง€ ์•Š์€ ํ…Œ์ŠคํŠธ ๊ธฐ๊ฐ„์œผ๋กœ ์ธํ•ด ๊ธฐ์‚ฌ์— ์˜ค๋ฅ˜๊ฐ€ ์žˆ์„ ์ˆ˜ ์žˆ์Šต๋‹ˆ๋‹ค. ๋น„ํŒ๊ณผ ๋…ผํ‰์€ ์ ๊ทน ํ™˜์˜ํ•˜๊ณ  ๊ธฐ๋Œ€ํ•ฉ๋‹ˆ๋‹ค.

์ž…๋ ฅ ๋ฐ์ดํ„ฐ

pg_locks ํ‘œํ˜„์˜ ์—ญ์‚ฌ

archive_locking

CREATE TABLE archive_locking 
(       timepoint timestamp without time zone ,
	locktype text ,
	relation oid ,
	mode text ,
	tid xid ,
	vtid text ,
	pid integer ,
	blocking_pids integer[] ,
	granted boolean ,
        queryid bigint 
);

๊ธฐ๋ณธ์ ์œผ๋กœ ํ…Œ์ด๋ธ”์€ ํ…Œ์ด๋ธ”๊ณผ ์œ ์‚ฌํ•ฉ๋‹ˆ๋‹ค. archive_pg_stat_activity, ์—ฌ๊ธฐ์— ๋” ์ž์„ธํžˆ ์„ค๋ช…๋˜์–ด ์žˆ์Šต๋‹ˆ๋‹ค. pg_stat_statements + pg_stat_activity + loq_query = pg_ash? ๊ทธ๋ฆฌ๊ณ  ์—ฌ๊ธฐ - PostgreSQL์šฉ ASH ์œ ์‚ฌ์ฒด๋ฅผ ์ƒ์„ฑํ•˜๋ ค๋Š” ์‹œ๋„์ž…๋‹ˆ๋‹ค.

์—ด์„ ์ฑ„์šฐ๋ ค๋ฉด ์ฟผ๋ฆฌID ๊ธฐ๋Šฅ์ด ์‚ฌ์šฉ๋ฉ๋‹ˆ๋‹ค

update_history_locking_by_queryid

--update_history_locking_by_queryid.sql
CREATE OR REPLACE FUNCTION update_history_locking_by_queryid() RETURNS boolean AS $$
DECLARE
  result boolean ;
  current_minute double precision ; 
  
  start_minute integer ;
  finish_minute integer ;
  
  start_period timestamp without time zone ;
  finish_period timestamp without time zone ;
  
  lock_rec record ; 
  endpoint_rec record ; 
  
  current_hour_diff double precision ;
BEGIN
  RAISE NOTICE '***update_history_locking_by_queryid';
  
  result = TRUE ;
  
  current_minute = extract ( minute from now() );

  SELECT * FROM endpoint WHERE is_need_monitoring
  INTO endpoint_rec ;
  
  current_hour_diff = endpoint_rec.hour_diff ;
  
  IF current_minute < 5 
  THEN
	RAISE NOTICE 'Current time is less than 5 minute.';
	
	start_period = date_trunc('hour',now()) + (current_hour_diff * interval '1 hour');
    finish_period = start_period - interval '5 minute' ;
  ELSE 
    finish_minute =  extract ( minute from now() ) / 5 ;
    start_minute =  finish_minute - 1 ;
  
    start_period = date_trunc('hour',now()) + interval '1 minute'*start_minute*5+(current_hour_diff * interval '1 hour');
    finish_period = date_trunc('hour',now()) + interval '1 minute'*finish_minute*5+(current_hour_diff * interval '1 hour') ;
    
  END IF ;  
  
  RAISE NOTICE 'start_period = %', start_period;
  RAISE NOTICE 'finish_period = %', finish_period;

	FOR lock_rec IN   
	WITH act_queryid AS
	 (
		SELECT 
				pid , 
				timepoint ,
				query_start AS started ,			
				MAX(timepoint) OVER (PARTITION BY pid ,	query_start   ) AS finished ,			
				queryid 
		FROM 
				activity_hist.history_pg_stat_activity 			
		WHERE 			
				timepoint BETWEEN start_period and 
								  finish_period
		GROUP BY 
				pid , 
				timepoint ,  
				query_start ,
				queryid 
	 ),
	 lock_pids AS
		(
			SELECT
				hl.pid , 
				hl.locktype  ,
				hl.mode ,
				hl.timepoint , 
				MIN ( timepoint ) OVER (PARTITION BY pid , locktype  ,mode ) as started 
			FROM 
				activity_hist.history_locking hl
			WHERE 
				hl.timepoint between start_period and 
								     finish_period
			GROUP BY 
				hl.pid , 
				hl.locktype  ,
				hl.mode ,
				hl.timepoint 
		)
	SELECT 
		lp.pid , 
		lp.locktype  ,
		lp.mode ,
		lp.timepoint ,     
		aq.queryid 
	FROM lock_pids 	lp LEFT OUTER JOIN act_queryid aq ON ( lp.pid = aq.pid AND lp.started BETWEEN aq.started AND aq.finished )
	WHERE aq.queryid IS NOT NULL 
	GROUP BY  
		lp.pid , 
		lp.locktype  ,
		lp.mode ,
		lp.timepoint , 
		aq.queryid
	LOOP
		UPDATE activity_hist.history_locking SET queryid = lock_rec.queryid 
		WHERE pid = lock_rec.pid AND locktype = lock_rec.locktype AND mode = lock_rec.mode AND timepoint = lock_rec.timepoint ;	
	END LOOP;    
  
  RETURN result ;
END
$$ LANGUAGE plpgsql;

์„ค๋ช… : queryid ์ปฌ๋Ÿผ์˜ ๊ฐ’์€ History_locking ํ…Œ์ด๋ธ”์—์„œ ์—…๋ฐ์ดํŠธ๋˜๋ฉฐ, archive_locking ํ…Œ์ด๋ธ”์— ๋Œ€ํ•ด ์ƒˆ ํŒŒํ‹ฐ์…˜์ด ์ƒ์„ฑ๋˜๋ฉด ํ•ด๋‹น ๊ฐ’์ด ๊ธฐ๋ก ๊ฐ’์— ์ €์žฅ๋ฉ๋‹ˆ๋‹ค.

์ถœ๋ ฅ

์ผ๋ฐ˜์ ์ธ ํ”„๋กœ์„ธ์Šค์— ๋Œ€ํ•œ ์ผ๋ฐ˜ ์ •๋ณด์ž…๋‹ˆ๋‹ค.

์ž ๊ธˆ ์œ ํ˜•๋ณ„ ์ž ๊ธˆ ๋Œ€๊ธฐ ์ค‘

์ฃผ์žฅ

WITH
t AS
(
	SELECT 
		locktype  ,
		mode ,
		count(*) as total 
	FROM 
		activity_hist.archive_locking
	WHERE 
		timepoint between pg_stat_history_begin+(current_hour_diff * interval '1 hour') AND pg_stat_history_end+(current_hour_diff * interval '1 hour') AND 
		NOT granted
	GROUP BY 
		locktype  ,
		mode  
)
SELECT 
	locktype  ,
	mode ,
	total * interval '1 second' as duration			
FROM t 		
ORDER BY 3 DESC 

์˜ˆ

| ์ž ๊ธˆ ์œ ํ˜•๋ณ„ ์ž ๊ธˆ ๋Œ€๊ธฐ ์ค‘ +------------+------------ ---------+ ------ | ์ž ๊ธˆ ์œ ํ˜•| ๋ชจ๋“œ| ๊ธฐ๊ฐ„ +---------+--------------- - ------------ | ๊ฑฐ๋ž˜ID| ๊ณต์œ ์ž ๊ธˆ| 19:39:26 | ํŠœํ”Œ| ์ ‘๊ทผ๋…์ ์ž ๊ธˆ| 00:03:35 +------+------------ - -----+------------

์ž๋ฌผ์‡  ์ข…๋ฅ˜์— ๋”ฐ๋ฅธ ์ž๋ฌผ์‡  ์‚ฌ์šฉ

์ฃผ์žฅ

WITH
t AS
(
	SELECT 
		locktype  ,
		mode ,
		count(*) as total 
	FROM 
		activity_hist.archive_locking
	WHERE 
		timepoint between pg_stat_history_begin+(current_hour_diff * interval '1 hour') AND pg_stat_history_end+(current_hour_diff * interval '1 hour') AND 
		granted
	GROUP BY 
		locktype  ,
		mode  
)
SELECT 
	locktype  ,
	mode ,
	total * interval '1 second' as duration			
FROM t 		
ORDER BY 3 DESC 

์˜ˆ

| ์ž ๊ธˆ ์œ ํ˜•๋ณ„ ์ž ๊ธˆ ํ•ด์ œ +---------+------------------------- --------+------ | ์ž ๊ธˆ ์œ ํ˜•| ๋ชจ๋“œ| ๊ธฐ๊ฐ„ +---------+--------------- - ------------ | ๊ด€๊ณ„| ํ–‰๋…์ ์ž ๊ธˆ| 51:11:10 | ๊ฐ€์ƒID| ๋…์ ์ž ๊ธˆ| 48:10:43 | ๊ฑฐ๋ž˜ID| ๋…์ ์ž ๊ธˆ| 44:24:53 | ๊ด€๊ณ„| ์•ก์„ธ์Šค๊ณต์œ ์ž ๊ธˆ| 20:06:13 | ํŠœํ”Œ| ์ ‘๊ทผ๋…์ ์ž ๊ธˆ| 17:58:47 | ํŠœํ”Œ| ๋…์ ์ž ๊ธˆ| 01:40:41 | ๊ด€๊ณ„| ๊ณต์œ ์—…๋ฐ์ดํŠธ๋…์ ์ž ๊ธˆ| 00:26:41 | ๊ฐœ์ฒด| ํ–‰๋…์ ์ž ๊ธˆ| 00:00:01 | ๊ฑฐ๋ž˜ID| ๊ณต์œ ์ž ๊ธˆ| 00:00:01 | ์—ฐ์žฅ| ๋…์ ์ž ๊ธˆ| 00:00:01 +------+------------ - -----+------------

ํŠน์ • queryid ์š”์ฒญ์— ๋Œ€ํ•œ ์ž์„ธํ•œ ์ •๋ณด

QUERYID๋ณ„ ์ž ๊ธˆ ์œ ํ˜•๋ณ„ ์ž ๊ธˆ ๋Œ€๊ธฐ ์ค‘

์ฃผ์žฅ

WITH
lt AS
(
	SELECT
		pid , 
		locktype  ,
		mode ,
		timepoint , 
		queryid , 
		blocking_pids ,
                MIN ( timepoint ) OVER (PARTITION BY pid , locktype  ,mode ) as started  
	FROM 
		activity_hist.archive_locking
	WHERE 
		timepoint between pg_stat_history_begin+(current_hour_diff * interval '1 hour') AND 
			                  pg_stat_history_end+(current_hour_diff * interval '1 hour') AND 
		NOT granted AND
	       queryid IS NOT NULL 
	GROUP BY 
	        pid , 
		locktype  ,
		mode ,
		timepoint ,
		queryid ,
		blocking_pids 
)
SELECT 
        lt.pid , 
	lt.locktype  ,
	lt.mode ,			
        lt.started ,
	lt.queryid  ,
	lt.blocking_pids ,
	COUNT(*)  * interval '1 second'	 as duration		
FROM lt 	
GROUP BY 
	lt.pid , 
        lt.locktype  ,
	lt.mode ,			
        lt.started ,
        lt.queryid ,
	lt.blocking_pids 
ORDER BY 4

์˜ˆ

| QUERYID์˜ ์ž ๊ธˆ ์œ ํ˜•๋ณ„ ์ž ๊ธˆ ๋Œ€๊ธฐ ์ค‘ +----------+------------+------ --------------- +---------------+--- ---- -+---------+------------ --------- | PID| ์ž ๊ธˆ ์œ ํ˜•| ๋ชจ๋“œ| ์‹œ์ž‘๋จ| ์ฟผ๋ฆฌID| Blocking_pids| ๊ธฐ๊ฐ„ +------------+------------+----------- ---------+---------------+--------- -- --------+---------+------ -- - | 11288| ๊ฑฐ๋ž˜ID| ๊ณต์œ ์ž ๊ธˆ| 2019-09-17 10:00:00.302936| 389015618226997618| {11092}| 00:03:34 | 11626| ๊ฑฐ๋ž˜ID| ๊ณต์œ ์ž ๊ธˆ| 2019-09-17 10:00:21.380921| 389015618226997618| {12380}| 00:00:29 | 11626| ๊ฑฐ๋ž˜ID| ๊ณต์œ ์ž ๊ธˆ| 2019-09-17 10:00:21.380921| 389015618226997618| {11092}| 00:03:25 | 11626| ๊ฑฐ๋ž˜ID| ๊ณต์œ ์ž ๊ธˆ| 2019-09-17 10:00:21.380921| 389015618226997618| {12213}| 00:01:55 | 11626| ๊ฑฐ๋ž˜ID| ๊ณต์œ ์ž ๊ธˆ| 2019-09-17 10:00:21.380921| 389015618226997618| {12751}| 00:00:01 | 11629| ๊ฑฐ๋ž˜ID| ๊ณต์œ ์ž ๊ธˆ| 2019-09-17 10:00:24.331935| 389015618226997618| {11092}| 00:03:22 | 11629| ๊ฑฐ๋ž˜ID| ๊ณต์œ ์ž ๊ธˆ| 2019-09-17 10:00:24.331935| 389015618226997618| {12007}| 00:00:01 | 12007| ๊ฑฐ๋ž˜ID| ๊ณต์œ ์ž ๊ธˆ| 2019-09-17 10:05:03.327933| 389015618226997618| {11629}| 00:00:13 | 12007| ๊ฑฐ๋ž˜ID| ๊ณต์œ ์ž ๊ธˆ| 2019-09-17 10:05:03.327933| 389015618226997618| {11092}| 00:01:10 | 12007| ๊ฑฐ๋ž˜ID| ๊ณต์œ ์ž ๊ธˆ| 2019-09-17 10:05:03.327933| 389015618226997618| {11288}| 00:00:05 | 12213| ๊ฑฐ๋ž˜ID| ๊ณต์œ ์ž ๊ธˆ| 2019-09-17 10:06:07.328019| 389015618226997618| {12007}| 00:00:10

QUERYID๋ฅผ ํ†ตํ•œ ์ž ๊ธˆ ์œ ํ˜•๋ณ„ ์ž ๊ธˆ ์ˆ˜ํ–‰

์ฃผ์žฅ

WITH
lt AS
(
	SELECT
		pid , 
		locktype  ,
		mode ,
		timepoint , 
		queryid , 
		blocking_pids ,
                MIN ( timepoint ) OVER (PARTITION BY pid , locktype  ,mode ) as started  
	FROM 
		activity_hist.archive_locking
	WHERE 
		timepoint between pg_stat_history_begin+(current_hour_diff * interval '1 hour') AND 
			                  pg_stat_history_end+(current_hour_diff * interval '1 hour') AND 
		granted AND
		queryid IS NOT NULL 
	GROUP BY 
	        pid , 
		locktype  ,
		mode ,
		timepoint ,
		queryid ,
		blocking_pids 
)
SELECT 
        lt.pid , 
	lt.locktype  ,
	lt.mode ,			
        lt.started ,
	lt.queryid  ,
	lt.blocking_pids ,
	COUNT(*)  * interval '1 second'	 as duration			
FROM lt 	
GROUP BY 
	lt.pid , 
	lt.locktype  ,
	lt.mode ,			
        lt.started ,
	lt.queryid ,
	lt.blocking_pids 
ORDER BY 4

์˜ˆ

| QUERYID๋กœ ์ž ๊ธˆ ์œ ํ˜•๋ณ„๋กœ ์ž ๊ธˆ ์„ค์ • +----------+----------+------ --------------+ ---------------+------ ---+ -------+------------ -------- | PID| ์ž ๊ธˆ ์œ ํ˜•| ๋ชจ๋“œ| ์‹œ์ž‘๋จ| ์ฟผ๋ฆฌID| Blocking_pids| ๊ธฐ๊ฐ„ +------------+------------+----------- ---------+---------------+--------- -- --------+---------+------ -- - | 11288| ๊ด€๊ณ„| ํ–‰๋…์ ์ž ๊ธˆ| 2019-09-17 10:00:00.302936| 389015618226997618| {11092}| 00:03:34 | 11092| ๊ฑฐ๋ž˜ID| ๋…์ ์ž ๊ธˆ| 2019-09-17 10:00:00.302936| 389015618226997618| {}| 00:03:34 | 11288| ๊ด€๊ณ„| ํ–‰๋…์ ์ž ๊ธˆ| 2019-09-17 10:00:00.302936| 389015618226997618| {}| 00:00:10 | 11092| ๊ด€๊ณ„| ํ–‰๋…์ ์ž ๊ธˆ| 2019-09-17 10:00:00.302936| 389015618226997618| {}| 00:03:34 | 11092| ๊ฐ€์ƒID| ๋…์ ์ž ๊ธˆ| 2019-09-17 10:00:00.302936| 389015618226997618| {}| 00:03:34 | 11288| ๊ฐ€์ƒID| ๋…์ ์ž ๊ธˆ| 2019-09-17 10:00:00.302936| 389015618226997618| {11092}| 00:03:34 | 11288| ๊ฑฐ๋ž˜ID| ๋…์ ์ž ๊ธˆ| 2019-09-17 10:00:00.302936| 389015618226997618| {11092}| 00:03:34 | 11288| ํŠœํ”Œ| ์ ‘๊ทผ๋…์ ์ž ๊ธˆ| 2019-09-17 10:00:00.302936| 389015618226997618| {11092}| 00:03:34

์ž ๊ธˆ ๊ธฐ๋ก์„ ์‚ฌ์šฉํ•˜์—ฌ ์„ฑ๋Šฅ ์‚ฌ๊ณ ๋ฅผ ๋ถ„์„ํ•ฉ๋‹ˆ๋‹ค.

  1. pid=389015618226997618์ธ ํ”„๋กœ์„ธ์Šค์— ์˜ํ•ด ์‹คํ–‰๋œ queryid=11288์ธ ์š”์ฒญ์ด 2019-09-17 10:00:00๋ถ€ํ„ฐ 3๋ถ„๊ฐ„ ์ฐจ๋‹จ์„ ๊ธฐ๋‹ค๋ฆฌ๊ณ  ์žˆ์—ˆ์Šต๋‹ˆ๋‹ค.
  2. ์ž ๊ธˆ์€ pid=11092์ธ ํ”„๋กœ์„ธ์Šค์— ์˜ํ•ด ์œ ์ง€๋˜์—ˆ์Šต๋‹ˆ๋‹ค.
  3. 11092-389015618226997618-2019 09:17:10๋ถ€ํ„ฐ queryid=00๋กœ ์š”์ฒญ์„ ์‹คํ–‰ํ•˜๋Š” pid=00์˜ ํ”„๋กœ์„ธ์Šค๊ฐ€ 3๋ถ„ ๋™์•ˆ ์ž ๊ธˆ์„ ์œ ์ง€ํ–ˆ์Šต๋‹ˆ๋‹ค.

ํ•ฉ๊ณ„

์ด์ œ ๊ฐ€์žฅ ํฅ๋ฏธ๋กญ๊ณ  ์œ ์šฉํ•œ ๋ถ€๋ถ„, ์ฆ‰ ๋Œ€๊ธฐ ๋ฐ ์ฐจ๋‹จ ๋‚ด์—ญ์— ๋Œ€ํ•œ ํ†ต๊ณ„ ์ˆ˜์ง‘ ๋ฐ ์‚ฌ๋ก€ ๋ถ„์„์ด ์‹œ์ž‘๋˜๊ธฐ๋ฅผ ๋ฐ”๋ž๋‹ˆ๋‹ค.

์•ž์œผ๋กœ๋Š” ๋ช‡ ๊ฐ€์ง€ ๋ฉ”๋ชจ(์˜ค๋ผํด์˜ metalink์™€ ์œ ์‚ฌ)๋ฅผ ์–ป๊ฒŒ ๋  ๊ฒƒ์ด๋ผ๊ณ  ๋ฏฟ๊ณ  ์‹ถ์Šต๋‹ˆ๋‹ค.

์ผ๋ฐ˜์ ์œผ๋กœ ์‚ฌ์šฉ๋œ ๋ฐฉ๋ฒ•๋ก ์ด ๊ฐ€๋Šฅํ•œ ํ•œ ๋นจ๋ฆฌ ๋ชจ๋“  ์‚ฌ๋žŒ์—๊ฒŒ ์ œ๊ณต๋˜๋Š” ๊ฒƒ์€ ๋ฐ”๋กœ ์ด๋Ÿฌํ•œ ์ด์œ  ๋•Œ๋ฌธ์ž…๋‹ˆ๋‹ค.

๊ฐ€๊นŒ์šด ์‹œ์ผ ๋‚ด์— ํ”„๋กœ์ ํŠธ๋ฅผ github์— ๊ฒŒ์‹œํ•˜๋ ค๊ณ  ํ•ฉ๋‹ˆ๋‹ค.

์ถœ์ฒ˜ : habr.com

์ฝ”๋ฉ˜ํŠธ๋ฅผ ์ถ”๊ฐ€