Skip to content

1.现象

sql
han=# select max(create_time) from public.tbl_index_table where create_time>='2010-10-08';
han=# select max(create_time) from public.tbl_index_table where create_time>='2010-10-08';

ERROR: could not read block 41381 of relation 16779/24769/24938: read only 0 of 8192 bytes

看到这个错误信息,首先想到的是表 tbl_index_table 上有坏块,估计需要表重建下。

2.查看执行计划

sql
--查看执行计划
han=# \d tbl_index_table;
         Table "public.tbl_index_table"
   Column   |      Type       |    Modifiers    
----------------+-----------------------------+------------------------
 total     | integer           |
 logined    | integer           |
 logining    | integer           |
 http      | integer           |
 rawtcp     | integer           |
 create_time  | timestamp without time zone | not null default now()
 logincountdesc | character varying      |
 logincountaddr | character varying      | not null
Indexes:
  "tbl_index_table_pkey" PRIMARY KEY, btree (create_time, logincountaddr)
  "index_tbl_index_table_create_time" btree (create_time)
--查看执行计划
han=# \d tbl_index_table;
         Table "public.tbl_index_table"
   Column   |      Type       |    Modifiers    
----------------+-----------------------------+------------------------
 total     | integer           |
 logined    | integer           |
 logining    | integer           |
 http      | integer           |
 rawtcp     | integer           |
 create_time  | timestamp without time zone | not null default now()
 logincountdesc | character varying      |
 logincountaddr | character varying      | not null
Indexes:
  "tbl_index_table_pkey" PRIMARY KEY, btree (create_time, logincountaddr)
  "index_tbl_index_table_create_time" btree (create_time)

3.explain

sql
han=# explain  select max(create_time) from public.tbl_index_table where create_time>='2010-10-08';
                                                                   QUERY PLAN                                                                  
------------------------------------------------------------------------------------------------------------------------------------------------
 Result  (cost=0.04..0.05 rows=1 width=0)
   InitPlan
     ->  Limit  (cost=0.00..0.04 rows=1 width=8)
           ->  Index Scan Backward using index_tbl_index_table_create_time on tbl_index_table  (cost=0.00..66.28 rows=1507 width=8)
                 Index Cond: (create_time >= '2010-10-08 00:00:00'::timestamp without time zone)
                 Filter: (create_time IS NOT NULL)
(6 rows)

   -- 发现上面的查询走的索引 index_tbl_index_table_create_time,猜测索引可能有问题。
han=# explain  select max(create_time) from public.tbl_index_table where create_time>='2010-10-08';
                                                                   QUERY PLAN                                                                  
------------------------------------------------------------------------------------------------------------------------------------------------
 Result  (cost=0.04..0.05 rows=1 width=0)
   InitPlan
     ->  Limit  (cost=0.00..0.04 rows=1 width=8)
           ->  Index Scan Backward using index_tbl_index_table_create_time on tbl_index_table  (cost=0.00..66.28 rows=1507 width=8)
                 Index Cond: (create_time >= '2010-10-08 00:00:00'::timestamp without time zone)
                 Filter: (create_time IS NOT NULL)
(6 rows)

   -- 发现上面的查询走的索引 index_tbl_index_table_create_time,猜测索引可能有问题。

4.relation分析

sql
--根据报错信息,从relation后面的数字分析
han=# select oid,relname from pg_class where oid=24938;
  oid  |                 relname                
-------+-----------------------------------------
 24938 | index_tbl_index_table_create_time
(1 row)

Time: 0.596 ms
han=# select oid,relname from pg_class where oid=24769;
 oid | relname
-----+---------
(0 rows)

Time: 0.369 ms
han=# select oid,relname from pg_class where oid=16779;
 oid | relname
-----+---------
(0 rows)

   发现 24938正好是表上的索引 index_tbl_index_table_create_time。

--查看索引状态
han=# select * from pg_index where indexrelid=24938;
 indexrelid | indrelid | indnatts | indisunique | indisprimary | indisclustered | indisvalid | indcheckxmin | indisready | indkey | indclass | indoption | indexprs | indpred
------------+----------+----------+-------------+--------------+----------------+------------+--------------+------------+--------+----------+-----------+----------+---------
      24938 |    24823 |        1 | f           | f            | f              | t          | f            | t          | 6      | 10053    | 0         |          |
(1 row)

indisvalid=t 表示索引处于可用状态。
--根据报错信息,从relation后面的数字分析
han=# select oid,relname from pg_class where oid=24938;
  oid  |                 relname                
-------+-----------------------------------------
 24938 | index_tbl_index_table_create_time
(1 row)

Time: 0.596 ms
han=# select oid,relname from pg_class where oid=24769;
 oid | relname
-----+---------
(0 rows)

Time: 0.369 ms
han=# select oid,relname from pg_class where oid=16779;
 oid | relname
-----+---------
(0 rows)

   发现 24938正好是表上的索引 index_tbl_index_table_create_time。

--查看索引状态
han=# select * from pg_index where indexrelid=24938;
 indexrelid | indrelid | indnatts | indisunique | indisprimary | indisclustered | indisvalid | indcheckxmin | indisready | indkey | indclass | indoption | indexprs | indpred
------------+----------+----------+-------------+--------------+----------------+------------+--------------+------------+--------+----------+-----------+----------+---------
      24938 |    24823 |        1 | f           | f            | f              | t          | f            | t          | 6      | 10053    | 0         |          |
(1 row)

indisvalid=t 表示索引处于可用状态。

4.重新创建

sql
--尝试下重建索引

han=# select query from pg_stat_activity;

han=# \timing
Timing is on.

back=# reindex index index_tbl_index_table_create_time;
REINDEX
Time: 107796.232 ms

--索引重建后,查询恢复正常
han=# select max(create_time) from public.tbl_index_table where create_time>='2010-10-08';
 max
-----
 
(1 row)

Time: 73.600 ms

han=# select pg_size_pretty(pg_relation_size('index_tbl_index_table_create_time'));
 pg_size_pretty
----------------
 327 MB
(1 row)
--尝试下重建索引

han=# select query from pg_stat_activity;

han=# \timing
Timing is on.

back=# reindex index index_tbl_index_table_create_time;
REINDEX
Time: 107796.232 ms

--索引重建后,查询恢复正常
han=# select max(create_time) from public.tbl_index_table where create_time>='2010-10-08';
 max
-----
 
(1 row)

Time: 73.600 ms

han=# select pg_size_pretty(pg_relation_size('index_tbl_index_table_create_time'));
 pg_size_pretty
----------------
 327 MB
(1 row)