文章详情

短信预约-IT技能 免费直播动态提醒

请输入下面的图形验证码

提交验证

短信预约提醒成功

PostgreSQL 源码解读(202)- 查询#115(类型转换)

2024-04-02 19:55

关注

本节简单介绍了PostgreSQL中的类型转换实现.
首先来看看几个示例SQL:



testdb=# 
testdb=# drop table if exists t_conv;
om t_conv where id = '1'::text;
explain verbose select * from t_conv where id > '13'::text;
DROP TABLE
testdb=# create table t_conv(id int);
CREATE TABLE
testdb=# 
testdb=# insert into t_conv values(1);
INSERT 0 1
testdb=# insert into t_conv values(2);
INSERT 0 1
testdb=#

查询条件为id = ‘1’,’1’转换为int进行比较.



testdb=# explain verbose select * from t_conv where id = '1';
                          QUERY PLAN                           
---------------------------------------------------------------
 Seq Scan on public.t_conv  (cost=0.00..41.88 rows=13 width=4)
   Output: id
   Filter: (t_conv.id = 1)
(3 rows)

查询条件为id = ‘1.1’,出错(1.1无法转换为整型)



testdb=# explain verbose select * from t_conv where id = '1.1';
psql: ERROR:  invalid input syntax for type integer: "1.1"
LINE 1: explain verbose select * from t_conv where id = '1.1';
                                                        ^

查询条件为id = ‘1’::text,出错(text和int4没有转换规则)



testdb=# explain verbose select * from t_conv where id = '1'::text;
psql: ERROR:  operator does not exist: integer = text
LINE 1: explain verbose select * from t_conv where id = '1'::text;
                                                      ^
HINT:  No operator matches the given name and argument types. You might need to add explicit type casts.
testdb=#

查询条件为id > ‘13’::text,转换为numeric进行比较



testdb=# explain verbose select * from t_conv where id > '13'::text;
                           QUERY PLAN                           
----------------------------------------------------------------
 Seq Scan on public.t_conv  (cost=0.00..48.25 rows=850 width=4)
   Output: id
   Filter: ((t_conv.id)::numeric > '13'::numeric)
(3 rows)
testdb=#

系统转换规则定义,”>”操作符有定义text&int的比较,而”=”操作符没有定义,因此”select * from t_conv where id = ‘1’::text”语句会出错.



testdb=# select oid,typname from pg_type where typname in ('int4','text');
 oid | typname 
-----+---------
  23 | int4
  25 | text
(2 rows)
testdb=# select oid,oprname,oprleft,oprright,oprresult,oprcode from pg_operator where oprname = '>' and oprleft = 23 and oprright = 25;
  oid  | oprname | oprleft | oprright | oprresult |     oprcode      
-------+---------+---------+----------+-----------+------------------
 16407 | >       |      23 |       25 |        16 | int_greater_text
(1 row)
testdb=# select oid,oprname,oprleft,oprright,oprresult,oprcode from pg_operator where oprname = '=' and oprleft = 23 and oprright = 25;
 oid | oprname | oprleft | oprright | oprresult | oprcode 
-----+---------+---------+----------+-----------+---------
(0 rows)

总结一下:
解析表达式,涉及不同数据类型时:
1.如有相应类型的Operator定义(pg_operator),则尝试进行类型转换,否则报错;
2.如有相应类型的转换规则,转换为目标类型后解析,否则报错.

一、数据结构

Form_pg_operator
pg_operator中的定义,代码会其中的定义转换为FormData_pg_operator结构体




CATALOG(pg_operator,2617,OperatorRelationId)
{
  Oid     oid;      
  
  NameData  oprname;
  
  Oid     oprnamespace BKI_DEFAULT(PGNSP);
  
  Oid     oprowner BKI_DEFAULT(PGUID);
  
  char    oprkind BKI_DEFAULT(b);
  
  bool    oprcanmerge BKI_DEFAULT(f);
  
  bool    oprcanhash BKI_DEFAULT(f);
  
  Oid     oprleft BKI_LOOKUP(pg_type);
  
  Oid     oprright BKI_LOOKUP(pg_type);
  
  Oid     oprresult BKI_LOOKUP(pg_type);
  
  Oid     oprcom BKI_DEFAULT(0) BKI_LOOKUP(pg_operator);
  
  Oid     oprnegate BKI_DEFAULT(0) BKI_LOOKUP(pg_operator);
  
  regproc   oprcode BKI_LOOKUP(pg_proc);
  
  regproc   oprrest BKI_DEFAULT(-) BKI_LOOKUP(pg_proc);
  
  regproc   oprjoin BKI_DEFAULT(-) BKI_LOOKUP(pg_proc);
} FormData_pg_operator;

typedef FormData_pg_operator *Form_pg_operator;

二、源码解读

make_op
变换操作符表达式以确保类型兼容,会存在某些类型转换.




Expr *
make_op(ParseState *pstate, List *opname, Node *ltree, Node *rtree,
    Node *last_srf, int location)
{
  Oid     ltypeId,//左算子类型OID
        rtypeId;//右算子类型OID
  Operator  tup;//操作符tuple
  Form_pg_operator opform;//操作符form(参照pg_operator)
  Oid     actual_arg_types[2];//实际参数类型
  Oid     declared_arg_types[2];//操作符声明的参数类型
  int     nargs;//参数格式
  List     *args;//参数链表
  Oid     rettype;//返回结果类型
  OpExpr     *result;//结果
  
  //选择操作符
  if (rtree == NULL)
  {
    
    //右树为NULL,则为右操作符,如阶乘运算符"!" : 10!
    ltypeId = exprType(ltree);
    rtypeId = InvalidOid;
    tup = right_oper(pstate, opname, ltypeId, false, location);
  }
  else if (ltree == NULL)
  {
    
    //左树为空,则为左操作符,如按位NOT运算符 : "~21"
    rtypeId = exprType(rtree);
    ltypeId = InvalidOid;
    tup = left_oper(pstate, opname, rtypeId, false, location);
  }
  else
  {
    
    //二元操作符
    ltypeId = exprType(ltree);
    rtypeId = exprType(rtree);
    tup = oper(pstate, opname, ltypeId, rtypeId, false, location);
  }
  //获取操作符
  opform = (Form_pg_operator) GETSTRUCT(tup);
  
  if (!RegProcedureIsValid(opform->oprcode))
    ereport(ERROR,
        (errcode(ERRCODE_UNDEFINED_FUNCTION),
         errmsg("operator is only a shell: %s",
            op_signature_string(opname,
                      opform->oprkind,
                      opform->oprleft,
                      opform->oprright)),
         parser_errposition(pstate, location)));
  
  //执行类型转换并构建表达式树
  if (rtree == NULL)
  {
    
    args = list_make1(ltree);//参数
    actual_arg_types[0] = ltypeId;//左实际参数类型
    declared_arg_types[0] = opform->oprleft;//声明类型
    nargs = 1;//参数个数
  }
  else if (ltree == NULL)
  {
    
    args = list_make1(rtree);
    actual_arg_types[0] = rtypeId;
    declared_arg_types[0] = opform->oprright;
    nargs = 1;
  }
  else
  {
    
    args = list_make2(ltree, rtree);
    actual_arg_types[0] = ltypeId;
    actual_arg_types[1] = rtypeId;
    declared_arg_types[0] = opform->oprleft;
    declared_arg_types[1] = opform->oprright;
    nargs = 2;
  }
  
  rettype = enforce_generic_type_consistency(actual_arg_types,
                         declared_arg_types,
                         nargs,
                         opform->oprresult,
                         false);
  
  //参数类型转换
  make_fn_arguments(pstate, args, actual_arg_types, declared_arg_types);
  
  //构建表达式节点
  result = makeNode(OpExpr);
  result->opno = oprid(tup);
  result->opfuncid = opform->oprcode;
  result->opresulttype = rettype;
  result->opretset = get_func_retset(opform->oprcode);
  
  result->args = args;
  result->location = location;
  
  if (result->opretset)
  {
    check_srf_call_placement(pstate, last_srf, location);
    
    pstate->p_last_srf = (Node *) result;
  }
  ReleaseSysCache(tup);
  return (Expr *) result;
}

make_fn_arguments
给定实际的参数表达式和期望的输入类型,为表达式树执行有需要的类型转换.




void
make_fn_arguments(ParseState *pstate,
          List *fargs,
          Oid *actual_arg_types,
          Oid *declared_arg_types)
{
  ListCell   *current_fargs;
  int     i = 0;
  foreach(current_fargs, fargs)
  {
    
    //类型不匹配?
    if (actual_arg_types[i] != declared_arg_types[i])
    {
      //获取节点
      Node     *node = (Node *) lfirst(current_fargs);
      
      if (IsA(node, NamedArgExpr))
      {
        NamedArgExpr *na = (NamedArgExpr *) node;
        node = coerce_type(pstate,
                   (Node *) na->arg,
                   actual_arg_types[i],
                   declared_arg_types[i], -1,
                   COERCION_IMPLICIT,
                   COERCE_IMPLICIT_CAST,
                   -1);
        na->arg = (Expr *) node;
      }
      else
      {
        //执行转换
        node = coerce_type(pstate,
                   node,
                   actual_arg_types[i],
                   declared_arg_types[i], -1,
                   COERCION_IMPLICIT,
                   COERCE_IMPLICIT_CAST,
                   -1);
        lfirst(current_fargs) = node;
      }
    }
    i++;
  }
}

三、跟踪分析

SQL脚本



testdb=# select * from t_conv where id = '1';

跟踪分析



(gdb) b make_op
Breakpoint 2 at 0x619cdb: file parse_oper.c, line 762.
(gdb) c
Continuing.
Breakpoint 2, make_op (pstate=0x22d6e30, opname=0x22d6c48, ltree=0x22d7620, rtree=0x22d7678, last_srf=0x0, location=30)
    at parse_oper.c:762
762   if (rtree == NULL)
(gdb)

调用栈信息



(gdb) bt
#0  make_op (pstate=0x22d6e30, opname=0x22d6c48, ltree=0x22d7620, rtree=0x22d7678, last_srf=0x0, location=30)
    at parse_oper.c:859
#1  0x000000000060df9c in transformAExprOp (pstate=0x22d6e30, a=0x22d6ba0) at parse_expr.c:1010
#2  0x000000000060c55b in transformExprRecurse (pstate=0x22d6e30, expr=0x22d6ba0) at parse_expr.c:216
#3  0x000000000060c298 in transformExpr (pstate=0x22d6e30, expr=0x22d6ba0, exprKind=EXPR_KIND_WHERE) at parse_expr.c:155
#4  0x0000000000602164 in transformWhereClause (pstate=0x22d6e30, clause=0x22d6ba0, exprKind=EXPR_KIND_WHERE, 
    constructName=0xb458a7 "WHERE") at parse_clause.c:1691
#5  0x00000000005c7eb5 in transformSelectStmt (pstate=0x22d6e30, stmt=0x22d6c80) at analyze.c:1239
#6  0x00000000005c6392 in transformStmt (pstate=0x22d6e30, parseTree=0x22d6c80) at analyze.c:301
#7  0x00000000005c626d in transformOptionalSelectInto (pstate=0x22d6e30, parseTree=0x22d6c80) at analyze.c:246
#8  0x00000000005c612b in transformTopLevelStmt (pstate=0x22d6e30, parseTree=0x22d6d98) at analyze.c:196
#9  0x00000000005c5f83 in parse_analyze (parseTree=0x22d6d98, sourceText=0x22d5e08 "select * from t_conv where id = '1';", 
    paramTypes=0x0, numParams=0, queryEnv=0x0) at analyze.c:116
#10 0x00000000008e78d9 in pg_analyze_and_rewrite (parsetree=0x22d6d98, 
    query_string=0x22d5e08 "select * from t_conv where id = '1';", paramTypes=0x0, numParams=0, queryEnv=0x0)
    at postgres.c:695
#11 0x00000000008e7f23 in exec_simple_query (query_string=0x22d5e08 "select * from t_conv where id = '1';")
    at postgres.c:1140
#12 0x00000000008ec3a0 in PostgresMain (argc=1, argv=0x22ffdb8, dbname=0x22ffc00 "testdb", username=0x22d2a68 "pg12")
    at postgres.c:4249
#13 0x0000000000843650 in BackendRun (port=0x22f7be0) at postmaster.c:4431
#14 0x0000000000842e2e in BackendStartup (port=0x22f7be0) at postmaster.c:4122
#15 0x000000000083f06a in ServerLoop () at postmaster.c:1704
#16 0x000000000083e920 in PostmasterMain (argc=1, argv=0x22d0a20) at postmaster.c:1377
#17 0x000000000075f834 in main (argc=1, argv=0x22d0a20) at main.c:228

输入参数
操作符为”=”;ltree为字段列,类型为int4(vartype = 23);rtree为常量,类型为unknown(consttype = 705);last_srf为NULL;该操作符在字符串中的偏移为30.



(gdb) p *pstate
$7 = {parentParseState = 0x0, p_sourcetext = 0x22d5e08 "select * from t_conv where id = '1';", p_rtable = 0x22d72a0, 
  p_joinexprs = 0x0, p_joinlist = 0x22d73a8, p_namespace = 0x22d7328, p_lateral_active = false, p_ctenamespace = 0x0, 
  p_future_ctes = 0x0, p_parent_cte = 0x0, p_target_relation = 0x0, p_target_rangetblentry = 0x0, p_is_insert = false, 
  p_windowdefs = 0x0, p_expr_kind = EXPR_KIND_WHERE, p_next_resno = 2, p_multiassign_exprs = 0x0, p_locking_clause = 0x0, 
  p_locked_from_parent = false, p_resolve_unknowns = true, p_queryEnv = 0x0, p_hasAggs = false, p_hasWindowFuncs = false, 
  p_hasTargetSRFs = false, p_hasSubLinks = false, p_hasModifyingCTE = false, p_last_srf = 0x0, p_pre_columnref_hook = 0x0, 
  p_post_columnref_hook = 0x0, p_paramref_hook = 0x0, p_coerce_param_hook = 0x0, p_ref_hook_state = 0x0}
(gdb) p *opname
$8 = {type = T_List, length = 1, head = 0x22d6c20, tail = 0x22d6c20}
(gdb) p *(Node *)opname->head->data.ptr_value
$9 = {type = T_String}
(gdb) p *(Value *)opname->head->data.ptr_value
$14 = {type = T_String, val = {ival = 12298942, str = 0xbbaabe "="}}
(gdb) p *ltree
$15 = {type = T_Var}
(gdb) p *(Var *)ltree
$16 = {xpr = {type = T_Var}, varno = 1, varattno = 1, vartype = 23, vartypmod = -1, varcollid = 0, varlevelsup = 0, 
  varnoold = 1, varoattno = 1, location = 27}
(gdb) p *(Const *)rtree
$18 = {xpr = {type = T_Const}, consttype = 705, consttypmod = -1, constcollid = 0, constlen = -2, constvalue = 36531016, 
  constisnull = false, constbyval = false, location = 32}  
###
testdb=# select typname from pg_type where oid in (23,705);
 typname 
---------
 int4
 unknown
(2 rows)
###

确定操作符(二元操作符)



(gdb) n
769   else if (ltree == NULL)
(gdb) 
779     ltypeId = exprType(ltree);
(gdb) 
780     rtypeId = exprType(rtree);
(gdb) 
781     tup = oper(pstate, opname, ltypeId, rtypeId, false, location);
(gdb) p ltypeId
$19 = 23
(gdb) p rtypeId
$20 = 705
(gdb)

获取操作符(对应pg_operator)



(gdb) n
784   opform = (Form_pg_operator) GETSTRUCT(tup);
(gdb) 
787   if (!RegProcedureIsValid(opform->oprcode))
(gdb) p *opform
$21 = {oid = 96, oprname = {data = "=", '\000' <repeats 62 times>}, oprnamespace = 11, oprowner = 10, oprkind = 98 'b', 
  oprcanmerge = true, oprcanhash = true, oprleft = 23, oprright = 23, oprresult = 16, oprcom = 96, oprnegate = 518, 
  oprcode = 65, oprrest = 101, oprjoin = 105}
(gdb)

执行类型转换并构建表达式树.
实际类型为23&705,操作符声明操作类型为23&23



(gdb) n
798   if (rtree == NULL)
(gdb) 
806   else if (ltree == NULL)
(gdb) 
817     args = list_make2(ltree, rtree);
(gdb) 
818     actual_arg_types[0] = ltypeId;
(gdb) 
819     actual_arg_types[1] = rtypeId;
(gdb) 
820     declared_arg_types[0] = opform->oprleft;
(gdb) 
821     declared_arg_types[1] = opform->oprright;
(gdb) 
822     nargs = 2;
(gdb) p opform->oprleft
$22 = 23
(gdb) p opform->oprright
$23 = 23
(gdb) n
830   rettype = enforce_generic_type_consistency(actual_arg_types,
(gdb)

进入函数make_fn_arguments



(gdb) 
837   make_fn_arguments(pstate, args, actual_arg_types, declared_arg_types);
(gdb) n
Breakpoint 1, make_fn_arguments (pstate=0x22d6e30, fargs=0x22d76f8, actual_arg_types=0x7ffda1b2af80, 
    declared_arg_types=0x7ffda1b2af70) at parse_func.c:1835
1835    int     i = 0;
(gdb)

调用coerce_type函数执行转换,unknown -> int4



(gdb) n
1837    foreach(current_fargs, fargs)
(gdb) 
1840      if (actual_arg_types[i] != declared_arg_types[i])
(gdb) 
1873      i++;
(gdb) 
1837    foreach(current_fargs, fargs)
(gdb) 
1840      if (actual_arg_types[i] != declared_arg_types[i])
(gdb) p actual_arg_types[i]
$24 = 705
(gdb) p declared_arg_types[i]
$25 = 23
(gdb) n
1842        Node     *node = (Node *) lfirst(current_fargs);
(gdb) n
1848        if (IsA(node, NamedArgExpr))
(gdb) 
1866                     declared_arg_types[i], -1,
(gdb) 
1863          node = coerce_type(pstate,
(gdb) 
1865                     actual_arg_types[i],
(gdb) 
1863          node = coerce_type(pstate,
(gdb) 
1870          lfirst(current_fargs) = node;
(gdb) p *node
$26 = {type = T_Const}
(gdb) p *(Const *)node
$27 = {xpr = {type = T_Const}, consttype = 23, consttypmod = -1, constcollid = 0, constlen = 4, constvalue = 1, 
  constisnull = false, constbyval = true, location = 32}
(gdb)

完成调用



(gdb) n
1873      i++;
(gdb) 
1837    foreach(current_fargs, fargs)
(gdb) 
1875  }
(gdb) 
make_op (pstate=0x22d6e30, opname=0x22d6c48, ltree=0x22d7620, rtree=0x22d7678, last_srf=0x0, location=30)
    at parse_oper.c:840
840   result = makeNode(OpExpr);

回到make_op,构造结果result结构体



(gdb) 
841   result->opno = oprid(tup);
(gdb) 
842   result->opfuncid = opform->oprcode;
(gdb) 
843   result->opresulttype = rettype;
(gdb) 
844   result->opretset = get_func_retset(opform->oprcode);
(gdb) 
846   result->args = args;
(gdb) 
847   result->location = location;
(gdb) 
850   if (result->opretset)
(gdb) 
857   ReleaseSysCache(tup);
(gdb) 
859   return (Expr *) result;
(gdb) p *(Expr *) result
$28 = {type = T_OpExpr}
(gdb) p *(OpExpr *) result
$29 = {xpr = {type = T_OpExpr}, opno = 96, opfuncid = 65, opresulttype = 16, opretset = false, opcollid = 0, 
  inputcollid = 0, args = 0x22d76f8, location = 30}
(gdb)

DONE!

实现函数coerce_type下节再行介绍

四、参考资料

PostgreSQL Type Conversion
PostgreSQL数据类型转换规则#1
PostgreSQL数据类型转换规则#2
PostgreSQL数据类型转换规则#3

免责声明:

① 本站未注明“稿件来源”的信息均来自网络整理。其文字、图片和音视频稿件的所属权归原作者所有。本站收集整理出于非商业性的教育和科研之目的,并不意味着本站赞同其观点或证实其内容的真实性。仅作为临时的测试数据,供内部测试之用。本站并未授权任何人以任何方式主动获取本站任何信息。

② 本站未注明“稿件来源”的临时测试数据将在测试完成后最终做删除处理。有问题或投稿请发送至: 邮箱/279061341@qq.com QQ/279061341

软考中级精品资料免费领

  • 历年真题答案解析
  • 备考技巧名师总结
  • 高频考点精准押题
  • 资料下载
  • 历年真题
  • 2024年上半年信息系统项目管理师第二批次真题及答案解析(完整版)

    难度     813人已做
    查看
  • 【考后总结】2024年5月26日信息系统项目管理师第2批次考情分析

    难度     354人已做
    查看
  • 【考后总结】2024年5月25日信息系统项目管理师第1批次考情分析

    难度     318人已做
    查看
  • 2024年上半年软考高项第一、二批次真题考点汇总(完整版)

    难度     435人已做
    查看
  • 2024年上半年系统架构设计师考试综合知识真题

    难度     224人已做
    查看

相关文章

发现更多好内容

猜你喜欢

AI推送时光机
咦!没有更多了?去看看其它编程学习网 内容吧
首页课程
资料下载
问答资讯