From: Mergen Imeev via Tarantool-patches <tarantool-patches@dev.tarantool.org> To: Vladislav Shpilevoy <v.shpilevoy@tarantool.org> Cc: tarantool-patches@dev.tarantool.org Subject: Re: [Tarantool-patches] [PATCH v2 12/15] sql: rework GROUP_CONCAT() Date: Sat, 25 Sep 2021 14:42:36 +0300 [thread overview] Message-ID: <20210925114236.GI290467@tarantool.org> (raw) In-Reply-To: <527aac58-f3f4-bae9-3057-187edee7d8d4@tarantool.org> Thank you for the review! My answers, diff and new patch below. On Thu, Sep 23, 2021 at 12:49:52AM +0200, Vladislav Shpilevoy wrote: > Thanks for the patch! > > > diff --git a/src/box/sql/func.c b/src/box/sql/func.c > > index f699aa927..001a8641c 100644 > > --- a/src/box/sql/func.c > > +++ b/src/box/sql/func.c > > @@ -213,6 +213,52 @@ fin_minmax(struct sql_context *ctx) > > mem_copy(ctx->pOut, ctx->pMem); > > } > > > > +/** Implementation of the GROUP_CONCAT() function. */ > > +static void > > +step_group_concat(struct sql_context *ctx, int argc, struct Mem **argv) > > +{ > > + assert(argc == 1 || argc == 2); > > + (void)argc; > > + if (argv[0]->type == MEM_TYPE_NULL) > > + return; > > + assert(mem_is_str(argv[0]) || mem_is_bin(argv[0])); > > + if (ctx->pMem->type == MEM_TYPE_NULL) { > > + if (mem_copy_str(ctx->pMem, argv[0]->z, argv[0]->n) != 0) > > 1. What if the argument is zeroblob with no actual memory allocated yet? > There will be '', which is wrong. I fixed this and added a test. > > + ctx->is_aborted = true; > > + return; > > + } > > + const char *sep = NULL; > > + int sep_len = 0; > > + if (argc == 1) { > > + sep = ","; > > + sep_len = 1; > > + } else if (argv[1]->type == MEM_TYPE_NULL) { > > + sep = ""; > > + sep_len = 0; > > + } else { > > + assert(mem_is_same_type(argv[0], argv[0])); > > + sep = argv[1]->z; > > + sep_len = argv[1]->n; > > + } > > + if (sep_len > 0) { > > + if (mem_append(ctx->pMem, sep, sep_len) != 0) { > > 2. Will it work if sep_len == 0? If yes, then I would propose to > drop the len check here and call the append always. > Fixed. I moved this check to mem_append(). > > + ctx->is_aborted = true; > > + return; > > + } Diff: diff --git a/src/box/sql/func.c b/src/box/sql/func.c index 182fb85be..28094e258 100644 --- a/src/box/sql/func.c +++ b/src/box/sql/func.c @@ -223,34 +223,43 @@ step_group_concat(struct sql_context *ctx, int argc, struct Mem **argv) { assert(argc == 1 || argc == 2); (void)argc; - if (argv[0]->type == MEM_TYPE_NULL) + if (mem_is_null(argv[0])) return; assert(mem_is_str(argv[0]) || mem_is_bin(argv[0])); - if (ctx->pMem->type == MEM_TYPE_NULL) { - if (mem_copy_str(ctx->pMem, argv[0]->z, argv[0]->n) != 0) + if (mem_is_null(ctx->pMem)) { + if (mem_copy(ctx->pMem, argv[0]) != 0) ctx->is_aborted = true; return; } + assert(!mem_is_zerobin(ctx->pMem)); const char *sep = NULL; int sep_len = 0; if (argc == 1) { sep = ","; sep_len = 1; - } else if (argv[1]->type == MEM_TYPE_NULL) { + } else if (mem_is_null(argv[1])) { sep = ""; sep_len = 0; } else { - assert(mem_is_same_type(argv[0], argv[0])); + assert(mem_is_same_type(argv[0], argv[1])); sep = argv[1]->z; sep_len = argv[1]->n; } - if (sep_len > 0) { - if (mem_append(ctx->pMem, sep, sep_len) != 0) { - ctx->is_aborted = true; - return; - } + if (mem_append(ctx->pMem, sep, sep_len) != 0) { + ctx->is_aborted = true; + return; + } + uint32_t size; + char *str; + if (mem_is_zerobin(argv[0])) { + size = argv[0]->u.nZero; + str = sqlDbMallocRawNN(sql_get(), size); + memset(str, 0, size); + } else { + size = argv[0]->n; + str = argv[0]->z; } - if (mem_append(ctx->pMem, argv[0]->z, argv[0]->n) != 0) { + if (mem_append(ctx->pMem, str, size) != 0) { ctx->is_aborted = true; return; } diff --git a/test/sql-tap/func.test.lua b/test/sql-tap/func.test.lua index 416f27d69..bd8a8fe78 100755 --- a/test/sql-tap/func.test.lua +++ b/test/sql-tap/func.test.lua @@ -1,6 +1,6 @@ #!/usr/bin/env tarantool local test = require("sqltester") -test:plan(14680) +test:plan(14681) --!./tcltestrunner.lua -- 2001 September 15 @@ -2142,11 +2142,14 @@ test:do_execsql_test( -- </func-24.2> }) --- do_test func-24.3 { --- execsql { --- SELECT group_concat(t1,' ' || rowid || ' ') FROM tbl1 --- } --- } {{this 2 program 3 is 4 free 5 software}} +test:do_execsql_test( + "func-24.3", + [[ + SELECT group_concat(zeroblob(10)); + ]], { + '\0\0\0\0\0\0\0\0\0\0' + }) + test:do_execsql_test( "func-24.4", [[ New patch: commit 5b8563e9b884c86885a3a91fc608fb144afb69a0 Author: Mergen Imeev <imeevma@gmail.com> Date: Thu Sep 9 18:37:00 2021 +0300 sql: rework GROUP_CONCAT() This patch simplifies SQL built-in aggregate function GROUP_CONCAT(). Part of #4145 diff --git a/src/box/sql/func.c b/src/box/sql/func.c index 3708440e3..28094e258 100644 --- a/src/box/sql/func.c +++ b/src/box/sql/func.c @@ -217,6 +217,61 @@ fin_minmax(struct sql_context *ctx) mem_copy(ctx->pOut, ctx->pMem); } +/** Implementation of the GROUP_CONCAT() function. */ +static void +step_group_concat(struct sql_context *ctx, int argc, struct Mem **argv) +{ + assert(argc == 1 || argc == 2); + (void)argc; + if (mem_is_null(argv[0])) + return; + assert(mem_is_str(argv[0]) || mem_is_bin(argv[0])); + if (mem_is_null(ctx->pMem)) { + if (mem_copy(ctx->pMem, argv[0]) != 0) + ctx->is_aborted = true; + return; + } + assert(!mem_is_zerobin(ctx->pMem)); + const char *sep = NULL; + int sep_len = 0; + if (argc == 1) { + sep = ","; + sep_len = 1; + } else if (mem_is_null(argv[1])) { + sep = ""; + sep_len = 0; + } else { + assert(mem_is_same_type(argv[0], argv[1])); + sep = argv[1]->z; + sep_len = argv[1]->n; + } + if (mem_append(ctx->pMem, sep, sep_len) != 0) { + ctx->is_aborted = true; + return; + } + uint32_t size; + char *str; + if (mem_is_zerobin(argv[0])) { + size = argv[0]->u.nZero; + str = sqlDbMallocRawNN(sql_get(), size); + memset(str, 0, size); + } else { + size = argv[0]->n; + str = argv[0]->z; + } + if (mem_append(ctx->pMem, str, size) != 0) { + ctx->is_aborted = true; + return; + } +} + +/** Finalizer for the GROUP_CONCAT() function. */ +static void +fin_group_concat(struct sql_context *ctx) +{ + mem_copy(ctx->pOut, ctx->pMem); +} + static const unsigned char * mem_as_ustr(struct Mem *mem) { @@ -1761,73 +1816,6 @@ soundexFunc(sql_context * context, int argc, sql_value ** argv) } } -/* - * group_concat(EXPR, ?SEPARATOR?) - */ -static void -groupConcatStep(sql_context * context, int argc, sql_value ** argv) -{ - const char *zVal; - StrAccum *pAccum; - const char *zSep; - int nVal, nSep; - if (argc != 1 && argc != 2) { - diag_set(ClientError, ER_FUNC_WRONG_ARG_COUNT, - "GROUP_CONCAT", "1 or 2", argc); - context->is_aborted = true; - return; - } - if (mem_is_null(argv[0])) - return; - pAccum = - (StrAccum *) sql_aggregate_context(context, sizeof(*pAccum)); - - if (pAccum) { - sql *db = sql_context_db_handle(context); - int firstTerm = pAccum->mxAlloc == 0; - pAccum->mxAlloc = db->aLimit[SQL_LIMIT_LENGTH]; - if (!firstTerm) { - if (argc == 2) { - zSep = mem_as_str0(argv[1]); - nSep = mem_len_unsafe(argv[1]); - } else { - zSep = ","; - nSep = 1; - } - if (zSep) - sqlStrAccumAppend(pAccum, zSep, nSep); - } - zVal = mem_as_str0(argv[0]); - nVal = mem_len_unsafe(argv[0]); - if (zVal) - sqlStrAccumAppend(pAccum, zVal, nVal); - } -} - -static void -groupConcatFinalize(sql_context * context) -{ - StrAccum *pAccum; - pAccum = sql_aggregate_context(context, 0); - if (pAccum) { - if (pAccum->accError == STRACCUM_TOOBIG) { - diag_set(ClientError, ER_SQL_EXECUTE, "string or binary"\ - "string is too big"); - context->is_aborted = true; - } else if (pAccum->accError == STRACCUM_NOMEM) { - context->is_aborted = true; - } else { - char *str = sqlStrAccumFinish(pAccum); - int len = pAccum->nChar; - assert(len >= 0); - if (context->func->def->returns == FIELD_TYPE_STRING) - mem_set_str_dynamic(context->pOut, str, len); - else - mem_set_bin_dynamic(context->pOut, str, len); - } - } -} - int sql_is_like_func(struct Expr *expr) { @@ -1995,13 +1983,13 @@ static struct sql_func_definition definitions[] = { NULL}, {"GROUP_CONCAT", 1, {FIELD_TYPE_STRING}, FIELD_TYPE_STRING, - groupConcatStep, groupConcatFinalize}, + step_group_concat, fin_group_concat}, {"GROUP_CONCAT", 2, {FIELD_TYPE_STRING, FIELD_TYPE_STRING}, - FIELD_TYPE_STRING, groupConcatStep, groupConcatFinalize}, + FIELD_TYPE_STRING, step_group_concat, fin_group_concat}, {"GROUP_CONCAT", 1, {FIELD_TYPE_VARBINARY}, FIELD_TYPE_VARBINARY, - groupConcatStep, groupConcatFinalize}, + step_group_concat, fin_group_concat}, {"GROUP_CONCAT", 2, {FIELD_TYPE_VARBINARY, FIELD_TYPE_VARBINARY}, - FIELD_TYPE_VARBINARY, groupConcatStep, groupConcatFinalize}, + FIELD_TYPE_VARBINARY, step_group_concat, fin_group_concat}, {"HEX", 1, {FIELD_TYPE_VARBINARY}, FIELD_TYPE_STRING, hexFunc, NULL}, {"IFNULL", 2, {FIELD_TYPE_ANY, FIELD_TYPE_ANY}, FIELD_TYPE_SCALAR, diff --git a/test/sql-tap/func.test.lua b/test/sql-tap/func.test.lua index 416f27d69..bd8a8fe78 100755 --- a/test/sql-tap/func.test.lua +++ b/test/sql-tap/func.test.lua @@ -1,6 +1,6 @@ #!/usr/bin/env tarantool local test = require("sqltester") -test:plan(14680) +test:plan(14681) --!./tcltestrunner.lua -- 2001 September 15 @@ -2142,11 +2142,14 @@ test:do_execsql_test( -- </func-24.2> }) --- do_test func-24.3 { --- execsql { --- SELECT group_concat(t1,' ' || rowid || ' ') FROM tbl1 --- } --- } {{this 2 program 3 is 4 free 5 software}} +test:do_execsql_test( + "func-24.3", + [[ + SELECT group_concat(zeroblob(10)); + ]], { + '\0\0\0\0\0\0\0\0\0\0' + }) + test:do_execsql_test( "func-24.4", [[
next prev parent reply other threads:[~2021-09-25 11:42 UTC|newest] Thread overview: 31+ messages / expand[flat|nested] mbox.gz Atom feed top [not found] <cover.1632220375.git.imeevma@gmail.com> 2021-09-21 10:59 ` [Tarantool-patches] [PATCH v2 01/15] sql: fix possible undefined behavior during cast Mergen Imeev via Tarantool-patches 2021-09-21 10:59 ` [Tarantool-patches] [PATCH v2 02/15] sql: use register P1 for number of arguments Mergen Imeev via Tarantool-patches 2021-09-21 10:59 ` [Tarantool-patches] [PATCH v2 04/15] sql: move collation to struct sql_context Mergen Imeev via Tarantool-patches 2021-09-21 10:59 ` [Tarantool-patches] [PATCH v2 05/15] sql: introduce mem_append() Mergen Imeev via Tarantool-patches 2021-09-25 11:06 ` Mergen Imeev via Tarantool-patches 2021-09-21 10:59 ` [Tarantool-patches] [PATCH v2 06/15] sql: remove sql_vdbemem_finalize() Mergen Imeev via Tarantool-patches 2021-09-22 22:47 ` Vladislav Shpilevoy via Tarantool-patches 2021-09-25 11:13 ` Mergen Imeev via Tarantool-patches 2021-09-21 10:59 ` [Tarantool-patches] [PATCH v2 07/15] sql: rework SUM() Mergen Imeev via Tarantool-patches 2021-09-22 22:48 ` Vladislav Shpilevoy via Tarantool-patches 2021-09-25 11:17 ` Mergen Imeev via Tarantool-patches 2021-09-21 10:59 ` [Tarantool-patches] [PATCH v2 08/15] sql: rework TOTAL() Mergen Imeev via Tarantool-patches 2021-09-25 11:20 ` Mergen Imeev via Tarantool-patches 2021-09-21 10:59 ` [Tarantool-patches] [PATCH v2 09/15] sql: rework AVG() Mergen Imeev via Tarantool-patches 2021-09-22 22:48 ` Vladislav Shpilevoy via Tarantool-patches 2021-09-25 11:32 ` Mergen Imeev via Tarantool-patches 2021-09-21 10:59 ` [Tarantool-patches] [PATCH v2 10/15] sql: rework COUNT() Mergen Imeev via Tarantool-patches 2021-09-25 11:34 ` Mergen Imeev via Tarantool-patches 2021-09-21 10:59 ` [Tarantool-patches] [PATCH v2 11/15] sql: rework MIN() and MAX() Mergen Imeev via Tarantool-patches 2021-09-25 11:36 ` Mergen Imeev via Tarantool-patches 2021-09-21 10:59 ` [Tarantool-patches] [PATCH v2 12/15] sql: rework GROUP_CONCAT() Mergen Imeev via Tarantool-patches 2021-09-22 22:49 ` Vladislav Shpilevoy via Tarantool-patches 2021-09-25 11:42 ` Mergen Imeev via Tarantool-patches [this message] 2021-09-29 7:03 ` Mergen Imeev via Tarantool-patches 2021-09-21 10:59 ` [Tarantool-patches] [PATCH v2 13/15] sql: remove copying of result in finalizers Mergen Imeev via Tarantool-patches 2021-09-22 22:50 ` Vladislav Shpilevoy via Tarantool-patches 2021-09-25 11:47 ` Mergen Imeev via Tarantool-patches 2021-09-21 10:59 ` [Tarantool-patches] [PATCH v2 14/15] sql: remove MEM_TYPE_AGG Mergen Imeev via Tarantool-patches 2021-09-21 10:59 ` [Tarantool-patches] [PATCH v2 15/15] sql: remove field argv from struct sql_context Mergen Imeev via Tarantool-patches 2021-09-22 22:51 ` Vladislav Shpilevoy via Tarantool-patches 2021-09-25 12:03 ` Mergen Imeev via Tarantool-patches
Reply instructions: You may reply publicly to this message via plain-text email using any one of the following methods: * Save the following mbox file, import it into your mail client, and reply-to-all from there: mbox Avoid top-posting and favor interleaved quoting: https://en.wikipedia.org/wiki/Posting_style#Interleaved_style * Reply using the --to, --cc, and --in-reply-to switches of git-send-email(1): git send-email \ --in-reply-to=20210925114236.GI290467@tarantool.org \ --to=tarantool-patches@dev.tarantool.org \ --cc=imeevma@tarantool.org \ --cc=v.shpilevoy@tarantool.org \ --subject='Re: [Tarantool-patches] [PATCH v2 12/15] sql: rework GROUP_CONCAT()' \ /path/to/YOUR_REPLY https://kernel.org/pub/software/scm/git/docs/git-send-email.html * If your mail client supports setting the In-Reply-To header via mailto: links, try the mailto: link
This is a public inbox, see mirroring instructions for how to clone and mirror all data and code used for this inbox