Дерево: 5157271f8f

24-1-mkql-runtime

24.3.14.stream-nb-24-3.fullflash-exp1

add-upcoming-event-1

alexv-smirnov-patch-1

alexv-smirnov-patch-2

alexv-smirnov-patch-3

alexv-smirnov-patch-4

blinkov-patch-1

blinkov-patch-2

bs/vdisk/split-synclog-processing

cmake-actions-1

cmake2

cmake3

cmakebuild

dev-dirty_fix_clang14

dev-iddqd

dev-jinja-html

dev-jinja-html2

dev-night

dev-nightly

dev-remove_clang14_from_pr

dev-sammy-optimization

dev-stable-24-3

dev-test-policy

dev-test-wf

dev-upload-tests

dev-warmup

dev-wf-run

dev-whole-analytics

dev-whole-analytics-sammy

dev_dirty_fix_clang14

docker-connect-doc-up

docs-3-nodes-mirror-3-dc

docs-371-tmp

docs-633-review-follow-up

docs-add-coscup

docs-add-database-node-synonym

docs-add-gitignore

docs-add_translation_for_terraform_ydb_doc

docs-ansible-add-extra-note

docs-ansible-installation-options

docs-ansible-mistype-restart

docs-ansible-ydb-archive

docs-bugfix

docs-build-fixes

docs-change-storage-bucket

docs-changelog-cli-mistype

docs-clear-field

docs-cli-recipes

docs-cli-restore-import-data

docs-cli-win-change-url

docs-codowners-root-md

docs-columnar-pk

docs-concepts-cluster

docs-contents-snippet

docs-coordination

docs-create-table-ident

docs-dark-theme

docs-data-at-rest-improvement

docs-default-sql-version

docs-dev-getting-started-mistype

docs-diplodoc-workaround

docs-distconf-tmp

docs-docker-old-version-note

docs-dont-link-to-archived-go-sdk

docs-drop-old-public-talks

docs-drop-old-public-talks-1

docs-drop-unused-files

docs-drop-wip

docs-edit-ru-ansible-articles

docs-enable-feature-codegen

docs-example-app-en-fixes

docs-fix-ansible-repo-name

docs-fix-column-table-redirect

docs-fix-concat-md

docs-fix-internal-build

docs-fix-internal-build-1

docs-fix-oauth2-link

docs-fix-pg-create-include

docs-fix-rendering

docs-fix-ru-text-in-en

docs-fix-test-commit-ui

docs-fq-postgresql-fix-link

docs-grafana-columnar

docs-gtm

docs-hotfix-config-examples

docs-hotfix-public-talks-redirect

docs-increase-disabled-nodes-ratio-limit

docs-indiafoss-2024

docs-insert-into-hotfix

docs-kikimr-20945-pin-configs

docs-kubecon-hongkong

docs-localhost-broken-link

docs-manual-deployment-refactoring

docs-md-fix-cast-examples

docs-more-internal-fixes

docs-mute

docs-old-docker

docs-pause-autodeploy

docs-pg-redirect-hotfix

docs-postgresql-docker-connect-minor-fix

docs-preview-in-pr

docs-quickstart-add-mkdir

docs-quickstart-apple-silicon-note

docs-quickstart-docker-arm

docs-refactor-build-sh

docs-refactoring-ydbdocs-633

docs-release-workflow-add-paths

docs-remove-setup-playbook-mention

docs-rm-mirror-3dc-3-nodes

docs-ru-glossary-terminology-fixes

docs-ru-index-yaml

docs-security-encryption

docs-simplify-sidebar

docs-single-page

docs-stackonf-fix-url

docs-test-codeowners

docs-test-if-oss

docs-tls-mistype

docs-tmp-alter-table

docs-topic-workload-fix-option-name

docs-topology-md-improvements

docs-translate-9019

docs-translate-connections-string

docs-translate-tracing

docs-translation-debts

docs-trigger-ci

docs-try-lunr

docs-unpause-deploy

docs-unrestrict-revision-access

docs-update-decimal-note

docs-update-diplodoc-actions

docs-update-favicon

docs-update-gitignore

docs-update-license-year

docs-update-query-limits

docs-update-readme

docs-update-redirects

docs-update-workflow-type

docs-use-ansible-collections-playbook

docs-version-builtin

docs-workflow-on-create

docs-ya-make-yql

docs-ydb-go-sdk-prometheus

docs-ydb-var

docs-ydbdocs-1020

docs-ydbdocs-119-glossary-revamp

docs-ydbdocs-191-translate-fq

docs-ydbdocs-519-translate-config-related

docs-ydbdocs-596

docs-ydbdocs-633-continue

docs-ydbdocs-633-continue-2

docs-ydbdocs-633-continue-3

docs-ydbdocs-633-continue-4

docs-ydbdocs-633-refactoring

docs-ydbdocs-653-restore-minikube-quickstart

docs-ydbdocs-668-add-ansible-logging

docs-ydbdocs-668-playbook-name

docs-ydbdocs-690-ansible-restart

docs-ydbdocs-691-introduce-recipes-section

docs-ydbdocs-692-update-config

docs-ydbdocs-696-fix-yql-build

docs-ydbdocs-760-analytics-faq

docs-ydbdocs-804-ansible-fq-connector

docs-ydbdocs-909

docs-ydbdocs-917

docs-ydbdocs-935

docs-ydbops-9957-updating-executables-ansible

docs-yfm-link

docs-yfm-warnings

docs-yfmlint

docs-yfmlint-2

docs-yfmlint-3

docstools-update-build-workflow

dstool/pypi

embedded-ui-refresh-v4.31.0

embedded-ui-refresh-v4.31.1

embedded-ui-v4.33.0

embedded-ui-v5.5.0

embedded-ui-v6.10.2

embedded-ui-v6.16.0

embedded-ui-v6.17.2

embedded-ui-v6.28.0

embedded-ui-v6.4.0

embedded-ui-v6.8.0

embedded-ui-v7.2.0

embedded-ui-v8.6.0

embedded-ui-v8.7.0

feature/KIKIMR-20843/fix-reserve

feature/backups/pre-6

feature/integrations_and_ide

fix-header-ident-bloom

license-year-2023

main

merge-libs-241224-1545

merge-libs-241224-2313

merge-libs-241225-1905

merge-libs-241227-0020

merge-libs-241227-1333

merge-libs-241228-0020

merge-libs-241228-1728

merge-libs-241229-0022

merge-libs-241230-0021

merge-libs-250109-1621

merge-libs-250110-0021

merge-libs-250111-0020

merge-libs-250112-0023

merge-libs-250113-0022

merge-libs-250114-0501

merge-libs-250114-1110

merge-libs-250115-0020

merge-libs-250116-0020

merge-libs-250117-0020

merge-libs-250117-1049

merge-libs-250118-0019

merge-libs-250119-0022

merge-libs-250120-0020

merge-libs-250121-0019

merge-libs-250122-0020

merge-libs-250122-1156

merge-libs-250123-0020

merge-libs-250124-0020

merge-libs-250125-0019

merge-libs-250126-0020

merge-libs-250127-0020

merge-libs-250128-0050

merge-libs-250129-0050

merge-libs-250129-1040

merge-libs-250130-0050

merge-libs-250130-1607

merge-libs-250131-0050

merge-libs-250201-0050

merge-libs-250202-0050

merge-libs-250203-0050

merge-libs-250204-0050

merge-libs-250205-0050

merge-libs-250206-0050

merge-libs-250207-0050

merge-libs-250207-1355

mergelibs-240308-1527

mergelibs-240312-1040

mergelibs-240313-1032

mergelibs-240313-1536

mergelibs-240318-0944

mergelibs-240325-1123

mergelibs-240326-1411

mergelibs-240326-1608

mergelibs-240327-1029

mergelibs-240403-0851

mergelibs-240404-1137

mergelibs-240408-0819

mergelibs-240416-0910

mergelibs-240417-0847

mergelibs-240423-0906

mergelibs-240425-1630

mergelibs-240506-1255

mergelibs-240507-1023

mergelibs-240508-0817

mergelibs-240510-1206

mergelibs-240514-0848

mergelibs-240603-0842

mergelibs-240606-1312

mergelibs-240610-0905

mergelibs-240611-1110

mergelibs-240618-0830

mergelibs-240621-1318

mergelibs-240626-2018

mergelibs-240708-1553

mergelibs-240719-0942

mergelibs-240730-1922

mergelibs-240803-2327

mergelibs-240807-0824

mergelibs-240807-1211

mergelibs-240807-1311

mergelibs-240814-1820

mergelibs-240814-2205

mergelibs-240815-1025

mergelibs-240816-1413

mergelibs-240819-0942

mergelibs-240819-1422

mergelibs-240819-2038

mergelibs-240820-1626

mergelibs-240820-2236

mergelibs-240821-1409

mergelibs-240823-1155

mergelibs-240830-1442

mergelibs-240903-1104

mergelibs-240905-0836

mergelibs-240906-1233

mergelibs-240911-0600

mergelibs-240913-0843

mergelibs-240916-1031

mergelibs-240918-0758

mergelibs-240924-0826

mergelibs-240926-1443

mergelibs-240930-1059

mergelibs-241002-1139

mergelibs-241002-1721

mergelibs-241003-0910

mergelibs-241003-1145

mergelibs-241003-1407

mergelibs-241004-1110

mergelibs-241004-1426

mergelibs-241007-1548

mergelibs-241008-2121

mergelibs-241009-1030

mergelibs-241011-1107

mergelibs-241015-1526

mergelibs-241016-1210

mergelibs-241019-1758

mergelibs-241021-1020

mergelibs-241028-1143

mergelibs-241028-2033

mergelibs-241031-1710

mergelibs-241101-0908

mergelibs-241102-0844

mergelibs-241106-0903

mergelibs-241108-0852

mergelibs-241115-0911

mergelibs-241120-1113

mergelibs-241122-0919

mergelibs-241123-1930

mergelibs-241123-2111

mergelibs-241126-1510

mergelibs-241127-0941

mergelibs-241128-1021

mergelibs-241128-1502

mergelibs-241129-1330

mergelibs-241130-1815

mergelibs-241202-1134

mergelibs-241202-1453

mergelibs-241203-0816

mergelibs-241203-1217

mergelibs-241204-1715

mergelibs-241204-2036

mergelibs-241205-0959

mergelibs-241210-0813

mergelibs-241210-1057

mergelibs-241210-1802

mergelibs-241213-1023

mergelibs-241216-0851

mergelibs-241216-1701

mergelibs-241218-0753

mergelibs-241219-0815

mergelibs-241225-1031

mergelibs-yql

mergelibs-yurchuk-manual

mute/ManyColumnShardsWithRestarts

mute/naspirato-7

mute/ydb/core/blobstorage/ut_vdisk2_VDiskTest.HugeBlobWrite

mute/ydb/core/kqp/workload_service/ut

mute/ydb/core/mind/hive/ut/THiveTest.DrainWithHiveRestart

mute/ydb/core/tablet_flat/ut_TSharedPageCache.Compaction_BTreeIndex

mute/ydb/core/viewer/tests-test.py.test_storage_groups

mute/ydb/library/yql/providers/generic/connector/tests/datasource/clickhouse-test.py.test_select_datetime

mute/ydb/library/yql/providers/generic/connector/tests/datasource/ms_sql_server-test.py.test_select_positive

mute/ydb/tests/fq/yds-test_row_dispatcher.py.TestPqRowDispatcher.test_restart_compute_node

mute/ydb/tests/olap/ttl_tiering-ttl_delete_s3.py.TestDeleteS3Ttl.test_data_unchanged_after_ttl_change

mute/ydb/tests/stress/kv/tests-test_workload.py.TestYdbKvWorkload.testcolumn]

mute/yurchuk/kqp

mute/yurchuk/kqp2

mute/yurchuk/viewer

mute/zverevgeny

naspirato/asan-retry

naspirato/coverage_2

naspirato/mute

naspirato/mute-1

naspirato/mute-10

naspirato/mute-2

naspirato/mute-3

naspirato/mute-4

naspirato/mute-5

naspirato/mute-6

naspirato/mute-7

naspirato/mute-8

naspirato/mute-9

naspirato/mute1

naspirato/muted

naspirato/muted-1

naspirato/muted-2

naspirato/muted-3

naspirato/muted-4

naspirato/muted-5

naspirato/muted-6

naspirato/muted_resolve

naspirato/test-asan-mod

naspirato/test_asan_mod

naspirato/test_coverage_over_nr

naspirato/testowners

naspirato/unmute

naspirato/update_regression_wf

oidc-proxy-stable-2024-09

oleshiy-fix-yc-terraform

password_in_file

prestable-24-4

prestable-24-4-del-me

q-stable-2023-11-22

q-stable-2024-01-09

q-stable-2024-03-21

q-stable-2024-07-08

q-stable-2024-12-05

q-stable-ydb-24-1

q-stable-ydb-24-2

q-stable-ydb-24-3

readme-linkedin-link

readme-links-update

readme-social-update

revert-10009-dev/check_thread_in_blockdevice

revert-10337-fix_includes_3

revert-11474-mvcc-snapshot-evwrite

revert-11605-YQL-19292

revert-12084-harmonizer/split_to_files

revert-12824-VIEW.s3_backup.1

revert-3499-main

revert-4919-olap-buffer

revert-4924-fix-joins

revert-5604-memory-free-fix

revert-5852-marat_nurgaleev_moi_drug

revert-6270-stats-24-1/change_as_usage

revert-6271-stats-24-2/change_as_usage

revert-6286-add-enable-impl-params-to-table-service-config

revert-7492-drop_old_json

revert-750-revert-634-kqp-computation-pattern-cache-serialized-program

revert-7994-mergelibs-240819-0942

revert-8164-ci-remove-warnings

revert-8269-patch/24-3/revert-as

revert-8383-legacy_kv_api_remove

revert-9886-libpq17-compat

revert-9998-mute/naspirato-17

revert-dffc12acf95248fe644c7a64a71abcd5467b4bf8

rightlib

roadmap

sammyvimes/experiments

spuchin-patch-1

stable-22-2

stable-22-4

stable-22-5

stable-23-1

stable-23-2

stable-23-3

stable-23-3-33-hotfix

stable-23-4

stable-23-4-11-normalizer-fix

stable-24-1

stable-24-1-10-hotfix

stable-24-1-14-analytics

stable-24-1-14-hotfix

stable-24-1-14-roaring

stable-24-1-16-analytics

stable-24-1-18-analytics

stable-24-1-8

stable-24-1-CS-patch

stable-24-1-CS-patch-2

stable-24-1-CS-patch-3

stable-24-1-CS-patch-3-att-2

stable-24-1-async-replication

stable-24-1-bump-workflows1

stable-24-1-bumpci2

stable-24-1-cbo

stable-24-1-iddqd

stable-24-1-iddqd-2

stable-24-1-iddqd-3

stable-24-2

stable-24-2-1-hotfix

stable-24-2-4-analytics

stable-24-2-4-hotfix

stable-24-2-6-hotfix

stable-24-2-7-hotfix

stable-24-2-fix-lwtrace

stable-24-3

stable-24-3-10-analytics

stable-24-3-10-hotfix

stable-24-3-11-hotfix

stable-24-3-13-hotfix

stable-24-3-13-hotfix-yasubd

stable-24-3-14-cs

stable-24-3-15-hotfix

stable-24-3-6-logbroker

stable-24-3-7-hotfix

stable-24-3-8-analytics

stable-24-3-8-analytics-misha

stable-24-3-9-cs

stable-24-3-9-hotfix

stream-nb-1

stream-nb-1-tracing

stream-nb-1.put-lwtrack

stream-nb-2

stream-nb-2.put-lwtrack

stream-nb-24-3

stream-nb-24.3.11.1-hotfix.7-hf.1

update-readme-docs-link

workflow-check-1

ydbdocs-557

yql-stable-2024-03-14

yql-stable-2024-05-07

yql-stable-2024-07-01

yql-stable-2024-09-03

yql-stable-2024-12-23

yql-stable-test1

yql-temp-table

REDUCE

Groups the input by the specified key columns, then passes the current keys and a lazy iterator over their corresponding values from the remaining columns to the specified UDF for processing. Similarly to PROCESS, the UDF can return an arbitrary number of result rows per call and also return Variants to create multiple outputs. In terms of MapReduce, it's very similar to Reduce.

Keywords that can follow:

PRESORT (optional): Specifying the order within each group, the syntax is similar to ORDER BY;
ON (required): Specifying key columns.
USING or USING ALL (required): A UDF call, see more about the rules below.

Rules for passing UDF arguments:

If TableRows() is specified as a UDF argument, then the UDF must accept one argument: a lazy iterator over strings, with the type Stream<Struct...>>. In this case, the output type of the function can only be Stream<OutputType> or List<OutputType>. It's guaranteed that the data in the input iterator is grouped by the key and, if necessary, sorted according to the PRESORT section. With TableRows(), you can only use USING ALL.
With USING:
- The UDF must accept two arguments: the current key is passed to the first argument, and a lazy iterator with values corresponding to this key is passed to the second argument.
With USING ALL:
- The UDF must accept one argument: a lazy iterator over Tuples, where the first item in the tuple is a key, and the second item is a lazy iterator with values corresponding to this key.
The key to be passed to the UDF follows the rule below. If there is only one key column, then only its value is used in the key. If there are multiple columns (columns are listed similarly to GROUP BY separated by commas), then the key is a Tuple with values from the listed columns in the specified order.
When you call REDUCE from a query, only the expression whose values will be passed as iterator items follows the UDF name in parentheses (the second UDF argument for USING or the second item of the tuple for USING ALL).

The result is built in the same way as for PROCESS. You can also use the TableRow() keyword to get the whole string as a structure.

In REDUCE, you can pass multiple inputs (the input here means a table, a range of tables, a subquery, a named expression), separated by commas. All inputs must have the key columns of the matching type specified in ON. To the function from USING in this case, you can only pass a special named expression TableRow(). The second argument (or the second element of the tuple for USING ALL) will include a lazy iterator over variants with a populated element that corresponds to the occurrence ID for the current entry.

After USING, in REDUCE you can optionally specify ASSUME ORDER BY with a list of columns. The result of such a REDUCE statement is treated as sorted, but without actually running a sort. Sort check is performed at the query execution stage. It supports setting the sort order using the keywords ASC (ascending order) and DESC (descending order). Expressions are not supported in ASSUME ORDER BY.

Examples

REDUCE my_table
ON key, subkey
USING MyUdf::MyReducer(TableRow());

REDUCE my_table
ON key, subkey
USING ALL MyUDF::MyStreamReducer(TableRow()); -- MyUDF::MyStreamReducer accepts a lazy list of tuples (key, list of entries for the key) as its input

REDUCE my_table
PRESORT LENGTH(subkey) DESC
ON key
USING MyUdf::MyReducer(
    AsTuple(subkey, value)
);

REDUCE my_table
ON key
USING ALL MyUDF::MyFlatStreamReducer(TableRows()); -- MyUDF::MyFlatStreamReducer accepts a single lazy list of entries as its input

-- The function returns Variants
$udf = Python::MyReducer(Callable<(String, Stream<Struct<...>>) -> Variant<Struct<...>, Struct<...>>>,
    $udfScript
);

-- The output of REDUCE produces a tuple of lists
$i, $j = (REDUCE my_table ON key USING $udf(TableRow()));

SELECT * FROM $i;
SELECT * FROM $j;

$script = @@
def MyReducer(key, values):
    state = None, 0
    for name, last_visit_time in values:
        if state[1] < last_visit_time:
            state = name, last_visit_time
    return {
        'region':key,
        'last_visitor':state[0],
    }
@@;

$udf = Python::MyReducer(Callable<(
    Int64?,
    Stream<Tuple<String?, Uint64?>>
) -> Struct<
    region:Int64?,
    last_visitor:String?
>>,
    $script
);

REDUCE my_table
ON region USING $udf((name, last_visit_time));

-- The function accepts a key and iterator of Variants as input
$udf = Python::MyReducer(Callable<(String, Stream<Variant<Struct<...>,Struct<...>>>) -> Struct<...>>,
    $udfScript
);

REDUCE my_table1, my_table2 ON key USING $udf(TableRow());

reduce.md 4.9 KB История Исходник

REDUCE

Examples

reduce.md 4.9 KB

История Исходник