digraph G {
0 [labelType="html" label="<br><b>AdaptiveSparkPlan</b><br><br>"];
1 [labelType="html" label="<b>Execute InsertIntoHadoopFsRelationCommand</b><br><br>task commit time total (min, med, max (stageId: taskId))<br>2 ms (0 ms, 1 ms, 1 ms (stage 15275.0: task 21196))<br>number of written files: 3<br>job commit time: 7 ms<br>number of output rows: 377,497<br>number of dynamic part: 0<br>written output: 968.3 KiB"];
2 [labelType="html" label="<br><b>WriteFiles</b><br><br>"];
subgraph cluster3 {
isCluster="true";
label="WholeStageCodegen (7)\n \nduration: total (min, med, max (stageId: taskId))\n758 ms (218 ms, 258 ms, 282 ms (stage 15275.0: task 21197))";
4 [labelType="html" label="<b>Sort</b><br><br>sort time total (min, med, max (stageId: taskId))<br>41 ms (12 ms, 13 ms, 16 ms (stage 15275.0: task 21197))<br>peak memory total (min, med, max (stageId: taskId))<br>60.0 MiB (20.0 MiB, 20.0 MiB, 20.0 MiB (stage 15275.0: task 21196))<br>spill size total (min, med, max (stageId: taskId))<br>0.0 B (0.0 B, 0.0 B, 0.0 B (stage 15275.0: task 21196))"];
}
5 [labelType="html" label="<b>AQEShuffleRead</b><br><br>number of partitions: 3<br>partition data size total (min, med, max (stageId: taskId))<br>3.7 MiB (1117.5 KiB, 1126.3 KiB, 1537.1 KiB (driver))<br>number of coalesced partitions: 3"];
6 [labelType="html" label="<b>Exchange</b><br><br>shuffle records written: 377,497<br>local merged chunks fetched: 0<br>shuffle write time total (min, med, max (stageId: taskId))<br>16 ms (3 ms, 4 ms, 5 ms (stage 15270.0: task 21191))<br>remote merged bytes read: 0.0 B<br>local merged blocks fetched: 0<br>corrupt merged block chunks: 0<br>remote merged reqs duration: 0 ms<br>remote merged blocks fetched: 0<br>records read: 377,497<br>local bytes read total (min, med, max (stageId: taskId))<br>3.5 MiB (1054.1 KiB, 1084.4 KiB, 1445.0 KiB (stage 15275.0: task 21197))<br>fetch wait time total (min, med, max (stageId: taskId))<br>0 ms (0 ms, 0 ms, 0 ms (stage 15275.0: task 21196))<br>remote bytes read: 0.0 B<br>merged fetch fallback count: 0<br>local blocks read: 8<br>remote merged chunks fetched: 0<br>remote blocks read: 0<br>data size total (min, med, max (stageId: taskId))<br>25.2 MiB (5.0 MiB, 6.4 MiB, 8.7 MiB (stage 15270.0: task 21191))<br>local merged bytes read: 0.0 B<br>number of partitions: 10<br>remote reqs duration: 0 ms<br>remote bytes read to disk: 0.0 B<br>shuffle bytes written total (min, med, max (stageId: taskId))<br>3.5 MiB (687.3 KiB, 886.7 KiB, 1306.3 KiB (stage 15270.0: task 21191))"];
7 [labelType="html" label="<br><b>Union</b><br><br>"];
subgraph cluster8 {
isCluster="true";
label="WholeStageCodegen (5)\n \nduration: total (min, med, max (stageId: taskId))\n244 ms (80 ms, 164 ms, 164 ms (stage 15270.0: task 21191))";
9 [labelType="html" label="<br><b>Project</b><br><br>"];
10 [labelType="html" label="<b>Generate</b><br><br>number of output rows: 275,604"];
11 [labelType="html" label="<br><b>Project</b><br><br>"];
12 [labelType="html" label="<b>Filter</b><br><br>number of output rows: 91,868"];
}
13 [labelType="html" label="<b>Window</b><br><br>spill size total (min, med, max (stageId: taskId))<br>0.0 B (0.0 B, 0.0 B, 0.0 B (stage 15266.0: task 21187))"];
subgraph cluster14 {
isCluster="true";
label="WholeStageCodegen (4)\n \nduration: total (min, med, max (stageId: taskId))\n338 ms (138 ms, 200 ms, 200 ms (stage 15270.0: task 21191))";
15 [labelType="html" label="<b>Sort</b><br><br>sort time total (min, med, max (stageId: taskId))<br>23 ms (11 ms, 12 ms, 12 ms (stage 15266.0: task 21187))<br>peak memory total (min, med, max (stageId: taskId))<br>36.0 MiB (18.0 MiB, 18.0 MiB, 18.0 MiB (stage 15266.0: task 21187))<br>spill size total (min, med, max (stageId: taskId))<br>0.0 B (0.0 B, 0.0 B, 0.0 B (stage 15266.0: task 21187))"];
}
16 [labelType="html" label="<b>AQEShuffleRead</b><br><br>number of partitions: 1<br>partition data size: 693.8 KiB<br>number of coalesced partitions: 1"];
17 [labelType="html" label="<b>Exchange</b><br><br>shuffle records written: 45,934<br>local merged chunks fetched: 0<br>shuffle write time: 4 ms<br>remote merged bytes read: 0.0 B<br>local merged blocks fetched: 0<br>corrupt merged block chunks: 0<br>remote merged reqs duration: 0 ms<br>remote merged blocks fetched: 0<br>records read: 91,868<br>local bytes read total (min, med, max (stageId: taskId))<br>1346.6 KiB (673.3 KiB, 673.3 KiB, 673.3 KiB (stage 15266.0: task 21187))<br>fetch wait time total (min, med, max (stageId: taskId))<br>0 ms (0 ms, 0 ms, 0 ms (stage 15266.0: task 21187))<br>remote bytes read: 0.0 B<br>merged fetch fallback count: 0<br>local blocks read: 2<br>remote merged chunks fetched: 0<br>remote blocks read: 0<br>data size: 3.5 MiB<br>local merged bytes read: 0.0 B<br>number of partitions: 10<br>remote reqs duration: 0 ms<br>remote bytes read to disk: 0.0 B<br>shuffle bytes written: 673.3 KiB"];
subgraph cluster18 {
isCluster="true";
label="WholeStageCodegen (1)\n \nduration: 372 ms";
19 [labelType="html" label="<br><b>Project</b><br><br>"];
20 [labelType="html" label="<b>Filter</b><br><br>number of output rows: 45,934"];
}
21 [labelType="html" label="<b>Scan csv </b><br><br>number of output rows: 45,934<br>number of files read: 1<br>metadata time: 0 ms<br>size of files read: 2.7 MiB"];
subgraph cluster22 {
isCluster="true";
label="WholeStageCodegen (6)\n \nduration: total (min, med, max (stageId: taskId))\n794 ms (112 ms, 138 ms, 156 ms (stage 15270.0: task 21194))";
23 [labelType="html" label="<b>Sort</b><br><br>sort time total (min, med, max (stageId: taskId))<br>228 ms (34 ms, 35 ms, 45 ms (stage 15266.0: task 21190))<br>peak memory total (min, med, max (stageId: taskId))<br>112.0 MiB (18.0 MiB, 18.0 MiB, 20.0 MiB (stage 15266.0: task 21190))<br>spill size total (min, med, max (stageId: taskId))<br>0.0 B (0.0 B, 0.0 B, 0.0 B (stage 15266.0: task 21189))"];
}
24 [labelType="html" label="<b>AQEShuffleRead</b><br><br>number of partitions: 3<br>partition data size total (min, med, max (stageId: taskId))<br>3.7 MiB (1156.7 KiB, 1171.3 KiB, 1484.8 KiB (driver))<br>number of coalesced partitions: 3"];
25 [labelType="html" label="<b>Exchange</b><br><br>shuffle records written: 239,695<br>local merged chunks fetched: 0<br>shuffle write time total (min, med, max (stageId: taskId))<br>15 ms (4 ms, 4 ms, 5 ms (stage 15262.0: task 21186))<br>remote merged bytes read: 0.0 B<br>local merged blocks fetched: 0<br>corrupt merged block chunks: 0<br>remote merged reqs duration: 0 ms<br>remote merged blocks fetched: 0<br>records read: 479,390<br>local bytes read total (min, med, max (stageId: taskId))<br>7.2 MiB (1102.9 KiB, 1135.0 KiB, 1434.6 KiB (stage 15266.0: task 21190))<br>fetch wait time total (min, med, max (stageId: taskId))<br>0 ms (0 ms, 0 ms, 0 ms (stage 15266.0: task 21189))<br>remote bytes read: 0.0 B<br>merged fetch fallback count: 0<br>local blocks read: 18<br>remote merged chunks fetched: 0<br>remote blocks read: 0<br>data size total (min, med, max (stageId: taskId))<br>16.5 MiB (4.9 MiB, 4.9 MiB, 6.6 MiB (stage 15262.0: task 21186))<br>local merged bytes read: 0.0 B<br>number of partitions: 10<br>remote reqs duration: 0 ms<br>remote bytes read to disk: 0.0 B<br>shuffle bytes written total (min, med, max (stageId: taskId))<br>3.6 MiB (1103.2 KiB, 1104.3 KiB, 1465.1 KiB (stage 15262.0: task 21186))"];
subgraph cluster26 {
isCluster="true";
label="WholeStageCodegen (3)\n \nduration: total (min, med, max (stageId: taskId))\n807 ms (113 ms, 131 ms, 170 ms (stage 15262.0: task 21186))";
27 [labelType="html" label="<b>HashAggregate</b><br><br>spill size: 0.0 B<br>time in aggregation build total (min, med, max (stageId: taskId))<br>434 ms (58 ms, 68 ms, 95 ms (stage 15262.0: task 21186))<br>peak memory total (min, med, max (stageId: taskId))<br>99.0 MiB (16.3 MiB, 16.3 MiB, 17.0 MiB (stage 15260.0: task 21183))<br>number of output rows: 479,390<br>number of sort fallback tasks: 0<br>avg hash probes per key (min, med, max (stageId: taskId)):<br>(1.3, 1.3, 1.6 (stage 15260.0: task 21183))"];
}
28 [labelType="html" label="<b>AQEShuffleRead</b><br><br>number of partitions: 3<br>partition data size total (min, med, max (stageId: taskId))<br>3.8 MiB (1151.9 KiB, 1167.2 KiB, 1539.7 KiB (driver))<br>number of coalesced partitions: 3"];
29 [labelType="html" label="<b>Exchange</b><br><br>shuffle records written: 239,813<br>local merged chunks fetched: 0<br>shuffle write time total (min, med, max (stageId: taskId))<br>33 ms (2 ms, 3 ms, 4 ms (stage 15258.0: task 21171))<br>remote merged bytes read: 0.0 B<br>local merged blocks fetched: 0<br>corrupt merged block chunks: 0<br>remote merged reqs duration: 0 ms<br>remote merged blocks fetched: 0<br>records read: 479,626<br>local bytes read total (min, med, max (stageId: taskId))<br>7.2 MiB (1111.9 KiB, 1113.0 KiB, 1486.4 KiB (stage 15260.0: task 21183))<br>fetch wait time total (min, med, max (stageId: taskId))<br>0 ms (0 ms, 0 ms, 0 ms (stage 15260.0: task 21182))<br>remote bytes read: 0.0 B<br>merged fetch fallback count: 0<br>local blocks read: 60<br>remote merged chunks fetched: 0<br>remote blocks read: 0<br>data size total (min, med, max (stageId: taskId))<br>16.5 MiB (1650.3 KiB, 1704.0 KiB, 1710.8 KiB (stage 15258.0: task 21171))<br>local merged bytes read: 0.0 B<br>number of partitions: 10<br>remote reqs duration: 0 ms<br>remote bytes read to disk: 0.0 B<br>shuffle bytes written total (min, med, max (stageId: taskId))<br>3.6 MiB (363.5 KiB, 374.7 KiB, 375.9 KiB (stage 15258.0: task 21171))"];
subgraph cluster30 {
isCluster="true";
label="WholeStageCodegen (2)\n \nduration: total (min, med, max (stageId: taskId))\n2.2 s (154 ms, 229 ms, 232 ms (stage 15258.0: task 21172))";
31 [labelType="html" label="<b>HashAggregate</b><br><br>spill size: 0.0 B<br>time in aggregation build total (min, med, max (stageId: taskId))<br>1.7 s (135 ms, 172 ms, 176 ms (stage 15258.0: task 21174))<br>peak memory total (min, med, max (stageId: taskId))<br>162.5 MiB (16.3 MiB, 16.3 MiB, 16.3 MiB (stage 15258.0: task 21173))<br>number of output rows: 239,813<br>number of sort fallback tasks: 0<br>avg hash probes per key (min, med, max (stageId: taskId)):<br>(1, 1, 1 (stage 15258.0: task 21173))"];
32 [labelType="html" label="<br><b>Project</b><br><br>"];
33 [labelType="html" label="<b>Generate</b><br><br>number of output rows: 1,186,836"];
34 [labelType="html" label="<br><b>Project</b><br><br>"];
35 [labelType="html" label="<b>ColumnarToRow</b><br><br>number of output rows: 169,548<br>number of input batches: 50"];
}
36 [labelType="html" label="<b>Scan parquet </b><br><br>number of files read: 10<br>scan time total (min, med, max (stageId: taskId))<br>77 ms (3 ms, 9 ms, 10 ms (stage 15258.0: task 21171))<br>metadata time: 0 ms<br>size of files read: 11.5 MiB<br>number of output rows: 169,548"];
1->0;
2->1;
4->2;
5->4;
6->5;
7->6;
9->7;
10->9;
11->10;
12->11;
13->12;
15->13;
16->15;
17->16;
19->17;
20->19;
21->20;
23->7;
24->23;
25->24;
27->25;
28->27;
29->28;
31->29;
32->31;
33->32;
34->33;
35->34;
36->35;
}
37
AdaptiveSparkPlan isFinalPlan=true
Execute InsertIntoHadoopFsRelationCommand file:/data/output/cache/parquet/datablock/14_B_PASSAGE_PA_176405, false, Parquet, [path=file:///data/output/cache/parquet/datablock/14_B_PASSAGE_PA_176405], Overwrite, [COL_E5ADB260_1BF6_449C_8439_0A94CEE6956C, COL_59774853_4110_4672_B6E2_C0D5DE930914, COL_E58DD17C_E55F_4036_9FA9_A5365B045A1A]
WriteFiles
Sort [COL_E5ADB260_1BF6_449C_8439_0A94CEE6956C#1187468 ASC NULLS FIRST, COL_59774853_4110_4672_B6E2_C0D5DE930914#1187469 ASC NULLS FIRST], true, 0
WholeStageCodegen (7)
AQEShuffleRead coalesced
Exchange rangepartitioning(COL_E5ADB260_1BF6_449C_8439_0A94CEE6956C#1187468 ASC NULLS FIRST, COL_59774853_4110_4672_B6E2_C0D5DE930914#1187469 ASC NULLS FIRST, 10), ENSURE_REQUIREMENTS, [plan_id=619755]
Union
Project [COL_DEB05435_3A84_4F8F_8CD2_6BE209A14FA8#1187428 AS COL_E5ADB260_1BF6_449C_8439_0A94CEE6956C#1187468, col0#1187437 AS COL_59774853_4110_4672_B6E2_C0D5DE930914#1187469, col1#1187438 AS COL_E58DD17C_E55F_4036_9FA9_A5365B045A1A#1187470]
Generate stack(3, 01-UF, COL_48FD2AAE_6F4D_4D43_BEE7_8A161203783C#1187429, 02-Transport, COL_E0699193_FC70_4F64_BAE6_B2F241857F3B#1187430, 03-CCMU, COL_630C2F1A_DB89_4A08_A2D2_179A10CC9FD2#1187431), [COL_DEB05435_3A84_4F8F_8CD2_6BE209A14FA8#1187428], false, [col0#1187437, col1#1187438]
Project [COL_2AF4FE05_74B1_4A24_9BC1_7612D6ED731D#1186936 AS COL_DEB05435_3A84_4F8F_8CD2_6BE209A14FA8#1187428, COL_E82CFB57_01EB_4E90_836D_4D6F4CA131FE#1186937 AS COL_48FD2AAE_6F4D_4D43_BEE7_8A161203783C#1187429, COL_E1010A22_775B_43B4_B8CA_4603C0801D28#1186938 AS COL_E0699193_FC70_4F64_BAE6_B2F241857F3B#1187430, COL_6A6D32F5_2B4E_4DF6_A459_B248882F909D#1186939 AS COL_630C2F1A_DB89_4A08_A2D2_179A10CC9FD2#1187431]
Filter (COL_6B340AEB_6908_4A50_8AD6_FE561D33FBE0#1186952 <=> 1)
WholeStageCodegen (5)
Window [row_number() windowspecdefinition(COL_2AF4FE05_74B1_4A24_9BC1_7612D6ED731D#1186936, 1 DESC NULLS LAST, specifiedwindowframe(RowFrame, unboundedpreceding$(), currentrow$())) AS COL_6B340AEB_6908_4A50_8AD6_FE561D33FBE0#1186952], [COL_2AF4FE05_74B1_4A24_9BC1_7612D6ED731D#1186936], [1 DESC NULLS LAST]
Sort [COL_2AF4FE05_74B1_4A24_9BC1_7612D6ED731D#1186936 ASC NULLS FIRST, 1 DESC NULLS LAST], false, 0
WholeStageCodegen (4)
AQEShuffleRead coalesced
Exchange hashpartitioning(COL_2AF4FE05_74B1_4A24_9BC1_7612D6ED731D#1186936, 10), ENSURE_REQUIREMENTS, [plan_id=619482]
Project [Numéro Séjour#1186820 AS COL_2AF4FE05_74B1_4A24_9BC1_7612D6ED731D#1186936, UF#1186821 AS COL_E82CFB57_01EB_4E90_836D_4D6F4CA131FE#1186937, str_remove_space(Transport admission#1186824, ONLY_ONE) AS COL_E1010A22_775B_43B4_B8CA_4603C0801D28#1186938, str_remove_space(str_list_get(str_extract_by_regex(Niveau CCMU#1186825, [+\d]+), 0), ALL) AS COL_6A6D32F5_2B4E_4DF6_A459_B248882F909D#1186939]
Filter NOT CASE WHEN isnull(StartsWith(Numéro Séjour#1186820, #)) THEN false ELSE StartsWith(Numéro Séjour#1186820, #) END
WholeStageCodegen (1)
FileScan csv [Numéro Séjour#1186820,UF#1186821,Transport admission#1186824,Niveau CCMU#1186825] Batched: false, DataFilters: [NOT CASE WHEN isnull(StartsWith(Numéro Séjour#1186820, #)) THEN false ELSE StartsWith(Numéro Séj..., Format: CSV, Location: InMemoryFileIndex(1 paths)[file:/data/input/depot/csv/tmp/02_PASSAGE_PATI_175675/passage_patient_..., PartitionFilters: [], PushedFilters: [], ReadSchema: struct<Numéro Séjour:string,UF:string,Transport admission:string,Niveau CCMU:string>
Sort [COL_DC1A3ABF_ADFC_4208_8B24_35ED54CC87DF#1187368 ASC NULLS FIRST, COL_EA9AE57C_DE84_4BBE_9131_053814B337F4#1187369 ASC NULLS FIRST], true, 0
WholeStageCodegen (6)
AQEShuffleRead coalesced
Exchange rangepartitioning(COL_DC1A3ABF_ADFC_4208_8B24_35ED54CC87DF#1187368 ASC NULLS FIRST, COL_EA9AE57C_DE84_4BBE_9131_053814B337F4#1187369 ASC NULLS FIRST, 10), ENSURE_REQUIREMENTS, [plan_id=619608]
HashAggregate(keys=[COL_8D7490B1_ED4B_4A07_9680_ECC66DF49E37#1187362, COL_7F6B8B23_E564_4B4E_8794_0FC7CE59D60B#1187363, COL_B6440F86_8BD4_4AFD_8640_45556688ABB9#1187364], functions=[])
WholeStageCodegen (3)
AQEShuffleRead coalesced
Exchange hashpartitioning(COL_8D7490B1_ED4B_4A07_9680_ECC66DF49E37#1187362, COL_7F6B8B23_E564_4B4E_8794_0FC7CE59D60B#1187363, COL_B6440F86_8BD4_4AFD_8640_45556688ABB9#1187364, 10), ENSURE_REQUIREMENTS, [plan_id=619511]
HashAggregate(keys=[COL_8D7490B1_ED4B_4A07_9680_ECC66DF49E37#1187362, COL_7F6B8B23_E564_4B4E_8794_0FC7CE59D60B#1187363, COL_B6440F86_8BD4_4AFD_8640_45556688ABB9#1187364], functions=[])
Project [COL_BC7CB40E_B2CA_42C4_94A5_B6AA996E14DC#1187323 AS COL_8D7490B1_ED4B_4A07_9680_ECC66DF49E37#1187362, col0#1187340 AS COL_7F6B8B23_E564_4B4E_8794_0FC7CE59D60B#1187363, col1#1187341 AS COL_B6440F86_8BD4_4AFD_8640_45556688ABB9#1187364]
Generate stack(7, 04-Date Naissance, COL_95E23023_63AA_4AB8_A60F_50D45234CFDD#1187324, 05-Date Entree, COL_78B23D10_75E8_415E_A3C0_8AB5C826A837#1187325, 06-Date Sortie, COL_885784F8_1772_40E3_89B6_6ACE1FAB6407#1187326, 07-Fides, COL_32AA235F_1BB1_4047_B8BA_AD2E9197AD1F#1187327, 08-Facturable AM, COL_3BBA8558_C3D5_4921_93AE_D7C9E273B39D#1187328, 09-Justif Exo, COL_35788C71_38EE_4A08_B685_AAC68457246A#1187329, 10-Nature Ass, COL_6EC95BD9_A121_4728_BE4A_49B7EA2976F2#1187330), [COL_BC7CB40E_B2CA_42C4_94A5_B6AA996E14DC#1187323], false, [col0#1187340, col1#1187341]
Project [COL_F76265AB_8748_4114_92B4_00E37DE25D34#1187001 AS COL_BC7CB40E_B2CA_42C4_94A5_B6AA996E14DC#1187323, COL_9262BBED_C393_416D_B38C_8F1458965BA7#1187000 AS COL_95E23023_63AA_4AB8_A60F_50D45234CFDD#1187324, COL_96E2282E_0771_460E_8BDB_D11261BD9020#1187002 AS COL_78B23D10_75E8_415E_A3C0_8AB5C826A837#1187325, COL_12028397_66B1_4E3C_BBDB_64537606E7DE#1187003 AS COL_885784F8_1772_40E3_89B6_6ACE1FAB6407#1187326, COL_0521CAB9_7617_4F31_948E_95DCA16387D7#1186998 AS COL_32AA235F_1BB1_4047_B8BA_AD2E9197AD1F#1187327, COL_1DACB81E_AFA5_4BB8_83D7_57DE8B8062B7#1186999 AS COL_3BBA8558_C3D5_4921_93AE_D7C9E273B39D#1187328, COL_4473F770_A575_4100_97F6_8190F900749A#1187007 AS COL_35788C71_38EE_4A08_B685_AAC68457246A#1187329, COL_715B3479_EAD2_422C_BF5C_7B020197D946#1187008 AS COL_6EC95BD9_A121_4728_BE4A_49B7EA2976F2#1187330]
ColumnarToRow
WholeStageCodegen (2)
FileScan parquet [COL_0521CAB9_7617_4F31_948E_95DCA16387D7#1186998,COL_1DACB81E_AFA5_4BB8_83D7_57DE8B8062B7#1186999,COL_9262BBED_C393_416D_B38C_8F1458965BA7#1187000,COL_F76265AB_8748_4114_92B4_00E37DE25D34#1187001,COL_96E2282E_0771_460E_8BDB_D11261BD9020#1187002,COL_12028397_66B1_4E3C_BBDB_64537606E7DE#1187003,COL_4473F770_A575_4100_97F6_8190F900749A#1187007,COL_715B3479_EAD2_422C_BF5C_7B020197D946#1187008] Batched: true, DataFilters: [], Format: Parquet, Location: InMemoryFileIndex(1 paths)[file:/data/output/cache/parquet/datablock/02_A_ELIGIBLE_176076], PartitionFilters: [], PushedFilters: [], ReadSchema: struct<COL_0521CAB9_7617_4F31_948E_95DCA16387D7:string,COL_1DACB81E_AFA5_4BB8_83D7_57DE8B8062B7:s...