Project [CASE WHEN ((fractile#94019614 = NA) OR (fractile#94019614 = null)) THEN null ELSE cast(fractile#94019614 as float) END AS fractile#94019634, CASE WHEN ((overall#94019615 = NA) OR (overall#94019615 = null)) THEN null ELSE cast(overall#94019615 as int) END AS overall#94019635, CASE WHEN ((annual_ret#94019616 = NA) OR (annual_ret#94019616 = null)) THEN null ELSE cast(annual_ret#94019616 as float) END AS annual_ret#94019636, CASE WHEN ((annual_resret#94019617 = NA) OR (annual_resret#94019617 = null)) THEN null ELSE cast(annual_resret#94019617 as float) END AS annual_resret#94019637, CASE WHEN ((numcos#94019618 = NA) OR (numcos#94019618 = null)) THEN null ELSE cast(numcos#94019618 as float) END AS numcos#94019638]
Project [CASE WHEN ((fractile#94019731 = NA) OR (fractile#94019731 = null)) THEN null ELSE cast(fractile#94019731 as float) END AS fractile#94019797, CASE WHEN ((cap#94019732 = NA) OR (cap#94019732 = null)) THEN null ELSE cast(cap#94019732 as float) END AS cap#94019799, CASE WHEN ((annual_ret#94019733 = NA) OR (annual_ret#94019733 = null)) THEN null ELSE cast(annual_ret#94019733 as float) END AS annual_ret#94019823, CASE WHEN ((annual_resret#94019734 = NA) OR (annual_resret#94019734 = null)) THEN null ELSE cast(annual_resret#94019734 as float) END AS annual_resret#94019848, CASE WHEN ((numcos#94019735 = NA) OR (numcos#94019735 = null)) THEN null ELSE cast(numcos#94019735 as float) END AS numcos#94019872]
== Physical Plan ==
CollectLimit (17)
+- * ColumnarToRow (16)
+- InMemoryTableScan (1)
+- InMemoryRelation (2)
+- Union (15)
:- * ColumnarToRow (7)
: +- InMemoryTableScan (3)
: +- InMemoryRelation (4)
: +- * Project (6)
: +- Scan csv (5)
+- * Project (14)
+- * Filter (13)
+- * ColumnarToRow (12)
+- InMemoryTableScan (8)
+- InMemoryRelation (9)
+- * Project (11)
+- Scan csv (10)
(1) InMemoryTableScan
Output [4]: [fractile#94019634, annual_ret#94019636, annual_resret#94019637, numcos#94019638]
Arguments: [fractile#94019634, annual_ret#94019636, annual_resret#94019637, numcos#94019638]
(2) InMemoryRelation
Arguments: [fractile#94019634, annual_ret#94019636, annual_resret#94019637, numcos#94019638], CachedRDDBuilder(org.apache.spark.sql.execution.columnar.DefaultCachedBatchSerializer@208e3fd9,StorageLevel(disk, memory, deserialized, 1 replicas),Union
:- *(1) ColumnarToRow
: +- InMemoryTableScan [fractile#94019634, annual_ret#94019636, annual_resret#94019637, numcos#94019638]
: +- InMemoryRelation [fractile#94019634, overall#94019635, annual_ret#94019636, annual_resret#94019637, numcos#94019638], StorageLevel(disk, memory, deserialized, 1 replicas)
: +- *(1) Project [CASE WHEN ((fractile#94019614 = NA) OR (fractile#94019614 = null)) THEN null ELSE cast(fractile#94019614 as float) END AS fractile#94019634, CASE WHEN ((overall#94019615 = NA) OR (overall#94019615 = null)) THEN null ELSE cast(overall#94019615 as int) END AS overall#94019635, CASE WHEN ((annual_ret#94019616 = NA) OR (annual_ret#94019616 = null)) THEN null ELSE cast(annual_ret#94019616 as float) END AS annual_ret#94019636, CASE WHEN ((annual_resret#94019617 = NA) OR (annual_resret#94019617 = null)) THEN null ELSE cast(annual_resret#94019617 as float) END AS annual_resret#94019637, CASE WHEN ((numcos#94019618 = NA) OR (numcos#94019618 = null)) THEN null ELSE cast(numcos#94019618 as float) END AS numcos#94019638]
: +- FileScan csv [fractile#94019614,overall#94019615,annual_ret#94019616,annual_resret#94019617,numcos#94019618] Batched: false, DataFilters: [], Format: CSV, Location: InMemoryFileIndex(1 paths)[file:/srv/plusamp/data/default/ea-market/output/risk_factors/growth/fr..., PartitionFilters: [], PushedFilters: [], ReadSchema: struct<fractile:string,overall:string,annual_ret:string,annual_resret:string,numcos:string>
+- *(2) Project [fractile#94019797, annual_ret#94019823, annual_resret#94019848, numcos#94019872]
+- *(2) Filter (isnotnull(cap#94019799) AND (cast(cap#94019799 as string) = 0))
+- *(2) ColumnarToRow
+- InMemoryTableScan [annual_resret#94019848, annual_ret#94019823, cap#94019799, fractile#94019797, numcos#94019872], [isnotnull(cap#94019799), (cast(cap#94019799 as string) = 0)]
+- InMemoryRelation [fractile#94019797, cap#94019799, annual_ret#94019823, annual_resret#94019848, numcos#94019872], StorageLevel(disk, memory, deserialized, 1 replicas)
+- *(1) Project [CASE WHEN ((fractile#94019731 = NA) OR (fractile#94019731 = null)) THEN null ELSE cast(fractile#94019731 as float) END AS fractile#94019797, CASE WHEN ((cap#94019732 = NA) OR (cap#94019732 = null)) THEN null ELSE cast(cap#94019732 as float) END AS cap#94019799, CASE WHEN ((annual_ret#94019733 = NA) OR (annual_ret#94019733 = null)) THEN null ELSE cast(annual_ret#94019733 as float) END AS annual_ret#94019823, CASE WHEN ((annual_resret#94019734 = NA) OR (annual_resret#94019734 = null)) THEN null ELSE cast(annual_resret#94019734 as float) END AS annual_resret#94019848, CASE WHEN ((numcos#94019735 = NA) OR (numcos#94019735 = null)) THEN null ELSE cast(numcos#94019735 as float) END AS numcos#94019872]
+- FileScan csv [fractile#94019731,cap#94019732,annual_ret#94019733,annual_resret#94019734,numcos#94019735] Batched: false, DataFilters: [], Format: CSV, Location: InMemoryFileIndex(1 paths)[file:/srv/plusamp/data/default/ea-market/output/risk_factors/growth/fr..., PartitionFilters: [], PushedFilters: [], ReadSchema: struct<fractile:string,cap:string,annual_ret:string,annual_resret:string,numcos:string>
,None)
(3) InMemoryTableScan
Output [4]: [fractile#94019634, annual_ret#94019636, annual_resret#94019637, numcos#94019638]
Arguments: [fractile#94019634, annual_ret#94019636, annual_resret#94019637, numcos#94019638]
(4) InMemoryRelation
Arguments: [fractile#94019634, overall#94019635, annual_ret#94019636, annual_resret#94019637, numcos#94019638], CachedRDDBuilder(org.apache.spark.sql.execution.columnar.DefaultCachedBatchSerializer@208e3fd9,StorageLevel(disk, memory, deserialized, 1 replicas),*(1) Project [CASE WHEN ((fractile#94019614 = NA) OR (fractile#94019614 = null)) THEN null ELSE cast(fractile#94019614 as float) END AS fractile#94019634, CASE WHEN ((overall#94019615 = NA) OR (overall#94019615 = null)) THEN null ELSE cast(overall#94019615 as int) END AS overall#94019635, CASE WHEN ((annual_ret#94019616 = NA) OR (annual_ret#94019616 = null)) THEN null ELSE cast(annual_ret#94019616 as float) END AS annual_ret#94019636, CASE WHEN ((annual_resret#94019617 = NA) OR (annual_resret#94019617 = null)) THEN null ELSE cast(annual_resret#94019617 as float) END AS annual_resret#94019637, CASE WHEN ((numcos#94019618 = NA) OR (numcos#94019618 = null)) THEN null ELSE cast(numcos#94019618 as float) END AS numcos#94019638]
+- FileScan csv [fractile#94019614,overall#94019615,annual_ret#94019616,annual_resret#94019617,numcos#94019618] Batched: false, DataFilters: [], Format: CSV, Location: InMemoryFileIndex(1 paths)[file:/srv/plusamp/data/default/ea-market/output/risk_factors/growth/fr..., PartitionFilters: [], PushedFilters: [], ReadSchema: struct<fractile:string,overall:string,annual_ret:string,annual_resret:string,numcos:string>
,None)
(5) Scan csv
Output [5]: [fractile#94019614, overall#94019615, annual_ret#94019616, annual_resret#94019617, numcos#94019618]
Batched: false
Location: InMemoryFileIndex [file:/srv/plusamp/data/default/ea-market/output/risk_factors/growth/fractiles_individually_overall.csv]
ReadSchema: struct<fractile:string,overall:string,annual_ret:string,annual_resret:string,numcos:string>
(6) Project [codegen id : 1]
Output [5]: [CASE WHEN ((fractile#94019614 = NA) OR (fractile#94019614 = null)) THEN null ELSE cast(fractile#94019614 as float) END AS fractile#94019634, CASE WHEN ((overall#94019615 = NA) OR (overall#94019615 = null)) THEN null ELSE cast(overall#94019615 as int) END AS overall#94019635, CASE WHEN ((annual_ret#94019616 = NA) OR (annual_ret#94019616 = null)) THEN null ELSE cast(annual_ret#94019616 as float) END AS annual_ret#94019636, CASE WHEN ((annual_resret#94019617 = NA) OR (annual_resret#94019617 = null)) THEN null ELSE cast(annual_resret#94019617 as float) END AS annual_resret#94019637, CASE WHEN ((numcos#94019618 = NA) OR (numcos#94019618 = null)) THEN null ELSE cast(numcos#94019618 as float) END AS numcos#94019638]
Input [5]: [fractile#94019614, overall#94019615, annual_ret#94019616, annual_resret#94019617, numcos#94019618]
(7) ColumnarToRow [codegen id : 1]
Input [4]: [fractile#94019634, annual_ret#94019636, annual_resret#94019637, numcos#94019638]
(8) InMemoryTableScan
Output [5]: [annual_resret#94019848, annual_ret#94019823, cap#94019799, fractile#94019797, numcos#94019872]
Arguments: [annual_resret#94019848, annual_ret#94019823, cap#94019799, fractile#94019797, numcos#94019872], [isnotnull(cap#94019799), (cast(cap#94019799 as string) = 0)]
(9) InMemoryRelation
Arguments: [fractile#94019797, cap#94019799, annual_ret#94019823, annual_resret#94019848, numcos#94019872], CachedRDDBuilder(org.apache.spark.sql.execution.columnar.DefaultCachedBatchSerializer@208e3fd9,StorageLevel(disk, memory, deserialized, 1 replicas),*(1) Project [CASE WHEN ((fractile#94019731 = NA) OR (fractile#94019731 = null)) THEN null ELSE cast(fractile#94019731 as float) END AS fractile#94019797, CASE WHEN ((cap#94019732 = NA) OR (cap#94019732 = null)) THEN null ELSE cast(cap#94019732 as float) END AS cap#94019799, CASE WHEN ((annual_ret#94019733 = NA) OR (annual_ret#94019733 = null)) THEN null ELSE cast(annual_ret#94019733 as float) END AS annual_ret#94019823, CASE WHEN ((annual_resret#94019734 = NA) OR (annual_resret#94019734 = null)) THEN null ELSE cast(annual_resret#94019734 as float) END AS annual_resret#94019848, CASE WHEN ((numcos#94019735 = NA) OR (numcos#94019735 = null)) THEN null ELSE cast(numcos#94019735 as float) END AS numcos#94019872]
+- FileScan csv [fractile#94019731,cap#94019732,annual_ret#94019733,annual_resret#94019734,numcos#94019735] Batched: false, DataFilters: [], Format: CSV, Location: InMemoryFileIndex(1 paths)[file:/srv/plusamp/data/default/ea-market/output/risk_factors/growth/fr..., PartitionFilters: [], PushedFilters: [], ReadSchema: struct<fractile:string,cap:string,annual_ret:string,annual_resret:string,numcos:string>
,None)
(10) Scan csv
Output [5]: [fractile#94019731, cap#94019732, annual_ret#94019733, annual_resret#94019734, numcos#94019735]
Batched: false
Location: InMemoryFileIndex [file:/srv/plusamp/data/default/ea-market/output/risk_factors/growth/fractiles_individually_cap.csv]
ReadSchema: struct<fractile:string,cap:string,annual_ret:string,annual_resret:string,numcos:string>
(11) Project [codegen id : 1]
Output [5]: [CASE WHEN ((fractile#94019731 = NA) OR (fractile#94019731 = null)) THEN null ELSE cast(fractile#94019731 as float) END AS fractile#94019797, CASE WHEN ((cap#94019732 = NA) OR (cap#94019732 = null)) THEN null ELSE cast(cap#94019732 as float) END AS cap#94019799, CASE WHEN ((annual_ret#94019733 = NA) OR (annual_ret#94019733 = null)) THEN null ELSE cast(annual_ret#94019733 as float) END AS annual_ret#94019823, CASE WHEN ((annual_resret#94019734 = NA) OR (annual_resret#94019734 = null)) THEN null ELSE cast(annual_resret#94019734 as float) END AS annual_resret#94019848, CASE WHEN ((numcos#94019735 = NA) OR (numcos#94019735 = null)) THEN null ELSE cast(numcos#94019735 as float) END AS numcos#94019872]
Input [5]: [fractile#94019731, cap#94019732, annual_ret#94019733, annual_resret#94019734, numcos#94019735]
(12) ColumnarToRow [codegen id : 2]
Input [5]: [annual_resret#94019848, annual_ret#94019823, cap#94019799, fractile#94019797, numcos#94019872]
(13) Filter [codegen id : 2]
Input [5]: [annual_resret#94019848, annual_ret#94019823, cap#94019799, fractile#94019797, numcos#94019872]
Condition : (isnotnull(cap#94019799) AND (cast(cap#94019799 as string) = 0))
(14) Project [codegen id : 2]
Output [4]: [fractile#94019797, annual_ret#94019823, annual_resret#94019848, numcos#94019872]
Input [5]: [annual_resret#94019848, annual_ret#94019823, cap#94019799, fractile#94019797, numcos#94019872]
(15) Union
(16) ColumnarToRow [codegen id : 1]
Input [4]: [fractile#94019634, annual_ret#94019636, annual_resret#94019637, numcos#94019638]
(17) CollectLimit
Input [4]: [fractile#94019634, annual_ret#94019636, annual_resret#94019637, numcos#94019638]
Arguments: 1000000