Project [CASE WHEN ((fractile#94076962 = NA) OR (fractile#94076962 = null)) THEN null ELSE cast(fractile#94076962 as float) END AS fractile#94076996, CASE WHEN ((overall#94076963 = NA) OR (overall#94076963 = null)) THEN null ELSE cast(overall#94076963 as int) END AS overall#94076997, CASE WHEN ((annual_ret#94076964 = NA) OR (annual_ret#94076964 = null)) THEN null ELSE cast(annual_ret#94076964 as float) END AS annual_ret#94076998, CASE WHEN ((annual_resret#94076965 = NA) OR (annual_resret#94076965 = null)) THEN null ELSE cast(annual_resret#94076965 as float) END AS annual_resret#94077004, CASE WHEN ((numcos#94076966 = NA) OR (numcos#94076966 = null)) THEN null ELSE cast(numcos#94076966 as float) END AS numcos#94077009]
Project [CASE WHEN ((fractile#94076941 = NA) OR (fractile#94076941 = null)) THEN null ELSE cast(fractile#94076941 as float) END AS fractile#94076991, CASE WHEN ((cap#94076942 = NA) OR (cap#94076942 = null)) THEN null ELSE cast(cap#94076942 as float) END AS cap#94076992, CASE WHEN ((annual_ret#94076943 = NA) OR (annual_ret#94076943 = null)) THEN null ELSE cast(annual_ret#94076943 as float) END AS annual_ret#94076993, CASE WHEN ((annual_resret#94076944 = NA) OR (annual_resret#94076944 = null)) THEN null ELSE cast(annual_resret#94076944 as float) END AS annual_resret#94076994, CASE WHEN ((numcos#94076945 = NA) OR (numcos#94076945 = null)) THEN null ELSE cast(numcos#94076945 as float) END AS numcos#94076995]
== Physical Plan ==
CollectLimit (17)
+- * ColumnarToRow (16)
+- InMemoryTableScan (1)
+- InMemoryRelation (2)
+- Union (15)
:- * ColumnarToRow (7)
: +- InMemoryTableScan (3)
: +- InMemoryRelation (4)
: +- * Project (6)
: +- Scan csv (5)
+- * Project (14)
+- * Filter (13)
+- * ColumnarToRow (12)
+- InMemoryTableScan (8)
+- InMemoryRelation (9)
+- * Project (11)
+- Scan csv (10)
(1) InMemoryTableScan
Output [4]: [fractile#94076996, annual_ret#94076998, annual_resret#94077004, numcos#94077009]
Arguments: [fractile#94076996, annual_ret#94076998, annual_resret#94077004, numcos#94077009]
(2) InMemoryRelation
Arguments: [fractile#94076996, annual_ret#94076998, annual_resret#94077004, numcos#94077009], CachedRDDBuilder(org.apache.spark.sql.execution.columnar.DefaultCachedBatchSerializer@208e3fd9,StorageLevel(disk, memory, deserialized, 1 replicas),Union
:- *(1) ColumnarToRow
: +- InMemoryTableScan [fractile#94076996, annual_ret#94076998, annual_resret#94077004, numcos#94077009]
: +- InMemoryRelation [fractile#94076996, overall#94076997, annual_ret#94076998, annual_resret#94077004, numcos#94077009], StorageLevel(disk, memory, deserialized, 1 replicas)
: +- *(1) Project [CASE WHEN ((fractile#94076962 = NA) OR (fractile#94076962 = null)) THEN null ELSE cast(fractile#94076962 as float) END AS fractile#94076996, CASE WHEN ((overall#94076963 = NA) OR (overall#94076963 = null)) THEN null ELSE cast(overall#94076963 as int) END AS overall#94076997, CASE WHEN ((annual_ret#94076964 = NA) OR (annual_ret#94076964 = null)) THEN null ELSE cast(annual_ret#94076964 as float) END AS annual_ret#94076998, CASE WHEN ((annual_resret#94076965 = NA) OR (annual_resret#94076965 = null)) THEN null ELSE cast(annual_resret#94076965 as float) END AS annual_resret#94077004, CASE WHEN ((numcos#94076966 = NA) OR (numcos#94076966 = null)) THEN null ELSE cast(numcos#94076966 as float) END AS numcos#94077009]
: +- FileScan csv [fractile#94076962,overall#94076963,annual_ret#94076964,annual_resret#94076965,numcos#94076966] Batched: false, DataFilters: [], Format: CSV, Location: InMemoryFileIndex(1 paths)[file:/srv/plusamp/data/default/ea-market/output/risk_factors/volatilit..., PartitionFilters: [], PushedFilters: [], ReadSchema: struct<fractile:string,overall:string,annual_ret:string,annual_resret:string,numcos:string>
+- *(2) Project [fractile#94076991, annual_ret#94076993, annual_resret#94076994, numcos#94076995]
+- *(2) Filter (isnotnull(cap#94076992) AND (cast(cap#94076992 as string) = 0))
+- *(2) ColumnarToRow
+- InMemoryTableScan [annual_resret#94076994, annual_ret#94076993, cap#94076992, fractile#94076991, numcos#94076995], [isnotnull(cap#94076992), (cast(cap#94076992 as string) = 0)]
+- InMemoryRelation [fractile#94076991, cap#94076992, annual_ret#94076993, annual_resret#94076994, numcos#94076995], StorageLevel(disk, memory, deserialized, 1 replicas)
+- *(1) Project [CASE WHEN ((fractile#94076941 = NA) OR (fractile#94076941 = null)) THEN null ELSE cast(fractile#94076941 as float) END AS fractile#94076991, CASE WHEN ((cap#94076942 = NA) OR (cap#94076942 = null)) THEN null ELSE cast(cap#94076942 as float) END AS cap#94076992, CASE WHEN ((annual_ret#94076943 = NA) OR (annual_ret#94076943 = null)) THEN null ELSE cast(annual_ret#94076943 as float) END AS annual_ret#94076993, CASE WHEN ((annual_resret#94076944 = NA) OR (annual_resret#94076944 = null)) THEN null ELSE cast(annual_resret#94076944 as float) END AS annual_resret#94076994, CASE WHEN ((numcos#94076945 = NA) OR (numcos#94076945 = null)) THEN null ELSE cast(numcos#94076945 as float) END AS numcos#94076995]
+- FileScan csv [fractile#94076941,cap#94076942,annual_ret#94076943,annual_resret#94076944,numcos#94076945] Batched: false, DataFilters: [], Format: CSV, Location: InMemoryFileIndex(1 paths)[file:/srv/plusamp/data/default/ea-market/output/risk_factors/volatilit..., PartitionFilters: [], PushedFilters: [], ReadSchema: struct<fractile:string,cap:string,annual_ret:string,annual_resret:string,numcos:string>
,None)
(3) InMemoryTableScan
Output [4]: [fractile#94076996, annual_ret#94076998, annual_resret#94077004, numcos#94077009]
Arguments: [fractile#94076996, annual_ret#94076998, annual_resret#94077004, numcos#94077009]
(4) InMemoryRelation
Arguments: [fractile#94076996, overall#94076997, annual_ret#94076998, annual_resret#94077004, numcos#94077009], CachedRDDBuilder(org.apache.spark.sql.execution.columnar.DefaultCachedBatchSerializer@208e3fd9,StorageLevel(disk, memory, deserialized, 1 replicas),*(1) Project [CASE WHEN ((fractile#94076962 = NA) OR (fractile#94076962 = null)) THEN null ELSE cast(fractile#94076962 as float) END AS fractile#94076996, CASE WHEN ((overall#94076963 = NA) OR (overall#94076963 = null)) THEN null ELSE cast(overall#94076963 as int) END AS overall#94076997, CASE WHEN ((annual_ret#94076964 = NA) OR (annual_ret#94076964 = null)) THEN null ELSE cast(annual_ret#94076964 as float) END AS annual_ret#94076998, CASE WHEN ((annual_resret#94076965 = NA) OR (annual_resret#94076965 = null)) THEN null ELSE cast(annual_resret#94076965 as float) END AS annual_resret#94077004, CASE WHEN ((numcos#94076966 = NA) OR (numcos#94076966 = null)) THEN null ELSE cast(numcos#94076966 as float) END AS numcos#94077009]
+- FileScan csv [fractile#94076962,overall#94076963,annual_ret#94076964,annual_resret#94076965,numcos#94076966] Batched: false, DataFilters: [], Format: CSV, Location: InMemoryFileIndex(1 paths)[file:/srv/plusamp/data/default/ea-market/output/risk_factors/volatilit..., PartitionFilters: [], PushedFilters: [], ReadSchema: struct<fractile:string,overall:string,annual_ret:string,annual_resret:string,numcos:string>
,None)
(5) Scan csv
Output [5]: [fractile#94076962, overall#94076963, annual_ret#94076964, annual_resret#94076965, numcos#94076966]
Batched: false
Location: InMemoryFileIndex [file:/srv/plusamp/data/default/ea-market/output/risk_factors/volatility/fractiles_individually_overall.csv]
ReadSchema: struct<fractile:string,overall:string,annual_ret:string,annual_resret:string,numcos:string>
(6) Project [codegen id : 1]
Output [5]: [CASE WHEN ((fractile#94076962 = NA) OR (fractile#94076962 = null)) THEN null ELSE cast(fractile#94076962 as float) END AS fractile#94076996, CASE WHEN ((overall#94076963 = NA) OR (overall#94076963 = null)) THEN null ELSE cast(overall#94076963 as int) END AS overall#94076997, CASE WHEN ((annual_ret#94076964 = NA) OR (annual_ret#94076964 = null)) THEN null ELSE cast(annual_ret#94076964 as float) END AS annual_ret#94076998, CASE WHEN ((annual_resret#94076965 = NA) OR (annual_resret#94076965 = null)) THEN null ELSE cast(annual_resret#94076965 as float) END AS annual_resret#94077004, CASE WHEN ((numcos#94076966 = NA) OR (numcos#94076966 = null)) THEN null ELSE cast(numcos#94076966 as float) END AS numcos#94077009]
Input [5]: [fractile#94076962, overall#94076963, annual_ret#94076964, annual_resret#94076965, numcos#94076966]
(7) ColumnarToRow [codegen id : 1]
Input [4]: [fractile#94076996, annual_ret#94076998, annual_resret#94077004, numcos#94077009]
(8) InMemoryTableScan
Output [5]: [annual_resret#94076994, annual_ret#94076993, cap#94076992, fractile#94076991, numcos#94076995]
Arguments: [annual_resret#94076994, annual_ret#94076993, cap#94076992, fractile#94076991, numcos#94076995], [isnotnull(cap#94076992), (cast(cap#94076992 as string) = 0)]
(9) InMemoryRelation
Arguments: [fractile#94076991, cap#94076992, annual_ret#94076993, annual_resret#94076994, numcos#94076995], CachedRDDBuilder(org.apache.spark.sql.execution.columnar.DefaultCachedBatchSerializer@208e3fd9,StorageLevel(disk, memory, deserialized, 1 replicas),*(1) Project [CASE WHEN ((fractile#94076941 = NA) OR (fractile#94076941 = null)) THEN null ELSE cast(fractile#94076941 as float) END AS fractile#94076991, CASE WHEN ((cap#94076942 = NA) OR (cap#94076942 = null)) THEN null ELSE cast(cap#94076942 as float) END AS cap#94076992, CASE WHEN ((annual_ret#94076943 = NA) OR (annual_ret#94076943 = null)) THEN null ELSE cast(annual_ret#94076943 as float) END AS annual_ret#94076993, CASE WHEN ((annual_resret#94076944 = NA) OR (annual_resret#94076944 = null)) THEN null ELSE cast(annual_resret#94076944 as float) END AS annual_resret#94076994, CASE WHEN ((numcos#94076945 = NA) OR (numcos#94076945 = null)) THEN null ELSE cast(numcos#94076945 as float) END AS numcos#94076995]
+- FileScan csv [fractile#94076941,cap#94076942,annual_ret#94076943,annual_resret#94076944,numcos#94076945] Batched: false, DataFilters: [], Format: CSV, Location: InMemoryFileIndex(1 paths)[file:/srv/plusamp/data/default/ea-market/output/risk_factors/volatilit..., PartitionFilters: [], PushedFilters: [], ReadSchema: struct<fractile:string,cap:string,annual_ret:string,annual_resret:string,numcos:string>
,None)
(10) Scan csv
Output [5]: [fractile#94076941, cap#94076942, annual_ret#94076943, annual_resret#94076944, numcos#94076945]
Batched: false
Location: InMemoryFileIndex [file:/srv/plusamp/data/default/ea-market/output/risk_factors/volatility/fractiles_individually_cap.csv]
ReadSchema: struct<fractile:string,cap:string,annual_ret:string,annual_resret:string,numcos:string>
(11) Project [codegen id : 1]
Output [5]: [CASE WHEN ((fractile#94076941 = NA) OR (fractile#94076941 = null)) THEN null ELSE cast(fractile#94076941 as float) END AS fractile#94076991, CASE WHEN ((cap#94076942 = NA) OR (cap#94076942 = null)) THEN null ELSE cast(cap#94076942 as float) END AS cap#94076992, CASE WHEN ((annual_ret#94076943 = NA) OR (annual_ret#94076943 = null)) THEN null ELSE cast(annual_ret#94076943 as float) END AS annual_ret#94076993, CASE WHEN ((annual_resret#94076944 = NA) OR (annual_resret#94076944 = null)) THEN null ELSE cast(annual_resret#94076944 as float) END AS annual_resret#94076994, CASE WHEN ((numcos#94076945 = NA) OR (numcos#94076945 = null)) THEN null ELSE cast(numcos#94076945 as float) END AS numcos#94076995]
Input [5]: [fractile#94076941, cap#94076942, annual_ret#94076943, annual_resret#94076944, numcos#94076945]
(12) ColumnarToRow [codegen id : 2]
Input [5]: [annual_resret#94076994, annual_ret#94076993, cap#94076992, fractile#94076991, numcos#94076995]
(13) Filter [codegen id : 2]
Input [5]: [annual_resret#94076994, annual_ret#94076993, cap#94076992, fractile#94076991, numcos#94076995]
Condition : (isnotnull(cap#94076992) AND (cast(cap#94076992 as string) = 0))
(14) Project [codegen id : 2]
Output [4]: [fractile#94076991, annual_ret#94076993, annual_resret#94076994, numcos#94076995]
Input [5]: [annual_resret#94076994, annual_ret#94076993, cap#94076992, fractile#94076991, numcos#94076995]
(15) Union
(16) ColumnarToRow [codegen id : 1]
Input [4]: [fractile#94076996, annual_ret#94076998, annual_resret#94077004, numcos#94077009]
(17) CollectLimit
Input [4]: [fractile#94076996, annual_ret#94076998, annual_resret#94077004, numcos#94077009]
Arguments: 1000000