== Physical Plan == CollectLimit (11) +- * ColumnarToRow (10) +- InMemoryTableScan (1) +- InMemoryRelation (2) +- * Project (9) +- * Filter (8) +- * ColumnarToRow (7) +- InMemoryTableScan (3) +- InMemoryRelation (4) +- * Project (6) +- Scan csv (5) (1) InMemoryTableScan Output [7]: [yield#94114023, volatility#94114019, momentum#94114021, size#94114012, value#94114014, growth#94114016, leverage#94114017] Arguments: [yield#94114023, volatility#94114019, momentum#94114021, size#94114012, value#94114014, growth#94114016, leverage#94114017] (2) InMemoryRelation Arguments: [yield#94114023, volatility#94114019, momentum#94114021, size#94114012, value#94114014, growth#94114016, leverage#94114017], CachedRDDBuilder(org.apache.spark.sql.execution.columnar.DefaultCachedBatchSerializer@208e3fd9,StorageLevel(disk, memory, deserialized, 1 replicas),*(1) Project [yield#94114023, volatility#94114019, momentum#94114021, size#94114012, value#94114014, growth#94114016, leverage#94114017] +- *(1) Filter (isnotnull(cap#94114006) AND (cap#94114006 = 0.0)) +- *(1) ColumnarToRow +- InMemoryTableScan [cap#94114006, growth#94114016, leverage#94114017, momentum#94114021, size#94114012, value#94114014, volatility#94114019, yield#94114023], [isnotnull(cap#94114006), (cap#94114006 = 0.0)] +- InMemoryRelation [overall#94114005, cap#94114006, retIC#94114008, resretIC#94114010, size#94114012, value#94114014, growth#94114016, leverage#94114017, volatility#94114019, momentum#94114021, yield#94114023, numcos#94114025, numdates#94114026, annual_bmret#94114028, annual_ret#94114030, std_ret#94114032, Sharpe_ret#94114033, PctPos_ret#94114035, TR_ret#94114037, IR_ret#94114039, annual_resret#94114040, std_resret#94114042, Sharpe_resret#94114044, PctPos_resret#94114046, ... 9 more fields], StorageLevel(disk, memory, deserialized, 1 replicas) +- *(1) Project [CASE WHEN ((overall#94113773 = NA) OR (overall#94113773 = null)) THEN null ELSE cast(overall#94113773 as int) END AS overall#94114005, CASE WHEN ((cap#94113774 = NA) OR (cap#94113774 = null)) THEN null ELSE cast(cap#94113774 as float) END AS cap#94114006, CASE WHEN ((retIC#94113775 = NA) OR (retIC#94113775 = null)) THEN null ELSE cast(retIC#94113775 as float) END AS retIC#94114008, CASE WHEN ((resretIC#94113776 = NA) OR (resretIC#94113776 = null)) THEN null ELSE cast(resretIC#94113776 as float) END AS resretIC#94114010, CASE WHEN ((size#94113777 = NA) OR (size#94113777 = null)) THEN null ELSE cast(size#94113777 as float) END AS size#94114012, CASE WHEN ((value#94113778 = NA) OR (value#94113778 = null)) THEN null ELSE cast(value#94113778 as float) END AS value#94114014, CASE WHEN ((growth#94113779 = NA) OR (growth#94113779 = null)) THEN null ELSE cast(growth#94113779 as float) END AS growth#94114016, CASE WHEN ((leverage#94113780 = NA) OR (leverage#94113780 = null)) THEN null ELSE cast(leverage#94113780 as float) END AS leverage#94114017, CASE WHEN ((volatility#94113781 = NA) OR (volatility#94113781 = null)) THEN null ELSE cast(volatility#94113781 as float) END AS volatility#94114019, CASE WHEN ((momentum#94113782 = NA) OR (momentum#94113782 = null)) THEN null ELSE cast(momentum#94113782 as float) END AS momentum#94114021, CASE WHEN ((yield#94113783 = NA) OR (yield#94113783 = null)) THEN null ELSE cast(yield#94113783 as float) END AS yield#94114023, CASE WHEN ((numcos#94113784 = NA) OR (numcos#94113784 = null)) THEN null ELSE cast(numcos#94113784 as float) END AS numcos#94114025, CASE WHEN ((numdates#94113785 = NA) OR (numdates#94113785 = null)) THEN null ELSE cast(numdates#94113785 as float) END AS numdates#94114026, CASE WHEN ((annual_bmret#94113786 = NA) OR (annual_bmret#94113786 = null)) THEN null ELSE cast(annual_bmret#94113786 as float) END AS annual_bmret#94114028, CASE WHEN ((annual_ret#94113787 = NA) OR (annual_ret#94113787 = null)) THEN null ELSE cast(annual_ret#94113787 as float) END AS annual_ret#94114030, CASE WHEN ((std_ret#94113788 = NA) OR (std_ret#94113788 = null)) THEN null ELSE cast(std_ret#94113788 as float) END AS std_ret#94114032, CASE WHEN ((Sharpe_ret#94113789 = NA) OR (Sharpe_ret#94113789 = null)) THEN null ELSE cast(Sharpe_ret#94113789 as float) END AS Sharpe_ret#94114033, CASE WHEN ((PctPos_ret#94113790 = NA) OR (PctPos_ret#94113790 = null)) THEN null ELSE cast(PctPos_ret#94113790 as float) END AS PctPos_ret#94114035, CASE WHEN ((TR_ret#94113791 = NA) OR (TR_ret#94113791 = null)) THEN null ELSE cast(TR_ret#94113791 as float) END AS TR_ret#94114037, CASE WHEN ((IR_ret#94113792 = NA) OR (IR_ret#94113792 = null)) THEN null ELSE cast(IR_ret#94113792 as float) END AS IR_ret#94114039, CASE WHEN ((annual_resret#94113793 = NA) OR (annual_resret#94113793 = null)) THEN null ELSE cast(annual_resret#94113793 as float) END AS annual_resret#94114040, CASE WHEN ((std_resret#94113794 = NA) OR (std_resret#94113794 = null)) THEN null ELSE cast(std_resret#94113794 as float) END AS std_resret#94114042, CASE WHEN ((Sharpe_resret#94113795 = NA) OR (Sharpe_resret#94113795 = null)) THEN null ELSE cast(Sharpe_resret#94113795 as float) END AS Sharpe_resret#94114044, CASE WHEN ((PctPos_resret#94113796 = NA) OR (PctPos_resret#94113796 = null)) THEN null ELSE cast(PctPos_resret#94113796 as float) END AS PctPos_resret#94114046, ... 9 more fields] +- FileScan csv [overall#94113773,cap#94113774,retIC#94113775,resretIC#94113776,size#94113777,value#94113778,growth#94113779,leverage#94113780,volatility#94113781,momentum#94113782,yield#94113783,numcos#94113784,numdates#94113785,annual_bmret#94113786,annual_ret#94113787,std_ret#94113788,Sharpe_ret#94113789,PctPos_ret#94113790,TR_ret#94113791,IR_ret#94113792,annual_resret#94113793,std_resret#94113794,Sharpe_resret#94113795,PctPos_resret#94113796,... 9 more fields] Batched: false, DataFilters: [], Format: CSV, Location: InMemoryFileIndex(1 paths)[file:/srv/plusamp/data/default/ea-market/output/tm1/eatm1_score/stats_..., PartitionFilters: [], PushedFilters: [], ReadSchema: struct<overall:string,cap:string,retIC:string,resretIC:string,size:string,value:string,growth:str... ,None) (3) InMemoryTableScan Output [8]: [cap#94114006, growth#94114016, leverage#94114017, momentum#94114021, size#94114012, value#94114014, volatility#94114019, yield#94114023] Arguments: [cap#94114006, growth#94114016, leverage#94114017, momentum#94114021, size#94114012, value#94114014, volatility#94114019, yield#94114023], [isnotnull(cap#94114006), (cap#94114006 = 0.0)] (4) InMemoryRelation Arguments: [overall#94114005, cap#94114006, retIC#94114008, resretIC#94114010, size#94114012, value#94114014, growth#94114016, leverage#94114017, volatility#94114019, momentum#94114021, yield#94114023, numcos#94114025, numdates#94114026, annual_bmret#94114028, annual_ret#94114030, std_ret#94114032, Sharpe_ret#94114033, PctPos_ret#94114035, TR_ret#94114037, IR_ret#94114039, annual_resret#94114040, std_resret#94114042, Sharpe_resret#94114044, PctPos_resret#94114046, ... 9 more fields], CachedRDDBuilder(org.apache.spark.sql.execution.columnar.DefaultCachedBatchSerializer@208e3fd9,StorageLevel(disk, memory, deserialized, 1 replicas),*(1) Project [CASE WHEN ((overall#94113773 = NA) OR (overall#94113773 = null)) THEN null ELSE cast(overall#94113773 as int) END AS overall#94114005, CASE WHEN ((cap#94113774 = NA) OR (cap#94113774 = null)) THEN null ELSE cast(cap#94113774 as float) END AS cap#94114006, CASE WHEN ((retIC#94113775 = NA) OR (retIC#94113775 = null)) THEN null ELSE cast(retIC#94113775 as float) END AS retIC#94114008, CASE WHEN ((resretIC#94113776 = NA) OR (resretIC#94113776 = null)) THEN null ELSE cast(resretIC#94113776 as float) END AS resretIC#94114010, CASE WHEN ((size#94113777 = NA) OR (size#94113777 = null)) THEN null ELSE cast(size#94113777 as float) END AS size#94114012, CASE WHEN ((value#94113778 = NA) OR (value#94113778 = null)) THEN null ELSE cast(value#94113778 as float) END AS value#94114014, CASE WHEN ((growth#94113779 = NA) OR (growth#94113779 = null)) THEN null ELSE cast(growth#94113779 as float) END AS growth#94114016, CASE WHEN ((leverage#94113780 = NA) OR (leverage#94113780 = null)) THEN null ELSE cast(leverage#94113780 as float) END AS leverage#94114017, CASE WHEN ((volatility#94113781 = NA) OR (volatility#94113781 = null)) THEN null ELSE cast(volatility#94113781 as float) END AS volatility#94114019, CASE WHEN ((momentum#94113782 = NA) OR (momentum#94113782 = null)) THEN null ELSE cast(momentum#94113782 as float) END AS momentum#94114021, CASE WHEN ((yield#94113783 = NA) OR (yield#94113783 = null)) THEN null ELSE cast(yield#94113783 as float) END AS yield#94114023, CASE WHEN ((numcos#94113784 = NA) OR (numcos#94113784 = null)) THEN null ELSE cast(numcos#94113784 as float) END AS numcos#94114025, CASE WHEN ((numdates#94113785 = NA) OR (numdates#94113785 = null)) THEN null ELSE cast(numdates#94113785 as float) END AS numdates#94114026, CASE WHEN ((annual_bmret#94113786 = NA) OR (annual_bmret#94113786 = null)) THEN null ELSE cast(annual_bmret#94113786 as float) END AS annual_bmret#94114028, CASE WHEN ((annual_ret#94113787 = NA) OR (annual_ret#94113787 = null)) THEN null ELSE cast(annual_ret#94113787 as float) END AS annual_ret#94114030, CASE WHEN ((std_ret#94113788 = NA) OR (std_ret#94113788 = null)) THEN null ELSE cast(std_ret#94113788 as float) END AS std_ret#94114032, CASE WHEN ((Sharpe_ret#94113789 = NA) OR (Sharpe_ret#94113789 = null)) THEN null ELSE cast(Sharpe_ret#94113789 as float) END AS Sharpe_ret#94114033, CASE WHEN ((PctPos_ret#94113790 = NA) OR (PctPos_ret#94113790 = null)) THEN null ELSE cast(PctPos_ret#94113790 as float) END AS PctPos_ret#94114035, CASE WHEN ((TR_ret#94113791 = NA) OR (TR_ret#94113791 = null)) THEN null ELSE cast(TR_ret#94113791 as float) END AS TR_ret#94114037, CASE WHEN ((IR_ret#94113792 = NA) OR (IR_ret#94113792 = null)) THEN null ELSE cast(IR_ret#94113792 as float) END AS IR_ret#94114039, CASE WHEN ((annual_resret#94113793 = NA) OR (annual_resret#94113793 = null)) THEN null ELSE cast(annual_resret#94113793 as float) END AS annual_resret#94114040, CASE WHEN ((std_resret#94113794 = NA) OR (std_resret#94113794 = null)) THEN null ELSE cast(std_resret#94113794 as float) END AS std_resret#94114042, CASE WHEN ((Sharpe_resret#94113795 = NA) OR (Sharpe_resret#94113795 = null)) THEN null ELSE cast(Sharpe_resret#94113795 as float) END AS Sharpe_resret#94114044, CASE WHEN ((PctPos_resret#94113796 = NA) OR (PctPos_resret#94113796 = null)) THEN null ELSE cast(PctPos_resret#94113796 as float) END AS PctPos_resret#94114046, ... 9 more fields] +- FileScan csv [overall#94113773,cap#94113774,retIC#94113775,resretIC#94113776,size#94113777,value#94113778,growth#94113779,leverage#94113780,volatility#94113781,momentum#94113782,yield#94113783,numcos#94113784,numdates#94113785,annual_bmret#94113786,annual_ret#94113787,std_ret#94113788,Sharpe_ret#94113789,PctPos_ret#94113790,TR_ret#94113791,IR_ret#94113792,annual_resret#94113793,std_resret#94113794,Sharpe_resret#94113795,PctPos_resret#94113796,... 9 more fields] Batched: false, DataFilters: [], Format: CSV, Location: InMemoryFileIndex(1 paths)[file:/srv/plusamp/data/default/ea-market/output/tm1/eatm1_score/stats_..., PartitionFilters: [], PushedFilters: [], ReadSchema: struct<overall:string,cap:string,retIC:string,resretIC:string,size:string,value:string,growth:str... ,None) (5) Scan csv Output [33]: [overall#94113773, cap#94113774, retIC#94113775, resretIC#94113776, size#94113777, value#94113778, growth#94113779, leverage#94113780, volatility#94113781, momentum#94113782, yield#94113783, numcos#94113784, numdates#94113785, annual_bmret#94113786, annual_ret#94113787, std_ret#94113788, Sharpe_ret#94113789, PctPos_ret#94113790, TR_ret#94113791, IR_ret#94113792, annual_resret#94113793, std_resret#94113794, Sharpe_resret#94113795, PctPos_resret#94113796, TR_resret#94113797, IR_resret#94113798, annual_retnet#94113799, std_retnet#94113800, Sharpe_retnet#94113801, PctPos_retnet#94113802, TR_retnet#94113803, IR_retnet#94113804, turnover#94113805] Batched: false Location: InMemoryFileIndex [file:/srv/plusamp/data/default/ea-market/output/tm1/eatm1_score/stats_overall.csv] ReadSchema: struct<overall:string,cap:string,retIC:string,resretIC:string,size:string,value:string,growth:string,leverage:string,volatility:string,momentum:string,yield:string,numcos:string,numdates:string,annual_bmret:string,annual_ret:string,std_ret:string,Sharpe_ret:string,PctPos_ret:string,TR_ret:string,IR_ret:string,annual_resret:string,std_resret:string,Sharpe_resret:string,PctPos_resret:string,TR_resret:string,IR_resret:string,annual_retnet:string,std_retnet:string,Sharpe_retnet:string,PctPos_retnet:string,TR_retnet:string,IR_retnet:string,turnover:string> (6) Project [codegen id : 1] Output [33]: [CASE WHEN ((overall#94113773 = NA) OR (overall#94113773 = null)) THEN null ELSE cast(overall#94113773 as int) END AS overall#94114005, CASE WHEN ((cap#94113774 = NA) OR (cap#94113774 = null)) THEN null ELSE cast(cap#94113774 as float) END AS cap#94114006, CASE WHEN ((retIC#94113775 = NA) OR (retIC#94113775 = null)) THEN null ELSE cast(retIC#94113775 as float) END AS retIC#94114008, CASE WHEN ((resretIC#94113776 = NA) OR (resretIC#94113776 = null)) THEN null ELSE cast(resretIC#94113776 as float) END AS resretIC#94114010, CASE WHEN ((size#94113777 = NA) OR (size#94113777 = null)) THEN null ELSE cast(size#94113777 as float) END AS size#94114012, CASE WHEN ((value#94113778 = NA) OR (value#94113778 = null)) THEN null ELSE cast(value#94113778 as float) END AS value#94114014, CASE WHEN ((growth#94113779 = NA) OR (growth#94113779 = null)) THEN null ELSE cast(growth#94113779 as float) END AS growth#94114016, CASE WHEN ((leverage#94113780 = NA) OR (leverage#94113780 = null)) THEN null ELSE cast(leverage#94113780 as float) END AS leverage#94114017, CASE WHEN ((volatility#94113781 = NA) OR (volatility#94113781 = null)) THEN null ELSE cast(volatility#94113781 as float) END AS volatility#94114019, CASE WHEN ((momentum#94113782 = NA) OR (momentum#94113782 = null)) THEN null ELSE cast(momentum#94113782 as float) END AS momentum#94114021, CASE WHEN ((yield#94113783 = NA) OR (yield#94113783 = null)) THEN null ELSE cast(yield#94113783 as float) END AS yield#94114023, CASE WHEN ((numcos#94113784 = NA) OR (numcos#94113784 = null)) THEN null ELSE cast(numcos#94113784 as float) END AS numcos#94114025, CASE WHEN ((numdates#94113785 = NA) OR (numdates#94113785 = null)) THEN null ELSE cast(numdates#94113785 as float) END AS numdates#94114026, CASE WHEN ((annual_bmret#94113786 = NA) OR (annual_bmret#94113786 = null)) THEN null ELSE cast(annual_bmret#94113786 as float) END AS annual_bmret#94114028, CASE WHEN ((annual_ret#94113787 = NA) OR (annual_ret#94113787 = null)) THEN null ELSE cast(annual_ret#94113787 as float) END AS annual_ret#94114030, CASE WHEN ((std_ret#94113788 = NA) OR (std_ret#94113788 = null)) THEN null ELSE cast(std_ret#94113788 as float) END AS std_ret#94114032, CASE WHEN ((Sharpe_ret#94113789 = NA) OR (Sharpe_ret#94113789 = null)) THEN null ELSE cast(Sharpe_ret#94113789 as float) END AS Sharpe_ret#94114033, CASE WHEN ((PctPos_ret#94113790 = NA) OR (PctPos_ret#94113790 = null)) THEN null ELSE cast(PctPos_ret#94113790 as float) END AS PctPos_ret#94114035, CASE WHEN ((TR_ret#94113791 = NA) OR (TR_ret#94113791 = null)) THEN null ELSE cast(TR_ret#94113791 as float) END AS TR_ret#94114037, CASE WHEN ((IR_ret#94113792 = NA) OR (IR_ret#94113792 = null)) THEN null ELSE cast(IR_ret#94113792 as float) END AS IR_ret#94114039, CASE WHEN ((annual_resret#94113793 = NA) OR (annual_resret#94113793 = null)) THEN null ELSE cast(annual_resret#94113793 as float) END AS annual_resret#94114040, CASE WHEN ((std_resret#94113794 = NA) OR (std_resret#94113794 = null)) THEN null ELSE cast(std_resret#94113794 as float) END AS std_resret#94114042, CASE WHEN ((Sharpe_resret#94113795 = NA) OR (Sharpe_resret#94113795 = null)) THEN null ELSE cast(Sharpe_resret#94113795 as float) END AS Sharpe_resret#94114044, CASE WHEN ((PctPos_resret#94113796 = NA) OR (PctPos_resret#94113796 = null)) THEN null ELSE cast(PctPos_resret#94113796 as float) END AS PctPos_resret#94114046, CASE WHEN ((TR_resret#94113797 = NA) OR (TR_resret#94113797 = null)) THEN null ELSE cast(TR_resret#94113797 as float) END AS TR_resret#94114047, CASE WHEN ((IR_resret#94113798 = NA) OR (IR_resret#94113798 = null)) THEN null ELSE cast(IR_resret#94113798 as float) END AS IR_resret#94114049, CASE WHEN ((annual_retnet#94113799 = NA) OR (annual_retnet#94113799 = null)) THEN null ELSE cast(annual_retnet#94113799 as float) END AS annual_retnet#94114051, CASE WHEN ((std_retnet#94113800 = NA) OR (std_retnet#94113800 = null)) THEN null ELSE cast(std_retnet#94113800 as float) END AS std_retnet#94114053, CASE WHEN ((Sharpe_retnet#94113801 = NA) OR (Sharpe_retnet#94113801 = null)) THEN null ELSE cast(Sharpe_retnet#94113801 as float) END AS Sharpe_retnet#94114054, CASE WHEN ((PctPos_retnet#94113802 = NA) OR (PctPos_retnet#94113802 = null)) THEN null ELSE cast(PctPos_retnet#94113802 as float) END AS PctPos_retnet#94114056, CASE WHEN ((TR_retnet#94113803 = NA) OR (TR_retnet#94113803 = null)) THEN null ELSE cast(TR_retnet#94113803 as float) END AS TR_retnet#94114058, CASE WHEN ((IR_retnet#94113804 = NA) OR (IR_retnet#94113804 = null)) THEN null ELSE cast(IR_retnet#94113804 as float) END AS IR_retnet#94114060, CASE WHEN ((turnover#94113805 = NA) OR (turnover#94113805 = null)) THEN null ELSE cast(turnover#94113805 as float) END AS turnover#94114062] Input [33]: [overall#94113773, cap#94113774, retIC#94113775, resretIC#94113776, size#94113777, value#94113778, growth#94113779, leverage#94113780, volatility#94113781, momentum#94113782, yield#94113783, numcos#94113784, numdates#94113785, annual_bmret#94113786, annual_ret#94113787, std_ret#94113788, Sharpe_ret#94113789, PctPos_ret#94113790, TR_ret#94113791, IR_ret#94113792, annual_resret#94113793, std_resret#94113794, Sharpe_resret#94113795, PctPos_resret#94113796, TR_resret#94113797, IR_resret#94113798, annual_retnet#94113799, std_retnet#94113800, Sharpe_retnet#94113801, PctPos_retnet#94113802, TR_retnet#94113803, IR_retnet#94113804, turnover#94113805] (7) ColumnarToRow [codegen id : 1] Input [8]: [cap#94114006, growth#94114016, leverage#94114017, momentum#94114021, size#94114012, value#94114014, volatility#94114019, yield#94114023] (8) Filter [codegen id : 1] Input [8]: [cap#94114006, growth#94114016, leverage#94114017, momentum#94114021, size#94114012, value#94114014, volatility#94114019, yield#94114023] Condition : (isnotnull(cap#94114006) AND (cap#94114006 = 0.0)) (9) Project [codegen id : 1] Output [7]: [yield#94114023, volatility#94114019, momentum#94114021, size#94114012, value#94114014, growth#94114016, leverage#94114017] Input [8]: [cap#94114006, growth#94114016, leverage#94114017, momentum#94114021, size#94114012, value#94114014, volatility#94114019, yield#94114023] (10) ColumnarToRow [codegen id : 1] Input [7]: [yield#94114023, volatility#94114019, momentum#94114021, size#94114012, value#94114014, growth#94114016, leverage#94114017] (11) CollectLimit Input [7]: [yield#94114023, volatility#94114019, momentum#94114021, size#94114012, value#94114014, growth#94114016, leverage#94114017] Arguments: 1000000