== Physical Plan == CollectLimit (11) +- * ColumnarToRow (10) +- InMemoryTableScan (1) +- InMemoryRelation (2) +- * Project (9) +- * Filter (8) +- * ColumnarToRow (7) +- InMemoryTableScan (3) +- InMemoryRelation (4) +- * Project (6) +- Scan csv (5) (1) InMemoryTableScan Output [7]: [yield#94129030, volatility#94129027, momentum#94129028, size#94129019, value#94129021, growth#94129023, leverage#94129025] Arguments: [yield#94129030, volatility#94129027, momentum#94129028, size#94129019, value#94129021, growth#94129023, leverage#94129025] (2) InMemoryRelation Arguments: [yield#94129030, volatility#94129027, momentum#94129028, size#94129019, value#94129021, growth#94129023, leverage#94129025], CachedRDDBuilder(org.apache.spark.sql.execution.columnar.DefaultCachedBatchSerializer@208e3fd9,StorageLevel(disk, memory, deserialized, 1 replicas),*(1) Project [yield#94129030, volatility#94129027, momentum#94129028, size#94129019, value#94129021, growth#94129023, leverage#94129025] +- *(1) Filter (isnotnull(cap#94129014) AND (cap#94129014 = 0.0)) +- *(1) ColumnarToRow +- InMemoryTableScan [cap#94129014, growth#94129023, leverage#94129025, momentum#94129028, size#94129019, value#94129021, volatility#94129027, yield#94129030], [isnotnull(cap#94129014), (cap#94129014 = 0.0)] +- InMemoryRelation [overall#94129012, cap#94129014, retIC#94129016, resretIC#94129018, size#94129019, value#94129021, growth#94129023, leverage#94129025, volatility#94129027, momentum#94129028, yield#94129030, numcos#94129032, numdates#94129034, annual_bmret#94129036, annual_ret#94129037, std_ret#94129039, Sharpe_ret#94129041, PctPos_ret#94129042, TR_ret#94129044, IR_ret#94129046, annual_resret#94129048, std_resret#94129049, Sharpe_resret#94129051, PctPos_resret#94129053, ... 9 more fields], StorageLevel(disk, memory, deserialized, 1 replicas) +- *(1) Project [CASE WHEN ((overall#94128830 = NA) OR (overall#94128830 = null)) THEN null ELSE cast(overall#94128830 as int) END AS overall#94129012, CASE WHEN ((cap#94128831 = NA) OR (cap#94128831 = null)) THEN null ELSE cast(cap#94128831 as float) END AS cap#94129014, CASE WHEN ((retIC#94128832 = NA) OR (retIC#94128832 = null)) THEN null ELSE cast(retIC#94128832 as float) END AS retIC#94129016, CASE WHEN ((resretIC#94128833 = NA) OR (resretIC#94128833 = null)) THEN null ELSE cast(resretIC#94128833 as float) END AS resretIC#94129018, CASE WHEN ((size#94128834 = NA) OR (size#94128834 = null)) THEN null ELSE cast(size#94128834 as float) END AS size#94129019, CASE WHEN ((value#94128835 = NA) OR (value#94128835 = null)) THEN null ELSE cast(value#94128835 as float) END AS value#94129021, CASE WHEN ((growth#94128836 = NA) OR (growth#94128836 = null)) THEN null ELSE cast(growth#94128836 as float) END AS growth#94129023, CASE WHEN ((leverage#94128837 = NA) OR (leverage#94128837 = null)) THEN null ELSE cast(leverage#94128837 as float) END AS leverage#94129025, CASE WHEN ((volatility#94128838 = NA) OR (volatility#94128838 = null)) THEN null ELSE cast(volatility#94128838 as float) END AS volatility#94129027, CASE WHEN ((momentum#94128839 = NA) OR (momentum#94128839 = null)) THEN null ELSE cast(momentum#94128839 as float) END AS momentum#94129028, CASE WHEN ((yield#94128840 = NA) OR (yield#94128840 = null)) THEN null ELSE cast(yield#94128840 as float) END AS yield#94129030, CASE WHEN ((numcos#94128841 = NA) OR (numcos#94128841 = null)) THEN null ELSE cast(numcos#94128841 as float) END AS numcos#94129032, CASE WHEN ((numdates#94128842 = NA) OR (numdates#94128842 = null)) THEN null ELSE cast(numdates#94128842 as float) END AS numdates#94129034, CASE WHEN ((annual_bmret#94128843 = NA) OR (annual_bmret#94128843 = null)) THEN null ELSE cast(annual_bmret#94128843 as float) END AS annual_bmret#94129036, CASE WHEN ((annual_ret#94128844 = NA) OR (annual_ret#94128844 = null)) THEN null ELSE cast(annual_ret#94128844 as float) END AS annual_ret#94129037, CASE WHEN ((std_ret#94128845 = NA) OR (std_ret#94128845 = null)) THEN null ELSE cast(std_ret#94128845 as float) END AS std_ret#94129039, CASE WHEN ((Sharpe_ret#94128846 = NA) OR (Sharpe_ret#94128846 = null)) THEN null ELSE cast(Sharpe_ret#94128846 as float) END AS Sharpe_ret#94129041, CASE WHEN ((PctPos_ret#94128847 = NA) OR (PctPos_ret#94128847 = null)) THEN null ELSE cast(PctPos_ret#94128847 as float) END AS PctPos_ret#94129042, CASE WHEN ((TR_ret#94128848 = NA) OR (TR_ret#94128848 = null)) THEN null ELSE cast(TR_ret#94128848 as float) END AS TR_ret#94129044, CASE WHEN ((IR_ret#94128849 = NA) OR (IR_ret#94128849 = null)) THEN null ELSE cast(IR_ret#94128849 as float) END AS IR_ret#94129046, CASE WHEN ((annual_resret#94128850 = NA) OR (annual_resret#94128850 = null)) THEN null ELSE cast(annual_resret#94128850 as float) END AS annual_resret#94129048, CASE WHEN ((std_resret#94128851 = NA) OR (std_resret#94128851 = null)) THEN null ELSE cast(std_resret#94128851 as float) END AS std_resret#94129049, CASE WHEN ((Sharpe_resret#94128852 = NA) OR (Sharpe_resret#94128852 = null)) THEN null ELSE cast(Sharpe_resret#94128852 as float) END AS Sharpe_resret#94129051, CASE WHEN ((PctPos_resret#94128853 = NA) OR (PctPos_resret#94128853 = null)) THEN null ELSE cast(PctPos_resret#94128853 as float) END AS PctPos_resret#94129053, ... 9 more fields] +- FileScan csv [overall#94128830,cap#94128831,retIC#94128832,resretIC#94128833,size#94128834,value#94128835,growth#94128836,leverage#94128837,volatility#94128838,momentum#94128839,yield#94128840,numcos#94128841,numdates#94128842,annual_bmret#94128843,annual_ret#94128844,std_ret#94128845,Sharpe_ret#94128846,PctPos_ret#94128847,TR_ret#94128848,IR_ret#94128849,annual_resret#94128850,std_resret#94128851,Sharpe_resret#94128852,PctPos_resret#94128853,... 9 more fields] Batched: false, DataFilters: [], Format: CSV, Location: InMemoryFileIndex(1 paths)[file:/srv/plusamp/data/default/ea-market/output/transcripts/transcript..., PartitionFilters: [], PushedFilters: [], ReadSchema: struct<overall:string,cap:string,retIC:string,resretIC:string,size:string,value:string,growth:str... ,None) (3) InMemoryTableScan Output [8]: [cap#94129014, growth#94129023, leverage#94129025, momentum#94129028, size#94129019, value#94129021, volatility#94129027, yield#94129030] Arguments: [cap#94129014, growth#94129023, leverage#94129025, momentum#94129028, size#94129019, value#94129021, volatility#94129027, yield#94129030], [isnotnull(cap#94129014), (cap#94129014 = 0.0)] (4) InMemoryRelation Arguments: [overall#94129012, cap#94129014, retIC#94129016, resretIC#94129018, size#94129019, value#94129021, growth#94129023, leverage#94129025, volatility#94129027, momentum#94129028, yield#94129030, numcos#94129032, numdates#94129034, annual_bmret#94129036, annual_ret#94129037, std_ret#94129039, Sharpe_ret#94129041, PctPos_ret#94129042, TR_ret#94129044, IR_ret#94129046, annual_resret#94129048, std_resret#94129049, Sharpe_resret#94129051, PctPos_resret#94129053, ... 9 more fields], CachedRDDBuilder(org.apache.spark.sql.execution.columnar.DefaultCachedBatchSerializer@208e3fd9,StorageLevel(disk, memory, deserialized, 1 replicas),*(1) Project [CASE WHEN ((overall#94128830 = NA) OR (overall#94128830 = null)) THEN null ELSE cast(overall#94128830 as int) END AS overall#94129012, CASE WHEN ((cap#94128831 = NA) OR (cap#94128831 = null)) THEN null ELSE cast(cap#94128831 as float) END AS cap#94129014, CASE WHEN ((retIC#94128832 = NA) OR (retIC#94128832 = null)) THEN null ELSE cast(retIC#94128832 as float) END AS retIC#94129016, CASE WHEN ((resretIC#94128833 = NA) OR (resretIC#94128833 = null)) THEN null ELSE cast(resretIC#94128833 as float) END AS resretIC#94129018, CASE WHEN ((size#94128834 = NA) OR (size#94128834 = null)) THEN null ELSE cast(size#94128834 as float) END AS size#94129019, CASE WHEN ((value#94128835 = NA) OR (value#94128835 = null)) THEN null ELSE cast(value#94128835 as float) END AS value#94129021, CASE WHEN ((growth#94128836 = NA) OR (growth#94128836 = null)) THEN null ELSE cast(growth#94128836 as float) END AS growth#94129023, CASE WHEN ((leverage#94128837 = NA) OR (leverage#94128837 = null)) THEN null ELSE cast(leverage#94128837 as float) END AS leverage#94129025, CASE WHEN ((volatility#94128838 = NA) OR (volatility#94128838 = null)) THEN null ELSE cast(volatility#94128838 as float) END AS volatility#94129027, CASE WHEN ((momentum#94128839 = NA) OR (momentum#94128839 = null)) THEN null ELSE cast(momentum#94128839 as float) END AS momentum#94129028, CASE WHEN ((yield#94128840 = NA) OR (yield#94128840 = null)) THEN null ELSE cast(yield#94128840 as float) END AS yield#94129030, CASE WHEN ((numcos#94128841 = NA) OR (numcos#94128841 = null)) THEN null ELSE cast(numcos#94128841 as float) END AS numcos#94129032, CASE WHEN ((numdates#94128842 = NA) OR (numdates#94128842 = null)) THEN null ELSE cast(numdates#94128842 as float) END AS numdates#94129034, CASE WHEN ((annual_bmret#94128843 = NA) OR (annual_bmret#94128843 = null)) THEN null ELSE cast(annual_bmret#94128843 as float) END AS annual_bmret#94129036, CASE WHEN ((annual_ret#94128844 = NA) OR (annual_ret#94128844 = null)) THEN null ELSE cast(annual_ret#94128844 as float) END AS annual_ret#94129037, CASE WHEN ((std_ret#94128845 = NA) OR (std_ret#94128845 = null)) THEN null ELSE cast(std_ret#94128845 as float) END AS std_ret#94129039, CASE WHEN ((Sharpe_ret#94128846 = NA) OR (Sharpe_ret#94128846 = null)) THEN null ELSE cast(Sharpe_ret#94128846 as float) END AS Sharpe_ret#94129041, CASE WHEN ((PctPos_ret#94128847 = NA) OR (PctPos_ret#94128847 = null)) THEN null ELSE cast(PctPos_ret#94128847 as float) END AS PctPos_ret#94129042, CASE WHEN ((TR_ret#94128848 = NA) OR (TR_ret#94128848 = null)) THEN null ELSE cast(TR_ret#94128848 as float) END AS TR_ret#94129044, CASE WHEN ((IR_ret#94128849 = NA) OR (IR_ret#94128849 = null)) THEN null ELSE cast(IR_ret#94128849 as float) END AS IR_ret#94129046, CASE WHEN ((annual_resret#94128850 = NA) OR (annual_resret#94128850 = null)) THEN null ELSE cast(annual_resret#94128850 as float) END AS annual_resret#94129048, CASE WHEN ((std_resret#94128851 = NA) OR (std_resret#94128851 = null)) THEN null ELSE cast(std_resret#94128851 as float) END AS std_resret#94129049, CASE WHEN ((Sharpe_resret#94128852 = NA) OR (Sharpe_resret#94128852 = null)) THEN null ELSE cast(Sharpe_resret#94128852 as float) END AS Sharpe_resret#94129051, CASE WHEN ((PctPos_resret#94128853 = NA) OR (PctPos_resret#94128853 = null)) THEN null ELSE cast(PctPos_resret#94128853 as float) END AS PctPos_resret#94129053, ... 9 more fields] +- FileScan csv [overall#94128830,cap#94128831,retIC#94128832,resretIC#94128833,size#94128834,value#94128835,growth#94128836,leverage#94128837,volatility#94128838,momentum#94128839,yield#94128840,numcos#94128841,numdates#94128842,annual_bmret#94128843,annual_ret#94128844,std_ret#94128845,Sharpe_ret#94128846,PctPos_ret#94128847,TR_ret#94128848,IR_ret#94128849,annual_resret#94128850,std_resret#94128851,Sharpe_resret#94128852,PctPos_resret#94128853,... 9 more fields] Batched: false, DataFilters: [], Format: CSV, Location: InMemoryFileIndex(1 paths)[file:/srv/plusamp/data/default/ea-market/output/transcripts/transcript..., PartitionFilters: [], PushedFilters: [], ReadSchema: struct<overall:string,cap:string,retIC:string,resretIC:string,size:string,value:string,growth:str... ,None) (5) Scan csv Output [33]: [overall#94128830, cap#94128831, retIC#94128832, resretIC#94128833, size#94128834, value#94128835, growth#94128836, leverage#94128837, volatility#94128838, momentum#94128839, yield#94128840, numcos#94128841, numdates#94128842, annual_bmret#94128843, annual_ret#94128844, std_ret#94128845, Sharpe_ret#94128846, PctPos_ret#94128847, TR_ret#94128848, IR_ret#94128849, annual_resret#94128850, std_resret#94128851, Sharpe_resret#94128852, PctPos_resret#94128853, TR_resret#94128854, IR_resret#94128855, annual_retnet#94128856, std_retnet#94128857, Sharpe_retnet#94128858, PctPos_retnet#94128859, TR_retnet#94128860, IR_retnet#94128861, turnover#94128862] Batched: false Location: InMemoryFileIndex [file:/srv/plusamp/data/default/ea-market/output/transcripts/transcript_model_residualized/stats_overall.csv] ReadSchema: struct<overall:string,cap:string,retIC:string,resretIC:string,size:string,value:string,growth:string,leverage:string,volatility:string,momentum:string,yield:string,numcos:string,numdates:string,annual_bmret:string,annual_ret:string,std_ret:string,Sharpe_ret:string,PctPos_ret:string,TR_ret:string,IR_ret:string,annual_resret:string,std_resret:string,Sharpe_resret:string,PctPos_resret:string,TR_resret:string,IR_resret:string,annual_retnet:string,std_retnet:string,Sharpe_retnet:string,PctPos_retnet:string,TR_retnet:string,IR_retnet:string,turnover:string> (6) Project [codegen id : 1] Output [33]: [CASE WHEN ((overall#94128830 = NA) OR (overall#94128830 = null)) THEN null ELSE cast(overall#94128830 as int) END AS overall#94129012, CASE WHEN ((cap#94128831 = NA) OR (cap#94128831 = null)) THEN null ELSE cast(cap#94128831 as float) END AS cap#94129014, CASE WHEN ((retIC#94128832 = NA) OR (retIC#94128832 = null)) THEN null ELSE cast(retIC#94128832 as float) END AS retIC#94129016, CASE WHEN ((resretIC#94128833 = NA) OR (resretIC#94128833 = null)) THEN null ELSE cast(resretIC#94128833 as float) END AS resretIC#94129018, CASE WHEN ((size#94128834 = NA) OR (size#94128834 = null)) THEN null ELSE cast(size#94128834 as float) END AS size#94129019, CASE WHEN ((value#94128835 = NA) OR (value#94128835 = null)) THEN null ELSE cast(value#94128835 as float) END AS value#94129021, CASE WHEN ((growth#94128836 = NA) OR (growth#94128836 = null)) THEN null ELSE cast(growth#94128836 as float) END AS growth#94129023, CASE WHEN ((leverage#94128837 = NA) OR (leverage#94128837 = null)) THEN null ELSE cast(leverage#94128837 as float) END AS leverage#94129025, CASE WHEN ((volatility#94128838 = NA) OR (volatility#94128838 = null)) THEN null ELSE cast(volatility#94128838 as float) END AS volatility#94129027, CASE WHEN ((momentum#94128839 = NA) OR (momentum#94128839 = null)) THEN null ELSE cast(momentum#94128839 as float) END AS momentum#94129028, CASE WHEN ((yield#94128840 = NA) OR (yield#94128840 = null)) THEN null ELSE cast(yield#94128840 as float) END AS yield#94129030, CASE WHEN ((numcos#94128841 = NA) OR (numcos#94128841 = null)) THEN null ELSE cast(numcos#94128841 as float) END AS numcos#94129032, CASE WHEN ((numdates#94128842 = NA) OR (numdates#94128842 = null)) THEN null ELSE cast(numdates#94128842 as float) END AS numdates#94129034, CASE WHEN ((annual_bmret#94128843 = NA) OR (annual_bmret#94128843 = null)) THEN null ELSE cast(annual_bmret#94128843 as float) END AS annual_bmret#94129036, CASE WHEN ((annual_ret#94128844 = NA) OR (annual_ret#94128844 = null)) THEN null ELSE cast(annual_ret#94128844 as float) END AS annual_ret#94129037, CASE WHEN ((std_ret#94128845 = NA) OR (std_ret#94128845 = null)) THEN null ELSE cast(std_ret#94128845 as float) END AS std_ret#94129039, CASE WHEN ((Sharpe_ret#94128846 = NA) OR (Sharpe_ret#94128846 = null)) THEN null ELSE cast(Sharpe_ret#94128846 as float) END AS Sharpe_ret#94129041, CASE WHEN ((PctPos_ret#94128847 = NA) OR (PctPos_ret#94128847 = null)) THEN null ELSE cast(PctPos_ret#94128847 as float) END AS PctPos_ret#94129042, CASE WHEN ((TR_ret#94128848 = NA) OR (TR_ret#94128848 = null)) THEN null ELSE cast(TR_ret#94128848 as float) END AS TR_ret#94129044, CASE WHEN ((IR_ret#94128849 = NA) OR (IR_ret#94128849 = null)) THEN null ELSE cast(IR_ret#94128849 as float) END AS IR_ret#94129046, CASE WHEN ((annual_resret#94128850 = NA) OR (annual_resret#94128850 = null)) THEN null ELSE cast(annual_resret#94128850 as float) END AS annual_resret#94129048, CASE WHEN ((std_resret#94128851 = NA) OR (std_resret#94128851 = null)) THEN null ELSE cast(std_resret#94128851 as float) END AS std_resret#94129049, CASE WHEN ((Sharpe_resret#94128852 = NA) OR (Sharpe_resret#94128852 = null)) THEN null ELSE cast(Sharpe_resret#94128852 as float) END AS Sharpe_resret#94129051, CASE WHEN ((PctPos_resret#94128853 = NA) OR (PctPos_resret#94128853 = null)) THEN null ELSE cast(PctPos_resret#94128853 as float) END AS PctPos_resret#94129053, CASE WHEN ((TR_resret#94128854 = NA) OR (TR_resret#94128854 = null)) THEN null ELSE cast(TR_resret#94128854 as float) END AS TR_resret#94129055, CASE WHEN ((IR_resret#94128855 = NA) OR (IR_resret#94128855 = null)) THEN null ELSE cast(IR_resret#94128855 as float) END AS IR_resret#94129056, CASE WHEN ((annual_retnet#94128856 = NA) OR (annual_retnet#94128856 = null)) THEN null ELSE cast(annual_retnet#94128856 as float) END AS annual_retnet#94129058, CASE WHEN ((std_retnet#94128857 = NA) OR (std_retnet#94128857 = null)) THEN null ELSE cast(std_retnet#94128857 as float) END AS std_retnet#94129060, CASE WHEN ((Sharpe_retnet#94128858 = NA) OR (Sharpe_retnet#94128858 = null)) THEN null ELSE cast(Sharpe_retnet#94128858 as float) END AS Sharpe_retnet#94129062, CASE WHEN ((PctPos_retnet#94128859 = NA) OR (PctPos_retnet#94128859 = null)) THEN null ELSE cast(PctPos_retnet#94128859 as float) END AS PctPos_retnet#94129063, CASE WHEN ((TR_retnet#94128860 = NA) OR (TR_retnet#94128860 = null)) THEN null ELSE cast(TR_retnet#94128860 as float) END AS TR_retnet#94129065, CASE WHEN ((IR_retnet#94128861 = NA) OR (IR_retnet#94128861 = null)) THEN null ELSE cast(IR_retnet#94128861 as float) END AS IR_retnet#94129067, CASE WHEN ((turnover#94128862 = NA) OR (turnover#94128862 = null)) THEN null ELSE cast(turnover#94128862 as float) END AS turnover#94129068] Input [33]: [overall#94128830, cap#94128831, retIC#94128832, resretIC#94128833, size#94128834, value#94128835, growth#94128836, leverage#94128837, volatility#94128838, momentum#94128839, yield#94128840, numcos#94128841, numdates#94128842, annual_bmret#94128843, annual_ret#94128844, std_ret#94128845, Sharpe_ret#94128846, PctPos_ret#94128847, TR_ret#94128848, IR_ret#94128849, annual_resret#94128850, std_resret#94128851, Sharpe_resret#94128852, PctPos_resret#94128853, TR_resret#94128854, IR_resret#94128855, annual_retnet#94128856, std_retnet#94128857, Sharpe_retnet#94128858, PctPos_retnet#94128859, TR_retnet#94128860, IR_retnet#94128861, turnover#94128862] (7) ColumnarToRow [codegen id : 1] Input [8]: [cap#94129014, growth#94129023, leverage#94129025, momentum#94129028, size#94129019, value#94129021, volatility#94129027, yield#94129030] (8) Filter [codegen id : 1] Input [8]: [cap#94129014, growth#94129023, leverage#94129025, momentum#94129028, size#94129019, value#94129021, volatility#94129027, yield#94129030] Condition : (isnotnull(cap#94129014) AND (cap#94129014 = 0.0)) (9) Project [codegen id : 1] Output [7]: [yield#94129030, volatility#94129027, momentum#94129028, size#94129019, value#94129021, growth#94129023, leverage#94129025] Input [8]: [cap#94129014, growth#94129023, leverage#94129025, momentum#94129028, size#94129019, value#94129021, volatility#94129027, yield#94129030] (10) ColumnarToRow [codegen id : 1] Input [7]: [yield#94129030, volatility#94129027, momentum#94129028, size#94129019, value#94129021, growth#94129023, leverage#94129025] (11) CollectLimit Input [7]: [yield#94129030, volatility#94129027, momentum#94129028, size#94129019, value#94129021, growth#94129023, leverage#94129025] Arguments: 1000000