== Physical Plan == CollectLimit (11) +- * ColumnarToRow (10) +- InMemoryTableScan (1) +- InMemoryRelation (2) +- * Project (9) +- * Filter (8) +- * ColumnarToRow (7) +- InMemoryTableScan (3) +- InMemoryRelation (4) +- * Project (6) +- Scan csv (5) (1) InMemoryTableScan Output [7]: [yield#93984822, volatility#93984819, momentum#93984821, size#93984812, value#93984813, growth#93984815, leverage#93984817] Arguments: [yield#93984822, volatility#93984819, momentum#93984821, size#93984812, value#93984813, growth#93984815, leverage#93984817] (2) InMemoryRelation Arguments: [yield#93984822, volatility#93984819, momentum#93984821, size#93984812, value#93984813, growth#93984815, leverage#93984817], CachedRDDBuilder(org.apache.spark.sql.execution.columnar.DefaultCachedBatchSerializer@208e3fd9,StorageLevel(disk, memory, deserialized, 1 replicas),*(1) Project [yield#93984822, volatility#93984819, momentum#93984821, size#93984812, value#93984813, growth#93984815, leverage#93984817] +- *(1) Filter (isnotnull(cap#93984806) AND (cap#93984806 = 0.0)) +- *(1) ColumnarToRow +- InMemoryTableScan [cap#93984806, growth#93984815, leverage#93984817, momentum#93984821, size#93984812, value#93984813, volatility#93984819, yield#93984822], [isnotnull(cap#93984806), (cap#93984806 = 0.0)] +- InMemoryRelation [overall#93984804, cap#93984806, retIC#93984808, resretIC#93984810, size#93984812, value#93984813, growth#93984815, leverage#93984817, volatility#93984819, momentum#93984821, yield#93984822, numcos#93984824, numdates#93984826, annual_bmret#93984828, annual_ret#93984830, std_ret#93984832, Sharpe_ret#93984834, PctPos_ret#93984836, TR_ret#93984837, IR_ret#93984838, annual_resret#93984839, std_resret#93984840, Sharpe_resret#93984841, PctPos_resret#93984842, ... 9 more fields], StorageLevel(disk, memory, deserialized, 1 replicas) +- *(1) Project [CASE WHEN ((overall#93984612 = NA) OR (overall#93984612 = null)) THEN null ELSE cast(overall#93984612 as float) END AS overall#93984804, CASE WHEN ((cap#93984613 = NA) OR (cap#93984613 = null)) THEN null ELSE cast(cap#93984613 as float) END AS cap#93984806, CASE WHEN ((retIC#93984614 = NA) OR (retIC#93984614 = null)) THEN null ELSE cast(retIC#93984614 as float) END AS retIC#93984808, CASE WHEN ((resretIC#93984615 = NA) OR (resretIC#93984615 = null)) THEN null ELSE cast(resretIC#93984615 as float) END AS resretIC#93984810, CASE WHEN ((size#93984616 = NA) OR (size#93984616 = null)) THEN null ELSE cast(size#93984616 as float) END AS size#93984812, CASE WHEN ((value#93984617 = NA) OR (value#93984617 = null)) THEN null ELSE cast(value#93984617 as float) END AS value#93984813, CASE WHEN ((growth#93984618 = NA) OR (growth#93984618 = null)) THEN null ELSE cast(growth#93984618 as float) END AS growth#93984815, CASE WHEN ((leverage#93984619 = NA) OR (leverage#93984619 = null)) THEN null ELSE cast(leverage#93984619 as float) END AS leverage#93984817, CASE WHEN ((volatility#93984620 = NA) OR (volatility#93984620 = null)) THEN null ELSE cast(volatility#93984620 as float) END AS volatility#93984819, CASE WHEN ((momentum#93984621 = NA) OR (momentum#93984621 = null)) THEN null ELSE cast(momentum#93984621 as float) END AS momentum#93984821, CASE WHEN ((yield#93984622 = NA) OR (yield#93984622 = null)) THEN null ELSE cast(yield#93984622 as float) END AS yield#93984822, CASE WHEN ((numcos#93984623 = NA) OR (numcos#93984623 = null)) THEN null ELSE cast(numcos#93984623 as float) END AS numcos#93984824, CASE WHEN ((numdates#93984624 = NA) OR (numdates#93984624 = null)) THEN null ELSE cast(numdates#93984624 as float) END AS numdates#93984826, CASE WHEN ((annual_bmret#93984625 = NA) OR (annual_bmret#93984625 = null)) THEN null ELSE cast(annual_bmret#93984625 as float) END AS annual_bmret#93984828, CASE WHEN ((annual_ret#93984626 = NA) OR (annual_ret#93984626 = null)) THEN null ELSE cast(annual_ret#93984626 as float) END AS annual_ret#93984830, CASE WHEN ((std_ret#93984627 = NA) OR (std_ret#93984627 = null)) THEN null ELSE cast(std_ret#93984627 as float) END AS std_ret#93984832, CASE WHEN ((Sharpe_ret#93984628 = NA) OR (Sharpe_ret#93984628 = null)) THEN null ELSE cast(Sharpe_ret#93984628 as float) END AS Sharpe_ret#93984834, CASE WHEN ((PctPos_ret#93984629 = NA) OR (PctPos_ret#93984629 = null)) THEN null ELSE cast(PctPos_ret#93984629 as float) END AS PctPos_ret#93984836, CASE WHEN ((TR_ret#93984630 = NA) OR (TR_ret#93984630 = null)) THEN null ELSE cast(TR_ret#93984630 as float) END AS TR_ret#93984837, CASE WHEN ((IR_ret#93984631 = NA) OR (IR_ret#93984631 = null)) THEN null ELSE cast(IR_ret#93984631 as float) END AS IR_ret#93984838, CASE WHEN ((annual_resret#93984632 = NA) OR (annual_resret#93984632 = null)) THEN null ELSE cast(annual_resret#93984632 as float) END AS annual_resret#93984839, CASE WHEN ((std_resret#93984633 = NA) OR (std_resret#93984633 = null)) THEN null ELSE cast(std_resret#93984633 as float) END AS std_resret#93984840, CASE WHEN ((Sharpe_resret#93984634 = NA) OR (Sharpe_resret#93984634 = null)) THEN null ELSE cast(Sharpe_resret#93984634 as float) END AS Sharpe_resret#93984841, CASE WHEN ((PctPos_resret#93984635 = NA) OR (PctPos_resret#93984635 = null)) THEN null ELSE cast(PctPos_resret#93984635 as float) END AS PctPos_resret#93984842, ... 9 more fields] +- FileScan csv [overall#93984612,cap#93984613,retIC#93984614,resretIC#93984615,size#93984616,value#93984617,growth#93984618,leverage#93984619,volatility#93984620,momentum#93984621,yield#93984622,numcos#93984623,numdates#93984624,annual_bmret#93984625,annual_ret#93984626,std_ret#93984627,Sharpe_ret#93984628,PctPos_ret#93984629,TR_ret#93984630,IR_ret#93984631,annual_resret#93984632,std_resret#93984633,Sharpe_resret#93984634,PctPos_resret#93984635,... 9 more fields] Batched: false, DataFilters: [], Format: CSV, Location: InMemoryFileIndex(1 paths)[file:/srv/plusamp/data/default/ea-market/output/estimize_signal_histor..., PartitionFilters: [], PushedFilters: [], ReadSchema: struct<overall:string,cap:string,retIC:string,resretIC:string,size:string,value:string,growth:str... ,None) (3) InMemoryTableScan Output [8]: [cap#93984806, growth#93984815, leverage#93984817, momentum#93984821, size#93984812, value#93984813, volatility#93984819, yield#93984822] Arguments: [cap#93984806, growth#93984815, leverage#93984817, momentum#93984821, size#93984812, value#93984813, volatility#93984819, yield#93984822], [isnotnull(cap#93984806), (cap#93984806 = 0.0)] (4) InMemoryRelation Arguments: [overall#93984804, cap#93984806, retIC#93984808, resretIC#93984810, size#93984812, value#93984813, growth#93984815, leverage#93984817, volatility#93984819, momentum#93984821, yield#93984822, numcos#93984824, numdates#93984826, annual_bmret#93984828, annual_ret#93984830, std_ret#93984832, Sharpe_ret#93984834, PctPos_ret#93984836, TR_ret#93984837, IR_ret#93984838, annual_resret#93984839, std_resret#93984840, Sharpe_resret#93984841, PctPos_resret#93984842, ... 9 more fields], CachedRDDBuilder(org.apache.spark.sql.execution.columnar.DefaultCachedBatchSerializer@208e3fd9,StorageLevel(disk, memory, deserialized, 1 replicas),*(1) Project [CASE WHEN ((overall#93984612 = NA) OR (overall#93984612 = null)) THEN null ELSE cast(overall#93984612 as float) END AS overall#93984804, CASE WHEN ((cap#93984613 = NA) OR (cap#93984613 = null)) THEN null ELSE cast(cap#93984613 as float) END AS cap#93984806, CASE WHEN ((retIC#93984614 = NA) OR (retIC#93984614 = null)) THEN null ELSE cast(retIC#93984614 as float) END AS retIC#93984808, CASE WHEN ((resretIC#93984615 = NA) OR (resretIC#93984615 = null)) THEN null ELSE cast(resretIC#93984615 as float) END AS resretIC#93984810, CASE WHEN ((size#93984616 = NA) OR (size#93984616 = null)) THEN null ELSE cast(size#93984616 as float) END AS size#93984812, CASE WHEN ((value#93984617 = NA) OR (value#93984617 = null)) THEN null ELSE cast(value#93984617 as float) END AS value#93984813, CASE WHEN ((growth#93984618 = NA) OR (growth#93984618 = null)) THEN null ELSE cast(growth#93984618 as float) END AS growth#93984815, CASE WHEN ((leverage#93984619 = NA) OR (leverage#93984619 = null)) THEN null ELSE cast(leverage#93984619 as float) END AS leverage#93984817, CASE WHEN ((volatility#93984620 = NA) OR (volatility#93984620 = null)) THEN null ELSE cast(volatility#93984620 as float) END AS volatility#93984819, CASE WHEN ((momentum#93984621 = NA) OR (momentum#93984621 = null)) THEN null ELSE cast(momentum#93984621 as float) END AS momentum#93984821, CASE WHEN ((yield#93984622 = NA) OR (yield#93984622 = null)) THEN null ELSE cast(yield#93984622 as float) END AS yield#93984822, CASE WHEN ((numcos#93984623 = NA) OR (numcos#93984623 = null)) THEN null ELSE cast(numcos#93984623 as float) END AS numcos#93984824, CASE WHEN ((numdates#93984624 = NA) OR (numdates#93984624 = null)) THEN null ELSE cast(numdates#93984624 as float) END AS numdates#93984826, CASE WHEN ((annual_bmret#93984625 = NA) OR (annual_bmret#93984625 = null)) THEN null ELSE cast(annual_bmret#93984625 as float) END AS annual_bmret#93984828, CASE WHEN ((annual_ret#93984626 = NA) OR (annual_ret#93984626 = null)) THEN null ELSE cast(annual_ret#93984626 as float) END AS annual_ret#93984830, CASE WHEN ((std_ret#93984627 = NA) OR (std_ret#93984627 = null)) THEN null ELSE cast(std_ret#93984627 as float) END AS std_ret#93984832, CASE WHEN ((Sharpe_ret#93984628 = NA) OR (Sharpe_ret#93984628 = null)) THEN null ELSE cast(Sharpe_ret#93984628 as float) END AS Sharpe_ret#93984834, CASE WHEN ((PctPos_ret#93984629 = NA) OR (PctPos_ret#93984629 = null)) THEN null ELSE cast(PctPos_ret#93984629 as float) END AS PctPos_ret#93984836, CASE WHEN ((TR_ret#93984630 = NA) OR (TR_ret#93984630 = null)) THEN null ELSE cast(TR_ret#93984630 as float) END AS TR_ret#93984837, CASE WHEN ((IR_ret#93984631 = NA) OR (IR_ret#93984631 = null)) THEN null ELSE cast(IR_ret#93984631 as float) END AS IR_ret#93984838, CASE WHEN ((annual_resret#93984632 = NA) OR (annual_resret#93984632 = null)) THEN null ELSE cast(annual_resret#93984632 as float) END AS annual_resret#93984839, CASE WHEN ((std_resret#93984633 = NA) OR (std_resret#93984633 = null)) THEN null ELSE cast(std_resret#93984633 as float) END AS std_resret#93984840, CASE WHEN ((Sharpe_resret#93984634 = NA) OR (Sharpe_resret#93984634 = null)) THEN null ELSE cast(Sharpe_resret#93984634 as float) END AS Sharpe_resret#93984841, CASE WHEN ((PctPos_resret#93984635 = NA) OR (PctPos_resret#93984635 = null)) THEN null ELSE cast(PctPos_resret#93984635 as float) END AS PctPos_resret#93984842, ... 9 more fields] +- FileScan csv [overall#93984612,cap#93984613,retIC#93984614,resretIC#93984615,size#93984616,value#93984617,growth#93984618,leverage#93984619,volatility#93984620,momentum#93984621,yield#93984622,numcos#93984623,numdates#93984624,annual_bmret#93984625,annual_ret#93984626,std_ret#93984627,Sharpe_ret#93984628,PctPos_ret#93984629,TR_ret#93984630,IR_ret#93984631,annual_resret#93984632,std_resret#93984633,Sharpe_resret#93984634,PctPos_resret#93984635,... 9 more fields] Batched: false, DataFilters: [], Format: CSV, Location: InMemoryFileIndex(1 paths)[file:/srv/plusamp/data/default/ea-market/output/estimize_signal_histor..., PartitionFilters: [], PushedFilters: [], ReadSchema: struct<overall:string,cap:string,retIC:string,resretIC:string,size:string,value:string,growth:str... ,None) (5) Scan csv Output [33]: [overall#93984612, cap#93984613, retIC#93984614, resretIC#93984615, size#93984616, value#93984617, growth#93984618, leverage#93984619, volatility#93984620, momentum#93984621, yield#93984622, numcos#93984623, numdates#93984624, annual_bmret#93984625, annual_ret#93984626, std_ret#93984627, Sharpe_ret#93984628, PctPos_ret#93984629, TR_ret#93984630, IR_ret#93984631, annual_resret#93984632, std_resret#93984633, Sharpe_resret#93984634, PctPos_resret#93984635, TR_resret#93984636, IR_resret#93984637, annual_retnet#93984638, std_retnet#93984639, Sharpe_retnet#93984640, PctPos_retnet#93984641, TR_retnet#93984642, IR_retnet#93984643, turnover#93984644] Batched: false Location: InMemoryFileIndex [file:/srv/plusamp/data/default/ea-market/output/estimize_signal_history/estimizesignal_postearnings/stats_overall.csv] ReadSchema: struct<overall:string,cap:string,retIC:string,resretIC:string,size:string,value:string,growth:string,leverage:string,volatility:string,momentum:string,yield:string,numcos:string,numdates:string,annual_bmret:string,annual_ret:string,std_ret:string,Sharpe_ret:string,PctPos_ret:string,TR_ret:string,IR_ret:string,annual_resret:string,std_resret:string,Sharpe_resret:string,PctPos_resret:string,TR_resret:string,IR_resret:string,annual_retnet:string,std_retnet:string,Sharpe_retnet:string,PctPos_retnet:string,TR_retnet:string,IR_retnet:string,turnover:string> (6) Project [codegen id : 1] Output [33]: [CASE WHEN ((overall#93984612 = NA) OR (overall#93984612 = null)) THEN null ELSE cast(overall#93984612 as float) END AS overall#93984804, CASE WHEN ((cap#93984613 = NA) OR (cap#93984613 = null)) THEN null ELSE cast(cap#93984613 as float) END AS cap#93984806, CASE WHEN ((retIC#93984614 = NA) OR (retIC#93984614 = null)) THEN null ELSE cast(retIC#93984614 as float) END AS retIC#93984808, CASE WHEN ((resretIC#93984615 = NA) OR (resretIC#93984615 = null)) THEN null ELSE cast(resretIC#93984615 as float) END AS resretIC#93984810, CASE WHEN ((size#93984616 = NA) OR (size#93984616 = null)) THEN null ELSE cast(size#93984616 as float) END AS size#93984812, CASE WHEN ((value#93984617 = NA) OR (value#93984617 = null)) THEN null ELSE cast(value#93984617 as float) END AS value#93984813, CASE WHEN ((growth#93984618 = NA) OR (growth#93984618 = null)) THEN null ELSE cast(growth#93984618 as float) END AS growth#93984815, CASE WHEN ((leverage#93984619 = NA) OR (leverage#93984619 = null)) THEN null ELSE cast(leverage#93984619 as float) END AS leverage#93984817, CASE WHEN ((volatility#93984620 = NA) OR (volatility#93984620 = null)) THEN null ELSE cast(volatility#93984620 as float) END AS volatility#93984819, CASE WHEN ((momentum#93984621 = NA) OR (momentum#93984621 = null)) THEN null ELSE cast(momentum#93984621 as float) END AS momentum#93984821, CASE WHEN ((yield#93984622 = NA) OR (yield#93984622 = null)) THEN null ELSE cast(yield#93984622 as float) END AS yield#93984822, CASE WHEN ((numcos#93984623 = NA) OR (numcos#93984623 = null)) THEN null ELSE cast(numcos#93984623 as float) END AS numcos#93984824, CASE WHEN ((numdates#93984624 = NA) OR (numdates#93984624 = null)) THEN null ELSE cast(numdates#93984624 as float) END AS numdates#93984826, CASE WHEN ((annual_bmret#93984625 = NA) OR (annual_bmret#93984625 = null)) THEN null ELSE cast(annual_bmret#93984625 as float) END AS annual_bmret#93984828, CASE WHEN ((annual_ret#93984626 = NA) OR (annual_ret#93984626 = null)) THEN null ELSE cast(annual_ret#93984626 as float) END AS annual_ret#93984830, CASE WHEN ((std_ret#93984627 = NA) OR (std_ret#93984627 = null)) THEN null ELSE cast(std_ret#93984627 as float) END AS std_ret#93984832, CASE WHEN ((Sharpe_ret#93984628 = NA) OR (Sharpe_ret#93984628 = null)) THEN null ELSE cast(Sharpe_ret#93984628 as float) END AS Sharpe_ret#93984834, CASE WHEN ((PctPos_ret#93984629 = NA) OR (PctPos_ret#93984629 = null)) THEN null ELSE cast(PctPos_ret#93984629 as float) END AS PctPos_ret#93984836, CASE WHEN ((TR_ret#93984630 = NA) OR (TR_ret#93984630 = null)) THEN null ELSE cast(TR_ret#93984630 as float) END AS TR_ret#93984837, CASE WHEN ((IR_ret#93984631 = NA) OR (IR_ret#93984631 = null)) THEN null ELSE cast(IR_ret#93984631 as float) END AS IR_ret#93984838, CASE WHEN ((annual_resret#93984632 = NA) OR (annual_resret#93984632 = null)) THEN null ELSE cast(annual_resret#93984632 as float) END AS annual_resret#93984839, CASE WHEN ((std_resret#93984633 = NA) OR (std_resret#93984633 = null)) THEN null ELSE cast(std_resret#93984633 as float) END AS std_resret#93984840, CASE WHEN ((Sharpe_resret#93984634 = NA) OR (Sharpe_resret#93984634 = null)) THEN null ELSE cast(Sharpe_resret#93984634 as float) END AS Sharpe_resret#93984841, CASE WHEN ((PctPos_resret#93984635 = NA) OR (PctPos_resret#93984635 = null)) THEN null ELSE cast(PctPos_resret#93984635 as float) END AS PctPos_resret#93984842, CASE WHEN ((TR_resret#93984636 = NA) OR (TR_resret#93984636 = null)) THEN null ELSE cast(TR_resret#93984636 as float) END AS TR_resret#93984843, CASE WHEN ((IR_resret#93984637 = NA) OR (IR_resret#93984637 = null)) THEN null ELSE cast(IR_resret#93984637 as float) END AS IR_resret#93984844, CASE WHEN ((annual_retnet#93984638 = NA) OR (annual_retnet#93984638 = null)) THEN null ELSE cast(annual_retnet#93984638 as float) END AS annual_retnet#93984845, CASE WHEN ((std_retnet#93984639 = NA) OR (std_retnet#93984639 = null)) THEN null ELSE cast(std_retnet#93984639 as float) END AS std_retnet#93984846, CASE WHEN ((Sharpe_retnet#93984640 = NA) OR (Sharpe_retnet#93984640 = null)) THEN null ELSE cast(Sharpe_retnet#93984640 as float) END AS Sharpe_retnet#93984847, CASE WHEN ((PctPos_retnet#93984641 = NA) OR (PctPos_retnet#93984641 = null)) THEN null ELSE cast(PctPos_retnet#93984641 as float) END AS PctPos_retnet#93984848, CASE WHEN ((TR_retnet#93984642 = NA) OR (TR_retnet#93984642 = null)) THEN null ELSE cast(TR_retnet#93984642 as float) END AS TR_retnet#93984849, CASE WHEN ((IR_retnet#93984643 = NA) OR (IR_retnet#93984643 = null)) THEN null ELSE cast(IR_retnet#93984643 as float) END AS IR_retnet#93984850, CASE WHEN ((turnover#93984644 = NA) OR (turnover#93984644 = null)) THEN null ELSE cast(turnover#93984644 as float) END AS turnover#93984851] Input [33]: [overall#93984612, cap#93984613, retIC#93984614, resretIC#93984615, size#93984616, value#93984617, growth#93984618, leverage#93984619, volatility#93984620, momentum#93984621, yield#93984622, numcos#93984623, numdates#93984624, annual_bmret#93984625, annual_ret#93984626, std_ret#93984627, Sharpe_ret#93984628, PctPos_ret#93984629, TR_ret#93984630, IR_ret#93984631, annual_resret#93984632, std_resret#93984633, Sharpe_resret#93984634, PctPos_resret#93984635, TR_resret#93984636, IR_resret#93984637, annual_retnet#93984638, std_retnet#93984639, Sharpe_retnet#93984640, PctPos_retnet#93984641, TR_retnet#93984642, IR_retnet#93984643, turnover#93984644] (7) ColumnarToRow [codegen id : 1] Input [8]: [cap#93984806, growth#93984815, leverage#93984817, momentum#93984821, size#93984812, value#93984813, volatility#93984819, yield#93984822] (8) Filter [codegen id : 1] Input [8]: [cap#93984806, growth#93984815, leverage#93984817, momentum#93984821, size#93984812, value#93984813, volatility#93984819, yield#93984822] Condition : (isnotnull(cap#93984806) AND (cap#93984806 = 0.0)) (9) Project [codegen id : 1] Output [7]: [yield#93984822, volatility#93984819, momentum#93984821, size#93984812, value#93984813, growth#93984815, leverage#93984817] Input [8]: [cap#93984806, growth#93984815, leverage#93984817, momentum#93984821, size#93984812, value#93984813, volatility#93984819, yield#93984822] (10) ColumnarToRow [codegen id : 1] Input [7]: [yield#93984822, volatility#93984819, momentum#93984821, size#93984812, value#93984813, growth#93984815, leverage#93984817] (11) CollectLimit Input [7]: [yield#93984822, volatility#93984819, momentum#93984821, size#93984812, value#93984813, growth#93984815, leverage#93984817] Arguments: 1000000