== Physical Plan == CollectLimit (11) +- * ColumnarToRow (10) +- InMemoryTableScan (1) +- InMemoryRelation (2) +- * Project (9) +- * Filter (8) +- * ColumnarToRow (7) +- InMemoryTableScan (3) +- InMemoryRelation (4) +- * Project (6) +- Scan csv (5) (1) InMemoryTableScan Output [7]: [yield#93999711, volatility#93999707, momentum#93999709, size#93999699, value#93999701, growth#93999703, leverage#93999705] Arguments: [yield#93999711, volatility#93999707, momentum#93999709, size#93999699, value#93999701, growth#93999703, leverage#93999705] (2) InMemoryRelation Arguments: [yield#93999711, volatility#93999707, momentum#93999709, size#93999699, value#93999701, growth#93999703, leverage#93999705], CachedRDDBuilder(org.apache.spark.sql.execution.columnar.DefaultCachedBatchSerializer@208e3fd9,StorageLevel(disk, memory, deserialized, 1 replicas),*(1) Project [yield#93999711, volatility#93999707, momentum#93999709, size#93999699, value#93999701, growth#93999703, leverage#93999705] +- *(1) Filter (isnotnull(cap#93999693) AND (cap#93999693 = 0.0)) +- *(1) ColumnarToRow +- InMemoryTableScan [cap#93999693, growth#93999703, leverage#93999705, momentum#93999709, size#93999699, value#93999701, volatility#93999707, yield#93999711], [isnotnull(cap#93999693), (cap#93999693 = 0.0)] +- InMemoryRelation [overall#93999691, cap#93999693, retIC#93999695, resretIC#93999697, size#93999699, value#93999701, growth#93999703, leverage#93999705, volatility#93999707, momentum#93999709, yield#93999711, numcos#93999713, numdates#93999715, annual_bmret#93999717, annual_ret#93999719, std_ret#93999721, Sharpe_ret#93999723, PctPos_ret#93999725, TR_ret#93999727, IR_ret#93999729, annual_resret#93999731, std_resret#93999733, Sharpe_resret#93999735, PctPos_resret#93999737, ... 9 more fields], StorageLevel(disk, memory, deserialized, 1 replicas) +- *(1) Project [CASE WHEN ((overall#93999484 = NA) OR (overall#93999484 = null)) THEN null ELSE cast(overall#93999484 as int) END AS overall#93999691, CASE WHEN ((cap#93999485 = NA) OR (cap#93999485 = null)) THEN null ELSE cast(cap#93999485 as float) END AS cap#93999693, CASE WHEN ((retIC#93999486 = NA) OR (retIC#93999486 = null)) THEN null ELSE cast(retIC#93999486 as float) END AS retIC#93999695, CASE WHEN ((resretIC#93999487 = NA) OR (resretIC#93999487 = null)) THEN null ELSE cast(resretIC#93999487 as float) END AS resretIC#93999697, CASE WHEN ((size#93999488 = NA) OR (size#93999488 = null)) THEN null ELSE cast(size#93999488 as float) END AS size#93999699, CASE WHEN ((value#93999489 = NA) OR (value#93999489 = null)) THEN null ELSE cast(value#93999489 as float) END AS value#93999701, CASE WHEN ((growth#93999490 = NA) OR (growth#93999490 = null)) THEN null ELSE cast(growth#93999490 as float) END AS growth#93999703, CASE WHEN ((leverage#93999491 = NA) OR (leverage#93999491 = null)) THEN null ELSE cast(leverage#93999491 as float) END AS leverage#93999705, CASE WHEN ((volatility#93999492 = NA) OR (volatility#93999492 = null)) THEN null ELSE cast(volatility#93999492 as float) END AS volatility#93999707, CASE WHEN ((momentum#93999493 = NA) OR (momentum#93999493 = null)) THEN null ELSE cast(momentum#93999493 as float) END AS momentum#93999709, CASE WHEN ((yield#93999494 = NA) OR (yield#93999494 = null)) THEN null ELSE cast(yield#93999494 as float) END AS yield#93999711, CASE WHEN ((numcos#93999495 = NA) OR (numcos#93999495 = null)) THEN null ELSE cast(numcos#93999495 as float) END AS numcos#93999713, CASE WHEN ((numdates#93999496 = NA) OR (numdates#93999496 = null)) THEN null ELSE cast(numdates#93999496 as float) END AS numdates#93999715, CASE WHEN ((annual_bmret#93999497 = NA) OR (annual_bmret#93999497 = null)) THEN null ELSE cast(annual_bmret#93999497 as float) END AS annual_bmret#93999717, CASE WHEN ((annual_ret#93999498 = NA) OR (annual_ret#93999498 = null)) THEN null ELSE cast(annual_ret#93999498 as float) END AS annual_ret#93999719, CASE WHEN ((std_ret#93999499 = NA) OR (std_ret#93999499 = null)) THEN null ELSE cast(std_ret#93999499 as float) END AS std_ret#93999721, CASE WHEN ((Sharpe_ret#93999500 = NA) OR (Sharpe_ret#93999500 = null)) THEN null ELSE cast(Sharpe_ret#93999500 as float) END AS Sharpe_ret#93999723, CASE WHEN ((PctPos_ret#93999501 = NA) OR (PctPos_ret#93999501 = null)) THEN null ELSE cast(PctPos_ret#93999501 as float) END AS PctPos_ret#93999725, CASE WHEN ((TR_ret#93999502 = NA) OR (TR_ret#93999502 = null)) THEN null ELSE cast(TR_ret#93999502 as float) END AS TR_ret#93999727, CASE WHEN ((IR_ret#93999503 = NA) OR (IR_ret#93999503 = null)) THEN null ELSE cast(IR_ret#93999503 as float) END AS IR_ret#93999729, CASE WHEN ((annual_resret#93999504 = NA) OR (annual_resret#93999504 = null)) THEN null ELSE cast(annual_resret#93999504 as float) END AS annual_resret#93999731, CASE WHEN ((std_resret#93999505 = NA) OR (std_resret#93999505 = null)) THEN null ELSE cast(std_resret#93999505 as float) END AS std_resret#93999733, CASE WHEN ((Sharpe_resret#93999506 = NA) OR (Sharpe_resret#93999506 = null)) THEN null ELSE cast(Sharpe_resret#93999506 as float) END AS Sharpe_resret#93999735, CASE WHEN ((PctPos_resret#93999507 = NA) OR (PctPos_resret#93999507 = null)) THEN null ELSE cast(PctPos_resret#93999507 as float) END AS PctPos_resret#93999737, ... 9 more fields] +- FileScan csv [overall#93999484,cap#93999485,retIC#93999486,resretIC#93999487,size#93999488,value#93999489,growth#93999490,leverage#93999491,volatility#93999492,momentum#93999493,yield#93999494,numcos#93999495,numdates#93999496,annual_bmret#93999497,annual_ret#93999498,std_ret#93999499,Sharpe_ret#93999500,PctPos_ret#93999501,TR_ret#93999502,IR_ret#93999503,annual_resret#93999504,std_resret#93999505,Sharpe_resret#93999506,PctPos_resret#93999507,... 9 more fields] Batched: false, DataFilters: [], Format: CSV, Location: InMemoryFileIndex(1 paths)[file:/srv/plusamp/data/default/ea-market/output/estimize_signal_histor..., PartitionFilters: [], PushedFilters: [], ReadSchema: struct<overall:string,cap:string,retIC:string,resretIC:string,size:string,value:string,growth:str... ,None) (3) InMemoryTableScan Output [8]: [cap#93999693, growth#93999703, leverage#93999705, momentum#93999709, size#93999699, value#93999701, volatility#93999707, yield#93999711] Arguments: [cap#93999693, growth#93999703, leverage#93999705, momentum#93999709, size#93999699, value#93999701, volatility#93999707, yield#93999711], [isnotnull(cap#93999693), (cap#93999693 = 0.0)] (4) InMemoryRelation Arguments: [overall#93999691, cap#93999693, retIC#93999695, resretIC#93999697, size#93999699, value#93999701, growth#93999703, leverage#93999705, volatility#93999707, momentum#93999709, yield#93999711, numcos#93999713, numdates#93999715, annual_bmret#93999717, annual_ret#93999719, std_ret#93999721, Sharpe_ret#93999723, PctPos_ret#93999725, TR_ret#93999727, IR_ret#93999729, annual_resret#93999731, std_resret#93999733, Sharpe_resret#93999735, PctPos_resret#93999737, ... 9 more fields], CachedRDDBuilder(org.apache.spark.sql.execution.columnar.DefaultCachedBatchSerializer@208e3fd9,StorageLevel(disk, memory, deserialized, 1 replicas),*(1) Project [CASE WHEN ((overall#93999484 = NA) OR (overall#93999484 = null)) THEN null ELSE cast(overall#93999484 as int) END AS overall#93999691, CASE WHEN ((cap#93999485 = NA) OR (cap#93999485 = null)) THEN null ELSE cast(cap#93999485 as float) END AS cap#93999693, CASE WHEN ((retIC#93999486 = NA) OR (retIC#93999486 = null)) THEN null ELSE cast(retIC#93999486 as float) END AS retIC#93999695, CASE WHEN ((resretIC#93999487 = NA) OR (resretIC#93999487 = null)) THEN null ELSE cast(resretIC#93999487 as float) END AS resretIC#93999697, CASE WHEN ((size#93999488 = NA) OR (size#93999488 = null)) THEN null ELSE cast(size#93999488 as float) END AS size#93999699, CASE WHEN ((value#93999489 = NA) OR (value#93999489 = null)) THEN null ELSE cast(value#93999489 as float) END AS value#93999701, CASE WHEN ((growth#93999490 = NA) OR (growth#93999490 = null)) THEN null ELSE cast(growth#93999490 as float) END AS growth#93999703, CASE WHEN ((leverage#93999491 = NA) OR (leverage#93999491 = null)) THEN null ELSE cast(leverage#93999491 as float) END AS leverage#93999705, CASE WHEN ((volatility#93999492 = NA) OR (volatility#93999492 = null)) THEN null ELSE cast(volatility#93999492 as float) END AS volatility#93999707, CASE WHEN ((momentum#93999493 = NA) OR (momentum#93999493 = null)) THEN null ELSE cast(momentum#93999493 as float) END AS momentum#93999709, CASE WHEN ((yield#93999494 = NA) OR (yield#93999494 = null)) THEN null ELSE cast(yield#93999494 as float) END AS yield#93999711, CASE WHEN ((numcos#93999495 = NA) OR (numcos#93999495 = null)) THEN null ELSE cast(numcos#93999495 as float) END AS numcos#93999713, CASE WHEN ((numdates#93999496 = NA) OR (numdates#93999496 = null)) THEN null ELSE cast(numdates#93999496 as float) END AS numdates#93999715, CASE WHEN ((annual_bmret#93999497 = NA) OR (annual_bmret#93999497 = null)) THEN null ELSE cast(annual_bmret#93999497 as float) END AS annual_bmret#93999717, CASE WHEN ((annual_ret#93999498 = NA) OR (annual_ret#93999498 = null)) THEN null ELSE cast(annual_ret#93999498 as float) END AS annual_ret#93999719, CASE WHEN ((std_ret#93999499 = NA) OR (std_ret#93999499 = null)) THEN null ELSE cast(std_ret#93999499 as float) END AS std_ret#93999721, CASE WHEN ((Sharpe_ret#93999500 = NA) OR (Sharpe_ret#93999500 = null)) THEN null ELSE cast(Sharpe_ret#93999500 as float) END AS Sharpe_ret#93999723, CASE WHEN ((PctPos_ret#93999501 = NA) OR (PctPos_ret#93999501 = null)) THEN null ELSE cast(PctPos_ret#93999501 as float) END AS PctPos_ret#93999725, CASE WHEN ((TR_ret#93999502 = NA) OR (TR_ret#93999502 = null)) THEN null ELSE cast(TR_ret#93999502 as float) END AS TR_ret#93999727, CASE WHEN ((IR_ret#93999503 = NA) OR (IR_ret#93999503 = null)) THEN null ELSE cast(IR_ret#93999503 as float) END AS IR_ret#93999729, CASE WHEN ((annual_resret#93999504 = NA) OR (annual_resret#93999504 = null)) THEN null ELSE cast(annual_resret#93999504 as float) END AS annual_resret#93999731, CASE WHEN ((std_resret#93999505 = NA) OR (std_resret#93999505 = null)) THEN null ELSE cast(std_resret#93999505 as float) END AS std_resret#93999733, CASE WHEN ((Sharpe_resret#93999506 = NA) OR (Sharpe_resret#93999506 = null)) THEN null ELSE cast(Sharpe_resret#93999506 as float) END AS Sharpe_resret#93999735, CASE WHEN ((PctPos_resret#93999507 = NA) OR (PctPos_resret#93999507 = null)) THEN null ELSE cast(PctPos_resret#93999507 as float) END AS PctPos_resret#93999737, ... 9 more fields] +- FileScan csv [overall#93999484,cap#93999485,retIC#93999486,resretIC#93999487,size#93999488,value#93999489,growth#93999490,leverage#93999491,volatility#93999492,momentum#93999493,yield#93999494,numcos#93999495,numdates#93999496,annual_bmret#93999497,annual_ret#93999498,std_ret#93999499,Sharpe_ret#93999500,PctPos_ret#93999501,TR_ret#93999502,IR_ret#93999503,annual_resret#93999504,std_resret#93999505,Sharpe_resret#93999506,PctPos_resret#93999507,... 9 more fields] Batched: false, DataFilters: [], Format: CSV, Location: InMemoryFileIndex(1 paths)[file:/srv/plusamp/data/default/ea-market/output/estimize_signal_histor..., PartitionFilters: [], PushedFilters: [], ReadSchema: struct<overall:string,cap:string,retIC:string,resretIC:string,size:string,value:string,growth:str... ,None) (5) Scan csv Output [33]: [overall#93999484, cap#93999485, retIC#93999486, resretIC#93999487, size#93999488, value#93999489, growth#93999490, leverage#93999491, volatility#93999492, momentum#93999493, yield#93999494, numcos#93999495, numdates#93999496, annual_bmret#93999497, annual_ret#93999498, std_ret#93999499, Sharpe_ret#93999500, PctPos_ret#93999501, TR_ret#93999502, IR_ret#93999503, annual_resret#93999504, std_resret#93999505, Sharpe_resret#93999506, PctPos_resret#93999507, TR_resret#93999508, IR_resret#93999509, annual_retnet#93999510, std_retnet#93999511, Sharpe_retnet#93999512, PctPos_retnet#93999513, TR_retnet#93999514, IR_retnet#93999515, turnover#93999516] Batched: false Location: InMemoryFileIndex [file:/srv/plusamp/data/default/ea-market/output/estimize_signal_history/estimizesignal_preearnings/stats_overall.csv] ReadSchema: struct<overall:string,cap:string,retIC:string,resretIC:string,size:string,value:string,growth:string,leverage:string,volatility:string,momentum:string,yield:string,numcos:string,numdates:string,annual_bmret:string,annual_ret:string,std_ret:string,Sharpe_ret:string,PctPos_ret:string,TR_ret:string,IR_ret:string,annual_resret:string,std_resret:string,Sharpe_resret:string,PctPos_resret:string,TR_resret:string,IR_resret:string,annual_retnet:string,std_retnet:string,Sharpe_retnet:string,PctPos_retnet:string,TR_retnet:string,IR_retnet:string,turnover:string> (6) Project [codegen id : 1] Output [33]: [CASE WHEN ((overall#93999484 = NA) OR (overall#93999484 = null)) THEN null ELSE cast(overall#93999484 as int) END AS overall#93999691, CASE WHEN ((cap#93999485 = NA) OR (cap#93999485 = null)) THEN null ELSE cast(cap#93999485 as float) END AS cap#93999693, CASE WHEN ((retIC#93999486 = NA) OR (retIC#93999486 = null)) THEN null ELSE cast(retIC#93999486 as float) END AS retIC#93999695, CASE WHEN ((resretIC#93999487 = NA) OR (resretIC#93999487 = null)) THEN null ELSE cast(resretIC#93999487 as float) END AS resretIC#93999697, CASE WHEN ((size#93999488 = NA) OR (size#93999488 = null)) THEN null ELSE cast(size#93999488 as float) END AS size#93999699, CASE WHEN ((value#93999489 = NA) OR (value#93999489 = null)) THEN null ELSE cast(value#93999489 as float) END AS value#93999701, CASE WHEN ((growth#93999490 = NA) OR (growth#93999490 = null)) THEN null ELSE cast(growth#93999490 as float) END AS growth#93999703, CASE WHEN ((leverage#93999491 = NA) OR (leverage#93999491 = null)) THEN null ELSE cast(leverage#93999491 as float) END AS leverage#93999705, CASE WHEN ((volatility#93999492 = NA) OR (volatility#93999492 = null)) THEN null ELSE cast(volatility#93999492 as float) END AS volatility#93999707, CASE WHEN ((momentum#93999493 = NA) OR (momentum#93999493 = null)) THEN null ELSE cast(momentum#93999493 as float) END AS momentum#93999709, CASE WHEN ((yield#93999494 = NA) OR (yield#93999494 = null)) THEN null ELSE cast(yield#93999494 as float) END AS yield#93999711, CASE WHEN ((numcos#93999495 = NA) OR (numcos#93999495 = null)) THEN null ELSE cast(numcos#93999495 as float) END AS numcos#93999713, CASE WHEN ((numdates#93999496 = NA) OR (numdates#93999496 = null)) THEN null ELSE cast(numdates#93999496 as float) END AS numdates#93999715, CASE WHEN ((annual_bmret#93999497 = NA) OR (annual_bmret#93999497 = null)) THEN null ELSE cast(annual_bmret#93999497 as float) END AS annual_bmret#93999717, CASE WHEN ((annual_ret#93999498 = NA) OR (annual_ret#93999498 = null)) THEN null ELSE cast(annual_ret#93999498 as float) END AS annual_ret#93999719, CASE WHEN ((std_ret#93999499 = NA) OR (std_ret#93999499 = null)) THEN null ELSE cast(std_ret#93999499 as float) END AS std_ret#93999721, CASE WHEN ((Sharpe_ret#93999500 = NA) OR (Sharpe_ret#93999500 = null)) THEN null ELSE cast(Sharpe_ret#93999500 as float) END AS Sharpe_ret#93999723, CASE WHEN ((PctPos_ret#93999501 = NA) OR (PctPos_ret#93999501 = null)) THEN null ELSE cast(PctPos_ret#93999501 as float) END AS PctPos_ret#93999725, CASE WHEN ((TR_ret#93999502 = NA) OR (TR_ret#93999502 = null)) THEN null ELSE cast(TR_ret#93999502 as float) END AS TR_ret#93999727, CASE WHEN ((IR_ret#93999503 = NA) OR (IR_ret#93999503 = null)) THEN null ELSE cast(IR_ret#93999503 as float) END AS IR_ret#93999729, CASE WHEN ((annual_resret#93999504 = NA) OR (annual_resret#93999504 = null)) THEN null ELSE cast(annual_resret#93999504 as float) END AS annual_resret#93999731, CASE WHEN ((std_resret#93999505 = NA) OR (std_resret#93999505 = null)) THEN null ELSE cast(std_resret#93999505 as float) END AS std_resret#93999733, CASE WHEN ((Sharpe_resret#93999506 = NA) OR (Sharpe_resret#93999506 = null)) THEN null ELSE cast(Sharpe_resret#93999506 as float) END AS Sharpe_resret#93999735, CASE WHEN ((PctPos_resret#93999507 = NA) OR (PctPos_resret#93999507 = null)) THEN null ELSE cast(PctPos_resret#93999507 as float) END AS PctPos_resret#93999737, CASE WHEN ((TR_resret#93999508 = NA) OR (TR_resret#93999508 = null)) THEN null ELSE cast(TR_resret#93999508 as float) END AS TR_resret#93999739, CASE WHEN ((IR_resret#93999509 = NA) OR (IR_resret#93999509 = null)) THEN null ELSE cast(IR_resret#93999509 as float) END AS IR_resret#93999741, CASE WHEN ((annual_retnet#93999510 = NA) OR (annual_retnet#93999510 = null)) THEN null ELSE cast(annual_retnet#93999510 as float) END AS annual_retnet#93999742, CASE WHEN ((std_retnet#93999511 = NA) OR (std_retnet#93999511 = null)) THEN null ELSE cast(std_retnet#93999511 as float) END AS std_retnet#93999743, CASE WHEN ((Sharpe_retnet#93999512 = NA) OR (Sharpe_retnet#93999512 = null)) THEN null ELSE cast(Sharpe_retnet#93999512 as float) END AS Sharpe_retnet#93999744, CASE WHEN ((PctPos_retnet#93999513 = NA) OR (PctPos_retnet#93999513 = null)) THEN null ELSE cast(PctPos_retnet#93999513 as float) END AS PctPos_retnet#93999745, CASE WHEN ((TR_retnet#93999514 = NA) OR (TR_retnet#93999514 = null)) THEN null ELSE cast(TR_retnet#93999514 as float) END AS TR_retnet#93999746, CASE WHEN ((IR_retnet#93999515 = NA) OR (IR_retnet#93999515 = null)) THEN null ELSE cast(IR_retnet#93999515 as float) END AS IR_retnet#93999747, CASE WHEN ((turnover#93999516 = NA) OR (turnover#93999516 = null)) THEN null ELSE cast(turnover#93999516 as float) END AS turnover#93999748] Input [33]: [overall#93999484, cap#93999485, retIC#93999486, resretIC#93999487, size#93999488, value#93999489, growth#93999490, leverage#93999491, volatility#93999492, momentum#93999493, yield#93999494, numcos#93999495, numdates#93999496, annual_bmret#93999497, annual_ret#93999498, std_ret#93999499, Sharpe_ret#93999500, PctPos_ret#93999501, TR_ret#93999502, IR_ret#93999503, annual_resret#93999504, std_resret#93999505, Sharpe_resret#93999506, PctPos_resret#93999507, TR_resret#93999508, IR_resret#93999509, annual_retnet#93999510, std_retnet#93999511, Sharpe_retnet#93999512, PctPos_retnet#93999513, TR_retnet#93999514, IR_retnet#93999515, turnover#93999516] (7) ColumnarToRow [codegen id : 1] Input [8]: [cap#93999693, growth#93999703, leverage#93999705, momentum#93999709, size#93999699, value#93999701, volatility#93999707, yield#93999711] (8) Filter [codegen id : 1] Input [8]: [cap#93999693, growth#93999703, leverage#93999705, momentum#93999709, size#93999699, value#93999701, volatility#93999707, yield#93999711] Condition : (isnotnull(cap#93999693) AND (cap#93999693 = 0.0)) (9) Project [codegen id : 1] Output [7]: [yield#93999711, volatility#93999707, momentum#93999709, size#93999699, value#93999701, growth#93999703, leverage#93999705] Input [8]: [cap#93999693, growth#93999703, leverage#93999705, momentum#93999709, size#93999699, value#93999701, volatility#93999707, yield#93999711] (10) ColumnarToRow [codegen id : 1] Input [7]: [yield#93999711, volatility#93999707, momentum#93999709, size#93999699, value#93999701, growth#93999703, leverage#93999705] (11) CollectLimit Input [7]: [yield#93999711, volatility#93999707, momentum#93999709, size#93999699, value#93999701, growth#93999703, leverage#93999705] Arguments: 1000000