== Physical Plan == CollectLimit (17) +- * ColumnarToRow (16) +- InMemoryTableScan (1) +- InMemoryRelation (2) +- * Project (15) +- * BroadcastNestedLoopJoin Cross BuildRight (14) :- * Project (7) : +- * Filter (6) : +- * ColumnarToRow (5) : +- InMemoryTableScan (3) : +- InMemoryRelation (4) : +- * Project (6) : +- Scan csv (5) +- BroadcastExchange (13) +- * Project (12) +- * Filter (11) +- * ColumnarToRow (10) +- InMemoryTableScan (8) +- InMemoryRelation (9) +- * Project (6) +- Scan csv (5) (1) InMemoryTableScan Output [3]: [ret_large#94285196, ret_small#94285198, differential#94285311] Arguments: [ret_large#94285196, ret_small#94285198, differential#94285311] (2) InMemoryRelation Arguments: [ret_large#94285196, ret_small#94285198, differential#94285311], CachedRDDBuilder(org.apache.spark.sql.execution.columnar.DefaultCachedBatchSerializer@208e3fd9,StorageLevel(disk, memory, deserialized, 1 replicas),*(2) Project [ret_large#94285196, ret_small#94285198, (ret_large#94285196 - ret_small#94285198) AS differential#94285311] +- *(2) BroadcastNestedLoopJoin BuildRight, Cross :- *(2) Project [annual_ret#94282676 AS ret_large#94285196] : +- *(2) Filter (isnotnull(cap#94282654) AND (cap#94282654 = 1.0)) : +- *(2) ColumnarToRow : +- InMemoryTableScan [annual_ret#94282676, cap#94282654], [isnotnull(cap#94282654), (cap#94282654 = 1.0)] : +- InMemoryRelation [cap#94282654, retIC#94282658, resretIC#94282659, numcos#94282663, numdates#94282669, annual_bmret#94282673, annual_ret#94282676, std_ret#94282681, Sharpe_ret#94282684, PctPos_ret#94282709, TR_ret#94282773, IR_ret#94282775, annual_resret#94282777, std_resret#94282790, Sharpe_resret#94282792, PctPos_resret#94282806, TR_resret#94282820, IR_resret#94282822, annual_retnet#94282823, std_retnet#94282836, Sharpe_retnet#94282837, PctPos_retnet#94282838, TR_retnet#94282851, IR_retnet#94282852, ... 2 more fields], StorageLevel(disk, memory, deserialized, 1 replicas) : +- *(1) Project [CASE WHEN ((cap#94282446 = NA) OR (cap#94282446 = null)) THEN null ELSE cast(cap#94282446 as float) END AS cap#94282654, CASE WHEN ((retIC#94282447 = NA) OR (retIC#94282447 = null)) THEN null ELSE cast(retIC#94282447 as float) END AS retIC#94282658, CASE WHEN ((resretIC#94282448 = NA) OR (resretIC#94282448 = null)) THEN null ELSE cast(resretIC#94282448 as float) END AS resretIC#94282659, CASE WHEN ((numcos#94282449 = NA) OR (numcos#94282449 = null)) THEN null ELSE cast(numcos#94282449 as float) END AS numcos#94282663, CASE WHEN ((numdates#94282450 = NA) OR (numdates#94282450 = null)) THEN null ELSE cast(numdates#94282450 as int) END AS numdates#94282669, CASE WHEN ((annual_bmret#94282451 = NA) OR (annual_bmret#94282451 = null)) THEN null ELSE cast(annual_bmret#94282451 as float) END AS annual_bmret#94282673, CASE WHEN ((annual_ret#94282452 = NA) OR (annual_ret#94282452 = null)) THEN null ELSE cast(annual_ret#94282452 as float) END AS annual_ret#94282676, CASE WHEN ((std_ret#94282453 = NA) OR (std_ret#94282453 = null)) THEN null ELSE cast(std_ret#94282453 as float) END AS std_ret#94282681, CASE WHEN ((Sharpe_ret#94282454 = NA) OR (Sharpe_ret#94282454 = null)) THEN null ELSE cast(Sharpe_ret#94282454 as float) END AS Sharpe_ret#94282684, CASE WHEN ((PctPos_ret#94282455 = NA) OR (PctPos_ret#94282455 = null)) THEN null ELSE cast(PctPos_ret#94282455 as float) END AS PctPos_ret#94282709, CASE WHEN ((TR_ret#94282456 = NA) OR (TR_ret#94282456 = null)) THEN null ELSE cast(TR_ret#94282456 as float) END AS TR_ret#94282773, CASE WHEN ((IR_ret#94282457 = NA) OR (IR_ret#94282457 = null)) THEN null ELSE cast(IR_ret#94282457 as float) END AS IR_ret#94282775, CASE WHEN ((annual_resret#94282458 = NA) OR (annual_resret#94282458 = null)) THEN null ELSE cast(annual_resret#94282458 as float) END AS annual_resret#94282777, CASE WHEN ((std_resret#94282459 = NA) OR (std_resret#94282459 = null)) THEN null ELSE cast(std_resret#94282459 as float) END AS std_resret#94282790, CASE WHEN ((Sharpe_resret#94282460 = NA) OR (Sharpe_resret#94282460 = null)) THEN null ELSE cast(Sharpe_resret#94282460 as float) END AS Sharpe_resret#94282792, CASE WHEN ((PctPos_resret#94282461 = NA) OR (PctPos_resret#94282461 = null)) THEN null ELSE cast(PctPos_resret#94282461 as float) END AS PctPos_resret#94282806, CASE WHEN ((TR_resret#94282462 = NA) OR (TR_resret#94282462 = null)) THEN null ELSE cast(TR_resret#94282462 as float) END AS TR_resret#94282820, CASE WHEN ((IR_resret#94282463 = NA) OR (IR_resret#94282463 = null)) THEN null ELSE cast(IR_resret#94282463 as float) END AS IR_resret#94282822, CASE WHEN ((annual_retnet#94282464 = NA) OR (annual_retnet#94282464 = null)) THEN null ELSE cast(annual_retnet#94282464 as float) END AS annual_retnet#94282823, CASE WHEN ((std_retnet#94282465 = NA) OR (std_retnet#94282465 = null)) THEN null ELSE cast(std_retnet#94282465 as float) END AS std_retnet#94282836, CASE WHEN ((Sharpe_retnet#94282466 = NA) OR (Sharpe_retnet#94282466 = null)) THEN null ELSE cast(Sharpe_retnet#94282466 as float) END AS Sharpe_retnet#94282837, CASE WHEN ((PctPos_retnet#94282467 = NA) OR (PctPos_retnet#94282467 = null)) THEN null ELSE cast(PctPos_retnet#94282467 as float) END AS PctPos_retnet#94282838, CASE WHEN ((TR_retnet#94282468 = NA) OR (TR_retnet#94282468 = null)) THEN null ELSE cast(TR_retnet#94282468 as float) END AS TR_retnet#94282851, CASE WHEN ((IR_retnet#94282469 = NA) OR (IR_retnet#94282469 = null)) THEN null ELSE cast(IR_retnet#94282469 as float) END AS IR_retnet#94282852, ... 2 more fields] : +- FileScan csv [cap#94282446,retIC#94282447,resretIC#94282448,numcos#94282449,numdates#94282450,annual_bmret#94282451,annual_ret#94282452,std_ret#94282453,Sharpe_ret#94282454,PctPos_ret#94282455,TR_ret#94282456,IR_ret#94282457,annual_resret#94282458,std_resret#94282459,Sharpe_resret#94282460,PctPos_resret#94282461,TR_resret#94282462,IR_resret#94282463,annual_retnet#94282464,std_retnet#94282465,Sharpe_retnet#94282466,PctPos_retnet#94282467,TR_retnet#94282468,IR_retnet#94282469,... 2 more fields] Batched: false, DataFilters: [], Format: CSV, Location: InMemoryFileIndex(1 paths)[file:/srv/plusamp/data/default/ea-market/output/eps_truebeat/surprise_..., PartitionFilters: [], PushedFilters: [], ReadSchema: struct<cap:string,retIC:string,resretIC:string,numcos:string,numdates:string,annual_bmret:string,... +- BroadcastExchange IdentityBroadcastMode, [id=#7528033] +- *(1) Project [annual_ret#94282676 AS ret_small#94285198] +- *(1) Filter (isnotnull(cap#94282654) AND (cap#94282654 = 3.0)) +- *(1) ColumnarToRow +- InMemoryTableScan [annual_ret#94282676, cap#94282654], [isnotnull(cap#94282654), (cap#94282654 = 3.0)] +- InMemoryRelation [cap#94282654, retIC#94282658, resretIC#94282659, numcos#94282663, numdates#94282669, annual_bmret#94282673, annual_ret#94282676, std_ret#94282681, Sharpe_ret#94282684, PctPos_ret#94282709, TR_ret#94282773, IR_ret#94282775, annual_resret#94282777, std_resret#94282790, Sharpe_resret#94282792, PctPos_resret#94282806, TR_resret#94282820, IR_resret#94282822, annual_retnet#94282823, std_retnet#94282836, Sharpe_retnet#94282837, PctPos_retnet#94282838, TR_retnet#94282851, IR_retnet#94282852, ... 2 more fields], StorageLevel(disk, memory, deserialized, 1 replicas) +- *(1) Project [CASE WHEN ((cap#94282446 = NA) OR (cap#94282446 = null)) THEN null ELSE cast(cap#94282446 as float) END AS cap#94282654, CASE WHEN ((retIC#94282447 = NA) OR (retIC#94282447 = null)) THEN null ELSE cast(retIC#94282447 as float) END AS retIC#94282658, CASE WHEN ((resretIC#94282448 = NA) OR (resretIC#94282448 = null)) THEN null ELSE cast(resretIC#94282448 as float) END AS resretIC#94282659, CASE WHEN ((numcos#94282449 = NA) OR (numcos#94282449 = null)) THEN null ELSE cast(numcos#94282449 as float) END AS numcos#94282663, CASE WHEN ((numdates#94282450 = NA) OR (numdates#94282450 = null)) THEN null ELSE cast(numdates#94282450 as int) END AS numdates#94282669, CASE WHEN ((annual_bmret#94282451 = NA) OR (annual_bmret#94282451 = null)) THEN null ELSE cast(annual_bmret#94282451 as float) END AS annual_bmret#94282673, CASE WHEN ((annual_ret#94282452 = NA) OR (annual_ret#94282452 = null)) THEN null ELSE cast(annual_ret#94282452 as float) END AS annual_ret#94282676, CASE WHEN ((std_ret#94282453 = NA) OR (std_ret#94282453 = null)) THEN null ELSE cast(std_ret#94282453 as float) END AS std_ret#94282681, CASE WHEN ((Sharpe_ret#94282454 = NA) OR (Sharpe_ret#94282454 = null)) THEN null ELSE cast(Sharpe_ret#94282454 as float) END AS Sharpe_ret#94282684, CASE WHEN ((PctPos_ret#94282455 = NA) OR (PctPos_ret#94282455 = null)) THEN null ELSE cast(PctPos_ret#94282455 as float) END AS PctPos_ret#94282709, CASE WHEN ((TR_ret#94282456 = NA) OR (TR_ret#94282456 = null)) THEN null ELSE cast(TR_ret#94282456 as float) END AS TR_ret#94282773, CASE WHEN ((IR_ret#94282457 = NA) OR (IR_ret#94282457 = null)) THEN null ELSE cast(IR_ret#94282457 as float) END AS IR_ret#94282775, CASE WHEN ((annual_resret#94282458 = NA) OR (annual_resret#94282458 = null)) THEN null ELSE cast(annual_resret#94282458 as float) END AS annual_resret#94282777, CASE WHEN ((std_resret#94282459 = NA) OR (std_resret#94282459 = null)) THEN null ELSE cast(std_resret#94282459 as float) END AS std_resret#94282790, CASE WHEN ((Sharpe_resret#94282460 = NA) OR (Sharpe_resret#94282460 = null)) THEN null ELSE cast(Sharpe_resret#94282460 as float) END AS Sharpe_resret#94282792, CASE WHEN ((PctPos_resret#94282461 = NA) OR (PctPos_resret#94282461 = null)) THEN null ELSE cast(PctPos_resret#94282461 as float) END AS PctPos_resret#94282806, CASE WHEN ((TR_resret#94282462 = NA) OR (TR_resret#94282462 = null)) THEN null ELSE cast(TR_resret#94282462 as float) END AS TR_resret#94282820, CASE WHEN ((IR_resret#94282463 = NA) OR (IR_resret#94282463 = null)) THEN null ELSE cast(IR_resret#94282463 as float) END AS IR_resret#94282822, CASE WHEN ((annual_retnet#94282464 = NA) OR (annual_retnet#94282464 = null)) THEN null ELSE cast(annual_retnet#94282464 as float) END AS annual_retnet#94282823, CASE WHEN ((std_retnet#94282465 = NA) OR (std_retnet#94282465 = null)) THEN null ELSE cast(std_retnet#94282465 as float) END AS std_retnet#94282836, CASE WHEN ((Sharpe_retnet#94282466 = NA) OR (Sharpe_retnet#94282466 = null)) THEN null ELSE cast(Sharpe_retnet#94282466 as float) END AS Sharpe_retnet#94282837, CASE WHEN ((PctPos_retnet#94282467 = NA) OR (PctPos_retnet#94282467 = null)) THEN null ELSE cast(PctPos_retnet#94282467 as float) END AS PctPos_retnet#94282838, CASE WHEN ((TR_retnet#94282468 = NA) OR (TR_retnet#94282468 = null)) THEN null ELSE cast(TR_retnet#94282468 as float) END AS TR_retnet#94282851, CASE WHEN ((IR_retnet#94282469 = NA) OR (IR_retnet#94282469 = null)) THEN null ELSE cast(IR_retnet#94282469 as float) END AS IR_retnet#94282852, ... 2 more fields] +- FileScan csv [cap#94282446,retIC#94282447,resretIC#94282448,numcos#94282449,numdates#94282450,annual_bmret#94282451,annual_ret#94282452,std_ret#94282453,Sharpe_ret#94282454,PctPos_ret#94282455,TR_ret#94282456,IR_ret#94282457,annual_resret#94282458,std_resret#94282459,Sharpe_resret#94282460,PctPos_resret#94282461,TR_resret#94282462,IR_resret#94282463,annual_retnet#94282464,std_retnet#94282465,Sharpe_retnet#94282466,PctPos_retnet#94282467,TR_retnet#94282468,IR_retnet#94282469,... 2 more fields] Batched: false, DataFilters: [], Format: CSV, Location: InMemoryFileIndex(1 paths)[file:/srv/plusamp/data/default/ea-market/output/eps_truebeat/surprise_..., PartitionFilters: [], PushedFilters: [], ReadSchema: struct<cap:string,retIC:string,resretIC:string,numcos:string,numdates:string,annual_bmret:string,... ,None) (3) InMemoryTableScan Output [2]: [annual_ret#94282676, cap#94282654] Arguments: [annual_ret#94282676, cap#94282654], [isnotnull(cap#94282654), (cap#94282654 = 1.0)] (4) InMemoryRelation Arguments: [cap#94282654, retIC#94282658, resretIC#94282659, numcos#94282663, numdates#94282669, annual_bmret#94282673, annual_ret#94282676, std_ret#94282681, Sharpe_ret#94282684, PctPos_ret#94282709, TR_ret#94282773, IR_ret#94282775, annual_resret#94282777, std_resret#94282790, Sharpe_resret#94282792, PctPos_resret#94282806, TR_resret#94282820, IR_resret#94282822, annual_retnet#94282823, std_retnet#94282836, Sharpe_retnet#94282837, PctPos_retnet#94282838, TR_retnet#94282851, IR_retnet#94282852, ... 2 more fields], CachedRDDBuilder(org.apache.spark.sql.execution.columnar.DefaultCachedBatchSerializer@208e3fd9,StorageLevel(disk, memory, deserialized, 1 replicas),*(1) Project [CASE WHEN ((cap#94282446 = NA) OR (cap#94282446 = null)) THEN null ELSE cast(cap#94282446 as float) END AS cap#94282654, CASE WHEN ((retIC#94282447 = NA) OR (retIC#94282447 = null)) THEN null ELSE cast(retIC#94282447 as float) END AS retIC#94282658, CASE WHEN ((resretIC#94282448 = NA) OR (resretIC#94282448 = null)) THEN null ELSE cast(resretIC#94282448 as float) END AS resretIC#94282659, CASE WHEN ((numcos#94282449 = NA) OR (numcos#94282449 = null)) THEN null ELSE cast(numcos#94282449 as float) END AS numcos#94282663, CASE WHEN ((numdates#94282450 = NA) OR (numdates#94282450 = null)) THEN null ELSE cast(numdates#94282450 as int) END AS numdates#94282669, CASE WHEN ((annual_bmret#94282451 = NA) OR (annual_bmret#94282451 = null)) THEN null ELSE cast(annual_bmret#94282451 as float) END AS annual_bmret#94282673, CASE WHEN ((annual_ret#94282452 = NA) OR (annual_ret#94282452 = null)) THEN null ELSE cast(annual_ret#94282452 as float) END AS annual_ret#94282676, CASE WHEN ((std_ret#94282453 = NA) OR (std_ret#94282453 = null)) THEN null ELSE cast(std_ret#94282453 as float) END AS std_ret#94282681, CASE WHEN ((Sharpe_ret#94282454 = NA) OR (Sharpe_ret#94282454 = null)) THEN null ELSE cast(Sharpe_ret#94282454 as float) END AS Sharpe_ret#94282684, CASE WHEN ((PctPos_ret#94282455 = NA) OR (PctPos_ret#94282455 = null)) THEN null ELSE cast(PctPos_ret#94282455 as float) END AS PctPos_ret#94282709, CASE WHEN ((TR_ret#94282456 = NA) OR (TR_ret#94282456 = null)) THEN null ELSE cast(TR_ret#94282456 as float) END AS TR_ret#94282773, CASE WHEN ((IR_ret#94282457 = NA) OR (IR_ret#94282457 = null)) THEN null ELSE cast(IR_ret#94282457 as float) END AS IR_ret#94282775, CASE WHEN ((annual_resret#94282458 = NA) OR (annual_resret#94282458 = null)) THEN null ELSE cast(annual_resret#94282458 as float) END AS annual_resret#94282777, CASE WHEN ((std_resret#94282459 = NA) OR (std_resret#94282459 = null)) THEN null ELSE cast(std_resret#94282459 as float) END AS std_resret#94282790, CASE WHEN ((Sharpe_resret#94282460 = NA) OR (Sharpe_resret#94282460 = null)) THEN null ELSE cast(Sharpe_resret#94282460 as float) END AS Sharpe_resret#94282792, CASE WHEN ((PctPos_resret#94282461 = NA) OR (PctPos_resret#94282461 = null)) THEN null ELSE cast(PctPos_resret#94282461 as float) END AS PctPos_resret#94282806, CASE WHEN ((TR_resret#94282462 = NA) OR (TR_resret#94282462 = null)) THEN null ELSE cast(TR_resret#94282462 as float) END AS TR_resret#94282820, CASE WHEN ((IR_resret#94282463 = NA) OR (IR_resret#94282463 = null)) THEN null ELSE cast(IR_resret#94282463 as float) END AS IR_resret#94282822, CASE WHEN ((annual_retnet#94282464 = NA) OR (annual_retnet#94282464 = null)) THEN null ELSE cast(annual_retnet#94282464 as float) END AS annual_retnet#94282823, CASE WHEN ((std_retnet#94282465 = NA) OR (std_retnet#94282465 = null)) THEN null ELSE cast(std_retnet#94282465 as float) END AS std_retnet#94282836, CASE WHEN ((Sharpe_retnet#94282466 = NA) OR (Sharpe_retnet#94282466 = null)) THEN null ELSE cast(Sharpe_retnet#94282466 as float) END AS Sharpe_retnet#94282837, CASE WHEN ((PctPos_retnet#94282467 = NA) OR (PctPos_retnet#94282467 = null)) THEN null ELSE cast(PctPos_retnet#94282467 as float) END AS PctPos_retnet#94282838, CASE WHEN ((TR_retnet#94282468 = NA) OR (TR_retnet#94282468 = null)) THEN null ELSE cast(TR_retnet#94282468 as float) END AS TR_retnet#94282851, CASE WHEN ((IR_retnet#94282469 = NA) OR (IR_retnet#94282469 = null)) THEN null ELSE cast(IR_retnet#94282469 as float) END AS IR_retnet#94282852, ... 2 more fields] +- FileScan csv [cap#94282446,retIC#94282447,resretIC#94282448,numcos#94282449,numdates#94282450,annual_bmret#94282451,annual_ret#94282452,std_ret#94282453,Sharpe_ret#94282454,PctPos_ret#94282455,TR_ret#94282456,IR_ret#94282457,annual_resret#94282458,std_resret#94282459,Sharpe_resret#94282460,PctPos_resret#94282461,TR_resret#94282462,IR_resret#94282463,annual_retnet#94282464,std_retnet#94282465,Sharpe_retnet#94282466,PctPos_retnet#94282467,TR_retnet#94282468,IR_retnet#94282469,... 2 more fields] Batched: false, DataFilters: [], Format: CSV, Location: InMemoryFileIndex(1 paths)[file:/srv/plusamp/data/default/ea-market/output/eps_truebeat/surprise_..., PartitionFilters: [], PushedFilters: [], ReadSchema: struct<cap:string,retIC:string,resretIC:string,numcos:string,numdates:string,annual_bmret:string,... ,None) (unknown) Scan csv Output [26]: [cap#94282446, retIC#94282447, resretIC#94282448, numcos#94282449, numdates#94282450, annual_bmret#94282451, annual_ret#94282452, std_ret#94282453, Sharpe_ret#94282454, PctPos_ret#94282455, TR_ret#94282456, IR_ret#94282457, annual_resret#94282458, std_resret#94282459, Sharpe_resret#94282460, PctPos_resret#94282461, TR_resret#94282462, IR_resret#94282463, annual_retnet#94282464, std_retnet#94282465, Sharpe_retnet#94282466, PctPos_retnet#94282467, TR_retnet#94282468, IR_retnet#94282469, turnover#94282470, coverage#94282471] Batched: false Location: InMemoryFileIndex [file:/srv/plusamp/data/default/ea-market/output/eps_truebeat/surprise_prediction_eps_trunc/stats_cap.csv] ReadSchema: struct<cap:string,retIC:string,resretIC:string,numcos:string,numdates:string,annual_bmret:string,annual_ret:string,std_ret:string,Sharpe_ret:string,PctPos_ret:string,TR_ret:string,IR_ret:string,annual_resret:string,std_resret:string,Sharpe_resret:string,PctPos_resret:string,TR_resret:string,IR_resret:string,annual_retnet:string,std_retnet:string,Sharpe_retnet:string,PctPos_retnet:string,TR_retnet:string,IR_retnet:string,turnover:string,coverage:string> (unknown) Project Output [26]: [CASE WHEN ((cap#94282446 = NA) OR (cap#94282446 = null)) THEN null ELSE cast(cap#94282446 as float) END AS cap#94282654, CASE WHEN ((retIC#94282447 = NA) OR (retIC#94282447 = null)) THEN null ELSE cast(retIC#94282447 as float) END AS retIC#94282658, CASE WHEN ((resretIC#94282448 = NA) OR (resretIC#94282448 = null)) THEN null ELSE cast(resretIC#94282448 as float) END AS resretIC#94282659, CASE WHEN ((numcos#94282449 = NA) OR (numcos#94282449 = null)) THEN null ELSE cast(numcos#94282449 as float) END AS numcos#94282663, CASE WHEN ((numdates#94282450 = NA) OR (numdates#94282450 = null)) THEN null ELSE cast(numdates#94282450 as int) END AS numdates#94282669, CASE WHEN ((annual_bmret#94282451 = NA) OR (annual_bmret#94282451 = null)) THEN null ELSE cast(annual_bmret#94282451 as float) END AS annual_bmret#94282673, CASE WHEN ((annual_ret#94282452 = NA) OR (annual_ret#94282452 = null)) THEN null ELSE cast(annual_ret#94282452 as float) END AS annual_ret#94282676, CASE WHEN ((std_ret#94282453 = NA) OR (std_ret#94282453 = null)) THEN null ELSE cast(std_ret#94282453 as float) END AS std_ret#94282681, CASE WHEN ((Sharpe_ret#94282454 = NA) OR (Sharpe_ret#94282454 = null)) THEN null ELSE cast(Sharpe_ret#94282454 as float) END AS Sharpe_ret#94282684, CASE WHEN ((PctPos_ret#94282455 = NA) OR (PctPos_ret#94282455 = null)) THEN null ELSE cast(PctPos_ret#94282455 as float) END AS PctPos_ret#94282709, CASE WHEN ((TR_ret#94282456 = NA) OR (TR_ret#94282456 = null)) THEN null ELSE cast(TR_ret#94282456 as float) END AS TR_ret#94282773, CASE WHEN ((IR_ret#94282457 = NA) OR (IR_ret#94282457 = null)) THEN null ELSE cast(IR_ret#94282457 as float) END AS IR_ret#94282775, CASE WHEN ((annual_resret#94282458 = NA) OR (annual_resret#94282458 = null)) THEN null ELSE cast(annual_resret#94282458 as float) END AS annual_resret#94282777, CASE WHEN ((std_resret#94282459 = NA) OR (std_resret#94282459 = null)) THEN null ELSE cast(std_resret#94282459 as float) END AS std_resret#94282790, CASE WHEN ((Sharpe_resret#94282460 = NA) OR (Sharpe_resret#94282460 = null)) THEN null ELSE cast(Sharpe_resret#94282460 as float) END AS Sharpe_resret#94282792, CASE WHEN ((PctPos_resret#94282461 = NA) OR (PctPos_resret#94282461 = null)) THEN null ELSE cast(PctPos_resret#94282461 as float) END AS PctPos_resret#94282806, CASE WHEN ((TR_resret#94282462 = NA) OR (TR_resret#94282462 = null)) THEN null ELSE cast(TR_resret#94282462 as float) END AS TR_resret#94282820, CASE WHEN ((IR_resret#94282463 = NA) OR (IR_resret#94282463 = null)) THEN null ELSE cast(IR_resret#94282463 as float) END AS IR_resret#94282822, CASE WHEN ((annual_retnet#94282464 = NA) OR (annual_retnet#94282464 = null)) THEN null ELSE cast(annual_retnet#94282464 as float) END AS annual_retnet#94282823, CASE WHEN ((std_retnet#94282465 = NA) OR (std_retnet#94282465 = null)) THEN null ELSE cast(std_retnet#94282465 as float) END AS std_retnet#94282836, CASE WHEN ((Sharpe_retnet#94282466 = NA) OR (Sharpe_retnet#94282466 = null)) THEN null ELSE cast(Sharpe_retnet#94282466 as float) END AS Sharpe_retnet#94282837, CASE WHEN ((PctPos_retnet#94282467 = NA) OR (PctPos_retnet#94282467 = null)) THEN null ELSE cast(PctPos_retnet#94282467 as float) END AS PctPos_retnet#94282838, CASE WHEN ((TR_retnet#94282468 = NA) OR (TR_retnet#94282468 = null)) THEN null ELSE cast(TR_retnet#94282468 as float) END AS TR_retnet#94282851, CASE WHEN ((IR_retnet#94282469 = NA) OR (IR_retnet#94282469 = null)) THEN null ELSE cast(IR_retnet#94282469 as float) END AS IR_retnet#94282852, CASE WHEN ((turnover#94282470 = NA) OR (turnover#94282470 = null)) THEN null ELSE cast(turnover#94282470 as float) END AS turnover#94282853, CASE WHEN ((coverage#94282471 = NA) OR (coverage#94282471 = null)) THEN null ELSE cast(coverage#94282471 as float) END AS coverage#94282921] Input [26]: [cap#94282446, retIC#94282447, resretIC#94282448, numcos#94282449, numdates#94282450, annual_bmret#94282451, annual_ret#94282452, std_ret#94282453, Sharpe_ret#94282454, PctPos_ret#94282455, TR_ret#94282456, IR_ret#94282457, annual_resret#94282458, std_resret#94282459, Sharpe_resret#94282460, PctPos_resret#94282461, TR_resret#94282462, IR_resret#94282463, annual_retnet#94282464, std_retnet#94282465, Sharpe_retnet#94282466, PctPos_retnet#94282467, TR_retnet#94282468, IR_retnet#94282469, turnover#94282470, coverage#94282471] (7) Project [codegen id : 2] Output [1]: [annual_ret#94282676 AS ret_large#94285196] Input [2]: [annual_ret#94282676, cap#94282654] (8) InMemoryTableScan Output [2]: [annual_ret#94282676, cap#94282654] Arguments: [annual_ret#94282676, cap#94282654], [isnotnull(cap#94282654), (cap#94282654 = 3.0)] (9) InMemoryRelation Arguments: [cap#94282654, retIC#94282658, resretIC#94282659, numcos#94282663, numdates#94282669, annual_bmret#94282673, annual_ret#94282676, std_ret#94282681, Sharpe_ret#94282684, PctPos_ret#94282709, TR_ret#94282773, IR_ret#94282775, annual_resret#94282777, std_resret#94282790, Sharpe_resret#94282792, PctPos_resret#94282806, TR_resret#94282820, IR_resret#94282822, annual_retnet#94282823, std_retnet#94282836, Sharpe_retnet#94282837, PctPos_retnet#94282838, TR_retnet#94282851, IR_retnet#94282852, ... 2 more fields], CachedRDDBuilder(org.apache.spark.sql.execution.columnar.DefaultCachedBatchSerializer@208e3fd9,StorageLevel(disk, memory, deserialized, 1 replicas),*(1) Project [CASE WHEN ((cap#94282446 = NA) OR (cap#94282446 = null)) THEN null ELSE cast(cap#94282446 as float) END AS cap#94282654, CASE WHEN ((retIC#94282447 = NA) OR (retIC#94282447 = null)) THEN null ELSE cast(retIC#94282447 as float) END AS retIC#94282658, CASE WHEN ((resretIC#94282448 = NA) OR (resretIC#94282448 = null)) THEN null ELSE cast(resretIC#94282448 as float) END AS resretIC#94282659, CASE WHEN ((numcos#94282449 = NA) OR (numcos#94282449 = null)) THEN null ELSE cast(numcos#94282449 as float) END AS numcos#94282663, CASE WHEN ((numdates#94282450 = NA) OR (numdates#94282450 = null)) THEN null ELSE cast(numdates#94282450 as int) END AS numdates#94282669, CASE WHEN ((annual_bmret#94282451 = NA) OR (annual_bmret#94282451 = null)) THEN null ELSE cast(annual_bmret#94282451 as float) END AS annual_bmret#94282673, CASE WHEN ((annual_ret#94282452 = NA) OR (annual_ret#94282452 = null)) THEN null ELSE cast(annual_ret#94282452 as float) END AS annual_ret#94282676, CASE WHEN ((std_ret#94282453 = NA) OR (std_ret#94282453 = null)) THEN null ELSE cast(std_ret#94282453 as float) END AS std_ret#94282681, CASE WHEN ((Sharpe_ret#94282454 = NA) OR (Sharpe_ret#94282454 = null)) THEN null ELSE cast(Sharpe_ret#94282454 as float) END AS Sharpe_ret#94282684, CASE WHEN ((PctPos_ret#94282455 = NA) OR (PctPos_ret#94282455 = null)) THEN null ELSE cast(PctPos_ret#94282455 as float) END AS PctPos_ret#94282709, CASE WHEN ((TR_ret#94282456 = NA) OR (TR_ret#94282456 = null)) THEN null ELSE cast(TR_ret#94282456 as float) END AS TR_ret#94282773, CASE WHEN ((IR_ret#94282457 = NA) OR (IR_ret#94282457 = null)) THEN null ELSE cast(IR_ret#94282457 as float) END AS IR_ret#94282775, CASE WHEN ((annual_resret#94282458 = NA) OR (annual_resret#94282458 = null)) THEN null ELSE cast(annual_resret#94282458 as float) END AS annual_resret#94282777, CASE WHEN ((std_resret#94282459 = NA) OR (std_resret#94282459 = null)) THEN null ELSE cast(std_resret#94282459 as float) END AS std_resret#94282790, CASE WHEN ((Sharpe_resret#94282460 = NA) OR (Sharpe_resret#94282460 = null)) THEN null ELSE cast(Sharpe_resret#94282460 as float) END AS Sharpe_resret#94282792, CASE WHEN ((PctPos_resret#94282461 = NA) OR (PctPos_resret#94282461 = null)) THEN null ELSE cast(PctPos_resret#94282461 as float) END AS PctPos_resret#94282806, CASE WHEN ((TR_resret#94282462 = NA) OR (TR_resret#94282462 = null)) THEN null ELSE cast(TR_resret#94282462 as float) END AS TR_resret#94282820, CASE WHEN ((IR_resret#94282463 = NA) OR (IR_resret#94282463 = null)) THEN null ELSE cast(IR_resret#94282463 as float) END AS IR_resret#94282822, CASE WHEN ((annual_retnet#94282464 = NA) OR (annual_retnet#94282464 = null)) THEN null ELSE cast(annual_retnet#94282464 as float) END AS annual_retnet#94282823, CASE WHEN ((std_retnet#94282465 = NA) OR (std_retnet#94282465 = null)) THEN null ELSE cast(std_retnet#94282465 as float) END AS std_retnet#94282836, CASE WHEN ((Sharpe_retnet#94282466 = NA) OR (Sharpe_retnet#94282466 = null)) THEN null ELSE cast(Sharpe_retnet#94282466 as float) END AS Sharpe_retnet#94282837, CASE WHEN ((PctPos_retnet#94282467 = NA) OR (PctPos_retnet#94282467 = null)) THEN null ELSE cast(PctPos_retnet#94282467 as float) END AS PctPos_retnet#94282838, CASE WHEN ((TR_retnet#94282468 = NA) OR (TR_retnet#94282468 = null)) THEN null ELSE cast(TR_retnet#94282468 as float) END AS TR_retnet#94282851, CASE WHEN ((IR_retnet#94282469 = NA) OR (IR_retnet#94282469 = null)) THEN null ELSE cast(IR_retnet#94282469 as float) END AS IR_retnet#94282852, ... 2 more fields] +- FileScan csv [cap#94282446,retIC#94282447,resretIC#94282448,numcos#94282449,numdates#94282450,annual_bmret#94282451,annual_ret#94282452,std_ret#94282453,Sharpe_ret#94282454,PctPos_ret#94282455,TR_ret#94282456,IR_ret#94282457,annual_resret#94282458,std_resret#94282459,Sharpe_resret#94282460,PctPos_resret#94282461,TR_resret#94282462,IR_resret#94282463,annual_retnet#94282464,std_retnet#94282465,Sharpe_retnet#94282466,PctPos_retnet#94282467,TR_retnet#94282468,IR_retnet#94282469,... 2 more fields] Batched: false, DataFilters: [], Format: CSV, Location: InMemoryFileIndex(1 paths)[file:/srv/plusamp/data/default/ea-market/output/eps_truebeat/surprise_..., PartitionFilters: [], PushedFilters: [], ReadSchema: struct<cap:string,retIC:string,resretIC:string,numcos:string,numdates:string,annual_bmret:string,... ,None) (10) ColumnarToRow [codegen id : 1] Input [2]: [annual_ret#94282676, cap#94282654] (11) Filter [codegen id : 1] Input [2]: [annual_ret#94282676, cap#94282654] Condition : (isnotnull(cap#94282654) AND (cap#94282654 = 3.0)) (12) Project [codegen id : 1] Output [1]: [annual_ret#94282676 AS ret_small#94285198] Input [2]: [annual_ret#94282676, cap#94282654] (13) BroadcastExchange Input [1]: [ret_small#94285198] Arguments: IdentityBroadcastMode, [id=#7528033] (14) BroadcastNestedLoopJoin [codegen id : 2] Join condition: None (15) Project [codegen id : 2] Output [3]: [ret_large#94285196, ret_small#94285198, (ret_large#94285196 - ret_small#94285198) AS differential#94285311] Input [2]: [ret_large#94285196, ret_small#94285198] (16) ColumnarToRow [codegen id : 1] Input [3]: [ret_large#94285196, ret_small#94285198, differential#94285311] (17) CollectLimit Input [3]: [ret_large#94285196, ret_small#94285198, differential#94285311] Arguments: 10000