== Physical Plan == CollectLimit (21) +- InMemoryTableScan (1) +- InMemoryRelation (2) +- * Project (20) +- * Sort (19) +- Exchange (18) +- * Project (17) +- * BroadcastHashJoin Inner BuildLeft (16) :- BroadcastExchange (9) : +- * Filter (8) : +- * ColumnarToRow (7) : +- InMemoryTableScan (3) : +- InMemoryRelation (4) : +- * Project (6) : +- Scan csv (5) +- * Project (15) +- * Filter (14) +- InMemoryTableScan (10) +- InMemoryRelation (11) +- * Project (13) +- Scan csv (12) (1) InMemoryTableScan Output [3]: [cap#94085547, turnover#94082713, days_hold#94085575] Arguments: [cap#94085547, turnover#94082713, days_hold#94085575] (2) InMemoryRelation Arguments: [cap#94085547, turnover#94082713, days_hold#94085575], CachedRDDBuilder(org.apache.spark.sql.execution.columnar.DefaultCachedBatchSerializer@208e3fd9,StorageLevel(disk, memory, deserialized, 1 replicas),*(3) Project [cap#94085547, turnover#94082713, (1.0 / cast(turnover#94082713 as double)) AS days_hold#94085575] +- *(3) Sort [cap_sort#94085458 ASC NULLS FIRST], true, 0 +- Exchange rangepartitioning(cap_sort#94085458 ASC NULLS FIRST, 200), ENSURE_REQUIREMENTS, [id=#7512025] +- *(2) Project [turnover#94082713, cap_description#94085457 AS cap#94085547, cap_sort#94085458] +- *(2) BroadcastHashJoin [knownfloatingpointnormalized(normalizenanandzero(cap#94082258))], [knownfloatingpointnormalized(normalizenanandzero(cast(cap#93880528 as float)))], Inner, BuildLeft, false :- BroadcastExchange HashedRelationBroadcastMode(List(knownfloatingpointnormalized(normalizenanandzero(input[0, float, false]))),false), [id=#7512017] : +- *(1) Filter isnotnull(cap#94082258) : +- *(1) ColumnarToRow : +- InMemoryTableScan [cap#94082258, turnover#94082713], [isnotnull(cap#94082258)] : +- InMemoryRelation [cap#94082258, retIC#94082265, resretIC#94082268, numcos#94082304, numdates#94082307, annual_bmret#94082308, annual_ret#94082309, std_ret#94082310, Sharpe_ret#94082311, PctPos_ret#94082312, TR_ret#94082313, IR_ret#94082314, annual_resret#94082315, std_resret#94082517, Sharpe_resret#94082703, PctPos_resret#94082704, TR_resret#94082705, IR_resret#94082706, annual_retnet#94082707, std_retnet#94082708, Sharpe_retnet#94082709, PctPos_retnet#94082710, TR_retnet#94082711, IR_retnet#94082712, ... 2 more fields], StorageLevel(disk, memory, deserialized, 1 replicas) : +- *(1) Project [CASE WHEN ((cap#94081987 = NA) OR (cap#94081987 = null)) THEN null ELSE cast(cap#94081987 as float) END AS cap#94082258, CASE WHEN ((retIC#94081988 = NA) OR (retIC#94081988 = null)) THEN null ELSE cast(retIC#94081988 as float) END AS retIC#94082265, CASE WHEN ((resretIC#94081989 = NA) OR (resretIC#94081989 = null)) THEN null ELSE cast(resretIC#94081989 as float) END AS resretIC#94082268, CASE WHEN ((numcos#94081990 = NA) OR (numcos#94081990 = null)) THEN null ELSE cast(numcos#94081990 as float) END AS numcos#94082304, CASE WHEN ((numdates#94081991 = NA) OR (numdates#94081991 = null)) THEN null ELSE cast(numdates#94081991 as int) END AS numdates#94082307, CASE WHEN ((annual_bmret#94081992 = NA) OR (annual_bmret#94081992 = null)) THEN null ELSE cast(annual_bmret#94081992 as float) END AS annual_bmret#94082308, CASE WHEN ((annual_ret#94081993 = NA) OR (annual_ret#94081993 = null)) THEN null ELSE cast(annual_ret#94081993 as float) END AS annual_ret#94082309, CASE WHEN ((std_ret#94081994 = NA) OR (std_ret#94081994 = null)) THEN null ELSE cast(std_ret#94081994 as float) END AS std_ret#94082310, CASE WHEN ((Sharpe_ret#94081995 = NA) OR (Sharpe_ret#94081995 = null)) THEN null ELSE cast(Sharpe_ret#94081995 as float) END AS Sharpe_ret#94082311, CASE WHEN ((PctPos_ret#94081996 = NA) OR (PctPos_ret#94081996 = null)) THEN null ELSE cast(PctPos_ret#94081996 as float) END AS PctPos_ret#94082312, CASE WHEN ((TR_ret#94081997 = NA) OR (TR_ret#94081997 = null)) THEN null ELSE cast(TR_ret#94081997 as float) END AS TR_ret#94082313, CASE WHEN ((IR_ret#94081998 = NA) OR (IR_ret#94081998 = null)) THEN null ELSE cast(IR_ret#94081998 as float) END AS IR_ret#94082314, CASE WHEN ((annual_resret#94081999 = NA) OR (annual_resret#94081999 = null)) THEN null ELSE cast(annual_resret#94081999 as float) END AS annual_resret#94082315, CASE WHEN ((std_resret#94082000 = NA) OR (std_resret#94082000 = null)) THEN null ELSE cast(std_resret#94082000 as float) END AS std_resret#94082517, CASE WHEN ((Sharpe_resret#94082001 = NA) OR (Sharpe_resret#94082001 = null)) THEN null ELSE cast(Sharpe_resret#94082001 as float) END AS Sharpe_resret#94082703, CASE WHEN ((PctPos_resret#94082002 = NA) OR (PctPos_resret#94082002 = null)) THEN null ELSE cast(PctPos_resret#94082002 as float) END AS PctPos_resret#94082704, CASE WHEN ((TR_resret#94082003 = NA) OR (TR_resret#94082003 = null)) THEN null ELSE cast(TR_resret#94082003 as float) END AS TR_resret#94082705, CASE WHEN ((IR_resret#94082004 = NA) OR (IR_resret#94082004 = null)) THEN null ELSE cast(IR_resret#94082004 as float) END AS IR_resret#94082706, CASE WHEN ((annual_retnet#94082005 = NA) OR (annual_retnet#94082005 = null)) THEN null ELSE cast(annual_retnet#94082005 as float) END AS annual_retnet#94082707, CASE WHEN ((std_retnet#94082006 = NA) OR (std_retnet#94082006 = null)) THEN null ELSE cast(std_retnet#94082006 as float) END AS std_retnet#94082708, CASE WHEN ((Sharpe_retnet#94082007 = NA) OR (Sharpe_retnet#94082007 = null)) THEN null ELSE cast(Sharpe_retnet#94082007 as float) END AS Sharpe_retnet#94082709, CASE WHEN ((PctPos_retnet#94082008 = NA) OR (PctPos_retnet#94082008 = null)) THEN null ELSE cast(PctPos_retnet#94082008 as float) END AS PctPos_retnet#94082710, CASE WHEN ((TR_retnet#94082009 = NA) OR (TR_retnet#94082009 = null)) THEN null ELSE cast(TR_retnet#94082009 as float) END AS TR_retnet#94082711, CASE WHEN ((IR_retnet#94082010 = NA) OR (IR_retnet#94082010 = null)) THEN null ELSE cast(IR_retnet#94082010 as float) END AS IR_retnet#94082712, ... 2 more fields] : +- FileScan csv [cap#94081987,retIC#94081988,resretIC#94081989,numcos#94081990,numdates#94081991,annual_bmret#94081992,annual_ret#94081993,std_ret#94081994,Sharpe_ret#94081995,PctPos_ret#94081996,TR_ret#94081997,IR_ret#94081998,annual_resret#94081999,std_resret#94082000,Sharpe_resret#94082001,PctPos_resret#94082002,TR_resret#94082003,IR_resret#94082004,annual_retnet#94082005,std_retnet#94082006,Sharpe_retnet#94082007,PctPos_retnet#94082008,TR_retnet#94082009,IR_retnet#94082010,... 2 more fields] Batched: false, DataFilters: [], Format: CSV, Location: InMemoryFileIndex(1 paths)[file:/srv/plusamp/data/default/ea-market/output/risk_factors/volatilit..., PartitionFilters: [], PushedFilters: [], ReadSchema: struct<cap:string,retIC:string,resretIC:string,numcos:string,numdates:string,annual_bmret:string,... +- *(2) Project [cap#93880528, description#93880533 AS cap_description#94085457, sort#93880531 AS cap_sort#94085458] +- *(2) Filter isnotnull(cap#93880528) +- InMemoryTableScan [cap#93880528, description#93880533, sort#93880531], [isnotnull(cap#93880528)] +- InMemoryRelation [cap#93880528, sort#93880531, description#93880533, universe#93880535], StorageLevel(disk, memory, deserialized, 1 replicas) +- *(1) Project [CASE WHEN ((cap#93880496 = NA) OR (cap#93880496 = null)) THEN null ELSE cast(cap#93880496 as int) END AS cap#93880528, CASE WHEN (sort#93880498 = null) THEN null ELSE sort#93880498 END AS sort#93880531, CASE WHEN (description#93880500 = null) THEN null ELSE description#93880500 END AS description#93880533, CASE WHEN ((universe#93880502 = NA) OR (universe#93880502 = null)) THEN null ELSE cast(universe#93880502 as int) END AS universe#93880535] +- FileScan csv [cap#93880496,sort#93880498,description#93880500,universe#93880502] Batched: false, DataFilters: [], Format: CSV, Location: InMemoryFileIndex(1 paths)[file:/srv/plusamp/data/default/ea-market/curate/curate_cap.csv], PartitionFilters: [], PushedFilters: [], ReadSchema: struct<cap:string,sort:string,description:string,universe:string> ,None), [cap_sort#94085458 ASC NULLS FIRST] (3) InMemoryTableScan Output [2]: [cap#94082258, turnover#94082713] Arguments: [cap#94082258, turnover#94082713], [isnotnull(cap#94082258)] (4) InMemoryRelation Arguments: [cap#94082258, retIC#94082265, resretIC#94082268, numcos#94082304, numdates#94082307, annual_bmret#94082308, annual_ret#94082309, std_ret#94082310, Sharpe_ret#94082311, PctPos_ret#94082312, TR_ret#94082313, IR_ret#94082314, annual_resret#94082315, std_resret#94082517, Sharpe_resret#94082703, PctPos_resret#94082704, TR_resret#94082705, IR_resret#94082706, annual_retnet#94082707, std_retnet#94082708, Sharpe_retnet#94082709, PctPos_retnet#94082710, TR_retnet#94082711, IR_retnet#94082712, ... 2 more fields], CachedRDDBuilder(org.apache.spark.sql.execution.columnar.DefaultCachedBatchSerializer@208e3fd9,StorageLevel(disk, memory, deserialized, 1 replicas),*(1) Project [CASE WHEN ((cap#94081987 = NA) OR (cap#94081987 = null)) THEN null ELSE cast(cap#94081987 as float) END AS cap#94082258, CASE WHEN ((retIC#94081988 = NA) OR (retIC#94081988 = null)) THEN null ELSE cast(retIC#94081988 as float) END AS retIC#94082265, CASE WHEN ((resretIC#94081989 = NA) OR (resretIC#94081989 = null)) THEN null ELSE cast(resretIC#94081989 as float) END AS resretIC#94082268, CASE WHEN ((numcos#94081990 = NA) OR (numcos#94081990 = null)) THEN null ELSE cast(numcos#94081990 as float) END AS numcos#94082304, CASE WHEN ((numdates#94081991 = NA) OR (numdates#94081991 = null)) THEN null ELSE cast(numdates#94081991 as int) END AS numdates#94082307, CASE WHEN ((annual_bmret#94081992 = NA) OR (annual_bmret#94081992 = null)) THEN null ELSE cast(annual_bmret#94081992 as float) END AS annual_bmret#94082308, CASE WHEN ((annual_ret#94081993 = NA) OR (annual_ret#94081993 = null)) THEN null ELSE cast(annual_ret#94081993 as float) END AS annual_ret#94082309, CASE WHEN ((std_ret#94081994 = NA) OR (std_ret#94081994 = null)) THEN null ELSE cast(std_ret#94081994 as float) END AS std_ret#94082310, CASE WHEN ((Sharpe_ret#94081995 = NA) OR (Sharpe_ret#94081995 = null)) THEN null ELSE cast(Sharpe_ret#94081995 as float) END AS Sharpe_ret#94082311, CASE WHEN ((PctPos_ret#94081996 = NA) OR (PctPos_ret#94081996 = null)) THEN null ELSE cast(PctPos_ret#94081996 as float) END AS PctPos_ret#94082312, CASE WHEN ((TR_ret#94081997 = NA) OR (TR_ret#94081997 = null)) THEN null ELSE cast(TR_ret#94081997 as float) END AS TR_ret#94082313, CASE WHEN ((IR_ret#94081998 = NA) OR (IR_ret#94081998 = null)) THEN null ELSE cast(IR_ret#94081998 as float) END AS IR_ret#94082314, CASE WHEN ((annual_resret#94081999 = NA) OR (annual_resret#94081999 = null)) THEN null ELSE cast(annual_resret#94081999 as float) END AS annual_resret#94082315, CASE WHEN ((std_resret#94082000 = NA) OR (std_resret#94082000 = null)) THEN null ELSE cast(std_resret#94082000 as float) END AS std_resret#94082517, CASE WHEN ((Sharpe_resret#94082001 = NA) OR (Sharpe_resret#94082001 = null)) THEN null ELSE cast(Sharpe_resret#94082001 as float) END AS Sharpe_resret#94082703, CASE WHEN ((PctPos_resret#94082002 = NA) OR (PctPos_resret#94082002 = null)) THEN null ELSE cast(PctPos_resret#94082002 as float) END AS PctPos_resret#94082704, CASE WHEN ((TR_resret#94082003 = NA) OR (TR_resret#94082003 = null)) THEN null ELSE cast(TR_resret#94082003 as float) END AS TR_resret#94082705, CASE WHEN ((IR_resret#94082004 = NA) OR (IR_resret#94082004 = null)) THEN null ELSE cast(IR_resret#94082004 as float) END AS IR_resret#94082706, CASE WHEN ((annual_retnet#94082005 = NA) OR (annual_retnet#94082005 = null)) THEN null ELSE cast(annual_retnet#94082005 as float) END AS annual_retnet#94082707, CASE WHEN ((std_retnet#94082006 = NA) OR (std_retnet#94082006 = null)) THEN null ELSE cast(std_retnet#94082006 as float) END AS std_retnet#94082708, CASE WHEN ((Sharpe_retnet#94082007 = NA) OR (Sharpe_retnet#94082007 = null)) THEN null ELSE cast(Sharpe_retnet#94082007 as float) END AS Sharpe_retnet#94082709, CASE WHEN ((PctPos_retnet#94082008 = NA) OR (PctPos_retnet#94082008 = null)) THEN null ELSE cast(PctPos_retnet#94082008 as float) END AS PctPos_retnet#94082710, CASE WHEN ((TR_retnet#94082009 = NA) OR (TR_retnet#94082009 = null)) THEN null ELSE cast(TR_retnet#94082009 as float) END AS TR_retnet#94082711, CASE WHEN ((IR_retnet#94082010 = NA) OR (IR_retnet#94082010 = null)) THEN null ELSE cast(IR_retnet#94082010 as float) END AS IR_retnet#94082712, ... 2 more fields] +- FileScan csv [cap#94081987,retIC#94081988,resretIC#94081989,numcos#94081990,numdates#94081991,annual_bmret#94081992,annual_ret#94081993,std_ret#94081994,Sharpe_ret#94081995,PctPos_ret#94081996,TR_ret#94081997,IR_ret#94081998,annual_resret#94081999,std_resret#94082000,Sharpe_resret#94082001,PctPos_resret#94082002,TR_resret#94082003,IR_resret#94082004,annual_retnet#94082005,std_retnet#94082006,Sharpe_retnet#94082007,PctPos_retnet#94082008,TR_retnet#94082009,IR_retnet#94082010,... 2 more fields] Batched: false, DataFilters: [], Format: CSV, Location: InMemoryFileIndex(1 paths)[file:/srv/plusamp/data/default/ea-market/output/risk_factors/volatilit..., PartitionFilters: [], PushedFilters: [], ReadSchema: struct<cap:string,retIC:string,resretIC:string,numcos:string,numdates:string,annual_bmret:string,... ,None) (5) Scan csv Output [26]: [cap#94081987, retIC#94081988, resretIC#94081989, numcos#94081990, numdates#94081991, annual_bmret#94081992, annual_ret#94081993, std_ret#94081994, Sharpe_ret#94081995, PctPos_ret#94081996, TR_ret#94081997, IR_ret#94081998, annual_resret#94081999, std_resret#94082000, Sharpe_resret#94082001, PctPos_resret#94082002, TR_resret#94082003, IR_resret#94082004, annual_retnet#94082005, std_retnet#94082006, Sharpe_retnet#94082007, PctPos_retnet#94082008, TR_retnet#94082009, IR_retnet#94082010, turnover#94082011, coverage#94082012] Batched: false Location: InMemoryFileIndex [file:/srv/plusamp/data/default/ea-market/output/risk_factors/volatility/stats_cap.csv] ReadSchema: struct<cap:string,retIC:string,resretIC:string,numcos:string,numdates:string,annual_bmret:string,annual_ret:string,std_ret:string,Sharpe_ret:string,PctPos_ret:string,TR_ret:string,IR_ret:string,annual_resret:string,std_resret:string,Sharpe_resret:string,PctPos_resret:string,TR_resret:string,IR_resret:string,annual_retnet:string,std_retnet:string,Sharpe_retnet:string,PctPos_retnet:string,TR_retnet:string,IR_retnet:string,turnover:string,coverage:string> (6) Project [codegen id : 1] Output [26]: [CASE WHEN ((cap#94081987 = NA) OR (cap#94081987 = null)) THEN null ELSE cast(cap#94081987 as float) END AS cap#94082258, CASE WHEN ((retIC#94081988 = NA) OR (retIC#94081988 = null)) THEN null ELSE cast(retIC#94081988 as float) END AS retIC#94082265, CASE WHEN ((resretIC#94081989 = NA) OR (resretIC#94081989 = null)) THEN null ELSE cast(resretIC#94081989 as float) END AS resretIC#94082268, CASE WHEN ((numcos#94081990 = NA) OR (numcos#94081990 = null)) THEN null ELSE cast(numcos#94081990 as float) END AS numcos#94082304, CASE WHEN ((numdates#94081991 = NA) OR (numdates#94081991 = null)) THEN null ELSE cast(numdates#94081991 as int) END AS numdates#94082307, CASE WHEN ((annual_bmret#94081992 = NA) OR (annual_bmret#94081992 = null)) THEN null ELSE cast(annual_bmret#94081992 as float) END AS annual_bmret#94082308, CASE WHEN ((annual_ret#94081993 = NA) OR (annual_ret#94081993 = null)) THEN null ELSE cast(annual_ret#94081993 as float) END AS annual_ret#94082309, CASE WHEN ((std_ret#94081994 = NA) OR (std_ret#94081994 = null)) THEN null ELSE cast(std_ret#94081994 as float) END AS std_ret#94082310, CASE WHEN ((Sharpe_ret#94081995 = NA) OR (Sharpe_ret#94081995 = null)) THEN null ELSE cast(Sharpe_ret#94081995 as float) END AS Sharpe_ret#94082311, CASE WHEN ((PctPos_ret#94081996 = NA) OR (PctPos_ret#94081996 = null)) THEN null ELSE cast(PctPos_ret#94081996 as float) END AS PctPos_ret#94082312, CASE WHEN ((TR_ret#94081997 = NA) OR (TR_ret#94081997 = null)) THEN null ELSE cast(TR_ret#94081997 as float) END AS TR_ret#94082313, CASE WHEN ((IR_ret#94081998 = NA) OR (IR_ret#94081998 = null)) THEN null ELSE cast(IR_ret#94081998 as float) END AS IR_ret#94082314, CASE WHEN ((annual_resret#94081999 = NA) OR (annual_resret#94081999 = null)) THEN null ELSE cast(annual_resret#94081999 as float) END AS annual_resret#94082315, CASE WHEN ((std_resret#94082000 = NA) OR (std_resret#94082000 = null)) THEN null ELSE cast(std_resret#94082000 as float) END AS std_resret#94082517, CASE WHEN ((Sharpe_resret#94082001 = NA) OR (Sharpe_resret#94082001 = null)) THEN null ELSE cast(Sharpe_resret#94082001 as float) END AS Sharpe_resret#94082703, CASE WHEN ((PctPos_resret#94082002 = NA) OR (PctPos_resret#94082002 = null)) THEN null ELSE cast(PctPos_resret#94082002 as float) END AS PctPos_resret#94082704, CASE WHEN ((TR_resret#94082003 = NA) OR (TR_resret#94082003 = null)) THEN null ELSE cast(TR_resret#94082003 as float) END AS TR_resret#94082705, CASE WHEN ((IR_resret#94082004 = NA) OR (IR_resret#94082004 = null)) THEN null ELSE cast(IR_resret#94082004 as float) END AS IR_resret#94082706, CASE WHEN ((annual_retnet#94082005 = NA) OR (annual_retnet#94082005 = null)) THEN null ELSE cast(annual_retnet#94082005 as float) END AS annual_retnet#94082707, CASE WHEN ((std_retnet#94082006 = NA) OR (std_retnet#94082006 = null)) THEN null ELSE cast(std_retnet#94082006 as float) END AS std_retnet#94082708, CASE WHEN ((Sharpe_retnet#94082007 = NA) OR (Sharpe_retnet#94082007 = null)) THEN null ELSE cast(Sharpe_retnet#94082007 as float) END AS Sharpe_retnet#94082709, CASE WHEN ((PctPos_retnet#94082008 = NA) OR (PctPos_retnet#94082008 = null)) THEN null ELSE cast(PctPos_retnet#94082008 as float) END AS PctPos_retnet#94082710, CASE WHEN ((TR_retnet#94082009 = NA) OR (TR_retnet#94082009 = null)) THEN null ELSE cast(TR_retnet#94082009 as float) END AS TR_retnet#94082711, CASE WHEN ((IR_retnet#94082010 = NA) OR (IR_retnet#94082010 = null)) THEN null ELSE cast(IR_retnet#94082010 as float) END AS IR_retnet#94082712, CASE WHEN ((turnover#94082011 = NA) OR (turnover#94082011 = null)) THEN null ELSE cast(turnover#94082011 as float) END AS turnover#94082713, CASE WHEN ((coverage#94082012 = NA) OR (coverage#94082012 = null)) THEN null ELSE cast(coverage#94082012 as float) END AS coverage#94082714] Input [26]: [cap#94081987, retIC#94081988, resretIC#94081989, numcos#94081990, numdates#94081991, annual_bmret#94081992, annual_ret#94081993, std_ret#94081994, Sharpe_ret#94081995, PctPos_ret#94081996, TR_ret#94081997, IR_ret#94081998, annual_resret#94081999, std_resret#94082000, Sharpe_resret#94082001, PctPos_resret#94082002, TR_resret#94082003, IR_resret#94082004, annual_retnet#94082005, std_retnet#94082006, Sharpe_retnet#94082007, PctPos_retnet#94082008, TR_retnet#94082009, IR_retnet#94082010, turnover#94082011, coverage#94082012] (7) ColumnarToRow [codegen id : 1] Input [2]: [cap#94082258, turnover#94082713] (8) Filter [codegen id : 1] Input [2]: [cap#94082258, turnover#94082713] Condition : isnotnull(cap#94082258) (9) BroadcastExchange Input [2]: [cap#94082258, turnover#94082713] Arguments: HashedRelationBroadcastMode(List(knownfloatingpointnormalized(normalizenanandzero(input[0, float, false]))),false), [id=#7512017] (10) InMemoryTableScan Output [3]: [cap#93880528, description#93880533, sort#93880531] Arguments: [cap#93880528, description#93880533, sort#93880531], [isnotnull(cap#93880528)] (11) InMemoryRelation Arguments: [cap#93880528, sort#93880531, description#93880533, universe#93880535], CachedRDDBuilder(org.apache.spark.sql.execution.columnar.DefaultCachedBatchSerializer@208e3fd9,StorageLevel(disk, memory, deserialized, 1 replicas),*(1) Project [CASE WHEN ((cap#93880496 = NA) OR (cap#93880496 = null)) THEN null ELSE cast(cap#93880496 as int) END AS cap#93880528, CASE WHEN (sort#93880498 = null) THEN null ELSE sort#93880498 END AS sort#93880531, CASE WHEN (description#93880500 = null) THEN null ELSE description#93880500 END AS description#93880533, CASE WHEN ((universe#93880502 = NA) OR (universe#93880502 = null)) THEN null ELSE cast(universe#93880502 as int) END AS universe#93880535] +- FileScan csv [cap#93880496,sort#93880498,description#93880500,universe#93880502] Batched: false, DataFilters: [], Format: CSV, Location: InMemoryFileIndex(1 paths)[file:/srv/plusamp/data/default/ea-market/curate/curate_cap.csv], PartitionFilters: [], PushedFilters: [], ReadSchema: struct<cap:string,sort:string,description:string,universe:string> ,None) (12) Scan csv Output [4]: [cap#93880496, sort#93880498, description#93880500, universe#93880502] Batched: false Location: InMemoryFileIndex [file:/srv/plusamp/data/default/ea-market/curate/curate_cap.csv] ReadSchema: struct<cap:string,sort:string,description:string,universe:string> (13) Project [codegen id : 1] Output [4]: [CASE WHEN ((cap#93880496 = NA) OR (cap#93880496 = null)) THEN null ELSE cast(cap#93880496 as int) END AS cap#93880528, CASE WHEN (sort#93880498 = null) THEN null ELSE sort#93880498 END AS sort#93880531, CASE WHEN (description#93880500 = null) THEN null ELSE description#93880500 END AS description#93880533, CASE WHEN ((universe#93880502 = NA) OR (universe#93880502 = null)) THEN null ELSE cast(universe#93880502 as int) END AS universe#93880535] Input [4]: [cap#93880496, sort#93880498, description#93880500, universe#93880502] (14) Filter Input [3]: [cap#93880528, description#93880533, sort#93880531] Condition : isnotnull(cap#93880528) (15) Project Output [3]: [cap#93880528, description#93880533 AS cap_description#94085457, sort#93880531 AS cap_sort#94085458] Input [3]: [cap#93880528, description#93880533, sort#93880531] (16) BroadcastHashJoin [codegen id : 2] Left keys [1]: [knownfloatingpointnormalized(normalizenanandzero(cap#94082258))] Right keys [1]: [knownfloatingpointnormalized(normalizenanandzero(cast(cap#93880528 as float)))] Join condition: None (17) Project [codegen id : 2] Output [3]: [turnover#94082713, cap_description#94085457 AS cap#94085547, cap_sort#94085458] Input [5]: [cap#94082258, turnover#94082713, cap#93880528, cap_description#94085457, cap_sort#94085458] (18) Exchange Input [3]: [turnover#94082713, cap#94085547, cap_sort#94085458] Arguments: rangepartitioning(cap_sort#94085458 ASC NULLS FIRST, 200), ENSURE_REQUIREMENTS, [id=#7512025] (19) Sort [codegen id : 3] Input [3]: [turnover#94082713, cap#94085547, cap_sort#94085458] Arguments: [cap_sort#94085458 ASC NULLS FIRST], true, 0 (20) Project [codegen id : 3] Output [3]: [cap#94085547, turnover#94082713, (1.0 / cast(turnover#94082713 as double)) AS days_hold#94085575] Input [3]: [turnover#94082713, cap#94085547, cap_sort#94085458] (21) CollectLimit Input [3]: [cap#94085547, turnover#94082713, days_hold#94085575] Arguments: 1000000