Project [CASE WHEN ((cap#94125227 = NA) OR (cap#94125227 = null)) THEN null ELSE cast(cap#94125227 as float) END AS cap#94125439, CASE WHEN ((retIC#94125228 = NA) OR (retIC#94125228 = null)) THEN null ELSE cast(retIC#94125228 as float) END AS retIC#94125440, CASE WHEN ((resretIC#94125229 = NA) OR (resretIC#94125229 = null)) THEN null ELSE cast(resretIC#94125229 as float) END AS resretIC#94125441, CASE WHEN ((numcos#94125230 = NA) OR (numcos#94125230 = null)) THEN null ELSE cast(numcos#94125230 as float) END AS numcos#94125442, CASE WHEN ((numdates#94125231 = NA) OR (numdates#94125231 = null)) THEN null ELSE cast(numdates#94125231 as int) END AS numdates#94125443, CASE WHEN ((annual_bmret#94125232 = NA) OR (annual_bmret#94125232 = null)) THEN null ELSE cast(annual_bmret#94125232 as float) END AS annual_bmret#94125456, CASE WHEN ((annual_ret#94125233 = NA) OR (annual_ret#94125233 = null)) THEN null ELSE cast(annual_ret#94125233 as float) END AS annual_ret#94125545, CASE WHEN ((std_ret#94125234 = NA) OR (std_ret#94125234 = null)) THEN null ELSE cast(std_ret#94125234 as float) END AS std_ret#94125546, CASE WHEN ((Sharpe_ret#94125235 = NA) OR (Sharpe_ret#94125235 = null)) THEN null ELSE cast(Sharpe_ret#94125235 as float) END AS Sharpe_ret#94125559, CASE WHEN ((PctPos_ret#94125236 = NA) OR (PctPos_ret#94125236 = null)) THEN null ELSE cast(PctPos_ret#94125236 as float) END AS PctPos_ret#94125560, CASE WHEN ((TR_ret#94125237 = NA) OR (TR_ret#94125237 = null)) THEN null ELSE cast(TR_ret#94125237 as float) END AS TR_ret#94125561, CASE WHEN ((IR_ret#94125238 = NA) OR (IR_ret#94125238 = null)) THEN null ELSE cast(IR_ret#94125238 as float) END AS IR_ret#94125574, CASE WHEN ((annual_resret#94125239 = NA) OR (annual_resret#94125239 = null)) THEN null ELSE cast(annual_resret#94125239 as float) END AS annual_resret#94125575, CASE WHEN ((std_resret#94125240 = NA) OR (std_resret#94125240 = null)) THEN null ELSE cast(std_resret#94125240 as float) END AS std_resret#94125636, CASE WHEN ((Sharpe_resret#94125241 = NA) OR (Sharpe_resret#94125241 = null)) THEN null ELSE cast(Sharpe_resret#94125241 as float) END AS Sharpe_resret#94125637, CASE WHEN ((PctPos_resret#94125242 = NA) OR (PctPos_resret#94125242 = null)) THEN null ELSE cast(PctPos_resret#94125242 as float) END AS PctPos_resret#94125650, CASE WHEN ((TR_resret#94125243 = NA) OR (TR_resret#94125243 = null)) THEN null ELSE cast(TR_resret#94125243 as float) END AS TR_resret#94125654, CASE WHEN ((IR_resret#94125244 = NA) OR (IR_resret#94125244 = null)) THEN null ELSE cast(IR_resret#94125244 as float) END AS IR_resret#94125668, CASE WHEN ((annual_retnet#94125245 = NA) OR (annual_retnet#94125245 = null)) THEN null ELSE cast(annual_retnet#94125245 as float) END AS annual_retnet#94125672, CASE WHEN ((std_retnet#94125246 = NA) OR (std_retnet#94125246 = null)) THEN null ELSE cast(std_retnet#94125246 as float) END AS std_retnet#94125674, CASE WHEN ((Sharpe_retnet#94125247 = NA) OR (Sharpe_retnet#94125247 = null)) THEN null ELSE cast(Sharpe_retnet#94125247 as float) END AS Sharpe_retnet#94125676, CASE WHEN ((PctPos_retnet#94125248 = NA) OR (PctPos_retnet#94125248 = null)) THEN null ELSE cast(PctPos_retnet#94125248 as float) END AS PctPos_retnet#94125678, CASE WHEN ((TR_retnet#94125249 = NA) OR (TR_retnet#94125249 = null)) THEN null ELSE cast(TR_retnet#94125249 as float) END AS TR_retnet#94125680, CASE WHEN ((IR_retnet#94125250 = NA) OR (IR_retnet#94125250 = null)) THEN null ELSE cast(IR_retnet#94125250 as float) END AS IR_retnet#94125682, ... 2 more fields]
Project [CASE WHEN ((cap#93880496 = NA) OR (cap#93880496 = null)) THEN null ELSE cast(cap#93880496 as int) END AS cap#93880528, CASE WHEN (sort#93880498 = null) THEN null ELSE sort#93880498 END AS sort#93880531, CASE WHEN (description#93880500 = null) THEN null ELSE description#93880500 END AS description#93880533, CASE WHEN ((universe#93880502 = NA) OR (universe#93880502 = null)) THEN null ELSE cast(universe#93880502 as int) END AS universe#93880535]
== Physical Plan ==
CollectLimit (19)
+- InMemoryTableScan (1)
+- InMemoryRelation (2)
+- * Project (18)
+- * Sort (17)
+- Exchange (16)
+- * Project (15)
+- * BroadcastHashJoin Inner BuildLeft (14)
:- BroadcastExchange (7)
: +- * Filter (6)
: +- * ColumnarToRow (5)
: +- InMemoryTableScan (3)
: +- InMemoryRelation (4)
: +- * Project (6)
: +- Scan csv (5)
+- * Project (13)
+- * Filter (12)
+- InMemoryTableScan (8)
+- InMemoryRelation (9)
+- * Project (11)
+- Scan csv (10)
(1) InMemoryTableScan
Output [3]: [cap#94128683, turnover#94125684, days_hold#94128738]
Arguments: [cap#94128683, turnover#94125684, days_hold#94128738]
(2) InMemoryRelation
Arguments: [cap#94128683, turnover#94125684, days_hold#94128738], CachedRDDBuilder(org.apache.spark.sql.execution.columnar.DefaultCachedBatchSerializer@208e3fd9,StorageLevel(disk, memory, deserialized, 1 replicas),*(3) Project [cap#94128683, turnover#94125684, (1.0 / cast(turnover#94125684 as double)) AS days_hold#94128738]
+- *(3) Sort [cap_sort#94128621 ASC NULLS FIRST], true, 0
+- Exchange rangepartitioning(cap_sort#94128621 ASC NULLS FIRST, 200), ENSURE_REQUIREMENTS, [id=#7515468]
+- *(2) Project [turnover#94125684, cap_description#94128620 AS cap#94128683, cap_sort#94128621]
+- *(2) BroadcastHashJoin [knownfloatingpointnormalized(normalizenanandzero(cap#94125439))], [knownfloatingpointnormalized(normalizenanandzero(cast(cap#93880528 as float)))], Inner, BuildLeft, false
:- BroadcastExchange HashedRelationBroadcastMode(List(knownfloatingpointnormalized(normalizenanandzero(input[0, float, false]))),false), [id=#7515460]
: +- *(1) Filter isnotnull(cap#94125439)
: +- *(1) ColumnarToRow
: +- InMemoryTableScan [cap#94125439, turnover#94125684], [isnotnull(cap#94125439)]
: +- InMemoryRelation [cap#94125439, retIC#94125440, resretIC#94125441, numcos#94125442, numdates#94125443, annual_bmret#94125456, annual_ret#94125545, std_ret#94125546, Sharpe_ret#94125559, PctPos_ret#94125560, TR_ret#94125561, IR_ret#94125574, annual_resret#94125575, std_resret#94125636, Sharpe_resret#94125637, PctPos_resret#94125650, TR_resret#94125654, IR_resret#94125668, annual_retnet#94125672, std_retnet#94125674, Sharpe_retnet#94125676, PctPos_retnet#94125678, TR_retnet#94125680, IR_retnet#94125682, ... 2 more fields], StorageLevel(disk, memory, deserialized, 1 replicas)
: +- *(1) Project [CASE WHEN ((cap#94125227 = NA) OR (cap#94125227 = null)) THEN null ELSE cast(cap#94125227 as float) END AS cap#94125439, CASE WHEN ((retIC#94125228 = NA) OR (retIC#94125228 = null)) THEN null ELSE cast(retIC#94125228 as float) END AS retIC#94125440, CASE WHEN ((resretIC#94125229 = NA) OR (resretIC#94125229 = null)) THEN null ELSE cast(resretIC#94125229 as float) END AS resretIC#94125441, CASE WHEN ((numcos#94125230 = NA) OR (numcos#94125230 = null)) THEN null ELSE cast(numcos#94125230 as float) END AS numcos#94125442, CASE WHEN ((numdates#94125231 = NA) OR (numdates#94125231 = null)) THEN null ELSE cast(numdates#94125231 as int) END AS numdates#94125443, CASE WHEN ((annual_bmret#94125232 = NA) OR (annual_bmret#94125232 = null)) THEN null ELSE cast(annual_bmret#94125232 as float) END AS annual_bmret#94125456, CASE WHEN ((annual_ret#94125233 = NA) OR (annual_ret#94125233 = null)) THEN null ELSE cast(annual_ret#94125233 as float) END AS annual_ret#94125545, CASE WHEN ((std_ret#94125234 = NA) OR (std_ret#94125234 = null)) THEN null ELSE cast(std_ret#94125234 as float) END AS std_ret#94125546, CASE WHEN ((Sharpe_ret#94125235 = NA) OR (Sharpe_ret#94125235 = null)) THEN null ELSE cast(Sharpe_ret#94125235 as float) END AS Sharpe_ret#94125559, CASE WHEN ((PctPos_ret#94125236 = NA) OR (PctPos_ret#94125236 = null)) THEN null ELSE cast(PctPos_ret#94125236 as float) END AS PctPos_ret#94125560, CASE WHEN ((TR_ret#94125237 = NA) OR (TR_ret#94125237 = null)) THEN null ELSE cast(TR_ret#94125237 as float) END AS TR_ret#94125561, CASE WHEN ((IR_ret#94125238 = NA) OR (IR_ret#94125238 = null)) THEN null ELSE cast(IR_ret#94125238 as float) END AS IR_ret#94125574, CASE WHEN ((annual_resret#94125239 = NA) OR (annual_resret#94125239 = null)) THEN null ELSE cast(annual_resret#94125239 as float) END AS annual_resret#94125575, CASE WHEN ((std_resret#94125240 = NA) OR (std_resret#94125240 = null)) THEN null ELSE cast(std_resret#94125240 as float) END AS std_resret#94125636, CASE WHEN ((Sharpe_resret#94125241 = NA) OR (Sharpe_resret#94125241 = null)) THEN null ELSE cast(Sharpe_resret#94125241 as float) END AS Sharpe_resret#94125637, CASE WHEN ((PctPos_resret#94125242 = NA) OR (PctPos_resret#94125242 = null)) THEN null ELSE cast(PctPos_resret#94125242 as float) END AS PctPos_resret#94125650, CASE WHEN ((TR_resret#94125243 = NA) OR (TR_resret#94125243 = null)) THEN null ELSE cast(TR_resret#94125243 as float) END AS TR_resret#94125654, CASE WHEN ((IR_resret#94125244 = NA) OR (IR_resret#94125244 = null)) THEN null ELSE cast(IR_resret#94125244 as float) END AS IR_resret#94125668, CASE WHEN ((annual_retnet#94125245 = NA) OR (annual_retnet#94125245 = null)) THEN null ELSE cast(annual_retnet#94125245 as float) END AS annual_retnet#94125672, CASE WHEN ((std_retnet#94125246 = NA) OR (std_retnet#94125246 = null)) THEN null ELSE cast(std_retnet#94125246 as float) END AS std_retnet#94125674, CASE WHEN ((Sharpe_retnet#94125247 = NA) OR (Sharpe_retnet#94125247 = null)) THEN null ELSE cast(Sharpe_retnet#94125247 as float) END AS Sharpe_retnet#94125676, CASE WHEN ((PctPos_retnet#94125248 = NA) OR (PctPos_retnet#94125248 = null)) THEN null ELSE cast(PctPos_retnet#94125248 as float) END AS PctPos_retnet#94125678, CASE WHEN ((TR_retnet#94125249 = NA) OR (TR_retnet#94125249 = null)) THEN null ELSE cast(TR_retnet#94125249 as float) END AS TR_retnet#94125680, CASE WHEN ((IR_retnet#94125250 = NA) OR (IR_retnet#94125250 = null)) THEN null ELSE cast(IR_retnet#94125250 as float) END AS IR_retnet#94125682, ... 2 more fields]
: +- FileScan csv [cap#94125227,retIC#94125228,resretIC#94125229,numcos#94125230,numdates#94125231,annual_bmret#94125232,annual_ret#94125233,std_ret#94125234,Sharpe_ret#94125235,PctPos_ret#94125236,TR_ret#94125237,IR_ret#94125238,annual_resret#94125239,std_resret#94125240,Sharpe_resret#94125241,PctPos_resret#94125242,TR_resret#94125243,IR_resret#94125244,annual_retnet#94125245,std_retnet#94125246,Sharpe_retnet#94125247,PctPos_retnet#94125248,TR_retnet#94125249,IR_retnet#94125250,... 2 more fields] Batched: false, DataFilters: [], Format: CSV, Location: InMemoryFileIndex(1 paths)[file:/srv/plusamp/data/default/ea-market/output/transcripts/transcript..., PartitionFilters: [], PushedFilters: [], ReadSchema: struct<cap:string,retIC:string,resretIC:string,numcos:string,numdates:string,annual_bmret:string,...
+- *(2) Project [cap#93880528, description#93880533 AS cap_description#94128620, sort#93880531 AS cap_sort#94128621]
+- *(2) Filter isnotnull(cap#93880528)
+- InMemoryTableScan [cap#93880528, description#93880533, sort#93880531], [isnotnull(cap#93880528)]
+- InMemoryRelation [cap#93880528, sort#93880531, description#93880533, universe#93880535], StorageLevel(disk, memory, deserialized, 1 replicas)
+- *(1) Project [CASE WHEN ((cap#93880496 = NA) OR (cap#93880496 = null)) THEN null ELSE cast(cap#93880496 as int) END AS cap#93880528, CASE WHEN (sort#93880498 = null) THEN null ELSE sort#93880498 END AS sort#93880531, CASE WHEN (description#93880500 = null) THEN null ELSE description#93880500 END AS description#93880533, CASE WHEN ((universe#93880502 = NA) OR (universe#93880502 = null)) THEN null ELSE cast(universe#93880502 as int) END AS universe#93880535]
+- FileScan csv [cap#93880496,sort#93880498,description#93880500,universe#93880502] Batched: false, DataFilters: [], Format: CSV, Location: InMemoryFileIndex(1 paths)[file:/srv/plusamp/data/default/ea-market/curate/curate_cap.csv], PartitionFilters: [], PushedFilters: [], ReadSchema: struct<cap:string,sort:string,description:string,universe:string>
,None), [cap_sort#94128621 ASC NULLS FIRST]
(3) InMemoryTableScan
Output [2]: [cap#94125439, turnover#94125684]
Arguments: [cap#94125439, turnover#94125684], [isnotnull(cap#94125439)]
(4) InMemoryRelation
Arguments: [cap#94125439, retIC#94125440, resretIC#94125441, numcos#94125442, numdates#94125443, annual_bmret#94125456, annual_ret#94125545, std_ret#94125546, Sharpe_ret#94125559, PctPos_ret#94125560, TR_ret#94125561, IR_ret#94125574, annual_resret#94125575, std_resret#94125636, Sharpe_resret#94125637, PctPos_resret#94125650, TR_resret#94125654, IR_resret#94125668, annual_retnet#94125672, std_retnet#94125674, Sharpe_retnet#94125676, PctPos_retnet#94125678, TR_retnet#94125680, IR_retnet#94125682, ... 2 more fields], CachedRDDBuilder(org.apache.spark.sql.execution.columnar.DefaultCachedBatchSerializer@208e3fd9,StorageLevel(disk, memory, deserialized, 1 replicas),*(1) Project [CASE WHEN ((cap#94125227 = NA) OR (cap#94125227 = null)) THEN null ELSE cast(cap#94125227 as float) END AS cap#94125439, CASE WHEN ((retIC#94125228 = NA) OR (retIC#94125228 = null)) THEN null ELSE cast(retIC#94125228 as float) END AS retIC#94125440, CASE WHEN ((resretIC#94125229 = NA) OR (resretIC#94125229 = null)) THEN null ELSE cast(resretIC#94125229 as float) END AS resretIC#94125441, CASE WHEN ((numcos#94125230 = NA) OR (numcos#94125230 = null)) THEN null ELSE cast(numcos#94125230 as float) END AS numcos#94125442, CASE WHEN ((numdates#94125231 = NA) OR (numdates#94125231 = null)) THEN null ELSE cast(numdates#94125231 as int) END AS numdates#94125443, CASE WHEN ((annual_bmret#94125232 = NA) OR (annual_bmret#94125232 = null)) THEN null ELSE cast(annual_bmret#94125232 as float) END AS annual_bmret#94125456, CASE WHEN ((annual_ret#94125233 = NA) OR (annual_ret#94125233 = null)) THEN null ELSE cast(annual_ret#94125233 as float) END AS annual_ret#94125545, CASE WHEN ((std_ret#94125234 = NA) OR (std_ret#94125234 = null)) THEN null ELSE cast(std_ret#94125234 as float) END AS std_ret#94125546, CASE WHEN ((Sharpe_ret#94125235 = NA) OR (Sharpe_ret#94125235 = null)) THEN null ELSE cast(Sharpe_ret#94125235 as float) END AS Sharpe_ret#94125559, CASE WHEN ((PctPos_ret#94125236 = NA) OR (PctPos_ret#94125236 = null)) THEN null ELSE cast(PctPos_ret#94125236 as float) END AS PctPos_ret#94125560, CASE WHEN ((TR_ret#94125237 = NA) OR (TR_ret#94125237 = null)) THEN null ELSE cast(TR_ret#94125237 as float) END AS TR_ret#94125561, CASE WHEN ((IR_ret#94125238 = NA) OR (IR_ret#94125238 = null)) THEN null ELSE cast(IR_ret#94125238 as float) END AS IR_ret#94125574, CASE WHEN ((annual_resret#94125239 = NA) OR (annual_resret#94125239 = null)) THEN null ELSE cast(annual_resret#94125239 as float) END AS annual_resret#94125575, CASE WHEN ((std_resret#94125240 = NA) OR (std_resret#94125240 = null)) THEN null ELSE cast(std_resret#94125240 as float) END AS std_resret#94125636, CASE WHEN ((Sharpe_resret#94125241 = NA) OR (Sharpe_resret#94125241 = null)) THEN null ELSE cast(Sharpe_resret#94125241 as float) END AS Sharpe_resret#94125637, CASE WHEN ((PctPos_resret#94125242 = NA) OR (PctPos_resret#94125242 = null)) THEN null ELSE cast(PctPos_resret#94125242 as float) END AS PctPos_resret#94125650, CASE WHEN ((TR_resret#94125243 = NA) OR (TR_resret#94125243 = null)) THEN null ELSE cast(TR_resret#94125243 as float) END AS TR_resret#94125654, CASE WHEN ((IR_resret#94125244 = NA) OR (IR_resret#94125244 = null)) THEN null ELSE cast(IR_resret#94125244 as float) END AS IR_resret#94125668, CASE WHEN ((annual_retnet#94125245 = NA) OR (annual_retnet#94125245 = null)) THEN null ELSE cast(annual_retnet#94125245 as float) END AS annual_retnet#94125672, CASE WHEN ((std_retnet#94125246 = NA) OR (std_retnet#94125246 = null)) THEN null ELSE cast(std_retnet#94125246 as float) END AS std_retnet#94125674, CASE WHEN ((Sharpe_retnet#94125247 = NA) OR (Sharpe_retnet#94125247 = null)) THEN null ELSE cast(Sharpe_retnet#94125247 as float) END AS Sharpe_retnet#94125676, CASE WHEN ((PctPos_retnet#94125248 = NA) OR (PctPos_retnet#94125248 = null)) THEN null ELSE cast(PctPos_retnet#94125248 as float) END AS PctPos_retnet#94125678, CASE WHEN ((TR_retnet#94125249 = NA) OR (TR_retnet#94125249 = null)) THEN null ELSE cast(TR_retnet#94125249 as float) END AS TR_retnet#94125680, CASE WHEN ((IR_retnet#94125250 = NA) OR (IR_retnet#94125250 = null)) THEN null ELSE cast(IR_retnet#94125250 as float) END AS IR_retnet#94125682, ... 2 more fields]
+- FileScan csv [cap#94125227,retIC#94125228,resretIC#94125229,numcos#94125230,numdates#94125231,annual_bmret#94125232,annual_ret#94125233,std_ret#94125234,Sharpe_ret#94125235,PctPos_ret#94125236,TR_ret#94125237,IR_ret#94125238,annual_resret#94125239,std_resret#94125240,Sharpe_resret#94125241,PctPos_resret#94125242,TR_resret#94125243,IR_resret#94125244,annual_retnet#94125245,std_retnet#94125246,Sharpe_retnet#94125247,PctPos_retnet#94125248,TR_retnet#94125249,IR_retnet#94125250,... 2 more fields] Batched: false, DataFilters: [], Format: CSV, Location: InMemoryFileIndex(1 paths)[file:/srv/plusamp/data/default/ea-market/output/transcripts/transcript..., PartitionFilters: [], PushedFilters: [], ReadSchema: struct<cap:string,retIC:string,resretIC:string,numcos:string,numdates:string,annual_bmret:string,...
,None)
(unknown) Scan csv
Output [26]: [cap#94125227, retIC#94125228, resretIC#94125229, numcos#94125230, numdates#94125231, annual_bmret#94125232, annual_ret#94125233, std_ret#94125234, Sharpe_ret#94125235, PctPos_ret#94125236, TR_ret#94125237, IR_ret#94125238, annual_resret#94125239, std_resret#94125240, Sharpe_resret#94125241, PctPos_resret#94125242, TR_resret#94125243, IR_resret#94125244, annual_retnet#94125245, std_retnet#94125246, Sharpe_retnet#94125247, PctPos_retnet#94125248, TR_retnet#94125249, IR_retnet#94125250, turnover#94125251, coverage#94125252]
Batched: false
Location: InMemoryFileIndex [file:/srv/plusamp/data/default/ea-market/output/transcripts/transcript_model_residualized/stats_cap.csv]
ReadSchema: struct<cap:string,retIC:string,resretIC:string,numcos:string,numdates:string,annual_bmret:string,annual_ret:string,std_ret:string,Sharpe_ret:string,PctPos_ret:string,TR_ret:string,IR_ret:string,annual_resret:string,std_resret:string,Sharpe_resret:string,PctPos_resret:string,TR_resret:string,IR_resret:string,annual_retnet:string,std_retnet:string,Sharpe_retnet:string,PctPos_retnet:string,TR_retnet:string,IR_retnet:string,turnover:string,coverage:string>
(unknown) Project
Output [26]: [CASE WHEN ((cap#94125227 = NA) OR (cap#94125227 = null)) THEN null ELSE cast(cap#94125227 as float) END AS cap#94125439, CASE WHEN ((retIC#94125228 = NA) OR (retIC#94125228 = null)) THEN null ELSE cast(retIC#94125228 as float) END AS retIC#94125440, CASE WHEN ((resretIC#94125229 = NA) OR (resretIC#94125229 = null)) THEN null ELSE cast(resretIC#94125229 as float) END AS resretIC#94125441, CASE WHEN ((numcos#94125230 = NA) OR (numcos#94125230 = null)) THEN null ELSE cast(numcos#94125230 as float) END AS numcos#94125442, CASE WHEN ((numdates#94125231 = NA) OR (numdates#94125231 = null)) THEN null ELSE cast(numdates#94125231 as int) END AS numdates#94125443, CASE WHEN ((annual_bmret#94125232 = NA) OR (annual_bmret#94125232 = null)) THEN null ELSE cast(annual_bmret#94125232 as float) END AS annual_bmret#94125456, CASE WHEN ((annual_ret#94125233 = NA) OR (annual_ret#94125233 = null)) THEN null ELSE cast(annual_ret#94125233 as float) END AS annual_ret#94125545, CASE WHEN ((std_ret#94125234 = NA) OR (std_ret#94125234 = null)) THEN null ELSE cast(std_ret#94125234 as float) END AS std_ret#94125546, CASE WHEN ((Sharpe_ret#94125235 = NA) OR (Sharpe_ret#94125235 = null)) THEN null ELSE cast(Sharpe_ret#94125235 as float) END AS Sharpe_ret#94125559, CASE WHEN ((PctPos_ret#94125236 = NA) OR (PctPos_ret#94125236 = null)) THEN null ELSE cast(PctPos_ret#94125236 as float) END AS PctPos_ret#94125560, CASE WHEN ((TR_ret#94125237 = NA) OR (TR_ret#94125237 = null)) THEN null ELSE cast(TR_ret#94125237 as float) END AS TR_ret#94125561, CASE WHEN ((IR_ret#94125238 = NA) OR (IR_ret#94125238 = null)) THEN null ELSE cast(IR_ret#94125238 as float) END AS IR_ret#94125574, CASE WHEN ((annual_resret#94125239 = NA) OR (annual_resret#94125239 = null)) THEN null ELSE cast(annual_resret#94125239 as float) END AS annual_resret#94125575, CASE WHEN ((std_resret#94125240 = NA) OR (std_resret#94125240 = null)) THEN null ELSE cast(std_resret#94125240 as float) END AS std_resret#94125636, CASE WHEN ((Sharpe_resret#94125241 = NA) OR (Sharpe_resret#94125241 = null)) THEN null ELSE cast(Sharpe_resret#94125241 as float) END AS Sharpe_resret#94125637, CASE WHEN ((PctPos_resret#94125242 = NA) OR (PctPos_resret#94125242 = null)) THEN null ELSE cast(PctPos_resret#94125242 as float) END AS PctPos_resret#94125650, CASE WHEN ((TR_resret#94125243 = NA) OR (TR_resret#94125243 = null)) THEN null ELSE cast(TR_resret#94125243 as float) END AS TR_resret#94125654, CASE WHEN ((IR_resret#94125244 = NA) OR (IR_resret#94125244 = null)) THEN null ELSE cast(IR_resret#94125244 as float) END AS IR_resret#94125668, CASE WHEN ((annual_retnet#94125245 = NA) OR (annual_retnet#94125245 = null)) THEN null ELSE cast(annual_retnet#94125245 as float) END AS annual_retnet#94125672, CASE WHEN ((std_retnet#94125246 = NA) OR (std_retnet#94125246 = null)) THEN null ELSE cast(std_retnet#94125246 as float) END AS std_retnet#94125674, CASE WHEN ((Sharpe_retnet#94125247 = NA) OR (Sharpe_retnet#94125247 = null)) THEN null ELSE cast(Sharpe_retnet#94125247 as float) END AS Sharpe_retnet#94125676, CASE WHEN ((PctPos_retnet#94125248 = NA) OR (PctPos_retnet#94125248 = null)) THEN null ELSE cast(PctPos_retnet#94125248 as float) END AS PctPos_retnet#94125678, CASE WHEN ((TR_retnet#94125249 = NA) OR (TR_retnet#94125249 = null)) THEN null ELSE cast(TR_retnet#94125249 as float) END AS TR_retnet#94125680, CASE WHEN ((IR_retnet#94125250 = NA) OR (IR_retnet#94125250 = null)) THEN null ELSE cast(IR_retnet#94125250 as float) END AS IR_retnet#94125682, CASE WHEN ((turnover#94125251 = NA) OR (turnover#94125251 = null)) THEN null ELSE cast(turnover#94125251 as float) END AS turnover#94125684, CASE WHEN ((coverage#94125252 = NA) OR (coverage#94125252 = null)) THEN null ELSE cast(coverage#94125252 as float) END AS coverage#94125686]
Input [26]: [cap#94125227, retIC#94125228, resretIC#94125229, numcos#94125230, numdates#94125231, annual_bmret#94125232, annual_ret#94125233, std_ret#94125234, Sharpe_ret#94125235, PctPos_ret#94125236, TR_ret#94125237, IR_ret#94125238, annual_resret#94125239, std_resret#94125240, Sharpe_resret#94125241, PctPos_resret#94125242, TR_resret#94125243, IR_resret#94125244, annual_retnet#94125245, std_retnet#94125246, Sharpe_retnet#94125247, PctPos_retnet#94125248, TR_retnet#94125249, IR_retnet#94125250, turnover#94125251, coverage#94125252]
(7) BroadcastExchange
Input [2]: [cap#94125439, turnover#94125684]
Arguments: HashedRelationBroadcastMode(List(knownfloatingpointnormalized(normalizenanandzero(input[0, float, false]))),false), [id=#7515460]
(8) InMemoryTableScan
Output [3]: [cap#93880528, description#93880533, sort#93880531]
Arguments: [cap#93880528, description#93880533, sort#93880531], [isnotnull(cap#93880528)]
(9) InMemoryRelation
Arguments: [cap#93880528, sort#93880531, description#93880533, universe#93880535], CachedRDDBuilder(org.apache.spark.sql.execution.columnar.DefaultCachedBatchSerializer@208e3fd9,StorageLevel(disk, memory, deserialized, 1 replicas),*(1) Project [CASE WHEN ((cap#93880496 = NA) OR (cap#93880496 = null)) THEN null ELSE cast(cap#93880496 as int) END AS cap#93880528, CASE WHEN (sort#93880498 = null) THEN null ELSE sort#93880498 END AS sort#93880531, CASE WHEN (description#93880500 = null) THEN null ELSE description#93880500 END AS description#93880533, CASE WHEN ((universe#93880502 = NA) OR (universe#93880502 = null)) THEN null ELSE cast(universe#93880502 as int) END AS universe#93880535]
+- FileScan csv [cap#93880496,sort#93880498,description#93880500,universe#93880502] Batched: false, DataFilters: [], Format: CSV, Location: InMemoryFileIndex(1 paths)[file:/srv/plusamp/data/default/ea-market/curate/curate_cap.csv], PartitionFilters: [], PushedFilters: [], ReadSchema: struct<cap:string,sort:string,description:string,universe:string>
,None)
(10) Scan csv
Output [4]: [cap#93880496, sort#93880498, description#93880500, universe#93880502]
Batched: false
Location: InMemoryFileIndex [file:/srv/plusamp/data/default/ea-market/curate/curate_cap.csv]
ReadSchema: struct<cap:string,sort:string,description:string,universe:string>
(11) Project [codegen id : 1]
Output [4]: [CASE WHEN ((cap#93880496 = NA) OR (cap#93880496 = null)) THEN null ELSE cast(cap#93880496 as int) END AS cap#93880528, CASE WHEN (sort#93880498 = null) THEN null ELSE sort#93880498 END AS sort#93880531, CASE WHEN (description#93880500 = null) THEN null ELSE description#93880500 END AS description#93880533, CASE WHEN ((universe#93880502 = NA) OR (universe#93880502 = null)) THEN null ELSE cast(universe#93880502 as int) END AS universe#93880535]
Input [4]: [cap#93880496, sort#93880498, description#93880500, universe#93880502]
(12) Filter
Input [3]: [cap#93880528, description#93880533, sort#93880531]
Condition : isnotnull(cap#93880528)
(13) Project
Output [3]: [cap#93880528, description#93880533 AS cap_description#94128620, sort#93880531 AS cap_sort#94128621]
Input [3]: [cap#93880528, description#93880533, sort#93880531]
(14) BroadcastHashJoin [codegen id : 2]
Left keys [1]: [knownfloatingpointnormalized(normalizenanandzero(cap#94125439))]
Right keys [1]: [knownfloatingpointnormalized(normalizenanandzero(cast(cap#93880528 as float)))]
Join condition: None
(15) Project [codegen id : 2]
Output [3]: [turnover#94125684, cap_description#94128620 AS cap#94128683, cap_sort#94128621]
Input [5]: [cap#94125439, turnover#94125684, cap#93880528, cap_description#94128620, cap_sort#94128621]
(16) Exchange
Input [3]: [turnover#94125684, cap#94128683, cap_sort#94128621]
Arguments: rangepartitioning(cap_sort#94128621 ASC NULLS FIRST, 200), ENSURE_REQUIREMENTS, [id=#7515468]
(17) Sort [codegen id : 3]
Input [3]: [turnover#94125684, cap#94128683, cap_sort#94128621]
Arguments: [cap_sort#94128621 ASC NULLS FIRST], true, 0
(18) Project [codegen id : 3]
Output [3]: [cap#94128683, turnover#94125684, (1.0 / cast(turnover#94125684 as double)) AS days_hold#94128738]
Input [3]: [turnover#94125684, cap#94128683, cap_sort#94128621]
(19) CollectLimit
Input [3]: [cap#94128683, turnover#94125684, days_hold#94128738]
Arguments: 10000