Project [CASE WHEN (date#94396171 = null) THEN null ELSE cast(date#94396171 as date) END AS date#94396426, CASE WHEN ((overall#94396172 = NA) OR (overall#94396172 = null)) THEN null ELSE cast(overall#94396172 as int) END AS overall#94396454, CASE WHEN ((ret#94396173 = NA) OR (ret#94396173 = null)) THEN null ELSE cast(ret#94396173 as float) END AS ret#94396487, CASE WHEN ((resret#94396174 = NA) OR (resret#94396174 = null)) THEN null ELSE cast(resret#94396174 as float) END AS resret#94396488, CASE WHEN ((retnet#94396175 = NA) OR (retnet#94396175 = null)) THEN null ELSE cast(retnet#94396175 as float) END AS retnet#94396489, CASE WHEN ((turnover#94396176 = NA) OR (turnover#94396176 = null)) THEN null ELSE cast(turnover#94396176 as float) END AS turnover#94396490, CASE WHEN ((numcos#94396177 = NA) OR (numcos#94396177 = null)) THEN null ELSE cast(numcos#94396177 as float) END AS numcos#94396504, CASE WHEN ((benchmark#94396178 = NA) OR (benchmark#94396178 = null)) THEN null ELSE cast(benchmark#94396178 as float) END AS benchmark#94396505, CASE WHEN ((excess_ret#94396179 = NA) OR (excess_ret#94396179 = null)) THEN null ELSE cast(excess_ret#94396179 as float) END AS excess_ret#94396506, CASE WHEN ((excess_resret#94396180 = NA) OR (excess_resret#94396180 = null)) THEN null ELSE cast(excess_resret#94396180 as float) END AS excess_resret#94396507, CASE WHEN ((excess_retnet#94396181 = NA) OR (excess_retnet#94396181 = null)) THEN null ELSE cast(excess_retnet#94396181 as float) END AS excess_retnet#94396508]
Filter (isnotnull(cap#94396521) AND (cast(cap#94396521 as string) = 0))
WholeStageCodegen (1)
InMemoryTableScan [cap#94396521, date#94396509, numcos#94396593], [isnotnull(cap#94396521), (cast(cap#94396521 as string) = 0)]
Project [CASE WHEN (date#94396194 = null) THEN null ELSE cast(date#94396194 as date) END AS date#94396509, CASE WHEN ((cap#94396195 = NA) OR (cap#94396195 = null)) THEN null ELSE cast(cap#94396195 as float) END AS cap#94396521, CASE WHEN ((ret#94396196 = NA) OR (ret#94396196 = null)) THEN null ELSE cast(ret#94396196 as float) END AS ret#94396522, CASE WHEN ((resret#94396197 = NA) OR (resret#94396197 = null)) THEN null ELSE cast(resret#94396197 as float) END AS resret#94396525, CASE WHEN ((retnet#94396198 = NA) OR (retnet#94396198 = null)) THEN null ELSE cast(retnet#94396198 as float) END AS retnet#94396528, CASE WHEN ((turnover#94396199 = NA) OR (turnover#94396199 = null)) THEN null ELSE cast(turnover#94396199 as float) END AS turnover#94396591, CASE WHEN ((numcos#94396200 = NA) OR (numcos#94396200 = null)) THEN null ELSE cast(numcos#94396200 as float) END AS numcos#94396593, CASE WHEN ((coverage#94396201 = NA) OR (coverage#94396201 = null)) THEN null ELSE cast(coverage#94396201 as float) END AS coverage#94396596, CASE WHEN ((benchmark#94396202 = NA) OR (benchmark#94396202 = null)) THEN null ELSE cast(benchmark#94396202 as float) END AS benchmark#94396599, CASE WHEN ((excess_ret#94396203 = NA) OR (excess_ret#94396203 = null)) THEN null ELSE cast(excess_ret#94396203 as float) END AS excess_ret#94396602, CASE WHEN ((excess_resret#94396204 = NA) OR (excess_resret#94396204 = null)) THEN null ELSE cast(excess_resret#94396204 as float) END AS excess_resret#94396604, CASE WHEN ((excess_retnet#94396205 = NA) OR (excess_retnet#94396205 = null)) THEN null ELSE cast(excess_retnet#94396205 as float) END AS excess_retnet#94396606]
== Physical Plan ==
CollectLimit (16)
+- InMemoryTableScan (1)
+- InMemoryRelation (2)
+- * Sort (15)
+- Exchange (14)
+- Union (13)
:- InMemoryTableScan (3)
: +- InMemoryRelation (4)
: +- * Project (6)
: +- Scan csv (5)
+- * Project (12)
+- * Filter (11)
+- InMemoryTableScan (7)
+- InMemoryRelation (8)
+- * Project (10)
+- Scan csv (9)
(1) InMemoryTableScan
Output [2]: [date#94396426, numcos#94396504]
Arguments: [date#94396426, numcos#94396504]
(2) InMemoryRelation
Arguments: [date#94396426, numcos#94396504], CachedRDDBuilder(org.apache.spark.sql.execution.columnar.DefaultCachedBatchSerializer@208e3fd9,StorageLevel(disk, memory, deserialized, 1 replicas),*(2) Sort [date#94396426 ASC NULLS FIRST], true, 0
+- Exchange rangepartitioning(date#94396426 ASC NULLS FIRST, 200), ENSURE_REQUIREMENTS, [id=#7536907]
+- Union
:- InMemoryTableScan [date#94396426, numcos#94396504]
: +- InMemoryRelation [date#94396426, overall#94396454, ret#94396487, resret#94396488, retnet#94396489, turnover#94396490, numcos#94396504, benchmark#94396505, excess_ret#94396506, excess_resret#94396507, excess_retnet#94396508], StorageLevel(disk, memory, deserialized, 1 replicas)
: +- *(1) Project [CASE WHEN (date#94396171 = null) THEN null ELSE cast(date#94396171 as date) END AS date#94396426, CASE WHEN ((overall#94396172 = NA) OR (overall#94396172 = null)) THEN null ELSE cast(overall#94396172 as int) END AS overall#94396454, CASE WHEN ((ret#94396173 = NA) OR (ret#94396173 = null)) THEN null ELSE cast(ret#94396173 as float) END AS ret#94396487, CASE WHEN ((resret#94396174 = NA) OR (resret#94396174 = null)) THEN null ELSE cast(resret#94396174 as float) END AS resret#94396488, CASE WHEN ((retnet#94396175 = NA) OR (retnet#94396175 = null)) THEN null ELSE cast(retnet#94396175 as float) END AS retnet#94396489, CASE WHEN ((turnover#94396176 = NA) OR (turnover#94396176 = null)) THEN null ELSE cast(turnover#94396176 as float) END AS turnover#94396490, CASE WHEN ((numcos#94396177 = NA) OR (numcos#94396177 = null)) THEN null ELSE cast(numcos#94396177 as float) END AS numcos#94396504, CASE WHEN ((benchmark#94396178 = NA) OR (benchmark#94396178 = null)) THEN null ELSE cast(benchmark#94396178 as float) END AS benchmark#94396505, CASE WHEN ((excess_ret#94396179 = NA) OR (excess_ret#94396179 = null)) THEN null ELSE cast(excess_ret#94396179 as float) END AS excess_ret#94396506, CASE WHEN ((excess_resret#94396180 = NA) OR (excess_resret#94396180 = null)) THEN null ELSE cast(excess_resret#94396180 as float) END AS excess_resret#94396507, CASE WHEN ((excess_retnet#94396181 = NA) OR (excess_retnet#94396181 = null)) THEN null ELSE cast(excess_retnet#94396181 as float) END AS excess_retnet#94396508]
: +- FileScan csv [date#94396171,overall#94396172,ret#94396173,resret#94396174,retnet#94396175,turnover#94396176,numcos#94396177,benchmark#94396178,excess_ret#94396179,excess_resret#94396180,excess_retnet#94396181] Batched: false, DataFilters: [], Format: CSV, Location: InMemoryFileIndex(1 paths)[file:/srv/plusamp/data/default/ea-market/output/risk_factors/momentum/..., PartitionFilters: [], PushedFilters: [], ReadSchema: struct<date:string,overall:string,ret:string,resret:string,retnet:string,turnover:string,numcos:s...
+- *(1) Project [date#94396509, numcos#94396593]
+- *(1) Filter (isnotnull(cap#94396521) AND (cast(cap#94396521 as string) = 0))
+- InMemoryTableScan [cap#94396521, date#94396509, numcos#94396593], [isnotnull(cap#94396521), (cast(cap#94396521 as string) = 0)]
+- InMemoryRelation [date#94396509, cap#94396521, ret#94396522, resret#94396525, retnet#94396528, turnover#94396591, numcos#94396593, coverage#94396596, benchmark#94396599, excess_ret#94396602, excess_resret#94396604, excess_retnet#94396606], StorageLevel(disk, memory, deserialized, 1 replicas)
+- *(1) Project [CASE WHEN (date#94396194 = null) THEN null ELSE cast(date#94396194 as date) END AS date#94396509, CASE WHEN ((cap#94396195 = NA) OR (cap#94396195 = null)) THEN null ELSE cast(cap#94396195 as float) END AS cap#94396521, CASE WHEN ((ret#94396196 = NA) OR (ret#94396196 = null)) THEN null ELSE cast(ret#94396196 as float) END AS ret#94396522, CASE WHEN ((resret#94396197 = NA) OR (resret#94396197 = null)) THEN null ELSE cast(resret#94396197 as float) END AS resret#94396525, CASE WHEN ((retnet#94396198 = NA) OR (retnet#94396198 = null)) THEN null ELSE cast(retnet#94396198 as float) END AS retnet#94396528, CASE WHEN ((turnover#94396199 = NA) OR (turnover#94396199 = null)) THEN null ELSE cast(turnover#94396199 as float) END AS turnover#94396591, CASE WHEN ((numcos#94396200 = NA) OR (numcos#94396200 = null)) THEN null ELSE cast(numcos#94396200 as float) END AS numcos#94396593, CASE WHEN ((coverage#94396201 = NA) OR (coverage#94396201 = null)) THEN null ELSE cast(coverage#94396201 as float) END AS coverage#94396596, CASE WHEN ((benchmark#94396202 = NA) OR (benchmark#94396202 = null)) THEN null ELSE cast(benchmark#94396202 as float) END AS benchmark#94396599, CASE WHEN ((excess_ret#94396203 = NA) OR (excess_ret#94396203 = null)) THEN null ELSE cast(excess_ret#94396203 as float) END AS excess_ret#94396602, CASE WHEN ((excess_resret#94396204 = NA) OR (excess_resret#94396204 = null)) THEN null ELSE cast(excess_resret#94396204 as float) END AS excess_resret#94396604, CASE WHEN ((excess_retnet#94396205 = NA) OR (excess_retnet#94396205 = null)) THEN null ELSE cast(excess_retnet#94396205 as float) END AS excess_retnet#94396606]
+- FileScan csv [date#94396194,cap#94396195,ret#94396196,resret#94396197,retnet#94396198,turnover#94396199,numcos#94396200,coverage#94396201,benchmark#94396202,excess_ret#94396203,excess_resret#94396204,excess_retnet#94396205] Batched: false, DataFilters: [], Format: CSV, Location: InMemoryFileIndex(1 paths)[file:/srv/plusamp/data/default/ea-market/output/risk_factors/momentum/..., PartitionFilters: [], PushedFilters: [], ReadSchema: struct<date:string,cap:string,ret:string,resret:string,retnet:string,turnover:string,numcos:strin...
,None), [date#94396426 ASC NULLS FIRST]
(3) InMemoryTableScan
Output [2]: [date#94396426, numcos#94396504]
Arguments: [date#94396426, numcos#94396504]
(4) InMemoryRelation
Arguments: [date#94396426, overall#94396454, ret#94396487, resret#94396488, retnet#94396489, turnover#94396490, numcos#94396504, benchmark#94396505, excess_ret#94396506, excess_resret#94396507, excess_retnet#94396508], CachedRDDBuilder(org.apache.spark.sql.execution.columnar.DefaultCachedBatchSerializer@208e3fd9,StorageLevel(disk, memory, deserialized, 1 replicas),*(1) Project [CASE WHEN (date#94396171 = null) THEN null ELSE cast(date#94396171 as date) END AS date#94396426, CASE WHEN ((overall#94396172 = NA) OR (overall#94396172 = null)) THEN null ELSE cast(overall#94396172 as int) END AS overall#94396454, CASE WHEN ((ret#94396173 = NA) OR (ret#94396173 = null)) THEN null ELSE cast(ret#94396173 as float) END AS ret#94396487, CASE WHEN ((resret#94396174 = NA) OR (resret#94396174 = null)) THEN null ELSE cast(resret#94396174 as float) END AS resret#94396488, CASE WHEN ((retnet#94396175 = NA) OR (retnet#94396175 = null)) THEN null ELSE cast(retnet#94396175 as float) END AS retnet#94396489, CASE WHEN ((turnover#94396176 = NA) OR (turnover#94396176 = null)) THEN null ELSE cast(turnover#94396176 as float) END AS turnover#94396490, CASE WHEN ((numcos#94396177 = NA) OR (numcos#94396177 = null)) THEN null ELSE cast(numcos#94396177 as float) END AS numcos#94396504, CASE WHEN ((benchmark#94396178 = NA) OR (benchmark#94396178 = null)) THEN null ELSE cast(benchmark#94396178 as float) END AS benchmark#94396505, CASE WHEN ((excess_ret#94396179 = NA) OR (excess_ret#94396179 = null)) THEN null ELSE cast(excess_ret#94396179 as float) END AS excess_ret#94396506, CASE WHEN ((excess_resret#94396180 = NA) OR (excess_resret#94396180 = null)) THEN null ELSE cast(excess_resret#94396180 as float) END AS excess_resret#94396507, CASE WHEN ((excess_retnet#94396181 = NA) OR (excess_retnet#94396181 = null)) THEN null ELSE cast(excess_retnet#94396181 as float) END AS excess_retnet#94396508]
+- FileScan csv [date#94396171,overall#94396172,ret#94396173,resret#94396174,retnet#94396175,turnover#94396176,numcos#94396177,benchmark#94396178,excess_ret#94396179,excess_resret#94396180,excess_retnet#94396181] Batched: false, DataFilters: [], Format: CSV, Location: InMemoryFileIndex(1 paths)[file:/srv/plusamp/data/default/ea-market/output/risk_factors/momentum/..., PartitionFilters: [], PushedFilters: [], ReadSchema: struct<date:string,overall:string,ret:string,resret:string,retnet:string,turnover:string,numcos:s...
,None)
(5) Scan csv
Output [11]: [date#94396171, overall#94396172, ret#94396173, resret#94396174, retnet#94396175, turnover#94396176, numcos#94396177, benchmark#94396178, excess_ret#94396179, excess_resret#94396180, excess_retnet#94396181]
Batched: false
Location: InMemoryFileIndex [file:/srv/plusamp/data/default/ea-market/output/risk_factors/momentum/longshort_overall.csv]
ReadSchema: struct<date:string,overall:string,ret:string,resret:string,retnet:string,turnover:string,numcos:string,benchmark:string,excess_ret:string,excess_resret:string,excess_retnet:string>
(6) Project [codegen id : 1]
Output [11]: [CASE WHEN (date#94396171 = null) THEN null ELSE cast(date#94396171 as date) END AS date#94396426, CASE WHEN ((overall#94396172 = NA) OR (overall#94396172 = null)) THEN null ELSE cast(overall#94396172 as int) END AS overall#94396454, CASE WHEN ((ret#94396173 = NA) OR (ret#94396173 = null)) THEN null ELSE cast(ret#94396173 as float) END AS ret#94396487, CASE WHEN ((resret#94396174 = NA) OR (resret#94396174 = null)) THEN null ELSE cast(resret#94396174 as float) END AS resret#94396488, CASE WHEN ((retnet#94396175 = NA) OR (retnet#94396175 = null)) THEN null ELSE cast(retnet#94396175 as float) END AS retnet#94396489, CASE WHEN ((turnover#94396176 = NA) OR (turnover#94396176 = null)) THEN null ELSE cast(turnover#94396176 as float) END AS turnover#94396490, CASE WHEN ((numcos#94396177 = NA) OR (numcos#94396177 = null)) THEN null ELSE cast(numcos#94396177 as float) END AS numcos#94396504, CASE WHEN ((benchmark#94396178 = NA) OR (benchmark#94396178 = null)) THEN null ELSE cast(benchmark#94396178 as float) END AS benchmark#94396505, CASE WHEN ((excess_ret#94396179 = NA) OR (excess_ret#94396179 = null)) THEN null ELSE cast(excess_ret#94396179 as float) END AS excess_ret#94396506, CASE WHEN ((excess_resret#94396180 = NA) OR (excess_resret#94396180 = null)) THEN null ELSE cast(excess_resret#94396180 as float) END AS excess_resret#94396507, CASE WHEN ((excess_retnet#94396181 = NA) OR (excess_retnet#94396181 = null)) THEN null ELSE cast(excess_retnet#94396181 as float) END AS excess_retnet#94396508]
Input [11]: [date#94396171, overall#94396172, ret#94396173, resret#94396174, retnet#94396175, turnover#94396176, numcos#94396177, benchmark#94396178, excess_ret#94396179, excess_resret#94396180, excess_retnet#94396181]
(7) InMemoryTableScan
Output [3]: [cap#94396521, date#94396509, numcos#94396593]
Arguments: [cap#94396521, date#94396509, numcos#94396593], [isnotnull(cap#94396521), (cast(cap#94396521 as string) = 0)]
(8) InMemoryRelation
Arguments: [date#94396509, cap#94396521, ret#94396522, resret#94396525, retnet#94396528, turnover#94396591, numcos#94396593, coverage#94396596, benchmark#94396599, excess_ret#94396602, excess_resret#94396604, excess_retnet#94396606], CachedRDDBuilder(org.apache.spark.sql.execution.columnar.DefaultCachedBatchSerializer@208e3fd9,StorageLevel(disk, memory, deserialized, 1 replicas),*(1) Project [CASE WHEN (date#94396194 = null) THEN null ELSE cast(date#94396194 as date) END AS date#94396509, CASE WHEN ((cap#94396195 = NA) OR (cap#94396195 = null)) THEN null ELSE cast(cap#94396195 as float) END AS cap#94396521, CASE WHEN ((ret#94396196 = NA) OR (ret#94396196 = null)) THEN null ELSE cast(ret#94396196 as float) END AS ret#94396522, CASE WHEN ((resret#94396197 = NA) OR (resret#94396197 = null)) THEN null ELSE cast(resret#94396197 as float) END AS resret#94396525, CASE WHEN ((retnet#94396198 = NA) OR (retnet#94396198 = null)) THEN null ELSE cast(retnet#94396198 as float) END AS retnet#94396528, CASE WHEN ((turnover#94396199 = NA) OR (turnover#94396199 = null)) THEN null ELSE cast(turnover#94396199 as float) END AS turnover#94396591, CASE WHEN ((numcos#94396200 = NA) OR (numcos#94396200 = null)) THEN null ELSE cast(numcos#94396200 as float) END AS numcos#94396593, CASE WHEN ((coverage#94396201 = NA) OR (coverage#94396201 = null)) THEN null ELSE cast(coverage#94396201 as float) END AS coverage#94396596, CASE WHEN ((benchmark#94396202 = NA) OR (benchmark#94396202 = null)) THEN null ELSE cast(benchmark#94396202 as float) END AS benchmark#94396599, CASE WHEN ((excess_ret#94396203 = NA) OR (excess_ret#94396203 = null)) THEN null ELSE cast(excess_ret#94396203 as float) END AS excess_ret#94396602, CASE WHEN ((excess_resret#94396204 = NA) OR (excess_resret#94396204 = null)) THEN null ELSE cast(excess_resret#94396204 as float) END AS excess_resret#94396604, CASE WHEN ((excess_retnet#94396205 = NA) OR (excess_retnet#94396205 = null)) THEN null ELSE cast(excess_retnet#94396205 as float) END AS excess_retnet#94396606]
+- FileScan csv [date#94396194,cap#94396195,ret#94396196,resret#94396197,retnet#94396198,turnover#94396199,numcos#94396200,coverage#94396201,benchmark#94396202,excess_ret#94396203,excess_resret#94396204,excess_retnet#94396205] Batched: false, DataFilters: [], Format: CSV, Location: InMemoryFileIndex(1 paths)[file:/srv/plusamp/data/default/ea-market/output/risk_factors/momentum/..., PartitionFilters: [], PushedFilters: [], ReadSchema: struct<date:string,cap:string,ret:string,resret:string,retnet:string,turnover:string,numcos:strin...
,None)
(9) Scan csv
Output [12]: [date#94396194, cap#94396195, ret#94396196, resret#94396197, retnet#94396198, turnover#94396199, numcos#94396200, coverage#94396201, benchmark#94396202, excess_ret#94396203, excess_resret#94396204, excess_retnet#94396205]
Batched: false
Location: InMemoryFileIndex [file:/srv/plusamp/data/default/ea-market/output/risk_factors/momentum/longshort_cap.csv]
ReadSchema: struct<date:string,cap:string,ret:string,resret:string,retnet:string,turnover:string,numcos:string,coverage:string,benchmark:string,excess_ret:string,excess_resret:string,excess_retnet:string>
(10) Project [codegen id : 1]
Output [12]: [CASE WHEN (date#94396194 = null) THEN null ELSE cast(date#94396194 as date) END AS date#94396509, CASE WHEN ((cap#94396195 = NA) OR (cap#94396195 = null)) THEN null ELSE cast(cap#94396195 as float) END AS cap#94396521, CASE WHEN ((ret#94396196 = NA) OR (ret#94396196 = null)) THEN null ELSE cast(ret#94396196 as float) END AS ret#94396522, CASE WHEN ((resret#94396197 = NA) OR (resret#94396197 = null)) THEN null ELSE cast(resret#94396197 as float) END AS resret#94396525, CASE WHEN ((retnet#94396198 = NA) OR (retnet#94396198 = null)) THEN null ELSE cast(retnet#94396198 as float) END AS retnet#94396528, CASE WHEN ((turnover#94396199 = NA) OR (turnover#94396199 = null)) THEN null ELSE cast(turnover#94396199 as float) END AS turnover#94396591, CASE WHEN ((numcos#94396200 = NA) OR (numcos#94396200 = null)) THEN null ELSE cast(numcos#94396200 as float) END AS numcos#94396593, CASE WHEN ((coverage#94396201 = NA) OR (coverage#94396201 = null)) THEN null ELSE cast(coverage#94396201 as float) END AS coverage#94396596, CASE WHEN ((benchmark#94396202 = NA) OR (benchmark#94396202 = null)) THEN null ELSE cast(benchmark#94396202 as float) END AS benchmark#94396599, CASE WHEN ((excess_ret#94396203 = NA) OR (excess_ret#94396203 = null)) THEN null ELSE cast(excess_ret#94396203 as float) END AS excess_ret#94396602, CASE WHEN ((excess_resret#94396204 = NA) OR (excess_resret#94396204 = null)) THEN null ELSE cast(excess_resret#94396204 as float) END AS excess_resret#94396604, CASE WHEN ((excess_retnet#94396205 = NA) OR (excess_retnet#94396205 = null)) THEN null ELSE cast(excess_retnet#94396205 as float) END AS excess_retnet#94396606]
Input [12]: [date#94396194, cap#94396195, ret#94396196, resret#94396197, retnet#94396198, turnover#94396199, numcos#94396200, coverage#94396201, benchmark#94396202, excess_ret#94396203, excess_resret#94396204, excess_retnet#94396205]
(11) Filter [codegen id : 1]
Input [3]: [cap#94396521, date#94396509, numcos#94396593]
Condition : (isnotnull(cap#94396521) AND (cast(cap#94396521 as string) = 0))
(12) Project [codegen id : 1]
Output [2]: [date#94396509, numcos#94396593]
Input [3]: [cap#94396521, date#94396509, numcos#94396593]
(13) Union
(14) Exchange
Input [2]: [date#94396426, numcos#94396504]
Arguments: rangepartitioning(date#94396426 ASC NULLS FIRST, 200), ENSURE_REQUIREMENTS, [id=#7536907]
(15) Sort [codegen id : 2]
Input [2]: [date#94396426, numcos#94396504]
Arguments: [date#94396426 ASC NULLS FIRST], true, 0
(16) CollectLimit
Input [2]: [date#94396426, numcos#94396504]
Arguments: 1000000