Github user davies commented on the pull request:
https://github.com/apache/spark/pull/12954#issuecomment-217527040
I still can't run Q41 after this PR:
```
select distinct(i_product_name)
from item i1
where i_manufact_id between 738 and 738+40
and (select count(*) as item_cnt
from item
where (i_manufact = i1.i_manufact and
(i_category = 'Women' and
(i_color = 'powder' or i_color = 'khaki') and
(i_units = 'Ounce' or i_units = 'Oz') and
(i_size = 'medium' or i_size = 'extra large')
) or
(i_category = 'Women' and
(i_color = 'brown' or i_color = 'honeydew') and
(i_units = 'Bunch' or i_units = 'Ton') and
(i_size = 'N/A' or i_size = 'small')
) or
(i_category = 'Men' and
(i_color = 'floral' or i_color = 'deep') and
(i_units = 'N/A' or i_units = 'Dozen') and
(i_size = 'petite' or i_size = 'large')
) or
(i_category = 'Men' and
(i_color = 'light' or i_color = 'cornflower') and
(i_units = 'Box' or i_units = 'Pound') and
(i_size = 'medium' or i_size = 'extra large')
))
or
(i_manufact = i1.i_manufact and
((i_category = 'Women' and
(i_color = 'midnight' or i_color = 'snow') and
(i_units = 'Pallet' or i_units = 'Gross') and
(i_size = 'medium' or i_size = 'extra large')
) or
(i_category = 'Women' and
(i_color = 'cyan' or i_color = 'papaya') and
(i_units = 'Cup' or i_units = 'Dram') and
(i_size = 'N/A' or i_size = 'small')
) or
(i_category = 'Men' and
(i_color = 'orange' or i_color = 'frosted') and
(i_units = 'Each' or i_units = 'Tbl') and
(i_size = 'petite' or i_size = 'large')
) or
(i_category = 'Men' and
(i_color = 'forest' or i_color = 'ghost') and
(i_units = 'Lb' or i_units = 'Bundle') and
(i_size = 'medium' or i_size = 'extra large')
)))) > 0
order by i_product_name
limit 100
Traceback (most recent call last):
File "tpcds.py", line 117, in <module>
test(sys.argv[1], 2)
File "tpcds.py", line 83, in test
sqlContext.sql(q).explain(False)
File "/Users/davies/work/spark/python/pyspark/sql/context.py", line 345,
in sql
return self.sparkSession.sql(sqlQuery)
File "/Users/davies/work/spark/python/pyspark/sql/session.py", line 505,
in sql
return DataFrame(self._jsparkSession.sql(sqlQuery), self._wrapped)
File "//anaconda/lib/python2.7/site-packages/py4j/java_gateway.py", line
538, in __call__
self.target_id, self.name)
File "/Users/davies/work/spark/python/pyspark/sql/utils.py", line 63, in
deco
raise AnalysisException(s.split(': ', 1)[1], stackTrace)
pyspark.sql.utils.AnalysisException: u'The correlated scalar subquery can
only contain equality predicates: ((((i_category#215#484 = Women) &&
(((((i_manufact#217#486 = i_manufact#217) && ((i_color#220#485 = powder) ||
(i_color#220#485 = khaki))) && ((i_units#221#488 = Ounce) || (i_units#221#488 =
Oz))) && ((i_size#218#487 = medium) || (i_size#218#487 = extra large))) ||
((((i_color#220#485 = brown) || (i_color#220#485 = honeydew)) &&
((i_units#221#488 = Bunch) || (i_units#221#488 = Ton))) && ((i_size#218#487 =
N/A) || (i_size#218#487 = small))))) || ((i_category#215#484 = Men) &&
(((((i_color#220#485 = floral) || (i_color#220#485 = deep)) &&
((i_units#221#488 = N/A) || (i_units#221#488 = Dozen))) && ((i_size#218#487 =
petite) || (i_size#218#487 = large))) || ((((i_color#220#485 = light) ||
(i_color#220#485 = cornflower)) && ((i_units#221#488 = Box) || (i_units#221#488
= Pound))) && ((i_size#218#487 = medium) || (i_size#218#487 = extra large))))))
|| ((i_manufact#217#486 = i_manu
fact#217) && (((i_category#215#484 = Women) && (((((i_color#220#485 =
midnight) || (i_color#220#485 = snow)) && ((i_units#221#488 = Pallet) ||
(i_units#221#488 = Gross))) && ((i_size#218#487 = medium) || (i_size#218#487 =
extra large))) || ((((i_color#220#485 = cyan) || (i_color#220#485 = papaya)) &&
((i_units#221#488 = Cup) || (i_units#221#488 = Dram))) && ((i_size#218#487 =
N/A) || (i_size#218#487 = small))))) || ((i_category#215#484 = Men) &&
(((((i_color#220#485 = orange) || (i_color#220#485 = frosted)) &&
((i_units#221#488 = Each) || (i_units#221#488 = Tbl))) && ((i_size#218#487 =
petite) || (i_size#218#487 = large))) || ((((i_color#220#485 = forest) ||
(i_color#220#485 = ghost)) && ((i_units#221#488 = Lb) || (i_units#221#488 =
Bundle))) && ((i_size#218#487 = medium) || (i_size#218#487 = extra
large))))))));'
```
---
If your project is set up for it, you can reply to this email and have your
reply appear on GitHub as well. If your project does not have this feature
enabled and wishes so, or if the feature is enabled but not working, please
contact infrastructure at [email protected] or file a JIRA ticket
with INFRA.
---
---------------------------------------------------------------------
To unsubscribe, e-mail: [email protected]
For additional commands, e-mail: [email protected]