[
https://issues.apache.org/jira/browse/HIVEMALL-78?page=com.atlassian.jira.plugin.system.issuetabpanels:all-tabpanel
]
Makoto Yui updated HIVEMALL-78:
-------------------------------
Description:
http://www.citeulike.org/user/myui/article/12615084
https://github.com/apache/spark/blob/master/mllib/src/main/scala/org/apache/spark/mllib/evaluation/BinaryClassificationMetrics.scala
{code:sql}
WITH roc as (
select
roc(label, prob) as tpr, tpr
from
data
)
select
auc(fpr, tpr) as auroc -- auc is UDAF, input is sorted by fp asc
from (
select
fpr, tpr
from
roc
DISTRIBUTE BY
floor(fpr / 0.2) -- 5 bins
SORT BY
fpr ASC
) t
{code}
was:
http://www.citeulike.org/user/myui/article/12615084
https://github.com/apache/spark/blob/master/mllib/src/main/scala/org/apache/spark/mllib/evaluation/BinaryClassificationMetrics.scala
{code:sql}
select
auc(fp, tp) as area -- auc is UDAF, input is sorted by fp asc
from (
select
fp, tp
from
data
DISTRIBUTE BY
floor(fp / 0.2) -- 5 bins
SORT BY
fp ASC
) t
{code}
> Support AUC BinaryClassificationMetrics
> ---------------------------------------
>
> Key: HIVEMALL-78
> URL: https://issues.apache.org/jira/browse/HIVEMALL-78
> Project: Hivemall
> Issue Type: New Feature
> Reporter: Makoto Yui
> Assignee: Takuya Kitazawa
> Priority: Minor
>
> http://www.citeulike.org/user/myui/article/12615084
> https://github.com/apache/spark/blob/master/mllib/src/main/scala/org/apache/spark/mllib/evaluation/BinaryClassificationMetrics.scala
> {code:sql}
> WITH roc as (
> select
> roc(label, prob) as tpr, tpr
> from
> data
> )
> select
> auc(fpr, tpr) as auroc -- auc is UDAF, input is sorted by fp asc
> from (
> select
> fpr, tpr
> from
> roc
> DISTRIBUTE BY
> floor(fpr / 0.2) -- 5 bins
> SORT BY
> fpr ASC
> ) t
> {code}
--
This message was sent by Atlassian JIRA
(v6.3.15#6346)