commit:     6f43428e3b857d6a9c642b4893334ad47bddb0f1
Author:     Alfredo Tupone <tupone <AT> gentoo <DOT> org>
AuthorDate: Tue May 16 20:40:24 2023 +0000
Commit:     Alfredo Tupone <tupone <AT> gentoo <DOT> org>
CommitDate: Tue May 16 20:40:47 2023 +0000
URL:        https://gitweb.gentoo.org/repo/gentoo.git/commit/?id=6f43428e

sci-libs/evaluate: new package, add 0.4.0

Signed-off-by: Alfredo Tupone <tupone <AT> gentoo.org>

 sci-libs/evaluate/Manifest                         |  1 +
 sci-libs/evaluate/evaluate-0.4.0.ebuild            | 43 ++++++++++++++++
 sci-libs/evaluate/files/evaluate-0.4.0-tests.patch | 60 ++++++++++++++++++++++
 sci-libs/evaluate/metadata.xml                     | 12 +++++
 4 files changed, 116 insertions(+)

diff --git a/sci-libs/evaluate/Manifest b/sci-libs/evaluate/Manifest
new file mode 100644
index 000000000000..684c25d25aa0
--- /dev/null
+++ b/sci-libs/evaluate/Manifest
@@ -0,0 +1 @@
+DIST evaluate-0.4.0.gh.tar.gz 292250 BLAKE2B 
f88428b263820c1af43d02ae676625257251476092efe624490f29e63a045d698db01e4a7a802c2330027d01bc6ccf16986f28ecf8202ecbfd943c5d7c40f6ec
 SHA512 
f2136196fc4e5717859e36e173cd49d049fc5ef50c89f466e13edd0142830574dec0b5485a4a1097eec9cb9df756a617216ff48c141db008cb0c2b85288d7fc9

diff --git a/sci-libs/evaluate/evaluate-0.4.0.ebuild 
b/sci-libs/evaluate/evaluate-0.4.0.ebuild
new file mode 100644
index 000000000000..60382685f160
--- /dev/null
+++ b/sci-libs/evaluate/evaluate-0.4.0.ebuild
@@ -0,0 +1,43 @@
+# Copyright 2023 Gentoo Authors
+# Distributed under the terms of the GNU General Public License v2
+
+EAPI=8
+
+DISTUTILS_USE_PEP517=setuptools
+PYTHON_COMPAT=( python3_11 )
+inherit distutils-r1
+
+DESCRIPTION="makes evaluating, comparing models and reporting their 
performance easier"
+HOMEPAGE="
+       https://pypi.org/project/evaluate/
+       https://github.com/huggingface/evaluate
+"
+SRC_URI="https://github.com/huggingface/${PN}/archive/refs/tags/v${PV}.tar.gz
+       -> ${P}.gh.tar.gz"
+
+LICENSE="Apache-2.0"
+SLOT="0"
+KEYWORDS="~amd64"
+
+RDEPEND="
+       dev-python/pyarrow[${PYTHON_USEDEP},parquet]
+       dev-python/unidecode[${PYTHON_USEDEP}]
+"
+BDEPEND="test? (
+       sci-libs/jiwer[${PYTHON_USEDEP}]
+       sci-libs/seqeval[${PYTHON_USEDEP}]
+)"
+
+PATCHES=( "${FILESDIR}"/${P}-tests.patch )
+
+distutils_enable_tests pytest
+
+src_prepare() {
+       # These require packages not available on gentoo
+       rm -r metrics/{bertscore,bleurt,character,charcut_mt,chrf,code_eval} || 
die
+       rm -r metrics/{competition_math,coval,google_bleu,mauve,meteor} || die
+       rm -r metrics/{nist_mt,rl_reliability,rouge,sacrebleu,sari} || die
+       rm -r metrics/{ter,trec_eval,wiki_split,xtreme_s} || die
+       rm -r measurements/word_length || die
+       distutils-r1_src_prepare
+}

diff --git a/sci-libs/evaluate/files/evaluate-0.4.0-tests.patch 
b/sci-libs/evaluate/files/evaluate-0.4.0-tests.patch
new file mode 100644
index 000000000000..1e7e808576e3
--- /dev/null
+++ b/sci-libs/evaluate/files/evaluate-0.4.0-tests.patch
@@ -0,0 +1,60 @@
+--- a/tests/test_evaluator.py  2023-05-14 11:01:54.449768849 +0200
++++ b/tests/test_evaluator.py  2023-05-14 11:06:15.182738125 +0200
+@@ -16,6 +16,7 @@
+ 
+ from time import sleep
+ from unittest import TestCase, mock
++from unittest import skip
+ 
+ from datasets import ClassLabel, Dataset, Features, Sequence, Value
+ from PIL import Image
+@@ -335,6 +335,7 @@
+         )
+         self.assertEqual(results["accuracy"], 1.0)
+ 
++    @skip("not working")
+     def test_bootstrap(self):
+         data = Dataset.from_dict({"label": [1, 0, 0], "text": ["great movie", 
"great movie", "horrible movie"]})
+ 
+@@ -368,6 +369,7 @@
+         self.assertAlmostEqual(results["samples_per_second"], len(self.data) 
/ results["total_time_in_seconds"], 5)
+         self.assertAlmostEqual(results["latency_in_seconds"], 
results["total_time_in_seconds"] / len(self.data), 5)
+ 
++    @skip("not working")
+     def test_bootstrap_and_perf(self):
+         data = Dataset.from_dict({"label": [1, 0, 0], "text": ["great movie", 
"great movie", "horrible movie"]})
+ 
+@@ -877,6 +877,7 @@
+         results = self.evaluator.compute(data=self.data)
+         self.assertIsInstance(results["unique_words"], int)
+ 
++    @skip("require nltk")
+     def test_overwrite_default_metric(self):
+         word_length = load("word_length")
+         results = self.evaluator.compute(
+@@ -939,6 +940,7 @@
+         results = self.evaluator.compute(data=self.data)
+         self.assertEqual(results["bleu"], 0)
+ 
++    @skip("require rouge_score")
+     def test_overwrite_default_metric(self):
+         rouge = load("rouge")
+         results = self.evaluator.compute(
+@@ -949,6 +952,7 @@
+         )
+         self.assertEqual(results["rouge1"], 1.0)
+ 
++    @skip("require rouge_score")
+     def test_summarization(self):
+         pipe = DummyText2TextGenerationPipeline(task="summarization", 
prefix="summary")
+         e = evaluator("summarization")
+--- a/tests/test_trainer_evaluator_parity.py   2023-05-14 17:50:29.224525549 
+0200
++++ b/tests/test_trainer_evaluator_parity.py   2023-05-14 17:37:40.947501195 
+0200
+@@ -269,6 +269,7 @@
+         self.assertEqual(transformers_results["eval_HasAns_f1"], 
evaluator_results["HasAns_f1"])
+         self.assertEqual(transformers_results["eval_NoAns_f1"], 
evaluator_results["NoAns_f1"])
+ 
++    @unittest.skip('require eval_results.json')
+     def test_token_classification_parity(self):
+         model_name = "hf-internal-testing/tiny-bert-for-token-classification"
+         n_samples = 500

diff --git a/sci-libs/evaluate/metadata.xml b/sci-libs/evaluate/metadata.xml
new file mode 100644
index 000000000000..f1e8571190f9
--- /dev/null
+++ b/sci-libs/evaluate/metadata.xml
@@ -0,0 +1,12 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE pkgmetadata SYSTEM "https://www.gentoo.org/dtd/metadata.dtd";>
+<pkgmetadata>
+       <maintainer type="person">
+               <email>[email protected]</email>
+               <name>Tupone Alfredo</name>
+       </maintainer>
+       <upstream>
+               <remote-id type="pypi">evaluate</remote-id>
+               <remote-id type="github">huggingface/evaluate</remote-id>
+       </upstream>
+</pkgmetadata>

Reply via email to