├── .github ├── hub │ ├── push_evaluations_to_hub.py │ └── requirements.txt └── workflows │ ├── build_documentation.yml │ ├── build_pr_documentation.yml │ ├── ci.yml │ ├── delete_doc_comment.yml │ ├── python-release.yml │ ├── trufflehog.yml │ └── update_spaces.yml ├── .gitignore ├── AUTHORS ├── CODE_OF_CONDUCT.md ├── CONTRIBUTING.md ├── LICENSE ├── Makefile ├── README.md ├── additional-tests-requirements.txt ├── comparisons ├── exact_match │ ├── README.md │ ├── app.py │ ├── exact_match.py │ └── requirements.txt ├── mcnemar │ ├── README.md │ ├── app.py │ ├── mcnemar.py │ └── requirements.txt └── wilcoxon │ ├── README.md │ ├── app.py │ ├── requirements.txt │ └── wilcoxon.py ├── docs ├── README.md └── source │ ├── _toctree.yml │ ├── a_quick_tour.mdx │ ├── base_evaluator.mdx │ ├── choosing_a_metric.mdx │ ├── considerations.mdx │ ├── creating_and_sharing.mdx │ ├── custom_evaluator.mdx │ ├── evaluation_suite.mdx │ ├── index.mdx │ ├── installation.mdx │ ├── keras_integrations.md │ ├── package_reference │ ├── evaluator_classes.mdx │ ├── hub_methods.mdx │ ├── loading_methods.mdx │ ├── logging_methods.mdx │ ├── main_classes.mdx │ ├── saving_methods.mdx │ └── visualization_methods.mdx │ ├── sklearn_integrations.mdx │ ├── transformers_integrations.mdx │ └── types_of_evaluations.mdx ├── measurements ├── honest │ ├── README.md │ ├── app.py │ ├── honest.py │ └── requirements.txt ├── label_distribution │ ├── README.md │ ├── app.py │ ├── label_distribution.py │ └── requirements.txt ├── perplexity │ ├── README.md │ ├── app.py │ ├── perplexity.py │ └── requirements.txt ├── regard │ ├── README.md │ ├── app.py │ ├── regard.py │ └── requirements.txt ├── text_duplicates │ ├── README.md │ ├── app.py │ ├── requirements.txt │ └── text_duplicates.py ├── toxicity │ ├── README.md │ ├── app.py │ ├── requirements.txt │ └── toxicity.py ├── word_count │ ├── README.md │ ├── app.py │ ├── requirements.txt │ └── word_count.py └── word_length │ ├── README.md │ ├── app.py │ ├── requirements.txt │ └── word_length.py ├── metrics ├── accuracy │ ├── README.md │ ├── accuracy.py │ ├── app.py │ └── requirements.txt ├── bertscore │ ├── README.md │ ├── app.py │ ├── bertscore.py │ └── requirements.txt ├── bleu │ ├── README.md │ ├── app.py │ ├── bleu.py │ ├── requirements.txt │ └── tokenizer_13a.py ├── bleurt │ ├── README.md │ ├── app.py │ ├── bleurt.py │ └── requirements.txt ├── brier_score │ ├── README.md │ ├── app.py │ ├── brier_score.py │ └── requirements.txt ├── cer │ ├── README.md │ ├── app.py │ ├── cer.py │ ├── requirements.txt │ └── test_cer.py ├── character │ ├── README.md │ ├── app.py │ ├── character.py │ └── requirements.txt ├── charcut_mt │ ├── README.md │ ├── app.py │ ├── charcut_mt.py │ └── requirements.txt ├── chrf │ ├── README.md │ ├── app.py │ ├── chrf.py │ └── requirements.txt ├── code_eval │ ├── README.md │ ├── app.py │ ├── code_eval.py │ ├── execute.py │ └── requirements.txt ├── comet │ ├── README.md │ ├── app.py │ ├── comet.py │ └── requirements.txt ├── competition_math │ ├── README.md │ ├── app.py │ ├── competition_math.py │ └── requirements.txt ├── confusion_matrix │ ├── README.md │ ├── app.py │ ├── confusion_matrix.py │ └── requirements.txt ├── coval │ ├── README.md │ ├── app.py │ ├── coval.py │ └── requirements.txt ├── cuad │ ├── README.md │ ├── app.py │ ├── compute_score.py │ ├── cuad.py │ └── requirements.txt ├── exact_match │ ├── README.md │ ├── app.py │ ├── exact_match.py │ └── requirements.txt ├── f1 │ ├── README.md │ ├── app.py │ ├── f1.py │ └── requirements.txt ├── fever │ ├── README.md │ ├── app.py │ ├── fever.py │ ├── requirements.txt │ └── test_fever.py ├── frugalscore │ ├── README.md │ ├── app.py │ ├── frugalscore.py │ └── requirements.txt ├── glue │ ├── README.md │ ├── app.py │ ├── glue.py │ └── requirements.txt ├── google_bleu │ ├── README.md │ ├── app.py │ ├── google_bleu.py │ ├── requirements.txt │ └── tokenizer_13a.py ├── indic_glue │ ├── README.md │ ├── app.py │ ├── indic_glue.py │ └── requirements.txt ├── mae │ ├── README.md │ ├── app.py │ ├── mae.py │ └── requirements.txt ├── mahalanobis │ ├── README.md │ ├── app.py │ ├── mahalanobis.py │ └── requirements.txt ├── mape │ ├── README.md │ ├── app.py │ ├── mape.py │ └── requirements.txt ├── mase │ ├── README.md │ ├── app.py │ ├── mase.py │ └── requirements.txt ├── matthews_correlation │ ├── README.md │ ├── app.py │ ├── matthews_correlation.py │ └── requirements.txt ├── mauve │ ├── README.md │ ├── app.py │ ├── mauve.py │ └── requirements.txt ├── mean_iou │ ├── README.md │ ├── app.py │ ├── mean_iou.py │ └── requirements.txt ├── meteor │ ├── README.md │ ├── app.py │ ├── meteor.py │ └── requirements.txt ├── mse │ ├── README.md │ ├── app.py │ ├── mse.py │ └── requirements.txt ├── nist_mt │ ├── README.md │ ├── app.py │ ├── nist_mt.py │ ├── requirements.txt │ └── tests.py ├── pearsonr │ ├── README.md │ ├── app.py │ ├── pearsonr.py │ └── requirements.txt ├── perplexity │ ├── README.md │ ├── app.py │ ├── perplexity.py │ └── requirements.txt ├── poseval │ ├── README.md │ ├── app.py │ ├── poseval.py │ └── requirements.txt ├── precision │ ├── README.md │ ├── app.py │ ├── precision.py │ └── requirements.txt ├── r_squared │ ├── README.md │ ├── app.py │ ├── r_squared.py │ └── requirements.txt ├── recall │ ├── README.md │ ├── app.py │ ├── recall.py │ └── requirements.txt ├── rl_reliability │ ├── README.md │ ├── app.py │ ├── requirements.txt │ └── rl_reliability.py ├── roc_auc │ ├── README.md │ ├── app.py │ ├── requirements.txt │ └── roc_auc.py ├── rouge │ ├── README.md │ ├── app.py │ ├── requirements.txt │ └── rouge.py ├── sacrebleu │ ├── README.md │ ├── app.py │ ├── requirements.txt │ └── sacrebleu.py ├── sari │ ├── README.md │ ├── app.py │ ├── requirements.txt │ └── sari.py ├── seqeval │ ├── README.md │ ├── app.py │ ├── requirements.txt │ └── seqeval.py ├── smape │ ├── README.md │ ├── app.py │ ├── requirements.txt │ └── smape.py ├── spearmanr │ ├── README.md │ ├── app.py │ ├── requirements.txt │ └── spearmanr.py ├── squad │ ├── README.md │ ├── app.py │ ├── compute_score.py │ ├── requirements.txt │ └── squad.py ├── squad_v2 │ ├── README.md │ ├── app.py │ ├── compute_score.py │ ├── requirements.txt │ └── squad_v2.py ├── super_glue │ ├── README.md │ ├── app.py │ ├── record_evaluation.py │ ├── requirements.txt │ └── super_glue.py ├── ter │ ├── README.md │ ├── app.py │ ├── requirements.txt │ └── ter.py ├── trec_eval │ ├── README.md │ ├── app.py │ ├── requirements.txt │ └── trec_eval.py ├── wer │ ├── README.md │ ├── app.py │ ├── requirements.txt │ └── wer.py ├── wiki_split │ ├── README.md │ ├── app.py │ ├── requirements.txt │ └── wiki_split.py ├── xnli │ ├── README.md │ ├── app.py │ ├── requirements.txt │ └── xnli.py └── xtreme_s │ ├── README.md │ ├── app.py │ ├── requirements.txt │ └── xtreme_s.py ├── setup.cfg ├── setup.py ├── src └── evaluate │ ├── __init__.py │ ├── commands │ ├── __init__.py │ └── evaluate_cli.py │ ├── config.py │ ├── evaluation_suite │ └── __init__.py │ ├── evaluator │ ├── __init__.py │ ├── audio_classification.py │ ├── automatic_speech_recognition.py │ ├── base.py │ ├── image_classification.py │ ├── question_answering.py │ ├── text2text_generation.py │ ├── text_classification.py │ ├── text_generation.py │ ├── token_classification.py │ └── utils.py │ ├── hub.py │ ├── info.py │ ├── inspect.py │ ├── loading.py │ ├── module.py │ ├── naming.py │ ├── saving.py │ ├── utils │ ├── __init__.py │ ├── file_utils.py │ ├── gradio.py │ └── logging.py │ └── visualization.py ├── templates ├── cookiecutter.json └── {{ cookiecutter.module_slug }} │ ├── README.md │ ├── app.py │ ├── requirements.txt │ ├── tests.py │ └── {{ cookiecutter.module_slug }}.py └── tests ├── __init__.py ├── conftest.py ├── test_evaluation_suite.py ├── test_evaluator.py ├── test_file_utils.py ├── test_hub.py ├── test_load.py ├── test_metric.py ├── test_metric_common.py ├── test_save.py ├── test_trainer_evaluator_parity.py ├── test_viz.py └── utils.py /.github/hub/push_evaluations_to_hub.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/.github/hub/push_evaluations_to_hub.py -------------------------------------------------------------------------------- /.github/hub/requirements.txt: -------------------------------------------------------------------------------- 1 | huggingface_hub -------------------------------------------------------------------------------- /.github/workflows/build_documentation.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/.github/workflows/build_documentation.yml -------------------------------------------------------------------------------- /.github/workflows/build_pr_documentation.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/.github/workflows/build_pr_documentation.yml -------------------------------------------------------------------------------- /.github/workflows/ci.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/.github/workflows/ci.yml -------------------------------------------------------------------------------- /.github/workflows/delete_doc_comment.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/.github/workflows/delete_doc_comment.yml -------------------------------------------------------------------------------- /.github/workflows/python-release.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/.github/workflows/python-release.yml -------------------------------------------------------------------------------- /.github/workflows/trufflehog.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/.github/workflows/trufflehog.yml -------------------------------------------------------------------------------- /.github/workflows/update_spaces.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/.github/workflows/update_spaces.yml -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/.gitignore -------------------------------------------------------------------------------- /AUTHORS: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/AUTHORS -------------------------------------------------------------------------------- /CODE_OF_CONDUCT.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/CODE_OF_CONDUCT.md -------------------------------------------------------------------------------- /CONTRIBUTING.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/CONTRIBUTING.md -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/LICENSE -------------------------------------------------------------------------------- /Makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/Makefile -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/README.md -------------------------------------------------------------------------------- /additional-tests-requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/additional-tests-requirements.txt -------------------------------------------------------------------------------- /comparisons/exact_match/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/comparisons/exact_match/README.md -------------------------------------------------------------------------------- /comparisons/exact_match/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/comparisons/exact_match/app.py -------------------------------------------------------------------------------- /comparisons/exact_match/exact_match.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/comparisons/exact_match/exact_match.py -------------------------------------------------------------------------------- /comparisons/exact_match/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} 2 | scipy -------------------------------------------------------------------------------- /comparisons/mcnemar/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/comparisons/mcnemar/README.md -------------------------------------------------------------------------------- /comparisons/mcnemar/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/comparisons/mcnemar/app.py -------------------------------------------------------------------------------- /comparisons/mcnemar/mcnemar.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/comparisons/mcnemar/mcnemar.py -------------------------------------------------------------------------------- /comparisons/mcnemar/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} 2 | scipy -------------------------------------------------------------------------------- /comparisons/wilcoxon/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/comparisons/wilcoxon/README.md -------------------------------------------------------------------------------- /comparisons/wilcoxon/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/comparisons/wilcoxon/app.py -------------------------------------------------------------------------------- /comparisons/wilcoxon/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/comparisons/wilcoxon/requirements.txt -------------------------------------------------------------------------------- /comparisons/wilcoxon/wilcoxon.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/comparisons/wilcoxon/wilcoxon.py -------------------------------------------------------------------------------- /docs/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/docs/README.md -------------------------------------------------------------------------------- /docs/source/_toctree.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/docs/source/_toctree.yml -------------------------------------------------------------------------------- /docs/source/a_quick_tour.mdx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/docs/source/a_quick_tour.mdx -------------------------------------------------------------------------------- /docs/source/base_evaluator.mdx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/docs/source/base_evaluator.mdx -------------------------------------------------------------------------------- /docs/source/choosing_a_metric.mdx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/docs/source/choosing_a_metric.mdx -------------------------------------------------------------------------------- /docs/source/considerations.mdx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/docs/source/considerations.mdx -------------------------------------------------------------------------------- /docs/source/creating_and_sharing.mdx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/docs/source/creating_and_sharing.mdx -------------------------------------------------------------------------------- /docs/source/custom_evaluator.mdx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/docs/source/custom_evaluator.mdx -------------------------------------------------------------------------------- /docs/source/evaluation_suite.mdx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/docs/source/evaluation_suite.mdx -------------------------------------------------------------------------------- /docs/source/index.mdx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/docs/source/index.mdx -------------------------------------------------------------------------------- /docs/source/installation.mdx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/docs/source/installation.mdx -------------------------------------------------------------------------------- /docs/source/keras_integrations.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/docs/source/keras_integrations.md -------------------------------------------------------------------------------- /docs/source/package_reference/evaluator_classes.mdx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/docs/source/package_reference/evaluator_classes.mdx -------------------------------------------------------------------------------- /docs/source/package_reference/hub_methods.mdx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/docs/source/package_reference/hub_methods.mdx -------------------------------------------------------------------------------- /docs/source/package_reference/loading_methods.mdx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/docs/source/package_reference/loading_methods.mdx -------------------------------------------------------------------------------- /docs/source/package_reference/logging_methods.mdx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/docs/source/package_reference/logging_methods.mdx -------------------------------------------------------------------------------- /docs/source/package_reference/main_classes.mdx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/docs/source/package_reference/main_classes.mdx -------------------------------------------------------------------------------- /docs/source/package_reference/saving_methods.mdx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/docs/source/package_reference/saving_methods.mdx -------------------------------------------------------------------------------- /docs/source/package_reference/visualization_methods.mdx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/docs/source/package_reference/visualization_methods.mdx -------------------------------------------------------------------------------- /docs/source/sklearn_integrations.mdx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/docs/source/sklearn_integrations.mdx -------------------------------------------------------------------------------- /docs/source/transformers_integrations.mdx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/docs/source/transformers_integrations.mdx -------------------------------------------------------------------------------- /docs/source/types_of_evaluations.mdx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/docs/source/types_of_evaluations.mdx -------------------------------------------------------------------------------- /measurements/honest/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/measurements/honest/README.md -------------------------------------------------------------------------------- /measurements/honest/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/measurements/honest/app.py -------------------------------------------------------------------------------- /measurements/honest/honest.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/measurements/honest/honest.py -------------------------------------------------------------------------------- /measurements/honest/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} 2 | transformers 3 | unidecode==1.3.4 4 | torch 5 | -------------------------------------------------------------------------------- /measurements/label_distribution/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/measurements/label_distribution/README.md -------------------------------------------------------------------------------- /measurements/label_distribution/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/measurements/label_distribution/app.py -------------------------------------------------------------------------------- /measurements/label_distribution/label_distribution.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/measurements/label_distribution/label_distribution.py -------------------------------------------------------------------------------- /measurements/label_distribution/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} 2 | scipy 3 | -------------------------------------------------------------------------------- /measurements/perplexity/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/measurements/perplexity/README.md -------------------------------------------------------------------------------- /measurements/perplexity/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/measurements/perplexity/app.py -------------------------------------------------------------------------------- /measurements/perplexity/perplexity.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/measurements/perplexity/perplexity.py -------------------------------------------------------------------------------- /measurements/perplexity/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} 2 | torch 3 | transformers -------------------------------------------------------------------------------- /measurements/regard/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/measurements/regard/README.md -------------------------------------------------------------------------------- /measurements/regard/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/measurements/regard/app.py -------------------------------------------------------------------------------- /measurements/regard/regard.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/measurements/regard/regard.py -------------------------------------------------------------------------------- /measurements/regard/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate.git@{COMMIT_PLACEHOLDER} 2 | transformers 3 | torch 4 | -------------------------------------------------------------------------------- /measurements/text_duplicates/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/measurements/text_duplicates/README.md -------------------------------------------------------------------------------- /measurements/text_duplicates/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/measurements/text_duplicates/app.py -------------------------------------------------------------------------------- /measurements/text_duplicates/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate.git@{COMMIT_PLACEHOLDER} 2 | -------------------------------------------------------------------------------- /measurements/text_duplicates/text_duplicates.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/measurements/text_duplicates/text_duplicates.py -------------------------------------------------------------------------------- /measurements/toxicity/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/measurements/toxicity/README.md -------------------------------------------------------------------------------- /measurements/toxicity/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/measurements/toxicity/app.py -------------------------------------------------------------------------------- /measurements/toxicity/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} 2 | transformers 3 | torch 4 | -------------------------------------------------------------------------------- /measurements/toxicity/toxicity.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/measurements/toxicity/toxicity.py -------------------------------------------------------------------------------- /measurements/word_count/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/measurements/word_count/README.md -------------------------------------------------------------------------------- /measurements/word_count/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/measurements/word_count/app.py -------------------------------------------------------------------------------- /measurements/word_count/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate.git@{COMMIT_PLACEHOLDER} 2 | scikit-learn~=0.0 3 | -------------------------------------------------------------------------------- /measurements/word_count/word_count.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/measurements/word_count/word_count.py -------------------------------------------------------------------------------- /measurements/word_length/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/measurements/word_length/README.md -------------------------------------------------------------------------------- /measurements/word_length/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/measurements/word_length/app.py -------------------------------------------------------------------------------- /measurements/word_length/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate.git@{COMMIT_PLACEHOLDER} 2 | nltk~=3.7 3 | -------------------------------------------------------------------------------- /measurements/word_length/word_length.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/measurements/word_length/word_length.py -------------------------------------------------------------------------------- /metrics/accuracy/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/accuracy/README.md -------------------------------------------------------------------------------- /metrics/accuracy/accuracy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/accuracy/accuracy.py -------------------------------------------------------------------------------- /metrics/accuracy/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/accuracy/app.py -------------------------------------------------------------------------------- /metrics/accuracy/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} 2 | scikit-learn -------------------------------------------------------------------------------- /metrics/bertscore/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/bertscore/README.md -------------------------------------------------------------------------------- /metrics/bertscore/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/bertscore/app.py -------------------------------------------------------------------------------- /metrics/bertscore/bertscore.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/bertscore/bertscore.py -------------------------------------------------------------------------------- /metrics/bertscore/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} 2 | bert_score -------------------------------------------------------------------------------- /metrics/bleu/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/bleu/README.md -------------------------------------------------------------------------------- /metrics/bleu/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/bleu/app.py -------------------------------------------------------------------------------- /metrics/bleu/bleu.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/bleu/bleu.py -------------------------------------------------------------------------------- /metrics/bleu/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} -------------------------------------------------------------------------------- /metrics/bleu/tokenizer_13a.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/bleu/tokenizer_13a.py -------------------------------------------------------------------------------- /metrics/bleurt/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/bleurt/README.md -------------------------------------------------------------------------------- /metrics/bleurt/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/bleurt/app.py -------------------------------------------------------------------------------- /metrics/bleurt/bleurt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/bleurt/bleurt.py -------------------------------------------------------------------------------- /metrics/bleurt/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/bleurt/requirements.txt -------------------------------------------------------------------------------- /metrics/brier_score/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/brier_score/README.md -------------------------------------------------------------------------------- /metrics/brier_score/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/brier_score/app.py -------------------------------------------------------------------------------- /metrics/brier_score/brier_score.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/brier_score/brier_score.py -------------------------------------------------------------------------------- /metrics/brier_score/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} 2 | scikit-learn -------------------------------------------------------------------------------- /metrics/cer/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/cer/README.md -------------------------------------------------------------------------------- /metrics/cer/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/cer/app.py -------------------------------------------------------------------------------- /metrics/cer/cer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/cer/cer.py -------------------------------------------------------------------------------- /metrics/cer/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} 2 | jiwer -------------------------------------------------------------------------------- /metrics/cer/test_cer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/cer/test_cer.py -------------------------------------------------------------------------------- /metrics/character/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/character/README.md -------------------------------------------------------------------------------- /metrics/character/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/character/app.py -------------------------------------------------------------------------------- /metrics/character/character.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/character/character.py -------------------------------------------------------------------------------- /metrics/character/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} 2 | cer>=1.2.0 3 | -------------------------------------------------------------------------------- /metrics/charcut_mt/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/charcut_mt/README.md -------------------------------------------------------------------------------- /metrics/charcut_mt/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/charcut_mt/app.py -------------------------------------------------------------------------------- /metrics/charcut_mt/charcut_mt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/charcut_mt/charcut_mt.py -------------------------------------------------------------------------------- /metrics/charcut_mt/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} 2 | charcut>=1.1.1 3 | -------------------------------------------------------------------------------- /metrics/chrf/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/chrf/README.md -------------------------------------------------------------------------------- /metrics/chrf/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/chrf/app.py -------------------------------------------------------------------------------- /metrics/chrf/chrf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/chrf/chrf.py -------------------------------------------------------------------------------- /metrics/chrf/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} 2 | sacrebleu -------------------------------------------------------------------------------- /metrics/code_eval/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/code_eval/README.md -------------------------------------------------------------------------------- /metrics/code_eval/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/code_eval/app.py -------------------------------------------------------------------------------- /metrics/code_eval/code_eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/code_eval/code_eval.py -------------------------------------------------------------------------------- /metrics/code_eval/execute.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/code_eval/execute.py -------------------------------------------------------------------------------- /metrics/code_eval/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} -------------------------------------------------------------------------------- /metrics/comet/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/comet/README.md -------------------------------------------------------------------------------- /metrics/comet/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/comet/app.py -------------------------------------------------------------------------------- /metrics/comet/comet.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/comet/comet.py -------------------------------------------------------------------------------- /metrics/comet/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} 2 | unbabel-comet 3 | torch -------------------------------------------------------------------------------- /metrics/competition_math/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/competition_math/README.md -------------------------------------------------------------------------------- /metrics/competition_math/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/competition_math/app.py -------------------------------------------------------------------------------- /metrics/competition_math/competition_math.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/competition_math/competition_math.py -------------------------------------------------------------------------------- /metrics/competition_math/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/competition_math/requirements.txt -------------------------------------------------------------------------------- /metrics/confusion_matrix/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/confusion_matrix/README.md -------------------------------------------------------------------------------- /metrics/confusion_matrix/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/confusion_matrix/app.py -------------------------------------------------------------------------------- /metrics/confusion_matrix/confusion_matrix.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/confusion_matrix/confusion_matrix.py -------------------------------------------------------------------------------- /metrics/confusion_matrix/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} 2 | scikit-learn -------------------------------------------------------------------------------- /metrics/coval/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/coval/README.md -------------------------------------------------------------------------------- /metrics/coval/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/coval/app.py -------------------------------------------------------------------------------- /metrics/coval/coval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/coval/coval.py -------------------------------------------------------------------------------- /metrics/coval/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/coval/requirements.txt -------------------------------------------------------------------------------- /metrics/cuad/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/cuad/README.md -------------------------------------------------------------------------------- /metrics/cuad/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/cuad/app.py -------------------------------------------------------------------------------- /metrics/cuad/compute_score.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/cuad/compute_score.py -------------------------------------------------------------------------------- /metrics/cuad/cuad.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/cuad/cuad.py -------------------------------------------------------------------------------- /metrics/cuad/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} -------------------------------------------------------------------------------- /metrics/exact_match/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/exact_match/README.md -------------------------------------------------------------------------------- /metrics/exact_match/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/exact_match/app.py -------------------------------------------------------------------------------- /metrics/exact_match/exact_match.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/exact_match/exact_match.py -------------------------------------------------------------------------------- /metrics/exact_match/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} -------------------------------------------------------------------------------- /metrics/f1/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/f1/README.md -------------------------------------------------------------------------------- /metrics/f1/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/f1/app.py -------------------------------------------------------------------------------- /metrics/f1/f1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/f1/f1.py -------------------------------------------------------------------------------- /metrics/f1/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} 2 | scikit-learn -------------------------------------------------------------------------------- /metrics/fever/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/fever/README.md -------------------------------------------------------------------------------- /metrics/fever/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/fever/app.py -------------------------------------------------------------------------------- /metrics/fever/fever.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/fever/fever.py -------------------------------------------------------------------------------- /metrics/fever/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} -------------------------------------------------------------------------------- /metrics/fever/test_fever.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/fever/test_fever.py -------------------------------------------------------------------------------- /metrics/frugalscore/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/frugalscore/README.md -------------------------------------------------------------------------------- /metrics/frugalscore/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/frugalscore/app.py -------------------------------------------------------------------------------- /metrics/frugalscore/frugalscore.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/frugalscore/frugalscore.py -------------------------------------------------------------------------------- /metrics/frugalscore/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} 2 | torch 3 | transformers -------------------------------------------------------------------------------- /metrics/glue/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/glue/README.md -------------------------------------------------------------------------------- /metrics/glue/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/glue/app.py -------------------------------------------------------------------------------- /metrics/glue/glue.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/glue/glue.py -------------------------------------------------------------------------------- /metrics/glue/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/glue/requirements.txt -------------------------------------------------------------------------------- /metrics/google_bleu/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/google_bleu/README.md -------------------------------------------------------------------------------- /metrics/google_bleu/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/google_bleu/app.py -------------------------------------------------------------------------------- /metrics/google_bleu/google_bleu.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/google_bleu/google_bleu.py -------------------------------------------------------------------------------- /metrics/google_bleu/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} 2 | nltk -------------------------------------------------------------------------------- /metrics/google_bleu/tokenizer_13a.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/google_bleu/tokenizer_13a.py -------------------------------------------------------------------------------- /metrics/indic_glue/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/indic_glue/README.md -------------------------------------------------------------------------------- /metrics/indic_glue/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/indic_glue/app.py -------------------------------------------------------------------------------- /metrics/indic_glue/indic_glue.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/indic_glue/indic_glue.py -------------------------------------------------------------------------------- /metrics/indic_glue/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/indic_glue/requirements.txt -------------------------------------------------------------------------------- /metrics/mae/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/mae/README.md -------------------------------------------------------------------------------- /metrics/mae/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/mae/app.py -------------------------------------------------------------------------------- /metrics/mae/mae.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/mae/mae.py -------------------------------------------------------------------------------- /metrics/mae/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} 2 | scikit-learn -------------------------------------------------------------------------------- /metrics/mahalanobis/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/mahalanobis/README.md -------------------------------------------------------------------------------- /metrics/mahalanobis/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/mahalanobis/app.py -------------------------------------------------------------------------------- /metrics/mahalanobis/mahalanobis.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/mahalanobis/mahalanobis.py -------------------------------------------------------------------------------- /metrics/mahalanobis/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} -------------------------------------------------------------------------------- /metrics/mape/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/mape/README.md -------------------------------------------------------------------------------- /metrics/mape/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/mape/app.py -------------------------------------------------------------------------------- /metrics/mape/mape.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/mape/mape.py -------------------------------------------------------------------------------- /metrics/mape/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} 2 | scikit-learn 3 | -------------------------------------------------------------------------------- /metrics/mase/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/mase/README.md -------------------------------------------------------------------------------- /metrics/mase/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/mase/app.py -------------------------------------------------------------------------------- /metrics/mase/mase.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/mase/mase.py -------------------------------------------------------------------------------- /metrics/mase/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} 2 | scikit-learn 3 | -------------------------------------------------------------------------------- /metrics/matthews_correlation/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/matthews_correlation/README.md -------------------------------------------------------------------------------- /metrics/matthews_correlation/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/matthews_correlation/app.py -------------------------------------------------------------------------------- /metrics/matthews_correlation/matthews_correlation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/matthews_correlation/matthews_correlation.py -------------------------------------------------------------------------------- /metrics/matthews_correlation/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} 2 | scikit-learn -------------------------------------------------------------------------------- /metrics/mauve/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/mauve/README.md -------------------------------------------------------------------------------- /metrics/mauve/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/mauve/app.py -------------------------------------------------------------------------------- /metrics/mauve/mauve.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/mauve/mauve.py -------------------------------------------------------------------------------- /metrics/mauve/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} 2 | faiss-cpu 3 | scikit-learn 4 | mauve-text -------------------------------------------------------------------------------- /metrics/mean_iou/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/mean_iou/README.md -------------------------------------------------------------------------------- /metrics/mean_iou/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/mean_iou/app.py -------------------------------------------------------------------------------- /metrics/mean_iou/mean_iou.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/mean_iou/mean_iou.py -------------------------------------------------------------------------------- /metrics/mean_iou/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} -------------------------------------------------------------------------------- /metrics/meteor/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/meteor/README.md -------------------------------------------------------------------------------- /metrics/meteor/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/meteor/app.py -------------------------------------------------------------------------------- /metrics/meteor/meteor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/meteor/meteor.py -------------------------------------------------------------------------------- /metrics/meteor/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} 2 | nltk -------------------------------------------------------------------------------- /metrics/mse/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/mse/README.md -------------------------------------------------------------------------------- /metrics/mse/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/mse/app.py -------------------------------------------------------------------------------- /metrics/mse/mse.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/mse/mse.py -------------------------------------------------------------------------------- /metrics/mse/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} 2 | scikit-learn -------------------------------------------------------------------------------- /metrics/nist_mt/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/nist_mt/README.md -------------------------------------------------------------------------------- /metrics/nist_mt/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/nist_mt/app.py -------------------------------------------------------------------------------- /metrics/nist_mt/nist_mt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/nist_mt/nist_mt.py -------------------------------------------------------------------------------- /metrics/nist_mt/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} 2 | nltk 3 | -------------------------------------------------------------------------------- /metrics/nist_mt/tests.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/nist_mt/tests.py -------------------------------------------------------------------------------- /metrics/pearsonr/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/pearsonr/README.md -------------------------------------------------------------------------------- /metrics/pearsonr/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/pearsonr/app.py -------------------------------------------------------------------------------- /metrics/pearsonr/pearsonr.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/pearsonr/pearsonr.py -------------------------------------------------------------------------------- /metrics/pearsonr/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} 2 | scipy -------------------------------------------------------------------------------- /metrics/perplexity/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/perplexity/README.md -------------------------------------------------------------------------------- /metrics/perplexity/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/perplexity/app.py -------------------------------------------------------------------------------- /metrics/perplexity/perplexity.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/perplexity/perplexity.py -------------------------------------------------------------------------------- /metrics/perplexity/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/perplexity/requirements.txt -------------------------------------------------------------------------------- /metrics/poseval/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/poseval/README.md -------------------------------------------------------------------------------- /metrics/poseval/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/poseval/app.py -------------------------------------------------------------------------------- /metrics/poseval/poseval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/poseval/poseval.py -------------------------------------------------------------------------------- /metrics/poseval/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} 2 | scikit-learn -------------------------------------------------------------------------------- /metrics/precision/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/precision/README.md -------------------------------------------------------------------------------- /metrics/precision/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/precision/app.py -------------------------------------------------------------------------------- /metrics/precision/precision.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/precision/precision.py -------------------------------------------------------------------------------- /metrics/precision/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} 2 | scikit-learn -------------------------------------------------------------------------------- /metrics/r_squared/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/r_squared/README.md -------------------------------------------------------------------------------- /metrics/r_squared/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/r_squared/app.py -------------------------------------------------------------------------------- /metrics/r_squared/r_squared.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/r_squared/r_squared.py -------------------------------------------------------------------------------- /metrics/r_squared/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} 2 | -------------------------------------------------------------------------------- /metrics/recall/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/recall/README.md -------------------------------------------------------------------------------- /metrics/recall/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/recall/app.py -------------------------------------------------------------------------------- /metrics/recall/recall.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/recall/recall.py -------------------------------------------------------------------------------- /metrics/recall/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} 2 | scikit-learn -------------------------------------------------------------------------------- /metrics/rl_reliability/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/rl_reliability/README.md -------------------------------------------------------------------------------- /metrics/rl_reliability/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/rl_reliability/app.py -------------------------------------------------------------------------------- /metrics/rl_reliability/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/rl_reliability/requirements.txt -------------------------------------------------------------------------------- /metrics/rl_reliability/rl_reliability.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/rl_reliability/rl_reliability.py -------------------------------------------------------------------------------- /metrics/roc_auc/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/roc_auc/README.md -------------------------------------------------------------------------------- /metrics/roc_auc/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/roc_auc/app.py -------------------------------------------------------------------------------- /metrics/roc_auc/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} 2 | scikit-learn -------------------------------------------------------------------------------- /metrics/roc_auc/roc_auc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/roc_auc/roc_auc.py -------------------------------------------------------------------------------- /metrics/rouge/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/rouge/README.md -------------------------------------------------------------------------------- /metrics/rouge/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/rouge/app.py -------------------------------------------------------------------------------- /metrics/rouge/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} 2 | absl-py 3 | nltk 4 | rouge_score>=0.1.2 -------------------------------------------------------------------------------- /metrics/rouge/rouge.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/rouge/rouge.py -------------------------------------------------------------------------------- /metrics/sacrebleu/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/sacrebleu/README.md -------------------------------------------------------------------------------- /metrics/sacrebleu/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/sacrebleu/app.py -------------------------------------------------------------------------------- /metrics/sacrebleu/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} 2 | sacrebleu -------------------------------------------------------------------------------- /metrics/sacrebleu/sacrebleu.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/sacrebleu/sacrebleu.py -------------------------------------------------------------------------------- /metrics/sari/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/sari/README.md -------------------------------------------------------------------------------- /metrics/sari/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/sari/app.py -------------------------------------------------------------------------------- /metrics/sari/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/sari/requirements.txt -------------------------------------------------------------------------------- /metrics/sari/sari.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/sari/sari.py -------------------------------------------------------------------------------- /metrics/seqeval/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/seqeval/README.md -------------------------------------------------------------------------------- /metrics/seqeval/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/seqeval/app.py -------------------------------------------------------------------------------- /metrics/seqeval/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} 2 | seqeval -------------------------------------------------------------------------------- /metrics/seqeval/seqeval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/seqeval/seqeval.py -------------------------------------------------------------------------------- /metrics/smape/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/smape/README.md -------------------------------------------------------------------------------- /metrics/smape/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/smape/app.py -------------------------------------------------------------------------------- /metrics/smape/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} 2 | scikit-learn 3 | -------------------------------------------------------------------------------- /metrics/smape/smape.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/smape/smape.py -------------------------------------------------------------------------------- /metrics/spearmanr/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/spearmanr/README.md -------------------------------------------------------------------------------- /metrics/spearmanr/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/spearmanr/app.py -------------------------------------------------------------------------------- /metrics/spearmanr/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} 2 | scipy -------------------------------------------------------------------------------- /metrics/spearmanr/spearmanr.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/spearmanr/spearmanr.py -------------------------------------------------------------------------------- /metrics/squad/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/squad/README.md -------------------------------------------------------------------------------- /metrics/squad/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/squad/app.py -------------------------------------------------------------------------------- /metrics/squad/compute_score.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/squad/compute_score.py -------------------------------------------------------------------------------- /metrics/squad/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} -------------------------------------------------------------------------------- /metrics/squad/squad.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/squad/squad.py -------------------------------------------------------------------------------- /metrics/squad_v2/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/squad_v2/README.md -------------------------------------------------------------------------------- /metrics/squad_v2/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/squad_v2/app.py -------------------------------------------------------------------------------- /metrics/squad_v2/compute_score.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/squad_v2/compute_score.py -------------------------------------------------------------------------------- /metrics/squad_v2/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} -------------------------------------------------------------------------------- /metrics/squad_v2/squad_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/squad_v2/squad_v2.py -------------------------------------------------------------------------------- /metrics/super_glue/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/super_glue/README.md -------------------------------------------------------------------------------- /metrics/super_glue/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/super_glue/app.py -------------------------------------------------------------------------------- /metrics/super_glue/record_evaluation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/super_glue/record_evaluation.py -------------------------------------------------------------------------------- /metrics/super_glue/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} 2 | scikit-learn -------------------------------------------------------------------------------- /metrics/super_glue/super_glue.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/super_glue/super_glue.py -------------------------------------------------------------------------------- /metrics/ter/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/ter/README.md -------------------------------------------------------------------------------- /metrics/ter/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/ter/app.py -------------------------------------------------------------------------------- /metrics/ter/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} 2 | sacrebleu -------------------------------------------------------------------------------- /metrics/ter/ter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/ter/ter.py -------------------------------------------------------------------------------- /metrics/trec_eval/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/trec_eval/README.md -------------------------------------------------------------------------------- /metrics/trec_eval/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/trec_eval/app.py -------------------------------------------------------------------------------- /metrics/trec_eval/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} 2 | trectools -------------------------------------------------------------------------------- /metrics/trec_eval/trec_eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/trec_eval/trec_eval.py -------------------------------------------------------------------------------- /metrics/wer/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/wer/README.md -------------------------------------------------------------------------------- /metrics/wer/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/wer/app.py -------------------------------------------------------------------------------- /metrics/wer/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} 2 | jiwer -------------------------------------------------------------------------------- /metrics/wer/wer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/wer/wer.py -------------------------------------------------------------------------------- /metrics/wiki_split/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/wiki_split/README.md -------------------------------------------------------------------------------- /metrics/wiki_split/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/wiki_split/app.py -------------------------------------------------------------------------------- /metrics/wiki_split/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/wiki_split/requirements.txt -------------------------------------------------------------------------------- /metrics/wiki_split/wiki_split.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/wiki_split/wiki_split.py -------------------------------------------------------------------------------- /metrics/xnli/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/xnli/README.md -------------------------------------------------------------------------------- /metrics/xnli/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/xnli/app.py -------------------------------------------------------------------------------- /metrics/xnli/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} -------------------------------------------------------------------------------- /metrics/xnli/xnli.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/xnli/xnli.py -------------------------------------------------------------------------------- /metrics/xtreme_s/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/xtreme_s/README.md -------------------------------------------------------------------------------- /metrics/xtreme_s/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/xtreme_s/app.py -------------------------------------------------------------------------------- /metrics/xtreme_s/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@{COMMIT_PLACEHOLDER} 2 | scikit-learn -------------------------------------------------------------------------------- /metrics/xtreme_s/xtreme_s.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/metrics/xtreme_s/xtreme_s.py -------------------------------------------------------------------------------- /setup.cfg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/setup.cfg -------------------------------------------------------------------------------- /setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/setup.py -------------------------------------------------------------------------------- /src/evaluate/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/src/evaluate/__init__.py -------------------------------------------------------------------------------- /src/evaluate/commands/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /src/evaluate/commands/evaluate_cli.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/src/evaluate/commands/evaluate_cli.py -------------------------------------------------------------------------------- /src/evaluate/config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/src/evaluate/config.py -------------------------------------------------------------------------------- /src/evaluate/evaluation_suite/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/src/evaluate/evaluation_suite/__init__.py -------------------------------------------------------------------------------- /src/evaluate/evaluator/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/src/evaluate/evaluator/__init__.py -------------------------------------------------------------------------------- /src/evaluate/evaluator/audio_classification.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/src/evaluate/evaluator/audio_classification.py -------------------------------------------------------------------------------- /src/evaluate/evaluator/automatic_speech_recognition.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/src/evaluate/evaluator/automatic_speech_recognition.py -------------------------------------------------------------------------------- /src/evaluate/evaluator/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/src/evaluate/evaluator/base.py -------------------------------------------------------------------------------- /src/evaluate/evaluator/image_classification.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/src/evaluate/evaluator/image_classification.py -------------------------------------------------------------------------------- /src/evaluate/evaluator/question_answering.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/src/evaluate/evaluator/question_answering.py -------------------------------------------------------------------------------- /src/evaluate/evaluator/text2text_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/src/evaluate/evaluator/text2text_generation.py -------------------------------------------------------------------------------- /src/evaluate/evaluator/text_classification.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/src/evaluate/evaluator/text_classification.py -------------------------------------------------------------------------------- /src/evaluate/evaluator/text_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/src/evaluate/evaluator/text_generation.py -------------------------------------------------------------------------------- /src/evaluate/evaluator/token_classification.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/src/evaluate/evaluator/token_classification.py -------------------------------------------------------------------------------- /src/evaluate/evaluator/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/src/evaluate/evaluator/utils.py -------------------------------------------------------------------------------- /src/evaluate/hub.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/src/evaluate/hub.py -------------------------------------------------------------------------------- /src/evaluate/info.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/src/evaluate/info.py -------------------------------------------------------------------------------- /src/evaluate/inspect.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/src/evaluate/inspect.py -------------------------------------------------------------------------------- /src/evaluate/loading.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/src/evaluate/loading.py -------------------------------------------------------------------------------- /src/evaluate/module.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/src/evaluate/module.py -------------------------------------------------------------------------------- /src/evaluate/naming.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/src/evaluate/naming.py -------------------------------------------------------------------------------- /src/evaluate/saving.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/src/evaluate/saving.py -------------------------------------------------------------------------------- /src/evaluate/utils/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/src/evaluate/utils/__init__.py -------------------------------------------------------------------------------- /src/evaluate/utils/file_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/src/evaluate/utils/file_utils.py -------------------------------------------------------------------------------- /src/evaluate/utils/gradio.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/src/evaluate/utils/gradio.py -------------------------------------------------------------------------------- /src/evaluate/utils/logging.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/src/evaluate/utils/logging.py -------------------------------------------------------------------------------- /src/evaluate/visualization.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/src/evaluate/visualization.py -------------------------------------------------------------------------------- /templates/cookiecutter.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/templates/cookiecutter.json -------------------------------------------------------------------------------- /templates/{{ cookiecutter.module_slug }}/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/templates/{{ cookiecutter.module_slug }}/README.md -------------------------------------------------------------------------------- /templates/{{ cookiecutter.module_slug }}/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/templates/{{ cookiecutter.module_slug }}/app.py -------------------------------------------------------------------------------- /templates/{{ cookiecutter.module_slug }}/requirements.txt: -------------------------------------------------------------------------------- 1 | git+https://github.com/huggingface/evaluate@main -------------------------------------------------------------------------------- /templates/{{ cookiecutter.module_slug }}/tests.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/templates/{{ cookiecutter.module_slug }}/tests.py -------------------------------------------------------------------------------- /templates/{{ cookiecutter.module_slug }}/{{ cookiecutter.module_slug }}.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/templates/{{ cookiecutter.module_slug }}/{{ cookiecutter.module_slug }}.py -------------------------------------------------------------------------------- /tests/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /tests/conftest.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/tests/conftest.py -------------------------------------------------------------------------------- /tests/test_evaluation_suite.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/tests/test_evaluation_suite.py -------------------------------------------------------------------------------- /tests/test_evaluator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/tests/test_evaluator.py -------------------------------------------------------------------------------- /tests/test_file_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/tests/test_file_utils.py -------------------------------------------------------------------------------- /tests/test_hub.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/tests/test_hub.py -------------------------------------------------------------------------------- /tests/test_load.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/tests/test_load.py -------------------------------------------------------------------------------- /tests/test_metric.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/tests/test_metric.py -------------------------------------------------------------------------------- /tests/test_metric_common.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/tests/test_metric_common.py -------------------------------------------------------------------------------- /tests/test_save.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/tests/test_save.py -------------------------------------------------------------------------------- /tests/test_trainer_evaluator_parity.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/tests/test_trainer_evaluator_parity.py -------------------------------------------------------------------------------- /tests/test_viz.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/tests/test_viz.py -------------------------------------------------------------------------------- /tests/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/huggingface/evaluate/HEAD/tests/utils.py --------------------------------------------------------------------------------