..
|
huggingface-evaluation.ipynb
|
qa-evaluation.ipynb
|
rag-evaluation.ipynb
|
README.md
|
evaluate_on_binary_classifier.py
|
evaluate_on_multiclass_classifier.py
|
evaluate_on_regressor.py
|
evaluate_with_custom_code_metrics.py
|
evaluate_with_custom_metrics.py
|
evaluate_with_custom_metrics_comprehensive.py
|
evaluate_with_function.py
|
evaluate_with_llm_judge.py
|
evaluate_with_model_validation.py
|
evaluate_with_qa_metrics.py
|
evaluate_with_static_dataset.py
|