Update README.md
Browse files
README.md
CHANGED
@@ -63,7 +63,7 @@ match_result = f1_match(reference_answer, candidate_answer, threshold=0.5)
|
|
63 |
print("F1 Match: ", match_result)
|
64 |
```
|
65 |
|
66 |
-
####
|
67 |
```python
|
68 |
from qa_metrics.cfm import CFMatcher
|
69 |
|
@@ -76,13 +76,13 @@ print("Score: %s; bert Match: %s" % (scores, match_result))
|
|
76 |
|
77 |
If you find this repo avialable, please cite our paper:
|
78 |
```bibtex
|
79 |
-
@misc{
|
80 |
-
|
81 |
-
|
82 |
-
|
83 |
-
|
84 |
-
|
85 |
-
|
86 |
}
|
87 |
```
|
88 |
|
|
|
63 |
print("F1 Match: ", match_result)
|
64 |
```
|
65 |
|
66 |
+
#### PANDA
|
67 |
```python
|
68 |
from qa_metrics.cfm import CFMatcher
|
69 |
|
|
|
76 |
|
77 |
If you find this repo avialable, please cite our paper:
|
78 |
```bibtex
|
79 |
+
@misc{li2024panda,
|
80 |
+
title={PANDA (Pedantic ANswer-correctness Determination and Adjudication):Improving Automatic Evaluation for Question Answering and Text Generation},
|
81 |
+
author={Zongxia Li and Ishani Mondal and Yijun Liang and Huy Nghiem and Jordan Lee Boyd-Graber},
|
82 |
+
year={2024},
|
83 |
+
eprint={2402.11161},
|
84 |
+
archivePrefix={arXiv},
|
85 |
+
primaryClass={cs.CL}
|
86 |
}
|
87 |
```
|
88 |
|