Spaces:
Running
Running
Commit
·
faceee1
1
Parent(s):
553b217
[MODIFY] Cross-evaluation framework column names
Browse files- src/about.py +12 -12
- src/populate.py +3 -3
src/about.py
CHANGED
|
@@ -64,10 +64,10 @@ class MedicalSummarizationColumn:
|
|
| 64 |
col_name: str
|
| 65 |
|
| 66 |
class MedicalSummarizationColumns(Enum):
|
| 67 |
-
medical_summarization_column0 = MedicalSummarizationColumn("
|
| 68 |
-
medical_summarization_column1 = MedicalSummarizationColumn("
|
| 69 |
-
medical_summarization_column2 = MedicalSummarizationColumn("
|
| 70 |
-
medical_summarization_column3 = MedicalSummarizationColumn("
|
| 71 |
|
| 72 |
@dataclass
|
| 73 |
class ACIColumn:
|
|
@@ -76,10 +76,10 @@ class ACIColumn:
|
|
| 76 |
col_name: str
|
| 77 |
|
| 78 |
class ACIColumns(Enum):
|
| 79 |
-
aci_column0 = ACIColumn("
|
| 80 |
-
aci_column1 = ACIColumn("
|
| 81 |
-
aci_column2 = ACIColumn("
|
| 82 |
-
aci_column3 = ACIColumn("
|
| 83 |
|
| 84 |
@dataclass
|
| 85 |
class SOAPColumn:
|
|
@@ -88,10 +88,10 @@ class SOAPColumn:
|
|
| 88 |
col_name: str
|
| 89 |
|
| 90 |
class SOAPColumns(Enum):
|
| 91 |
-
soap_column0 = SOAPColumn("
|
| 92 |
-
soap_column1 = SOAPColumn("
|
| 93 |
-
soap_column2 = SOAPColumn("
|
| 94 |
-
soap_column3 = SOAPColumn("
|
| 95 |
|
| 96 |
NUM_FEWSHOT = 0 # Change with your few shot
|
| 97 |
# ---------------------------------------------------
|
|
|
|
| 64 |
col_name: str
|
| 65 |
|
| 66 |
class MedicalSummarizationColumns(Enum):
|
| 67 |
+
medical_summarization_column0 = MedicalSummarizationColumn("coverage", "score", "Coverage")
|
| 68 |
+
medical_summarization_column1 = MedicalSummarizationColumn("conform", "score", "Conformity")
|
| 69 |
+
medical_summarization_column2 = MedicalSummarizationColumn("fact", "score", "Consistency")
|
| 70 |
+
medical_summarization_column3 = MedicalSummarizationColumn("brief", "score", "Conciseness")
|
| 71 |
|
| 72 |
@dataclass
|
| 73 |
class ACIColumn:
|
|
|
|
| 76 |
col_name: str
|
| 77 |
|
| 78 |
class ACIColumns(Enum):
|
| 79 |
+
aci_column0 = ACIColumn("coverage", "score", "Coverage")
|
| 80 |
+
aci_column1 = ACIColumn("conform", "score", "Conformity")
|
| 81 |
+
aci_column2 = ACIColumn("fact", "score", "Consistency")
|
| 82 |
+
aci_column3 = ACIColumn("brief", "score", "Conciseness")
|
| 83 |
|
| 84 |
@dataclass
|
| 85 |
class SOAPColumn:
|
|
|
|
| 88 |
col_name: str
|
| 89 |
|
| 90 |
class SOAPColumns(Enum):
|
| 91 |
+
soap_column0 = SOAPColumn("coverage", "score", "Coverage")
|
| 92 |
+
soap_column1 = SOAPColumn("conform", "score", "Conformity")
|
| 93 |
+
soap_column2 = SOAPColumn("fact", "score", "Consistency")
|
| 94 |
+
soap_column3 = SOAPColumn("brief", "score", "Conciseness")
|
| 95 |
|
| 96 |
NUM_FEWSHOT = 0 # Change with your few shot
|
| 97 |
# ---------------------------------------------------
|
src/populate.py
CHANGED
|
@@ -25,11 +25,11 @@ def get_leaderboard_df(results_path: str, requests_path: str, cols: list, benchm
|
|
| 25 |
elif subset == "open_ended":
|
| 26 |
df = df.sort_values(by=["ELO"], ascending=False)
|
| 27 |
elif subset == "medical_summarization":
|
| 28 |
-
df = df.sort_values(by=["Coverage
|
| 29 |
elif subset == "aci":
|
| 30 |
-
df = df.sort_values(by=["Coverage
|
| 31 |
elif subset == "soap":
|
| 32 |
-
df = df.sort_values(by=["Coverage
|
| 33 |
cols = list(set(df.columns).intersection(set(cols)))
|
| 34 |
df = df[cols].round(decimals=2)
|
| 35 |
# filter out if any of the benchmarks have not been produced
|
|
|
|
| 25 |
elif subset == "open_ended":
|
| 26 |
df = df.sort_values(by=["ELO"], ascending=False)
|
| 27 |
elif subset == "medical_summarization":
|
| 28 |
+
df = df.sort_values(by=["Coverage"], ascending=False)
|
| 29 |
elif subset == "aci":
|
| 30 |
+
df = df.sort_values(by=["Coverage"], ascending=False)
|
| 31 |
elif subset == "soap":
|
| 32 |
+
df = df.sort_values(by=["Coverage"], ascending=False)
|
| 33 |
cols = list(set(df.columns).intersection(set(cols)))
|
| 34 |
df = df[cols].round(decimals=2)
|
| 35 |
# filter out if any of the benchmarks have not been produced
|