Spaces:

unitxt
/

metric

Running

App Files Files Community

Elron commited on Mar 24, 2024

Commit

8320ba9

verified ·

1 Parent(s): c57223d

Upload standard.py with huggingface_hub

Browse files

Files changed (1) hide show

standard.py +19 -3

standard.py CHANGED Viewed

@@ -1,7 +1,7 @@
 from typing import List
 from .card import TaskCard
-from .dataclass import Field, InternalField, OptionalField
 from .formats import Format, SystemFormat
 from .logging_utils import get_logger
 from .operator import SourceSequentialOperator, StreamingOperator
@@ -29,6 +29,8 @@ class BaseRecipe(Recipe, SourceSequentialOperator):
     template: Template = None
     system_prompt: SystemPrompt = Field(default_factory=EmptySystemPrompt)
     format: Format = Field(default_factory=SystemFormat)
     loader_limit: int = None
@@ -107,6 +109,18 @@ class BaseRecipe(Recipe, SourceSequentialOperator):
         self.test_refiner.apply_to_streams = ["test"]
         self.steps.append(self.test_refiner)
     def prepare(self):
         self.steps = [
             self.card.loader,
@@ -173,12 +187,12 @@ class BaseRecipe(Recipe, SourceSequentialOperator):
         if self.augmentor.augment_model_input:
             self.steps.append(self.augmentor)
-        postprocessors = self.template.get_postprocessors()
         self.steps.append(
             ToUnitxtGroup(
                 group="unitxt",
-                metrics=self.card.task.metrics,
                 postprocessors=postprocessors,
             )
         )
@@ -222,6 +236,8 @@ class StandardRecipe(StandardRecipeWithIndexes):
         system_prompt (SystemPrompt, optional): SystemPrompt object to be used for the recipe.
         loader_limit (int, optional): Specifies the maximum number of instances per stream to be returned from the loader (used to reduce loading time in large datasets)
         format (SystemFormat, optional): SystemFormat object to be used for the recipe.
         train_refiner (StreamRefiner, optional): Train refiner to be used in the recipe.
         max_train_instances (int, optional): Maximum training instances for the refiner.
         validation_refiner (StreamRefiner, optional): Validation refiner to be used in the recipe.

 from typing import List
 from .card import TaskCard
+from .dataclass import Field, InternalField, NonPositionalField, OptionalField
 from .formats import Format, SystemFormat
 from .logging_utils import get_logger
 from .operator import SourceSequentialOperator, StreamingOperator
     template: Template = None
     system_prompt: SystemPrompt = Field(default_factory=EmptySystemPrompt)
     format: Format = Field(default_factory=SystemFormat)
+    metrics: List[str] = NonPositionalField(default=None)
+    postprocessors: List[str] = NonPositionalField(default=None)
     loader_limit: int = None
         self.test_refiner.apply_to_streams = ["test"]
         self.steps.append(self.test_refiner)
+    def prepare_metrics_and_postprocessors(self):
+        if self.postprocessors is None:
+            postprocessors = self.template.get_postprocessors()
+        else:
+            postprocessors = self.postprocessors
+        if self.metrics is None:
+            metrics = self.card.task.metrics
+        else:
+            metrics = self.metrics
+        return metrics, postprocessors
     def prepare(self):
         self.steps = [
             self.card.loader,
         if self.augmentor.augment_model_input:
             self.steps.append(self.augmentor)
+        metrics, postprocessors = self.prepare_metrics_and_postprocessors()
         self.steps.append(
             ToUnitxtGroup(
                 group="unitxt",
+                metrics=metrics,
                 postprocessors=postprocessors,
             )
         )
         system_prompt (SystemPrompt, optional): SystemPrompt object to be used for the recipe.
         loader_limit (int, optional): Specifies the maximum number of instances per stream to be returned from the loader (used to reduce loading time in large datasets)
         format (SystemFormat, optional): SystemFormat object to be used for the recipe.
+        metrics (List[str]): list of catalog metrics to use with this recipe.
+        postprocessors (List[str]): list of catalog processors to apply at post processing. (Not recommended to use from here)
         train_refiner (StreamRefiner, optional): Train refiner to be used in the recipe.
         max_train_instances (int, optional): Maximum training instances for the refiner.
         validation_refiner (StreamRefiner, optional): Validation refiner to be used in the recipe.