File size: 1,624 Bytes
d389578 2e00cda f2b3434 16273a7 f2b3434 2e00cda 16273a7 b462f85 d389578 f2b3434 d08fbc6 527a33e 24df49f 527a33e f2b3434 370e1f5 b462f85 d389578 88c61d3 16273a7 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 |
from typing import Dict, List, Union
from .artifact import Artifact
from .dataclass import OptionalField
from .loaders import Loader
from .operator import StreamingOperator
from .splitters import RandomSampler, Sampler
from .task import Task
from .templates import Template, TemplatesDict, TemplatesList
class TaskCard(Artifact):
"""TaskCard delineates the phases in transforming the source dataset into model input, and specifies the metrics for evaluation of model output.
Args:
loader:
specifies the source address and the loading operator that can access that source and transform it into a unitxt multistream.
preprocess_steps:
list of unitxt operators to process the data source into model input.
task:
specifies the fields (of the already (pre)processed instance) making the inputs, the fields making the outputs, and the metrics to be used for evaluating the model output.
templates:
format strings to be applied on the input fields (specified by the task) and the output fields. The template also carries the instructions and the list of postprocessing steps, to be applied to the model output.
default_template:
a default template for tasks with very specific task dataset specific template
"""
loader: Loader
preprocess_steps: List[StreamingOperator] = None
task: Task
templates: Union[
TemplatesDict, TemplatesList, Dict[str, Template], List[Template]
] = None
default_template: Template = None
sampler: Sampler = OptionalField(default_factory=RandomSampler)
|