scandeval.benchmark_modules.base

docs module scandeval.benchmark_modules.base
"""Abstract benchmark module class that the model classes inherit from."""importcollections.abcascimportloggingimportsysimporttypingastfromabcimportABC,abstractmethodfromfunctoolsimportcached_property,partialfromdatasetsimportDatasetDictfromtorchimportnnfromtqdm.autoimporttqdmfromtransformersimportPreTrainedTokenizer,Trainerfrom..data_modelsimport(BenchmarkConfig,DatasetConfig,GenerativeModelOutput,ModelConfig,Task,)from..enumsimportBatchingPreference,GenerativeType,TaskGroupfrom..exceptionsimportNeedsEnvironmentVariable,NeedsExtraInstalledfrom..task_utilsimport(question_answering,sequence_classification,text_to_text,token_classification,)from..typesimportComputeMetricsFunction,ExtractLabelsFunctionfrom..utilsimportlog_oncelogger=logging.getLogger("scandeval")classBenchmarkModule(ABC):docs
    """Abstract class for a benchmark module.    Attributes:        model_config:            The model configuration.        dataset_config:            The dataset configuration.        benchmark_config:            The benchmark configuration.        buffer:            A buffer to store temporary data.    """fresh_model:boolbatching_preference:BatchingPreferencehigh_priority:booldef__init__(self,model_config:ModelConfig,dataset_config:DatasetConfig,benchmark_config:BenchmarkConfig,)->None:        """Initialise the benchmark module.        Args:            model_config:                The model configuration.            dataset_config:                The dataset configuration.            benchmark_config:                The benchmark configuration.        """self.model_config=model_configself.dataset_config=dataset_configself.benchmark_config=benchmark_configself.buffer:dict[str,t.Any]=dict()self._log_metadata()def_log_metadata(self)->None:        """Log the metadata of the model."""# Set logging level based on verbosityifhasattr(sys,"_called_from_test"):logging_level=logging.CRITICALelifself.benchmark_config.verbose:logging_level=logging.DEBUGelse:logging_level=logging.INFOlogger.setLevel(logging_level)logging_msg:str=""ifself.num_params<0:logging_msg+="The model has an unknown number of parameters, "else:logging_msg+=f"The model has {self.num_params:,} parameters, "ifself.vocab_size<0:logging_msg+="an unknown vocabulary size, "else:logging_msg+=f"a vocabulary size of {self.vocab_size:,}, "ifself.model_max_length<0:logging_msg+="and an unknown maximum sequence length."else:logging_msg+=f"and a maximum context length of {self.model_max_length:,}."log_once(message=logging_msg,level=logging.INFO)defget_pytorch_module(self)->"nn.Module":docs
        """Get the underlying PyTorch module.        Returns:            The PyTorch module.        """ifhasattr(self,"_model"):returnself._modelraiseNotImplementedError("The `get_pytorch_module` method has not been implemented for "f"{self.__class__.__name__}.")defget_tokenizer(self)->"PreTrainedTokenizer":docs
        """Get the underlying tokenizer.        Returns:            The tokenizer.        """ifhasattr(self,"_tokenizer"):returnself._tokenizerraiseNotImplementedError("The `get_tokenizer` method has not been implemented for "f"{self.__class__.__name__}.")@cached_property@abstractmethoddefnum_params(self)->int:docs
        """The number of parameters in the model.        Returns:            The number of parameters in the model.        """...@property@abstractmethoddefgenerative_type(self)->GenerativeType|None:docs
        """Get the generative type of the model.        Returns:            The generative type of the model, or None if the model is not generative.        """...@cached_property@abstractmethoddefvocab_size(self)->int:docs
        """The vocabulary size of the model.        Returns:            The vocabulary size of the model.        """...@cached_property@abstractmethoddefmodel_max_length(self)->int:docs
        """The maximum length of the model.        Returns:            The maximum length of the model.        """...@property@abstractmethoddocs
defdata_collator(self)->c.Callable[[list[t.Any]],dict[str,t.Any]]:        """The data collator used to prepare samples during finetuning.        Returns:            The data collator.        """...@propertydefcompute_metrics(self)->ComputeMetricsFunction:docs
        """The function used to compute the metrics.        Returns:            The function used to compute the metrics.        """matchself.dataset_config.task.task_group:caseTaskGroup.SEQUENCE_CLASSIFICATION:returnpartial(sequence_classification.compute_metrics,dataset_config=self.dataset_config,benchmark_config=self.benchmark_config,)caseTaskGroup.MULTIPLE_CHOICE_CLASSIFICATION:returnpartial(sequence_classification.compute_metrics,dataset_config=self.dataset_config,benchmark_config=self.benchmark_config,)caseTaskGroup.TEXT_TO_TEXT:returnpartial(text_to_text.compute_metrics,dataset_config=self.dataset_config,benchmark_config=self.benchmark_config,)caseTaskGroup.TOKEN_CLASSIFICATION:returnpartial(token_classification.compute_metrics,has_misc_tags=self.buffer.get("has_misc_tags",True),dataset_config=self.dataset_config,benchmark_config=self.benchmark_config,)caseTaskGroup.QUESTION_ANSWERING:returnpartial(question_answering.compute_metrics,dataset_config=self.dataset_config,benchmark_config=self.benchmark_config,)case _:raiseNotImplementedError(f"Unsupported task group: {self.dataset_config.task.task_group}.")@property@abstractmethoddefextract_labels_from_generation(self)->ExtractLabelsFunction:docs
        """The function used to extract the labels from the generated output.        Returns:            The function used to extract the labels from the generated output.        """...@property@abstractmethoddeftrainer_class(self)->t.Type["Trainer"]:docs
        """The Trainer class to use for finetuning.        Returns:            The Trainer class.        """...defprepare_datasets(docs
self,datasets:list[DatasetDict],task:Task)->list[DatasetDict]:        """Prepare the datasets for the model.        This includes things like tokenisation.        Args:            datasets:                The datasets to prepare.            task:                The task to prepare the datasets for.        Returns:            The prepared datasets.        """foridx,datasetinenumerate(tqdm(iterable=datasets,desc="Preparing datasets")):prepared_dataset=self.prepare_dataset(dataset=dataset,task=task,itr_idx=idx)ifself.dataset_config.task.task_group==TaskGroup.TOKEN_CLASSIFICATION:labels_in_train:set[str]={tagfortag_listindataset["train"]["labels"]fortagintag_list}self.buffer["has_misc_tags"]=("B-MISC"inlabels_in_trainor"I-MISC"inlabels_in_train)datasets[idx]=DatasetDict(dict(train=prepared_dataset["train"],val=prepared_dataset["val"],test=prepared_dataset["test"],original_train=dataset["train"],original_val=dataset["val"],original_test=dataset["test"],))returndatasets@abstractmethoddefprepare_dataset(docs
self,dataset:DatasetDict,task:Task,itr_idx:int)->DatasetDict:        """Prepare the dataset for the model.        This includes things like tokenisation.        Args:            dataset:                The dataset to prepare.            task:                The task to prepare the dataset for.            itr_idx:                The index of the dataset in the iterator.        Returns:            The prepared dataset.        """...defgenerate(self,inputs:dict)->GenerativeModelOutput:docs
        """Generate outputs from the model.        Args:            inputs:                A batch of inputs to pass through the model.        Returns:            The generated model outputs.        """raiseNotImplementedError("The `generate` method has not been implemented for "f"{self.__class__.__name__}.")@classmethod@abstractmethoddefmodel_exists(docs
cls,model_id:str,benchmark_config:BenchmarkConfig)->bool|NeedsExtraInstalled|NeedsEnvironmentVariable:        """Check if a model exists.        Args:            model_id:                The model ID.            benchmark_config:                The benchmark configuration.        Returns:            Whether the model exists, or an error describing why we cannot check            whether the model exists.        """...@classmethod@abstractmethoddefget_model_config(docs
cls,model_id:str,benchmark_config:BenchmarkConfig)->ModelConfig:        """Fetch the model configuration.        Args:            model_id:                The model ID.            benchmark_config:                The benchmark configuration.        Returns:            The model configuration.        """...