scandeval.benchmark_modules.fresh

docs module scandeval.benchmark_modules.fresh
"""Freshly initialised encoder models."""importosfromfunctoolsimportcached_propertyfromjsonimportJSONDecodeErrorfromtransformersimport(AutoConfig,AutoTokenizer,ElectraForQuestionAnswering,ElectraForSequenceClassification,ElectraForTokenClassification,PretrainedConfig,PreTrainedModel,PreTrainedTokenizer,XLMRobertaForQuestionAnswering,XLMRobertaForSequenceClassification,XLMRobertaForTokenClassification,)from..data_modelsimportBenchmarkConfig,DatasetConfig,ModelConfigfrom..enumsimportInferenceBackend,ModelType,TaskGroupfrom..exceptionsimport(InvalidBenchmark,InvalidModel,NeedsEnvironmentVariable,NeedsExtraInstalled,)from..utilsimportblock_terminal_output,create_model_cache_dirfrom.hfimport(HuggingFaceEncoderModel,align_model_and_tokenizer,setup_model_for_question_answering,)classFreshEncoderModel(HuggingFaceEncoderModel):docs
    """A freshly initialised encoder model."""fresh_model=Truedef__init__(self,model_config:ModelConfig,dataset_config:DatasetConfig,benchmark_config:BenchmarkConfig,)->None:        """Initialise the model.        Args:            model_config:                The model configuration.            dataset_config:                The dataset configuration.            benchmark_config:                The benchmark configuration.        """# This is already set when calling `super.__init__`, but we need it to get a# value from `self.model_max_length`, so we set it here as well.self.model_config=model_configmodel,tokenizer=load_model_and_tokenizer(model_config=model_config,dataset_config=dataset_config,benchmark_config=benchmark_config,model_max_length=self.model_max_length,)self._model:PreTrainedModel=modelself._tokenizer:PreTrainedTokenizer=tokenizerself._model,self._tokenizer=align_model_and_tokenizer(model=self._model,tokenizer=self._tokenizer,model_max_length=self.model_max_length,raise_errors=benchmark_config.raise_errors,)# We specify `HuggingFaceEncoderModel` here instead of `VLLMModel`, as we want# to call the `__init__` method of the `BenchmarkModule` class.super(HuggingFaceEncoderModel,self).__init__(model_config=model_config,dataset_config=dataset_config,benchmark_config=benchmark_config,)@cached_propertydefnum_params(self)->int:docs
        """The number of parameters in the model.        Returns:            The number of parameters in the model.        """matchself.model_config.model_id:case"fresh-xlm-roberta-base":return278_885_778case"fresh-electra-small":return13_738_755case _:raiseNotImplementedError(f"Number of parameters for model {self.model_config.model_id} is ""not implemented.")@cached_propertydefvocab_size(self)->int:docs
        """The vocabulary size of the model.        Returns:            The vocabulary size of the model.        """matchself.model_config.model_id:case"fresh-xlm-roberta-base":return250_002case"fresh-electra-small":return32_000case _:raiseNotImplementedError(f"Vocabulary size for model {self.model_config.model_id} is not ""implemented.")@cached_propertydefmodel_max_length(self)->int:docs
        """The maximum context length of the model.        Returns:            The maximum context length of the model.        """matchself.model_config.model_id:case"fresh-xlm-roberta-base":return512case"fresh-electra-small":return128case _:raiseNotImplementedError(f"Maximum context length for model {self.model_config.model_id} is ""not implemented.")@classmethoddefmodel_exists(docs
cls,model_id:str,benchmark_config:BenchmarkConfig)->bool|NeedsExtraInstalled|NeedsEnvironmentVariable:        """Check if a model exists.        Args:            model_id:                The model ID.            benchmark_config:                The benchmark configuration.        Returns:            Whether the model exists, or an error describing why we cannot check            whether the model exists.        """valid_models=["fresh-electra-small","fresh-xlm-roberta-base"]returnmodel_idinvalid_models@classmethoddefget_model_config(docs
cls,model_id:str,benchmark_config:BenchmarkConfig)->ModelConfig:        """Fetch the model configuration.        Args:            model_id:                The model ID.            benchmark_config:                The benchmark configuration.        Returns:            The model configuration.        """returnModelConfig(model_id=model_id,task="fill-mask",languages=list(),revision="main",merge=False,inference_backend=InferenceBackend.TRANSFORMERS,model_type=ModelType.ENCODER,fresh=True,model_cache_dir=create_model_cache_dir(cache_dir=benchmark_config.cache_dir,model_id=model_id),adapter_base_model_id=None,)defload_model_and_tokenizer(docs
model_config:ModelConfig,dataset_config:DatasetConfig,benchmark_config:BenchmarkConfig,model_max_length:int,)->tuple[PreTrainedModel,PreTrainedTokenizer]:    """Load the model and tokenizer.    Args:        model_config:            The model configuration.        dataset_config:            The dataset configuration.        benchmark_config:            The benchmark configuration.        model_max_length:            The maximum context length of the model.    Returns:        The loaded model and tokenizer.    """config:"PretrainedConfig"block_terminal_output()# Get the fresh model ID and the corresponding real model IDmodel_id=model_config.model_id.replace("-","_")fresh_to_real_model_id_mapping=dict(fresh_xlm_roberta_base="FacebookAI/xlm-roberta-base",fresh_electra_small="google/electra-small-discriminator",)real_model_id=fresh_to_real_model_id_mapping[model_id]matchdataset_config.task.task_group:case(TaskGroup.SEQUENCE_CLASSIFICATION|TaskGroup.MULTIPLE_CHOICE_CLASSIFICATION):model_cls_mapping=dict(fresh_xlm_roberta_base=XLMRobertaForSequenceClassification,fresh_electra_small=ElectraForSequenceClassification,)caseTaskGroup.TOKEN_CLASSIFICATION:model_cls_mapping=dict(fresh_xlm_roberta_base=XLMRobertaForTokenClassification,fresh_electra_small=ElectraForTokenClassification,)caseTaskGroup.QUESTION_ANSWERING:model_cls_mapping=dict(fresh_xlm_roberta_base=XLMRobertaForQuestionAnswering,fresh_electra_small=ElectraForQuestionAnswering,)case _:raiseInvalidBenchmark(f"Task group {dataset_config.task.task_group} is not "f"supported for model {model_config.model_id}.")model_cls=model_cls_mapping[model_id]config=AutoConfig.from_pretrained(real_model_id,token=benchmark_config.api_keyoros.getenv("HUGGINGFACE_API_KEY")orTrue,num_labels=dataset_config.num_labels,id2label=dataset_config.id2label,label2id=dataset_config.label2id,cache_dir=model_config.model_cache_dir,trust_remote_code=benchmark_config.trust_remote_code,)model=model_cls(config)ifdataset_config.task.task_group==TaskGroup.QUESTION_ANSWERING:model=setup_model_for_question_answering(model=model)# Load the tokenizer. If the model is a subclass of a RoBERTa model then we# have to add a prefix space to the tokens, by the way the model is constructedprefix_models=["Roberta","GPT","Deberta"]prefix=any(model_typeintype(model).__name__formodel_typeinprefix_models)try:tokenizer:"PreTrainedTokenizer"=AutoTokenizer.from_pretrained(real_model_id,revision=model_config.revision,token=benchmark_config.api_keyoros.getenv("HUGGINGFACE_API_KEY")orTrue,add_prefix_space=prefix,cache_dir=model_config.model_cache_dir,use_fast=True,verbose=False,trust_remote_code=benchmark_config.trust_remote_code,)except(JSONDecodeError,OSError):raiseInvalidModel(f"Could not load tokenizer for model {real_model_id!r}.")model,tokenizer=align_model_and_tokenizer(model=model,tokenizer=tokenizer,model_max_length=model_max_length,raise_errors=benchmark_config.raise_errors,)returnmodel,tokenizer