From 6a48d07b66262ea065a9339be89bbf82df7d0a35 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Marcos=20Mart=C3=ADnez=20Galindo?= Date: Tue, 23 Jul 2024 15:59:40 +0100 Subject: [PATCH] :bug: Fix trust_remote_code=True bug in tests MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Signed-off-by: Marcos Martínez Galindo --- zshot/evaluation/dataset/fewrel/fewrel.py | 2 +- zshot/evaluation/dataset/med_mentions/med_mentions.py | 2 +- zshot/evaluation/dataset/ontonotes/onto_notes.py | 2 +- 3 files changed, 3 insertions(+), 3 deletions(-) diff --git a/zshot/evaluation/dataset/fewrel/fewrel.py b/zshot/evaluation/dataset/fewrel/fewrel.py index d3da23f..e7a80f5 100644 --- a/zshot/evaluation/dataset/fewrel/fewrel.py +++ b/zshot/evaluation/dataset/fewrel/fewrel.py @@ -25,7 +25,7 @@ def get_entity_data(e, tokenized_sentence): def load_few_rel_zs(split: Optional[Union[str, Split]] = "val_wiki") -> Union[Dict[DatasetWithRelations, Dataset], Dataset]: - dataset = load_dataset("few_rel", split=split) + dataset = load_dataset("few_rel", split=split, trust_remote_code=True) relations_descriptions = dataset["names"] tokenized_sentences = dataset["tokens"] sentences = [" ".join(tokens) for tokens in tokenized_sentences] diff --git a/zshot/evaluation/dataset/med_mentions/med_mentions.py b/zshot/evaluation/dataset/med_mentions/med_mentions.py index 3e94eda..5b32e35 100644 --- a/zshot/evaluation/dataset/med_mentions/med_mentions.py +++ b/zshot/evaluation/dataset/med_mentions/med_mentions.py @@ -13,7 +13,7 @@ def load_medmentions_zs(split: Optional[Union[str, Split]] = None, **kwargs) -> Union[DatasetDict, Dataset]: - dataset = load_dataset(REPO_ID, split=split, **kwargs) + dataset = load_dataset(REPO_ID, split=split, trust_remote_code=True, **kwargs) entities_file = hf_hub_download(repo_id=REPO_ID, repo_type='dataset', filename=ENTITIES_FN) diff --git a/zshot/evaluation/dataset/ontonotes/onto_notes.py b/zshot/evaluation/dataset/ontonotes/onto_notes.py index f2569c9..b48e43b 100644 --- a/zshot/evaluation/dataset/ontonotes/onto_notes.py +++ b/zshot/evaluation/dataset/ontonotes/onto_notes.py @@ -58,7 +58,7 @@ def remove_out_of_split(sentence, split): def load_ontonotes_zs(split: Optional[Union[str, Split]] = None, **kwargs) -> Union[Dict[DatasetWithEntities, Dataset], Dataset]: dataset_zs = load_dataset("conll2012_ontonotesv5", "english_v12", - split=split, verification_mode='no_checks', **kwargs) + split=split, verification_mode='no_checks', trust_remote_code=True, **kwargs) if split: ontonotes_zs = preprocess_spit(dataset_zs, get_simple_split(split)) else: