From ecf6d441336f65e0627545ae7fdf43fb5deaff50 Mon Sep 17 00:00:00 2001 From: gongjy <2474590974@qq.com> Date: Sat, 14 Sep 2024 14:05:41 +0800 Subject: [PATCH] update model/dataset.py --- model/dataset.py | 10 +++++++++- 1 file changed, 9 insertions(+), 1 deletion(-) diff --git a/model/dataset.py b/model/dataset.py index 47387d5..f3cc897 100644 --- a/model/dataset.py +++ b/model/dataset.py @@ -8,6 +8,7 @@ from torch.utils.data import Dataset, DataLoader import torch from sklearn.model_selection import train_test_split import os + os.environ["TOKENIZERS_PARALLELISM"] = "false" @@ -68,10 +69,17 @@ class SFTDataset(Dataset): last_index = i return last_index + def safe_eval(self, s): + try: + res = eval(s) + except Exception as e: + return [] + return res + def __getitem__(self, index: int): # sample = self.df.iloc[index] - history = eval(sample['history']) + history = self.safe_eval(sample['history']) q = sample['q'] a = sample['a']