RangiLyu commited on
Commit
d1b2b44
·
1 Parent(s): 844e150

remove end string

Browse files
mmgpt/datasets/dolly_dataset.py CHANGED
@@ -66,7 +66,7 @@ class DollyDataset(Dataset):
66
 
67
  def tokenize(self, text):
68
  res = self.tokenizer(
69
- text["instruction"] + text["answer"] + "### End.",
70
  return_tensors=None,
71
  padding="do_not_pad",
72
  truncation=True,
 
66
 
67
  def tokenize(self, text):
68
  res = self.tokenizer(
69
+ text["instruction"] + text["answer"],
70
  return_tensors=None,
71
  padding="do_not_pad",
72
  truncation=True,
mmgpt/datasets/vqa_dataset.py CHANGED
@@ -127,7 +127,7 @@ class VQADataset(Dataset):
127
 
128
  def tokenize(self, text):
129
  res = self.tokenizer(
130
- text["instruction"] + text["answer"] + "### End.",
131
  return_tensors=None,
132
  padding="do_not_pad",
133
  truncation=True,
 
127
 
128
  def tokenize(self, text):
129
  res = self.tokenizer(
130
+ text["instruction"] + text["answer"],
131
  return_tensors=None,
132
  padding="do_not_pad",
133
  truncation=True,