From 791c977ab2c74fe204bb25f1e6c44f4faf88bf06 Mon Sep 17 00:00:00 2001 From: YuzaChongyi <490083538@qq.com> Date: Sun, 11 Aug 2024 13:20:29 +0800 Subject: [PATCH] fix 2.6 slice placeholder --- finetune/dataset.py | 11 ++++++++--- 1 file changed, 8 insertions(+), 3 deletions(-) diff --git a/finetune/dataset.py b/finetune/dataset.py index 38d05d4..09dadcc 100644 --- a/finetune/dataset.py +++ b/finetune/dataset.py @@ -485,9 +485,14 @@ def split_to_patches(image, grid): def get_grid_placeholder(tokenizer, grid, query_num, new_schema=False): - image_placeholder = ( - tokenizer.im_start + tokenizer.unk_token * query_num + tokenizer.im_end - ) + if new_schema: + image_placeholder = ( + tokenizer.slice_start + tokenizer.unk_token * query_num + tokenizer.slice_end + ) + else: + image_placeholder = ( + tokenizer.im_start + tokenizer.unk_token * query_num + tokenizer.im_end + ) cols = grid[0] rows = grid[1]