[Feature] add mm token usage (#4570)

* add mm token usage

* fix unit test

* fix unit test

* fix unit test

* fix model path

* fix unit test

* fix unit test

* fix unit test

* remove uncomment

* change var name

* fix code style

* fix code style

* fix code style

* fix code style

* fix unit test
This commit is contained in:
ApplEOFDiscord
2025-10-29 14:37:12 +08:00
committed by GitHub
parent fc5cd1adb1
commit 14f8cddaf1
9 changed files with 70 additions and 20 deletions

View File

@@ -142,6 +142,8 @@ class DataProcessor:
"labels": [],
"cur_position": 0,
"video_cnt": 0,
"num_input_image_tokens": 0,
"num_input_video_tokens": 0,
"fps": [],
"mm_positions": [],
"mm_hashes": [],
@@ -351,6 +353,7 @@ class DataProcessor:
outputs["mm_positions"].append(ImagePosition(len(outputs["input_ids"]), num_tokens))
outputs["input_ids"].extend([self.image_token_id] * num_tokens)
outputs["token_type_ids"].extend([IDS_TYPE_FLAG["image"]] * num_tokens)
outputs["num_input_image_tokens"] += int(num_tokens)
outputs["images"].append(ret["pixel_values"])
if not uuid:
@@ -409,6 +412,7 @@ class DataProcessor:
outputs["mm_positions"].append(ImagePosition(len(outputs["input_ids"]), num_tokens))
outputs["input_ids"].extend([self.video_token_id] * num_tokens)
outputs["token_type_ids"].extend([IDS_TYPE_FLAG["video"]] * num_tokens)
outputs["num_input_video_tokens"] += int(num_tokens)
outputs["images"].append(ret["pixel_values"])
if not uuid: