From a70e19df5d2cc2f8d1652b9e251c0aa143d6dee3 Mon Sep 17 00:00:00 2001 From: Colin <> Date: Sun, 10 Aug 2025 15:25:14 +0800 Subject: [PATCH] Init status. --- wit/train.py | 13 ++++++++----- 1 file changed, 8 insertions(+), 5 deletions(-) diff --git a/wit/train.py b/wit/train.py index 48a6c99..a1f6989 100644 --- a/wit/train.py +++ b/wit/train.py @@ -7,7 +7,7 @@ from model.modeling_rwkv7 import RWKVLMHeadModel from logger import TBLogger import configuration -import dataset.dataset as ds +import meaning as m import numpy as np if __name__ == "__main__": @@ -29,10 +29,13 @@ if __name__ == "__main__": conf.seed = 42 conf.dataloader_works = 2 - conf.dataset.meaning.start = 800 - conf.dataset.meaning.size = 200000 + conf.dataset.meaning.start = 10000 + conf.dataset.meaning.end = 200000 + conf.dataset.meaning.size = None conf.dataset.meaning.min_subitem = 2 - conf.dataset.meaning.max_subitem = 4 + conf.dataset.meaning.max_subitem = 6 + conf.dataset.meaning.stride = 1 + conf.dataset.meaning.with_tree = False conf.dataset.meaning.val_mask_level = [0, 1, 2] conf.dataset.meaning.val_mask_idx = [0, 0, -1] @@ -50,7 +53,7 @@ if __name__ == "__main__": # model = RWKVLMHeadModel(conf.model_config) qwen = LightModule(conf, model) - train_dataloader, val_dataloader = ds.InitDataset(conf) + train_dataloader, val_dataloader = m.InitDataset(conf) # for i in range(len(train_dataloader)): # print(train_dataloader.print_mapping(i))