parent
							
								
									f8480678d8
								
							
						
					
					
						commit
						c92db47135
					
				| 
						 | 
				
			
			@ -47,7 +47,6 @@ def InitDataset(config):
 | 
			
		|||
            print(f"INFO: Load dataset end")
 | 
			
		||||
        else:
 | 
			
		||||
            raw_dataset = MeaningDataset(start, start + size, vocab, None, conf.level_ratio, conf.min_subitem)
 | 
			
		||||
            print("INFO: raw_dataset.token_frequency" + raw_dataset.token_frequency())
 | 
			
		||||
            raw_dataset.set_mask(conf.mask_level, conf.mask_idx)
 | 
			
		||||
            train_dataset, val_dataset = raw_dataset.split(0.9)
 | 
			
		||||
            torch.save(train_dataset, trainfile)
 | 
			
		||||
| 
						 | 
				
			
			
 | 
			
		|||
		Loading…
	
		Reference in New Issue