mirror of https://github.com/InternLM/InternLM
				
				
				
			feat(data/utils.py): add new dataset type code for streaming dataset (#225)
							parent
							
								
									94b2aa28fc
								
							
						
					
					
						commit
						fd28bcab58
					
				| 
						 | 
				
			
			@ -5,7 +5,7 @@ import torch
 | 
			
		|||
 | 
			
		||||
from internlm.core.context import global_context as gpc
 | 
			
		||||
 | 
			
		||||
DATASET_TYPE_IDS_MAP = {"en": 0, "cn": 1}
 | 
			
		||||
DATASET_TYPE_IDS_MAP = {"en": 0, "cn": 1, "code": 2}
 | 
			
		||||
 | 
			
		||||
 | 
			
		||||
def get_dataset_type_id(path):
 | 
			
		||||
| 
						 | 
				
			
			
 | 
			
		|||
		Loading…
	
		Reference in New Issue