1515from .rope2d import get_rope_index_2 , get_rope_index_25
1616
1717# Define placeholders for dataset paths
18- IION_split1 = {
18+ IIGN_split1 = {
1919 "data_path" : "projects/VL-LN-Bench/traj_data/mp3d_split1" ,
2020 "height" : 125 ,
2121 "pitch_1" : 0 ,
2222 "pitch_2" : 30 ,
2323}
2424
25- IION_split2 = {
25+ IIGN_split2 = {
2626 "data_path" : "projects/VL-LN-Bench/traj_data/mp3d_split2" ,
2727 "height" : 125 ,
2828 "pitch_1" : 0 ,
2929 "pitch_2" : 30 ,
3030}
3131
32- IION_split3 = {
32+ IIGN_split3 = {
3333 "data_path" : "projects/VL-LN-Bench/traj_data/mp3d_split3" ,
3434 "height" : 125 ,
3535 "pitch_1" : 0 ,
3636 "pitch_2" : 30 ,
3737}
3838
3939data_dict = {
40- "iion_split1 " : IION_split1 ,
41- "iion_split2 " : IION_split2 ,
42- "iion_split3 " : IION_split3 ,
40+ "iign_split1 " : IIGN_split1 ,
41+ "iign_split2 " : IIGN_split2 ,
42+ "iign_split3 " : IIGN_split3 ,
4343}
4444
4545IGNORE_INDEX = - 100
5555
5656class VLLNDataset (Dataset ):
5757 """
58- Dataset for 'Vision-Language'-'Language-Navigation' (VL-LN) / IION -style training.
58+ Dataset for 'Vision-Language'-'Language-Navigation' (VL-LN) / IIGN -style training.
5959
6060 Args:
6161 tokenizer (transformers.PreTrainedTokenizer): Tokenizer used to encode
6262 the chat template and produce `input_ids` / `labels`.
6363 data_args: A config-like object that must provide at least:
64- - iion_dataset_use (str): comma-separated dataset names, optionally
65- with sampling rate suffix like `iion_split1 %50`.
64+ - iign_dataset_use (str): comma-separated dataset names, optionally
65+ with sampling rate suffix like `iign_split1 %50`.
6666 - model_type (str): decides which rope-index function to use.
6767 - sample_step (int): stride for sampling start frames.
6868 - pixel_goal_only (bool): whether to keep only pixel-goal samples.
@@ -74,7 +74,7 @@ class VLLNDataset(Dataset):
7474
7575 def __init__ (self , tokenizer : transformers .PreTrainedTokenizer , data_args ):
7676 super (VLLNDataset , self ).__init__ ()
77- dataset = data_args .iion_dataset_use .split ("," )
77+ dataset = data_args .iign_dataset_use .split ("," )
7878 dataset_list = data_list (dataset )
7979 rank0_print (f"Loading datasets: { dataset_list } " )
8080 self .video_max_total_pixels = getattr (data_args , "video_max_total_pixels" , 1664 * 28 * 28 )
0 commit comments