123 commited on Jan 12

Commit

addbf21

1 Parent(s): 3192c09

upload ckpts

Files changed (26) hide show

100_percent/LLM-Augmented-MTR/best_eval_record.txt +40 -0
100_percent/LLM-Augmented-MTR/checkpoint_epoch_26.pth +3 -0
100_percent/LLM-Augmented-MTR/log_train_20240516-100200.txt +0 -0
100_percent/LLM-Augmented-MTR/log_train_20240516-143350.txt +0 -0
100_percent/LLM-Augmented-MTR/log_train_20240518-102918.txt +1038 -0
100_percent/LLM-Augmented-MTR/log_train_20240518-104841.txt +0 -0
100_percent/MTR/best_eval_record.txt +40 -0
100_percent/MTR/checkpoint_epoch_30.pth +3 -0
100_percent/MTR/log_train_20230318-135944.txt +0 -0
100_percent/MTR/log_train_20230323-015050.txt +0 -0
100_percent/MTR/log_train_20230324-224338.txt +0 -0
20_percent/LLM-Augmented-MTR/best_eval_record.txt +42 -0
20_percent/LLM-Augmented-MTR/checkpoint_epoch_29.pth +3 -0
20_percent/LLM-Augmented-MTR/log_train_20240227-140250.txt +0 -0
20_percent/MTR/best_eval_record.txt +42 -0
20_percent/MTR/checkpoint_epoch_29.pth +3 -0
20_percent/MTR/log_train_20240315-005422.txt +0 -0
20_percent/MTR/log_train_20240315-075642.txt +0 -0
5_percent/LLM-Augmented-MTR/best_eval_record.txt +40 -0
5_percent/LLM-Augmented-MTR/checkpoint_epoch_28.pth +3 -0
5_percent/LLM-Augmented-MTR/log_train_20240519-174533.txt +0 -0
5_percent/LLM-Augmented-MTR/log_train_20240520-084733.txt +0 -0
5_percent/MTR/best_eval_record.txt +42 -0
5_percent/MTR/checkpoint_epoch_28.pth +3 -0
5_percent/MTR/log_train_20240429-093927.txt +0 -0
README.md +60 -0

100_percent/LLM-Augmented-MTR/best_eval_record.txt ADDED Viewed

	@@ -0,0 +1,40 @@

+epoch_1 mAP 0.23161921567387053
+best_epoch_1 mAP 0.23161921567387053
+epoch_4 mAP 0.3319349918100569
+best_epoch_4 mAP 0.3319349918100569
+epoch_6 mAP 0.3404955714941025
+best_epoch_6 mAP 0.3404955714941025
+epoch_8 mAP 0.37202317184872097
+best_epoch_8 mAP 0.37202317184872097
+epoch_10 mAP 0.3758834236198001
+best_epoch_10 mAP 0.3758834236198001
+epoch_12 mAP 0.37917777564790517
+best_epoch_12 mAP 0.37917777564790517
+epoch_14 mAP 0.37314530710379284
+best_epoch_12 mAP 0.37917777564790517
+epoch_16 mAP 0.39642529024018175
+best_epoch_16 mAP 0.39642529024018175
+epoch_18 mAP 0.40432000160217285
+best_epoch_18 mAP 0.40432000160217285
+epoch_20 mAP 0.4059317045741611
+best_epoch_20 mAP 0.4059317045741611
+epoch_21 mAP 0.40459092126952273
+best_epoch_20 mAP 0.4059317045741611
+epoch_22 mAP 0.4035279485914442
+best_epoch_20 mAP 0.4059317045741611
+epoch_23 mAP 0.4111773471037547
+best_epoch_23 mAP 0.4111773471037547
+epoch_24 mAP 0.41981253690189785
+best_epoch_24 mAP 0.41981253690189785
+epoch_25 mAP 0.4195335838529799
+best_epoch_24 mAP 0.41981253690189785
+epoch_26 mAP 0.4268754555119409
+best_epoch_26 mAP 0.4268754555119409
+epoch_27 mAP 0.42183637287881637
+best_epoch_26 mAP 0.4268754555119409
+epoch_28 mAP 0.4209697412119972
+best_epoch_26 mAP 0.4268754555119409
+epoch_29 mAP 0.4222996963395012
+best_epoch_26 mAP 0.4268754555119409
+epoch_30 mAP 0.4242007202572293
+best_epoch_26 mAP 0.4268754555119409

100_percent/LLM-Augmented-MTR/checkpoint_epoch_26.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fc53c6fbae714165ac201d28f8b6ea1fd558ffb45a9bca22cdfab00484d60d1e
+size 843700702

100_percent/LLM-Augmented-MTR/log_train_20240516-100200.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

100_percent/LLM-Augmented-MTR/log_train_20240516-143350.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

100_percent/LLM-Augmented-MTR/log_train_20240518-102918.txt ADDED Viewed

	@@ -0,0 +1,1038 @@

+2024-05-18 10:29:18,049   INFO  **********************Start logging**********************
+2024-05-18 10:29:18,049   INFO  CUDA_VISIBLE_DEVICES=4,5,6,7
+2024-05-18 10:29:18,050   INFO  total_batch_size: 52
+2024-05-18 10:29:18,050   INFO  cfg_file         cfgs/waymo/mtr+100_percent_data_llm_augmented.yaml
+2024-05-18 10:29:18,050   INFO  batch_size       13
+2024-05-18 10:29:18,050   INFO  epochs           30
+2024-05-18 10:29:18,050   INFO  workers          8
+2024-05-18 10:29:18,050   INFO  extra_tag        llm_augmented_mtr+100_percent_attn_loop_learned_gate_inside+change_context_window_8_layer_4
+2024-05-18 10:29:18,050   INFO  ckpt             None
+2024-05-18 10:29:18,050   INFO  pretrained_model None
+2024-05-18 10:29:18,050   INFO  launcher         pytorch
+2024-05-18 10:29:18,050   INFO  tcp_port         18888
+2024-05-18 10:29:18,050   INFO  without_sync_bn  False
+2024-05-18 10:29:18,050   INFO  fix_random_seed  False
+2024-05-18 10:29:18,050   INFO  ckpt_save_interval 2
+2024-05-18 10:29:18,050   INFO  local_rank       0
+2024-05-18 10:29:18,050   INFO  max_ckpt_save_num 5
+2024-05-18 10:29:18,050   INFO  merge_all_iters_to_one_epoch False
+2024-05-18 10:29:18,050   INFO  set_cfgs         None
+2024-05-18 10:29:18,050   INFO  max_waiting_mins 0
+2024-05-18 10:29:18,050   INFO  start_epoch      0
+2024-05-18 10:29:18,050   INFO  save_to_file     False
+2024-05-18 10:29:18,050   INFO  not_eval_with_train False
+2024-05-18 10:29:18,050   INFO  logger_iter_interval 50
+2024-05-18 10:29:18,050   INFO  ckpt_save_time_interval 300
+2024-05-18 10:29:18,050   INFO  add_worker_init_fn False
+2024-05-18 10:29:18,051   INFO  dataset_type
+2024-05-18 10:29:18,051   INFO  cfg.ROOT_DIR: /home/aidrive/zhengxj/projects_new/MTR_new
+2024-05-18 10:29:18,051   INFO  cfg.LOCAL_RANK: 0
+2024-05-18 10:29:18,051   INFO
+cfg.DATA_CONFIG = edict()
+2024-05-18 10:29:18,055   INFO  cfg.DATA_CONFIG.DATASET: WaymoDataset
+2024-05-18 10:29:18,055   INFO  cfg.DATA_CONFIG.OBJECT_TYPE: ['TYPE_VEHICLE', 'TYPE_PEDESTRIAN', 'TYPE_CYCLIST']
+2024-05-18 10:29:18,055   INFO  cfg.DATA_CONFIG.DATA_ROOT: /home/DISCOVER/yanzj/workspace/code/MTR/data/waymo/mtr_processed
+2024-05-18 10:29:18,055   INFO
+cfg.DATA_CONFIG.SPLIT_DIR = edict()
+2024-05-18 10:29:18,055   INFO  cfg.DATA_CONFIG.SPLIT_DIR.train: processed_scenarios_training
+2024-05-18 10:29:18,055   INFO  cfg.DATA_CONFIG.SPLIT_DIR.valid: processed_scenarios_validation
+2024-05-18 10:29:18,055   INFO  cfg.DATA_CONFIG.SPLIT_DIR.test: processed_scenarios_testing
+2024-05-18 10:29:18,055   INFO
+cfg.DATA_CONFIG.INFO_FILE = edict()
+2024-05-18 10:29:18,055   INFO  cfg.DATA_CONFIG.INFO_FILE.train: processed_scenarios_training_infos.pkl
+2024-05-18 10:29:18,055   INFO  cfg.DATA_CONFIG.INFO_FILE.valid: processed_scenarios_val_infos.pkl
+2024-05-18 10:29:18,055   INFO  cfg.DATA_CONFIG.INFO_FILE.test: processed_scenarios_test_infos.pkl
+2024-05-18 10:29:18,055   INFO
+cfg.DATA_CONFIG.SAMPLE_INTERVAL = edict()
+2024-05-18 10:29:18,055   INFO  cfg.DATA_CONFIG.SAMPLE_INTERVAL.train: 1
+2024-05-18 10:29:18,055   INFO  cfg.DATA_CONFIG.SAMPLE_INTERVAL.valid: 1
+2024-05-18 10:29:18,055   INFO  cfg.DATA_CONFIG.SAMPLE_INTERVAL.test: 1
+2024-05-18 10:29:18,055   INFO
+cfg.DATA_CONFIG.INFO_FILTER_DICT = edict()
+2024-05-18 10:29:18,055   INFO  cfg.DATA_CONFIG.INFO_FILTER_DICT.filter_info_by_object_type: ['TYPE_VEHICLE', 'TYPE_PEDESTRIAN', 'TYPE_CYCLIST']
+2024-05-18 10:29:18,055   INFO  cfg.DATA_CONFIG.POINT_SAMPLED_INTERVAL: 1
+2024-05-18 10:29:18,055   INFO  cfg.DATA_CONFIG.NUM_POINTS_EACH_POLYLINE: 20
+2024-05-18 10:29:18,055   INFO  cfg.DATA_CONFIG.VECTOR_BREAK_DIST_THRESH: 1.0
+2024-05-18 10:29:18,055   INFO  cfg.DATA_CONFIG.NUM_OF_SRC_POLYLINES: 768
+2024-05-18 10:29:18,056   INFO  cfg.DATA_CONFIG.CENTER_OFFSET_OF_MAP: [30.0, 0]
+2024-05-18 10:29:18,056   INFO  cfg.DATA_CONFIG.LOAD_CONTEXT_DATA: True
+2024-05-18 10:29:18,056   INFO  cfg.DATA_CONFIG.GENERATE_EMBEDDING: False
+2024-05-18 10:29:18,056   INFO  cfg.DATA_CONFIG.RETRIEVAL_WINDOW_SIZE: 8
+2024-05-18 10:29:18,056   INFO  cfg.DATA_CONFIG.ENCODER_FOR_CONTEXT: 100
+2024-05-18 10:29:18,056   INFO
+cfg.MODEL = edict()
+2024-05-18 10:29:18,056   INFO
+cfg.MODEL.CONTEXT_ENCODER = edict()
+2024-05-18 10:29:18,056   INFO  cfg.MODEL.CONTEXT_ENCODER.NAME: MTREncoder
+2024-05-18 10:29:18,056   INFO  cfg.MODEL.CONTEXT_ENCODER.NUM_OF_ATTN_NEIGHBORS: 16
+2024-05-18 10:29:18,056   INFO  cfg.MODEL.CONTEXT_ENCODER.NUM_INPUT_ATTR_AGENT: 29
+2024-05-18 10:29:18,056   INFO  cfg.MODEL.CONTEXT_ENCODER.NUM_INPUT_ATTR_MAP: 9
+2024-05-18 10:29:18,056   INFO  cfg.MODEL.CONTEXT_ENCODER.NUM_CHANNEL_IN_MLP_AGENT: 256
+2024-05-18 10:29:18,056   INFO  cfg.MODEL.CONTEXT_ENCODER.NUM_CHANNEL_IN_MLP_MAP: 64
+2024-05-18 10:29:18,056   INFO  cfg.MODEL.CONTEXT_ENCODER.NUM_LAYER_IN_MLP_AGENT: 3
+2024-05-18 10:29:18,056   INFO  cfg.MODEL.CONTEXT_ENCODER.NUM_LAYER_IN_MLP_MAP: 5
+2024-05-18 10:29:18,056   INFO  cfg.MODEL.CONTEXT_ENCODER.NUM_LAYER_IN_PRE_MLP_MAP: 3
+2024-05-18 10:29:18,056   INFO  cfg.MODEL.CONTEXT_ENCODER.D_MODEL: 256
+2024-05-18 10:29:18,056   INFO  cfg.MODEL.CONTEXT_ENCODER.NUM_ATTN_LAYERS: 6
+2024-05-18 10:29:18,056   INFO  cfg.MODEL.CONTEXT_ENCODER.NUM_ATTN_HEAD: 8
+2024-05-18 10:29:18,056   INFO  cfg.MODEL.CONTEXT_ENCODER.DROPOUT_OF_ATTN: 0.1
+2024-05-18 10:29:18,056   INFO  cfg.MODEL.CONTEXT_ENCODER.USE_LOCAL_ATTN: True
+2024-05-18 10:29:18,056   INFO
+cfg.MODEL.MOTION_DECODER = edict()
+2024-05-18 10:29:18,057   INFO  cfg.MODEL.MOTION_DECODER.NAME: MTRDecoder
+2024-05-18 10:29:18,057   INFO  cfg.MODEL.MOTION_DECODER.OBJECT_TYPE: ['TYPE_VEHICLE', 'TYPE_PEDESTRIAN', 'TYPE_CYCLIST']
+2024-05-18 10:29:18,057   INFO  cfg.MODEL.MOTION_DECODER.CENTER_OFFSET_OF_MAP: [30.0, 0]
+2024-05-18 10:29:18,057   INFO  cfg.MODEL.MOTION_DECODER.NUM_FUTURE_FRAMES: 80
+2024-05-18 10:29:18,057   INFO  cfg.MODEL.MOTION_DECODER.NUM_MOTION_MODES: 6
+2024-05-18 10:29:18,057   INFO  cfg.MODEL.MOTION_DECODER.INTENTION_POINTS_FILE: data/waymo/cluster_64_center_dict.pkl
+2024-05-18 10:29:18,057   INFO  cfg.MODEL.MOTION_DECODER.D_MODEL: 512
+2024-05-18 10:29:18,057   INFO  cfg.MODEL.MOTION_DECODER.NUM_DECODER_LAYERS: 6
+2024-05-18 10:29:18,057   INFO  cfg.MODEL.MOTION_DECODER.NUM_ATTN_HEAD: 8
+2024-05-18 10:29:18,057   INFO  cfg.MODEL.MOTION_DECODER.MAP_D_MODEL: 256
+2024-05-18 10:29:18,057   INFO  cfg.MODEL.MOTION_DECODER.DROPOUT_OF_ATTN: 0.1
+2024-05-18 10:29:18,057   INFO  cfg.MODEL.MOTION_DECODER.NUM_BASE_MAP_POLYLINES: 256
+2024-05-18 10:29:18,057   INFO  cfg.MODEL.MOTION_DECODER.NUM_WAYPOINT_MAP_POLYLINES: 128
+2024-05-18 10:29:18,057   INFO
+cfg.MODEL.MOTION_DECODER.LOSS_WEIGHTS = edict()
+2024-05-18 10:29:18,057   INFO  cfg.MODEL.MOTION_DECODER.LOSS_WEIGHTS.cls: 1.0
+2024-05-18 10:29:18,057   INFO  cfg.MODEL.MOTION_DECODER.LOSS_WEIGHTS.reg: 1.0
+2024-05-18 10:29:18,057   INFO  cfg.MODEL.MOTION_DECODER.LOSS_WEIGHTS.vel: 0.5
+2024-05-18 10:29:18,057   INFO  cfg.MODEL.MOTION_DECODER.NMS_DIST_THRESH: 2.5
+2024-05-18 10:29:18,057   INFO  cfg.MODEL.MOTION_DECODER.LOAD_CONTEXT_DATA: True
+2024-05-18 10:29:18,057   INFO  cfg.MODEL.MOTION_DECODER.RETRIEVAL_WINDOW_SIZE: 8
+2024-05-18 10:29:18,057   INFO  cfg.MODEL.GENERATE_EMBEDDING: False
+2024-05-18 10:29:18,057   INFO
+cfg.OPTIMIZATION = edict()
+2024-05-18 10:29:18,057   INFO  cfg.OPTIMIZATION.BATCH_SIZE_PER_GPU: 10
+2024-05-18 10:29:18,057   INFO  cfg.OPTIMIZATION.NUM_EPOCHS: 30
+2024-05-18 10:29:18,058   INFO  cfg.OPTIMIZATION.OPTIMIZER: AdamW
+2024-05-18 10:29:18,058   INFO  cfg.OPTIMIZATION.LR: 0.0001
+2024-05-18 10:29:18,058   INFO  cfg.OPTIMIZATION.WEIGHT_DECAY: 0.01
+2024-05-18 10:29:18,058   INFO  cfg.OPTIMIZATION.SCHEDULER: lambdaLR
+2024-05-18 10:29:18,058   INFO  cfg.OPTIMIZATION.DECAY_STEP_LIST: [22, 24, 26, 28]
+2024-05-18 10:29:18,058   INFO  cfg.OPTIMIZATION.LR_DECAY: 0.5
+2024-05-18 10:29:18,058   INFO  cfg.OPTIMIZATION.LR_CLIP: 1e-06
+2024-05-18 10:29:18,058   INFO  cfg.OPTIMIZATION.GRAD_NORM_CLIP: 1000.0
+2024-05-18 10:29:18,058   INFO  cfg.TAG: mtr+100_percent_data_llm_augmented
+2024-05-18 10:29:18,058   INFO  cfg.EXP_GROUP_PATH: waymo
+2024-05-18 10:29:18,135   INFO  Start to load infos from /home/DISCOVER/yanzj/workspace/code/MTR/data/waymo/mtr_processed/processed_scenarios_training_infos.pkl
+2024-05-18 10:29:31,419   INFO  Total scenes before filters: 487002
+2024-05-18 10:29:41,038   INFO  Total scenes after filter_info_by_object_type: 487002
+2024-05-18 10:29:41,063   INFO  Total scenes after filters: 487002
+2024-05-18 10:29:41,064   INFO  Start to load context from /home/aidrive/zhengxj/projects_new/MTR_new/LLM_integrate/context_data/train/context_data_encoder_100.pkl
+2024-05-18 10:30:18,067   INFO  Total scenes in context info file: 487002
+2024-05-18 10:31:55,387   INFO  ==> Loading parameters from checkpoint /home/aidrive/zhengxj/projects_new/MTR_new/output/waymo/mtr+100_percent_data_llm_augmented/llm_augmented_mtr+100_percent_attn_loop_learned_gate_inside+change_context_window_8_layer_4/ckpt/latest_model.pth to CPU
+2024-05-18 10:31:57,791   INFO  ==> Loading optimizer parameters from checkpoint /home/aidrive/zhengxj/projects_new/MTR_new/output/waymo/mtr+100_percent_data_llm_augmented/llm_augmented_mtr+100_percent_attn_loop_learned_gate_inside+change_context_window_8_layer_4/ckpt/latest_model.pth to CPU
+2024-05-18 10:31:59,104   INFO  ==> Done (loaded 894/894)
+2024-05-18 10:32:00,840   INFO  DistributedDataParallel(
+  (module): MotionTransformer(
+    (context_encoder): MTREncoder(
+      (agent_polyline_encoder): PointNetPolylineEncoder(
+        (pre_mlps): Sequential(
+          (0): Linear(in_features=30, out_features=256, bias=False)
+          (1): SyncBatchNorm(256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
+          (2): ReLU()
+        )
+        (mlps): Sequential(
+          (0): Linear(in_features=512, out_features=256, bias=False)
+          (1): SyncBatchNorm(256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
+          (2): ReLU()
+          (3): Linear(in_features=256, out_features=256, bias=False)
+          (4): SyncBatchNorm(256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
+          (5): ReLU()
+        )
+        (out_mlps): Sequential(
+          (0): Linear(in_features=256, out_features=256, bias=True)
+          (1): ReLU()
+          (2): Linear(in_features=256, out_features=256, bias=True)
+        )
+      )
+      (map_polyline_encoder): PointNetPolylineEncoder(
+        (pre_mlps): Sequential(
+          (0): Linear(in_features=9, out_features=64, bias=False)
+          (1): SyncBatchNorm(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
+          (2): ReLU()
+          (3): Linear(in_features=64, out_features=64, bias=False)
+          (4): SyncBatchNorm(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
+          (5): ReLU()
+          (6): Linear(in_features=64, out_features=64, bias=False)
+          (7): SyncBatchNorm(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
+          (8): ReLU()
+        )
+        (mlps): Sequential(
+          (0): Linear(in_features=128, out_features=64, bias=False)
+          (1): SyncBatchNorm(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
+          (2): ReLU()
+          (3): Linear(in_features=64, out_features=64, bias=False)
+          (4): SyncBatchNorm(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
+          (5): ReLU()
+        )
+        (out_mlps): Sequential(
+          (0): Linear(in_features=64, out_features=64, bias=True)
+          (1): ReLU()
+          (2): Linear(in_features=64, out_features=256, bias=True)
+        )
+      )
+      (self_attn_layers): ModuleList(
+        (0): TransformerEncoderLayer(
+          (self_attn): MultiheadAttentionLocal(
+            (out_proj): Linear(in_features=256, out_features=256, bias=True)
+          )
+          (linear1): Linear(in_features=256, out_features=1024, bias=True)
+          (dropout): Dropout(p=0.1, inplace=False)
+          (linear2): Linear(in_features=1024, out_features=256, bias=True)
+          (norm1): LayerNorm((256,), eps=1e-05, elementwise_affine=True)
+          (norm2): LayerNorm((256,), eps=1e-05, elementwise_affine=True)
+          (dropout1): Dropout(p=0.1, inplace=False)
+          (dropout2): Dropout(p=0.1, inplace=False)
+        )
+        (1): TransformerEncoderLayer(
+          (self_attn): MultiheadAttentionLocal(
+            (out_proj): Linear(in_features=256, out_features=256, bias=True)
+          )
+          (linear1): Linear(in_features=256, out_features=1024, bias=True)
+          (dropout): Dropout(p=0.1, inplace=False)
+          (linear2): Linear(in_features=1024, out_features=256, bias=True)
+          (norm1): LayerNorm((256,), eps=1e-05, elementwise_affine=True)
+          (norm2): LayerNorm((256,), eps=1e-05, elementwise_affine=True)
+          (dropout1): Dropout(p=0.1, inplace=False)
+          (dropout2): Dropout(p=0.1, inplace=False)
+        )
+        (2): TransformerEncoderLayer(
+          (self_attn): MultiheadAttentionLocal(
+            (out_proj): Linear(in_features=256, out_features=256, bias=True)
+          )
+          (linear1): Linear(in_features=256, out_features=1024, bias=True)
+          (dropout): Dropout(p=0.1, inplace=False)
+          (linear2): Linear(in_features=1024, out_features=256, bias=True)
+          (norm1): LayerNorm((256,), eps=1e-05, elementwise_affine=True)
+          (norm2): LayerNorm((256,), eps=1e-05, elementwise_affine=True)
+          (dropout1): Dropout(p=0.1, inplace=False)
+          (dropout2): Dropout(p=0.1, inplace=False)
+        )
+        (3): TransformerEncoderLayer(
+          (self_attn): MultiheadAttentionLocal(
+            (out_proj): Linear(in_features=256, out_features=256, bias=True)
+          )
+          (linear1): Linear(in_features=256, out_features=1024, bias=True)
+          (dropout): Dropout(p=0.1, inplace=False)
+          (linear2): Linear(in_features=1024, out_features=256, bias=True)
+          (norm1): LayerNorm((256,), eps=1e-05, elementwise_affine=True)
+          (norm2): LayerNorm((256,), eps=1e-05, elementwise_affine=True)
+          (dropout1): Dropout(p=0.1, inplace=False)
+          (dropout2): Dropout(p=0.1, inplace=False)
+        )
+        (4): TransformerEncoderLayer(
+          (self_attn): MultiheadAttentionLocal(
+            (out_proj): Linear(in_features=256, out_features=256, bias=True)
+          )
+          (linear1): Linear(in_features=256, out_features=1024, bias=True)
+          (dropout): Dropout(p=0.1, inplace=False)
+          (linear2): Linear(in_features=1024, out_features=256, bias=True)
+          (norm1): LayerNorm((256,), eps=1e-05, elementwise_affine=True)
+          (norm2): LayerNorm((256,), eps=1e-05, elementwise_affine=True)
+          (dropout1): Dropout(p=0.1, inplace=False)
+          (dropout2): Dropout(p=0.1, inplace=False)
+        )
+        (5): TransformerEncoderLayer(
+          (self_attn): MultiheadAttentionLocal(
+            (out_proj): Linear(in_features=256, out_features=256, bias=True)
+          )
+          (linear1): Linear(in_features=256, out_features=1024, bias=True)
+          (dropout): Dropout(p=0.1, inplace=False)
+          (linear2): Linear(in_features=1024, out_features=256, bias=True)
+          (norm1): LayerNorm((256,), eps=1e-05, elementwise_affine=True)
+          (norm2): LayerNorm((256,), eps=1e-05, elementwise_affine=True)
+          (dropout1): Dropout(p=0.1, inplace=False)
+          (dropout2): Dropout(p=0.1, inplace=False)
+        )
+      )
+    )
+    (motion_decoder): MTRDecoder(
+      (in_proj_center_obj): Sequential(
+        (0): Linear(in_features=256, out_features=512, bias=True)
+        (1): ReLU()
+        (2): Linear(in_features=512, out_features=512, bias=True)
+      )
+      (in_proj_obj): Sequential(
+        (0): Linear(in_features=256, out_features=512, bias=True)
+        (1): ReLU()
+        (2): Linear(in_features=512, out_features=512, bias=True)
+      )
+      (obj_decoder_layers): ModuleList(
+        (0): TransformerDecoderLayer(
+          (sa_qcontent_proj): Linear(in_features=512, out_features=512, bias=True)
+          (sa_qpos_proj): Linear(in_features=512, out_features=512, bias=True)
+          (sa_kcontent_proj): Linear(in_features=512, out_features=512, bias=True)
+          (sa_kpos_proj): Linear(in_features=512, out_features=512, bias=True)
+          (sa_v_proj): Linear(in_features=512, out_features=512, bias=True)
+          (self_attn): MultiheadAttention(
+            (out_proj): Linear(in_features=512, out_features=512, bias=True)
+          )
+          (norm1): LayerNorm((512,), eps=1e-05, elementwise_affine=True)
+          (dropout1): Dropout(p=0.1, inplace=False)
+          (ca_qcontent_proj): Linear(in_features=512, out_features=512, bias=True)
+          (ca_qpos_proj): Linear(in_features=512, out_features=512, bias=True)
+          (ca_kcontent_proj): Linear(in_features=512, out_features=512, bias=True)
+          (ca_kpos_proj): Linear(in_features=512, out_features=512, bias=True)
+          (ca_v_proj): Linear(in_features=512, out_features=512, bias=True)
+          (ca_qpos_sine_proj): Linear(in_features=512, out_features=512, bias=True)
+          (cross_attn): MultiheadAttention(
+            (out_proj): Linear(in_features=512, out_features=512, bias=True)
+          )
+          (linear1): Linear(in_features=512, out_features=2048, bias=True)
+          (dropout): Dropout(p=0.1, inplace=False)
+          (linear2): Linear(in_features=2048, out_features=512, bias=True)
+          (norm2): LayerNorm((512,), eps=1e-05, elementwise_affine=True)
+          (norm3): LayerNorm((512,), eps=1e-05, elementwise_affine=True)
+          (dropout2): Dropout(p=0.1, inplace=False)
+          (dropout3): Dropout(p=0.1, inplace=False)
+        )
+        (1): TransformerDecoderLayer(
+          (sa_qcontent_proj): Linear(in_features=512, out_features=512, bias=True)
+          (sa_qpos_proj): Linear(in_features=512, out_features=512, bias=True)
+          (sa_kcontent_proj): Linear(in_features=512, out_features=512, bias=True)
+          (sa_kpos_proj): Linear(in_features=512, out_features=512, bias=True)
+          (sa_v_proj): Linear(in_features=512, out_features=512, bias=True)
+          (self_attn): MultiheadAttention(
+            (out_proj): Linear(in_features=512, out_features=512, bias=True)
+          )
+          (norm1): LayerNorm((512,), eps=1e-05, elementwise_affine=True)
+          (dropout1): Dropout(p=0.1, inplace=False)
+          (ca_qcontent_proj): Linear(in_features=512, out_features=512, bias=True)
+          (ca_qpos_proj): Linear(in_features=512, out_features=512, bias=True)
+          (ca_kcontent_proj): Linear(in_features=512, out_features=512, bias=True)
+          (ca_kpos_proj): Linear(in_features=512, out_features=512, bias=True)
+          (ca_v_proj): Linear(in_features=512, out_features=512, bias=True)
+          (ca_qpos_sine_proj): Linear(in_features=512, out_features=512, bias=True)
+          (cross_attn): MultiheadAttention(
+            (out_proj): Linear(in_features=512, out_features=512, bias=True)
+          )
+          (linear1): Linear(in_features=512, out_features=2048, bias=True)
+          (dropout): Dropout(p=0.1, inplace=False)
+          (linear2): Linear(in_features=2048, out_features=512, bias=True)
+          (norm2): LayerNorm((512,), eps=1e-05, elementwise_affine=True)
+          (norm3): LayerNorm((512,), eps=1e-05, elementwise_affine=True)
+          (dropout2): Dropout(p=0.1, inplace=False)
+          (dropout3): Dropout(p=0.1, inplace=False)
+        )
+        (2): TransformerDecoderLayer(
+          (sa_qcontent_proj): Linear(in_features=512, out_features=512, bias=True)
+          (sa_qpos_proj): Linear(in_features=512, out_features=512, bias=True)
+          (sa_kcontent_proj): Linear(in_features=512, out_features=512, bias=True)
+          (sa_kpos_proj): Linear(in_features=512, out_features=512, bias=True)
+          (sa_v_proj): Linear(in_features=512, out_features=512, bias=True)
+          (self_attn): MultiheadAttention(
+            (out_proj): Linear(in_features=512, out_features=512, bias=True)
+          )
+          (norm1): LayerNorm((512,), eps=1e-05, elementwise_affine=True)
+          (dropout1): Dropout(p=0.1, inplace=False)
+          (ca_qcontent_proj): Linear(in_features=512, out_features=512, bias=True)
+          (ca_qpos_proj): Linear(in_features=512, out_features=512, bias=True)
+          (ca_kcontent_proj): Linear(in_features=512, out_features=512, bias=True)
+          (ca_kpos_proj): Linear(in_features=512, out_features=512, bias=True)
+          (ca_v_proj): Linear(in_features=512, out_features=512, bias=True)
+          (ca_qpos_sine_proj): Linear(in_features=512, out_features=512, bias=True)
+          (cross_attn): MultiheadAttention(
+            (out_proj): Linear(in_features=512, out_features=512, bias=True)
+          )
+          (linear1): Linear(in_features=512, out_features=2048, bias=True)
+          (dropout): Dropout(p=0.1, inplace=False)
+          (linear2): Linear(in_features=2048, out_features=512, bias=True)
+          (norm2): LayerNorm((512,), eps=1e-05, elementwise_affine=True)
+          (norm3): LayerNorm((512,), eps=1e-05, elementwise_affine=True)
+          (dropout2): Dropout(p=0.1, inplace=False)
+          (dropout3): Dropout(p=0.1, inplace=False)
+        )
+        (3): TransformerDecoderLayer(
+          (sa_qcontent_proj): Linear(in_features=512, out_features=512, bias=True)
+          (sa_qpos_proj): Linear(in_features=512, out_features=512, bias=True)
+          (sa_kcontent_proj): Linear(in_features=512, out_features=512, bias=True)
+          (sa_kpos_proj): Linear(in_features=512, out_features=512, bias=True)
+          (sa_v_proj): Linear(in_features=512, out_features=512, bias=True)
+          (self_attn): MultiheadAttention(
+            (out_proj): Linear(in_features=512, out_features=512, bias=True)
+          )
+          (norm1): LayerNorm((512,), eps=1e-05, elementwise_affine=True)
+          (dropout1): Dropout(p=0.1, inplace=False)
+          (ca_qcontent_proj): Linear(in_features=512, out_features=512, bias=True)
+          (ca_qpos_proj): Linear(in_features=512, out_features=512, bias=True)
+          (ca_kcontent_proj): Linear(in_features=512, out_features=512, bias=True)
+          (ca_kpos_proj): Linear(in_features=512, out_features=512, bias=True)
+          (ca_v_proj): Linear(in_features=512, out_features=512, bias=True)
+          (ca_qpos_sine_proj): Linear(in_features=512, out_features=512, bias=True)
+          (cross_attn): MultiheadAttention(
+            (out_proj): Linear(in_features=512, out_features=512, bias=True)
+          )
+          (linear1): Linear(in_features=512, out_features=2048, bias=True)
+          (dropout): Dropout(p=0.1, inplace=False)
+          (linear2): Linear(in_features=2048, out_features=512, bias=True)
+          (norm2): LayerNorm((512,), eps=1e-05, elementwise_affine=True)
+          (norm3): LayerNorm((512,), eps=1e-05, elementwise_affine=True)
+          (dropout2): Dropout(p=0.1, inplace=False)
+          (dropout3): Dropout(p=0.1, inplace=False)
+        )
+        (4): TransformerDecoderLayer(
+          (sa_qcontent_proj): Linear(in_features=512, out_features=512, bias=True)
+          (sa_qpos_proj): Linear(in_features=512, out_features=512, bias=True)
+          (sa_kcontent_proj): Linear(in_features=512, out_features=512, bias=True)
+          (sa_kpos_proj): Linear(in_features=512, out_features=512, bias=True)
+          (sa_v_proj): Linear(in_features=512, out_features=512, bias=True)
+          (self_attn): MultiheadAttention(
+            (out_proj): Linear(in_features=512, out_features=512, bias=True)
+          )
+          (norm1): LayerNorm((512,), eps=1e-05, elementwise_affine=True)
+          (dropout1): Dropout(p=0.1, inplace=False)
+          (ca_qcontent_proj): Linear(in_features=512, out_features=512, bias=True)
+          (ca_qpos_proj): Linear(in_features=512, out_features=512, bias=True)
+          (ca_kcontent_proj): Linear(in_features=512, out_features=512, bias=True)
+          (ca_kpos_proj): Linear(in_features=512, out_features=512, bias=True)
+          (ca_v_proj): Linear(in_features=512, out_features=512, bias=True)
+          (ca_qpos_sine_proj): Linear(in_features=512, out_features=512, bias=True)
+          (cross_attn): MultiheadAttention(
+            (out_proj): Linear(in_features=512, out_features=512, bias=True)
+          )
+          (linear1): Linear(in_features=512, out_features=2048, bias=True)
+          (dropout): Dropout(p=0.1, inplace=False)
+          (linear2): Linear(in_features=2048, out_features=512, bias=True)
+          (norm2): LayerNorm((512,), eps=1e-05, elementwise_affine=True)
+          (norm3): LayerNorm((512,), eps=1e-05, elementwise_affine=True)
+          (dropout2): Dropout(p=0.1, inplace=False)
+          (dropout3): Dropout(p=0.1, inplace=False)
+        )
+        (5): TransformerDecoderLayer(
+          (sa_qcontent_proj): Linear(in_features=512, out_features=512, bias=True)
+          (sa_qpos_proj): Linear(in_features=512, out_features=512, bias=True)
+          (sa_kcontent_proj): Linear(in_features=512, out_features=512, bias=True)
+          (sa_kpos_proj): Linear(in_features=512, out_features=512, bias=True)
+          (sa_v_proj): Linear(in_features=512, out_features=512, bias=True)
+          (self_attn): MultiheadAttention(
+            (out_proj): Linear(in_features=512, out_features=512, bias=True)
+          )
+          (norm1): LayerNorm((512,), eps=1e-05, elementwise_affine=True)
+          (dropout1): Dropout(p=0.1, inplace=False)
+          (ca_qcontent_proj): Linear(in_features=512, out_features=512, bias=True)
+          (ca_qpos_proj): Linear(in_features=512, out_features=512, bias=True)
+          (ca_kcontent_proj): Linear(in_features=512, out_features=512, bias=True)
+          (ca_kpos_proj): Linear(in_features=512, out_features=512, bias=True)
+          (ca_v_proj): Linear(in_features=512, out_features=512, bias=True)
+          (ca_qpos_sine_proj): Linear(in_features=512, out_features=512, bias=True)
+          (cross_attn): MultiheadAttention(
+            (out_proj): Linear(in_features=512, out_features=512, bias=True)
+          )
+          (linear1): Linear(in_features=512, out_features=2048, bias=True)
+          (dropout): Dropout(p=0.1, inplace=False)
+          (linear2): Linear(in_features=2048, out_features=512, bias=True)
+          (norm2): LayerNorm((512,), eps=1e-05, elementwise_affine=True)
+          (norm3): LayerNorm((512,), eps=1e-05, elementwise_affine=True)
+          (dropout2): Dropout(p=0.1, inplace=False)
+          (dropout3): Dropout(p=0.1, inplace=False)
+        )
+      )
+      (in_proj_map): Sequential(
+        (0): Linear(in_features=256, out_features=256, bias=True)
+        (1): ReLU()
+        (2): Linear(in_features=256, out_features=256, bias=True)
+      )
+      (map_decoder_layers): ModuleList(
+        (0): TransformerDecoderLayer(
+          (sa_qcontent_proj): Linear(in_features=256, out_features=256, bias=True)
+          (sa_qpos_proj): Linear(in_features=256, out_features=256, bias=True)
+          (sa_kcontent_proj): Linear(in_features=256, out_features=256, bias=True)
+          (sa_kpos_proj): Linear(in_features=256, out_features=256, bias=True)
+          (sa_v_proj): Linear(in_features=256, out_features=256, bias=True)
+          (self_attn): MultiheadAttention(
+            (out_proj): Linear(in_features=256, out_features=256, bias=True)
+          )
+          (norm1): LayerNorm((256,), eps=1e-05, elementwise_affine=True)
+          (dropout1): Dropout(p=0.1, inplace=False)
+          (ca_qcontent_proj): Linear(in_features=256, out_features=256, bias=True)
+          (ca_qpos_proj): Linear(in_features=256, out_features=256, bias=True)
+          (ca_kcontent_proj): Linear(in_features=256, out_features=256, bias=True)
+          (ca_kpos_proj): Linear(in_features=256, out_features=256, bias=True)
+          (ca_v_proj): Linear(in_features=256, out_features=256, bias=True)
+          (ca_qpos_sine_proj): Linear(in_features=256, out_features=256, bias=True)
+          (cross_attn): MultiheadAttentionLocal(
+            (out_proj): Linear(in_features=256, out_features=256, bias=True)
+          )
+          (linear1): Linear(in_features=256, out_features=1024, bias=True)
+          (dropout): Dropout(p=0.1, inplace=False)
+          (linear2): Linear(in_features=1024, out_features=256, bias=True)
+          (norm2): LayerNorm((256,), eps=1e-05, elementwise_affine=True)
+          (norm3): LayerNorm((256,), eps=1e-05, elementwise_affine=True)
+          (dropout2): Dropout(p=0.1, inplace=False)
+          (dropout3): Dropout(p=0.1, inplace=False)
+        )
+        (1): TransformerDecoderLayer(
+          (sa_qcontent_proj): Linear(in_features=256, out_features=256, bias=True)
+          (sa_qpos_proj): Linear(in_features=256, out_features=256, bias=True)
+          (sa_kcontent_proj): Linear(in_features=256, out_features=256, bias=True)
+          (sa_kpos_proj): Linear(in_features=256, out_features=256, bias=True)
+          (sa_v_proj): Linear(in_features=256, out_features=256, bias=True)
+          (self_attn): MultiheadAttention(
+            (out_proj): Linear(in_features=256, out_features=256, bias=True)
+          )
+          (norm1): LayerNorm((256,), eps=1e-05, elementwise_affine=True)
+          (dropout1): Dropout(p=0.1, inplace=False)
+          (ca_qcontent_proj): Linear(in_features=256, out_features=256, bias=True)
+          (ca_qpos_proj): Linear(in_features=256, out_features=256, bias=True)
+          (ca_kcontent_proj): Linear(in_features=256, out_features=256, bias=True)
+          (ca_kpos_proj): Linear(in_features=256, out_features=256, bias=True)
+          (ca_v_proj): Linear(in_features=256, out_features=256, bias=True)
+          (ca_qpos_sine_proj): Linear(in_features=256, out_features=256, bias=True)
+          (cross_attn): MultiheadAttentionLocal(
+            (out_proj): Linear(in_features=256, out_features=256, bias=True)
+          )
+          (linear1): Linear(in_features=256, out_features=1024, bias=True)
+          (dropout): Dropout(p=0.1, inplace=False)
+          (linear2): Linear(in_features=1024, out_features=256, bias=True)
+          (norm2): LayerNorm((256,), eps=1e-05, elementwise_affine=True)
+          (norm3): LayerNorm((256,), eps=1e-05, elementwise_affine=True)
+          (dropout2): Dropout(p=0.1, inplace=False)
+          (dropout3): Dropout(p=0.1, inplace=False)
+        )
+        (2): TransformerDecoderLayer(
+          (sa_qcontent_proj): Linear(in_features=256, out_features=256, bias=True)
+          (sa_qpos_proj): Linear(in_features=256, out_features=256, bias=True)
+          (sa_kcontent_proj): Linear(in_features=256, out_features=256, bias=True)
+          (sa_kpos_proj): Linear(in_features=256, out_features=256, bias=True)
+          (sa_v_proj): Linear(in_features=256, out_features=256, bias=True)
+          (self_attn): MultiheadAttention(
+            (out_proj): Linear(in_features=256, out_features=256, bias=True)
+          )
+          (norm1): LayerNorm((256,), eps=1e-05, elementwise_affine=True)
+          (dropout1): Dropout(p=0.1, inplace=False)
+          (ca_qcontent_proj): Linear(in_features=256, out_features=256, bias=True)
+          (ca_qpos_proj): Linear(in_features=256, out_features=256, bias=True)
+          (ca_kcontent_proj): Linear(in_features=256, out_features=256, bias=True)
+          (ca_kpos_proj): Linear(in_features=256, out_features=256, bias=True)
+          (ca_v_proj): Linear(in_features=256, out_features=256, bias=True)
+          (ca_qpos_sine_proj): Linear(in_features=256, out_features=256, bias=True)
+          (cross_attn): MultiheadAttentionLocal(
+            (out_proj): Linear(in_features=256, out_features=256, bias=True)
+          )
+          (linear1): Linear(in_features=256, out_features=1024, bias=True)
+          (dropout): Dropout(p=0.1, inplace=False)
+          (linear2): Linear(in_features=1024, out_features=256, bias=True)
+          (norm2): LayerNorm((256,), eps=1e-05, elementwise_affine=True)
+          (norm3): LayerNorm((256,), eps=1e-05, elementwise_affine=True)
+          (dropout2): Dropout(p=0.1, inplace=False)
+          (dropout3): Dropout(p=0.1, inplace=False)
+        )
+        (3): TransformerDecoderLayer(
+          (sa_qcontent_proj): Linear(in_features=256, out_features=256, bias=True)
+          (sa_qpos_proj): Linear(in_features=256, out_features=256, bias=True)
+          (sa_kcontent_proj): Linear(in_features=256, out_features=256, bias=True)
+          (sa_kpos_proj): Linear(in_features=256, out_features=256, bias=True)
+          (sa_v_proj): Linear(in_features=256, out_features=256, bias=True)
+          (self_attn): MultiheadAttention(
+            (out_proj): Linear(in_features=256, out_features=256, bias=True)
+          )
+          (norm1): LayerNorm((256,), eps=1e-05, elementwise_affine=True)
+          (dropout1): Dropout(p=0.1, inplace=False)
+          (ca_qcontent_proj): Linear(in_features=256, out_features=256, bias=True)
+          (ca_qpos_proj): Linear(in_features=256, out_features=256, bias=True)
+          (ca_kcontent_proj): Linear(in_features=256, out_features=256, bias=True)
+          (ca_kpos_proj): Linear(in_features=256, out_features=256, bias=True)
+          (ca_v_proj): Linear(in_features=256, out_features=256, bias=True)
+          (ca_qpos_sine_proj): Linear(in_features=256, out_features=256, bias=True)
+          (cross_attn): MultiheadAttentionLocal(
+            (out_proj): Linear(in_features=256, out_features=256, bias=True)
+          )
+          (linear1): Linear(in_features=256, out_features=1024, bias=True)
+          (dropout): Dropout(p=0.1, inplace=False)
+          (linear2): Linear(in_features=1024, out_features=256, bias=True)
+          (norm2): LayerNorm((256,), eps=1e-05, elementwise_affine=True)
+          (norm3): LayerNorm((256,), eps=1e-05, elementwise_affine=True)
+          (dropout2): Dropout(p=0.1, inplace=False)
+          (dropout3): Dropout(p=0.1, inplace=False)
+        )
+        (4): TransformerDecoderLayer(
+          (sa_qcontent_proj): Linear(in_features=256, out_features=256, bias=True)
+          (sa_qpos_proj): Linear(in_features=256, out_features=256, bias=True)
+          (sa_kcontent_proj): Linear(in_features=256, out_features=256, bias=True)
+          (sa_kpos_proj): Linear(in_features=256, out_features=256, bias=True)
+          (sa_v_proj): Linear(in_features=256, out_features=256, bias=True)
+          (self_attn): MultiheadAttention(
+            (out_proj): Linear(in_features=256, out_features=256, bias=True)
+          )
+          (norm1): LayerNorm((256,), eps=1e-05, elementwise_affine=True)
+          (dropout1): Dropout(p=0.1, inplace=False)
+          (ca_qcontent_proj): Linear(in_features=256, out_features=256, bias=True)
+          (ca_qpos_proj): Linear(in_features=256, out_features=256, bias=True)
+          (ca_kcontent_proj): Linear(in_features=256, out_features=256, bias=True)
+          (ca_kpos_proj): Linear(in_features=256, out_features=256, bias=True)
+          (ca_v_proj): Linear(in_features=256, out_features=256, bias=True)
+          (ca_qpos_sine_proj): Linear(in_features=256, out_features=256, bias=True)
+          (cross_attn): MultiheadAttentionLocal(
+            (out_proj): Linear(in_features=256, out_features=256, bias=True)
+          )
+          (linear1): Linear(in_features=256, out_features=1024, bias=True)
+          (dropout): Dropout(p=0.1, inplace=False)
+          (linear2): Linear(in_features=1024, out_features=256, bias=True)
+          (norm2): LayerNorm((256,), eps=1e-05, elementwise_affine=True)
+          (norm3): LayerNorm((256,), eps=1e-05, elementwise_affine=True)
+          (dropout2): Dropout(p=0.1, inplace=False)
+          (dropout3): Dropout(p=0.1, inplace=False)
+        )
+        (5): TransformerDecoderLayer(
+          (sa_qcontent_proj): Linear(in_features=256, out_features=256, bias=True)
+          (sa_qpos_proj): Linear(in_features=256, out_features=256, bias=True)
+          (sa_kcontent_proj): Linear(in_features=256, out_features=256, bias=True)
+          (sa_kpos_proj): Linear(in_features=256, out_features=256, bias=True)
+          (sa_v_proj): Linear(in_features=256, out_features=256, bias=True)
+          (self_attn): MultiheadAttention(
+            (out_proj): Linear(in_features=256, out_features=256, bias=True)
+          )
+          (norm1): LayerNorm((256,), eps=1e-05, elementwise_affine=True)
+          (dropout1): Dropout(p=0.1, inplace=False)
+          (ca_qcontent_proj): Linear(in_features=256, out_features=256, bias=True)
+          (ca_qpos_proj): Linear(in_features=256, out_features=256, bias=True)
+          (ca_kcontent_proj): Linear(in_features=256, out_features=256, bias=True)
+          (ca_kpos_proj): Linear(in_features=256, out_features=256, bias=True)
+          (ca_v_proj): Linear(in_features=256, out_features=256, bias=True)
+          (ca_qpos_sine_proj): Linear(in_features=256, out_features=256, bias=True)
+          (cross_attn): MultiheadAttentionLocal(
+            (out_proj): Linear(in_features=256, out_features=256, bias=True)
+          )
+          (linear1): Linear(in_features=256, out_features=1024, bias=True)
+          (dropout): Dropout(p=0.1, inplace=False)
+          (linear2): Linear(in_features=1024, out_features=256, bias=True)
+          (norm2): LayerNorm((256,), eps=1e-05, elementwise_affine=True)
+          (norm3): LayerNorm((256,), eps=1e-05, elementwise_affine=True)
+          (dropout2): Dropout(p=0.1, inplace=False)
+          (dropout3): Dropout(p=0.1, inplace=False)
+        )
+      )
+      (map_query_content_mlps): ModuleList(
+        (0): Linear(in_features=512, out_features=256, bias=True)
+        (1): Linear(in_features=512, out_features=256, bias=True)
+        (2): Linear(in_features=512, out_features=256, bias=True)
+        (3): Linear(in_features=512, out_features=256, bias=True)
+        (4): Linear(in_features=512, out_features=256, bias=True)
+        (5): Linear(in_features=512, out_features=256, bias=True)
+      )
+      (map_query_embed_mlps): Linear(in_features=512, out_features=256, bias=True)
+      (obj_pos_encoding_layer): Sequential(
+        (0): Linear(in_features=2, out_features=512, bias=True)
+        (1): ReLU()
+        (2): Linear(in_features=512, out_features=512, bias=True)
+        (3): ReLU()
+        (4): Linear(in_features=512, out_features=512, bias=True)
+      )
+      (dense_future_head): Sequential(
+        (0): Linear(in_features=1024, out_features=512, bias=False)
+        (1): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
+        (2): ReLU()
+        (3): Linear(in_features=512, out_features=512, bias=False)
+        (4): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
+        (5): ReLU()
+        (6): Linear(in_features=512, out_features=560, bias=True)
+      )
+      (future_traj_mlps): Sequential(
+        (0): Linear(in_features=320, out_features=512, bias=True)
+        (1): ReLU()
+        (2): Linear(in_features=512, out_features=512, bias=True)
+        (3): ReLU()
+        (4): Linear(in_features=512, out_features=512, bias=True)
+      )
+      (traj_fusion_mlps): Sequential(
+        (0): Linear(in_features=1024, out_features=512, bias=True)
+        (1): ReLU()
+        (2): Linear(in_features=512, out_features=512, bias=True)
+        (3): ReLU()
+        (4): Linear(in_features=512, out_features=512, bias=True)
+      )
+      (intention_query_mlps): Sequential(
+        (0): Linear(in_features=512, out_features=512, bias=False)
+        (1): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
+        (2): ReLU()
+        (3): Linear(in_features=512, out_features=512, bias=True)
+      )
+      (context_proj_layer): Sequential(
+        (0): Linear(in_features=17, out_features=512, bias=True)
+        (1): ReLU()
+        (2): Linear(in_features=512, out_features=512, bias=True)
+      )
+      (context_multi_head_attn): ModuleList(
+        (0): MultiheadAttention(
+          (out_proj): NonDynamicallyQuantizableLinear(in_features=512, out_features=512, bias=True)
+        )
+        (1): MultiheadAttention(
+          (out_proj): NonDynamicallyQuantizableLinear(in_features=512, out_features=512, bias=True)
+        )
+        (2): MultiheadAttention(
+          (out_proj): NonDynamicallyQuantizableLinear(in_features=512, out_features=512, bias=True)
+        )
+        (3): MultiheadAttention(
+          (out_proj): NonDynamicallyQuantizableLinear(in_features=512, out_features=512, bias=True)
+        )
+      )
+      (gate_proj_layers): ModuleList(
+        (0): Sequential(
+          (0): Linear(in_features=512, out_features=512, bias=False)
+          (1): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
+          (2): ReLU()
+          (3): Linear(in_features=512, out_features=1, bias=True)
+        )
+        (1): Sequential(
+          (0): Linear(in_features=512, out_features=512, bias=False)
+          (1): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
+          (2): ReLU()
+          (3): Linear(in_features=512, out_features=1, bias=True)
+        )
+        (2): Sequential(
+          (0): Linear(in_features=512, out_features=512, bias=False)
+          (1): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
+          (2): ReLU()
+          (3): Linear(in_features=512, out_features=1, bias=True)
+        )
+        (3): Sequential(
+          (0): Linear(in_features=512, out_features=512, bias=False)
+          (1): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
+          (2): ReLU()
+          (3): Linear(in_features=512, out_features=1, bias=True)
+        )
+      )
+      (query_feature_fusion_layers): ModuleList(
+        (0): Sequential(
+          (0): Linear(in_features=1280, out_features=512, bias=False)
+          (1): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
+          (2): ReLU()
+          (3): Linear(in_features=512, out_features=512, bias=True)
+        )
+        (1): Sequential(
+          (0): Linear(in_features=1280, out_features=512, bias=False)
+          (1): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
+          (2): ReLU()
+          (3): Linear(in_features=512, out_features=512, bias=True)
+        )
+        (2): Sequential(
+          (0): Linear(in_features=1280, out_features=512, bias=False)
+          (1): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
+          (2): ReLU()
+          (3): Linear(in_features=512, out_features=512, bias=True)
+        )
+        (3): Sequential(
+          (0): Linear(in_features=1280, out_features=512, bias=False)
+          (1): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
+          (2): ReLU()
+          (3): Linear(in_features=512, out_features=512, bias=True)
+        )
+        (4): Sequential(
+          (0): Linear(in_features=1280, out_features=512, bias=False)
+          (1): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
+          (2): ReLU()
+          (3): Linear(in_features=512, out_features=512, bias=True)
+        )
+        (5): Sequential(
+          (0): Linear(in_features=1280, out_features=512, bias=False)
+          (1): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
+          (2): ReLU()
+          (3): Linear(in_features=512, out_features=512, bias=True)
+        )
+      )
+      (motion_reg_heads): ModuleList(
+        (0): Sequential(
+          (0): Linear(in_features=512, out_features=512, bias=False)
+          (1): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
+          (2): ReLU()
+          (3): Linear(in_features=512, out_features=512, bias=False)
+          (4): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
+          (5): ReLU()
+          (6): Linear(in_features=512, out_features=560, bias=True)
+        )
+        (1): Sequential(
+          (0): Linear(in_features=512, out_features=512, bias=False)
+          (1): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
+          (2): ReLU()
+          (3): Linear(in_features=512, out_features=512, bias=False)
+          (4): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
+          (5): ReLU()
+          (6): Linear(in_features=512, out_features=560, bias=True)
+        )
+        (2): Sequential(
+          (0): Linear(in_features=512, out_features=512, bias=False)
+          (1): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
+          (2): ReLU()
+          (3): Linear(in_features=512, out_features=512, bias=False)
+          (4): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
+          (5): ReLU()
+          (6): Linear(in_features=512, out_features=560, bias=True)
+        )
+        (3): Sequential(
+          (0): Linear(in_features=512, out_features=512, bias=False)
+          (1): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
+          (2): ReLU()
+          (3): Linear(in_features=512, out_features=512, bias=False)
+          (4): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
+          (5): ReLU()
+          (6): Linear(in_features=512, out_features=560, bias=True)
+        )
+        (4): Sequential(
+          (0): Linear(in_features=512, out_features=512, bias=False)
+          (1): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
+          (2): ReLU()
+          (3): Linear(in_features=512, out_features=512, bias=False)
+          (4): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
+          (5): ReLU()
+          (6): Linear(in_features=512, out_features=560, bias=True)
+        )
+        (5): Sequential(
+          (0): Linear(in_features=512, out_features=512, bias=False)
+          (1): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
+          (2): ReLU()
+          (3): Linear(in_features=512, out_features=512, bias=False)
+          (4): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
+          (5): ReLU()
+          (6): Linear(in_features=512, out_features=560, bias=True)
+        )
+      )
+      (motion_cls_heads): ModuleList(
+        (0): Sequential(
+          (0): Linear(in_features=512, out_features=512, bias=False)
+          (1): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
+          (2): ReLU()
+          (3): Linear(in_features=512, out_features=512, bias=False)
+          (4): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
+          (5): ReLU()
+          (6): Linear(in_features=512, out_features=1, bias=True)
+        )
+        (1): Sequential(
+          (0): Linear(in_features=512, out_features=512, bias=False)
+          (1): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
+          (2): ReLU()
+          (3): Linear(in_features=512, out_features=512, bias=False)
+          (4): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
+          (5): ReLU()
+          (6): Linear(in_features=512, out_features=1, bias=True)
+        )
+        (2): Sequential(
+          (0): Linear(in_features=512, out_features=512, bias=False)
+          (1): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
+          (2): ReLU()
+          (3): Linear(in_features=512, out_features=512, bias=False)
+          (4): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
+          (5): ReLU()
+          (6): Linear(in_features=512, out_features=1, bias=True)
+        )
+        (3): Sequential(
+          (0): Linear(in_features=512, out_features=512, bias=False)
+          (1): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
+          (2): ReLU()
+          (3): Linear(in_features=512, out_features=512, bias=False)
+          (4): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
+          (5): ReLU()
+          (6): Linear(in_features=512, out_features=1, bias=True)
+        )
+        (4): Sequential(
+          (0): Linear(in_features=512, out_features=512, bias=False)
+          (1): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
+          (2): ReLU()
+          (3): Linear(in_features=512, out_features=512, bias=False)
+          (4): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
+          (5): ReLU()
+          (6): Linear(in_features=512, out_features=1, bias=True)
+        )
+        (5): Sequential(
+          (0): Linear(in_features=512, out_features=512, bias=False)
+          (1): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
+          (2): ReLU()
+          (3): Linear(in_features=512, out_features=512, bias=False)
+          (4): SyncBatchNorm(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
+          (5): ReLU()
+          (6): Linear(in_features=512, out_features=1, bias=True)
+        )
+      )
+    )
+  )
+)
+2024-05-18 10:32:00,849   INFO  Total number of parameters: 71310426
+2024-05-18 10:32:00,850   INFO  Start to load infos from /home/DISCOVER/yanzj/workspace/code/MTR/data/waymo/mtr_processed/processed_scenarios_val_infos.pkl
+2024-05-18 10:32:01,586   INFO  Total scenes before filters: 44097
+2024-05-18 10:32:02,404   INFO  Total scenes after filter_info_by_object_type: 44097
+2024-05-18 10:32:02,409   INFO  Total scenes after filters: 44097
+2024-05-18 10:32:02,409   INFO  Start to load context from /home/aidrive/zhengxj/projects_new/MTR_new/LLM_integrate/context_data/valid/context_data_encoder_100.pkl
+2024-05-18 10:32:09,467   INFO  Total scenes in context info file: 44097
+2024-05-18 10:32:18,343   INFO  **********************Start training waymo/mtr+100_percent_data_llm_augmented(llm_augmented_mtr+100_percent_attn_loop_learned_gate_inside+change_context_window_8_layer_4)**********************
+2024-05-18 10:32:32,868   INFO  epoch: 21/30, acc_iter=131034, cur_iter=9275/9366, batch_size=13, iter_cost=8.56s, time_cost(epoch): 00:08/12:58, time_cost(all): 00:14/178:16:33, ade_TYPE_VEHICLE_layer_5=0.691, ade_TYPE_PEDESTRIAN_layer_5=0.178, ade_TYPE_CYCLIST_layer_5=0.385, loss=106.815, lr=0.0001
+2024-05-18 10:32:53,257   INFO  epoch: 21/30, acc_iter=131050, cur_iter=9291/9366, batch_size=13, iter_cost=1.70s, time_cost(epoch): 00:28/02:07, time_cost(all): 00:34/35:28:21, ade_TYPE_VEHICLE_layer_5=0.765, ade_TYPE_PEDESTRIAN_layer_5=0.331, ade_TYPE_CYCLIST_layer_5=0.484, loss=93.268, lr=0.0001
+2024-05-18 10:33:52,925   INFO  epoch: 21/30, acc_iter=131100, cur_iter=9341/9366, batch_size=13, iter_cost=1.32s, time_cost(epoch): 01:28/00:33, time_cost(all): 01:34/27:32:10, ade_TYPE_VEHICLE_layer_5=0.654, ade_TYPE_PEDESTRIAN_layer_5=0.322, ade_TYPE_CYCLIST_layer_5=0.868, loss=54.603, lr=0.0001
+2024-05-18 10:34:20,693   INFO  epoch: 21/30, acc_iter=131124, cur_iter=9365/9366, batch_size=13, iter_cost=1.28s, time_cost(epoch): 01:56/00:01, time_cost(all): 02:02/26:37:06, ade_TYPE_VEHICLE_layer_5=0.588, ade_TYPE_PEDESTRIAN_layer_5=0.244, ade_TYPE_CYCLIST_layer_5=0.272, loss=42.187, lr=0.0001
+2024-05-18 10:34:36,717   INFO  *************** EPOCH 22 EVALUATION *****************
+2024-05-18 10:34:40,366   INFO  eval: epoch=22, batch_iter=0/849, batch_size=13, iter_cost=3.64s, time_cost: 00:03/51:31,
+2024-05-18 10:34:42,700   INFO  eval: epoch=22, batch_iter=10/849, batch_size=13, iter_cost=0.60s, time_cost: 00:05/08:21,
+2024-05-18 10:34:45,003   INFO  eval: epoch=22, batch_iter=20/849, batch_size=13, iter_cost=0.41s, time_cost: 00:08/05:43,
+2024-05-18 10:34:47,257   INFO  eval: epoch=22, batch_iter=30/849, batch_size=13, iter_cost=0.35s, time_cost: 00:10/04:47,
+2024-05-18 10:34:49,694   INFO  eval: epoch=22, batch_iter=40/849, batch_size=13, iter_cost=0.32s, time_cost: 00:12/04:22,
+2024-05-18 10:34:52,057   INFO  eval: epoch=22, batch_iter=50/849, batch_size=13, iter_cost=0.31s, time_cost: 00:15/04:05,
+2024-05-18 10:34:54,463   INFO  eval: epoch=22, batch_iter=60/849, batch_size=13, iter_cost=0.30s, time_cost: 00:17/03:53,
+2024-05-18 10:34:56,687   INFO  eval: epoch=22, batch_iter=70/849, batch_size=13, iter_cost=0.29s, time_cost: 00:19/03:42,
+2024-05-18 10:34:59,094   INFO  eval: epoch=22, batch_iter=80/849, batch_size=13, iter_cost=0.28s, time_cost: 00:22/03:35,
+2024-05-18 10:35:01,361   INFO  eval: epoch=22, batch_iter=90/849, batch_size=13, iter_cost=0.27s, time_cost: 00:24/03:27,
+2024-05-18 10:35:03,720   INFO  eval: epoch=22, batch_iter=100/849, batch_size=13, iter_cost=0.27s, time_cost: 00:26/03:22,
+2024-05-18 10:35:06,003   INFO  eval: epoch=22, batch_iter=110/849, batch_size=13, iter_cost=0.27s, time_cost: 00:29/03:16,
+2024-05-18 10:35:08,339   INFO  eval: epoch=22, batch_iter=120/849, batch_size=13, iter_cost=0.26s, time_cost: 00:31/03:12,
+2024-05-18 10:35:10,738   INFO  eval: epoch=22, batch_iter=130/849, batch_size=13, iter_cost=0.26s, time_cost: 00:34/03:08,
+2024-05-18 10:35:13,110   INFO  eval: epoch=22, batch_iter=140/849, batch_size=13, iter_cost=0.26s, time_cost: 00:36/03:04,
+2024-05-18 10:35:15,416   INFO  eval: epoch=22, batch_iter=150/849, batch_size=13, iter_cost=0.26s, time_cost: 00:38/03:00,
+2024-05-18 10:35:17,712   INFO  eval: epoch=22, batch_iter=160/849, batch_size=13, iter_cost=0.26s, time_cost: 00:40/02:56,
+2024-05-18 10:35:20,083   INFO  eval: epoch=22, batch_iter=170/849, batch_size=13, iter_cost=0.26s, time_cost: 00:43/02:53,
+2024-05-18 10:35:22,418   INFO  eval: epoch=22, batch_iter=180/849, batch_size=13, iter_cost=0.25s, time_cost: 00:45/02:49,
+2024-05-18 10:35:24,709   INFO  eval: epoch=22, batch_iter=190/849, batch_size=13, iter_cost=0.25s, time_cost: 00:47/02:46,
+2024-05-18 10:35:27,086   INFO  eval: epoch=22, batch_iter=200/849, batch_size=13, iter_cost=0.25s, time_cost: 00:50/02:43,
+2024-05-18 10:35:29,527   INFO  eval: epoch=22, batch_iter=210/849, batch_size=13, iter_cost=0.25s, time_cost: 00:52/02:40,
+2024-05-18 10:35:31,772   INFO  eval: epoch=22, batch_iter=220/849, batch_size=13, iter_cost=0.25s, time_cost: 00:55/02:37,
+2024-05-18 10:35:34,195   INFO  eval: epoch=22, batch_iter=230/849, batch_size=13, iter_cost=0.25s, time_cost: 00:57/02:34,
+2024-05-18 10:35:36,580   INFO  eval: epoch=22, batch_iter=240/849, batch_size=13, iter_cost=0.25s, time_cost: 00:59/02:31,
+2024-05-18 10:35:38,983   INFO  eval: epoch=22, batch_iter=250/849, batch_size=13, iter_cost=0.25s, time_cost: 01:02/02:29,
+2024-05-18 10:35:41,266   INFO  eval: epoch=22, batch_iter=260/849, batch_size=13, iter_cost=0.25s, time_cost: 01:04/02:26,
+2024-05-18 10:35:43,514   INFO  eval: epoch=22, batch_iter=270/849, batch_size=13, iter_cost=0.25s, time_cost: 01:06/02:23,
+2024-05-18 10:35:45,727   INFO  eval: epoch=22, batch_iter=280/849, batch_size=13, iter_cost=0.25s, time_cost: 01:09/02:20,
+2024-05-18 10:35:48,131   INFO  eval: epoch=22, batch_iter=290/849, batch_size=13, iter_cost=0.25s, time_cost: 01:11/02:17,
+2024-05-18 10:35:50,573   INFO  eval: epoch=22, batch_iter=300/849, batch_size=13, iter_cost=0.25s, time_cost: 01:13/02:15,
+2024-05-18 10:35:53,226   INFO  eval: epoch=22, batch_iter=310/849, batch_size=13, iter_cost=0.25s, time_cost: 01:16/02:13,
+2024-05-18 10:35:55,819   INFO  eval: epoch=22, batch_iter=320/849, batch_size=13, iter_cost=0.25s, time_cost: 01:19/02:10,
+2024-05-18 10:35:58,139   INFO  eval: epoch=22, batch_iter=330/849, batch_size=13, iter_cost=0.25s, time_cost: 01:21/02:08,
+2024-05-18 10:36:00,685   INFO  eval: epoch=22, batch_iter=340/849, batch_size=13, iter_cost=0.25s, time_cost: 01:23/02:05,
+2024-05-18 10:36:03,115   INFO  eval: epoch=22, batch_iter=350/849, batch_size=13, iter_cost=0.25s, time_cost: 01:26/02:03,
+2024-05-18 10:36:05,615   INFO  eval: epoch=22, batch_iter=360/849, batch_size=13, iter_cost=0.25s, time_cost: 01:28/02:00,
+2024-05-18 10:36:08,071   INFO  eval: epoch=22, batch_iter=370/849, batch_size=13, iter_cost=0.25s, time_cost: 01:31/01:58,
+2024-05-18 10:36:10,403   INFO  eval: epoch=22, batch_iter=380/849, batch_size=13, iter_cost=0.25s, time_cost: 01:33/01:55,
+2024-05-18 10:36:12,569   INFO  eval: epoch=22, batch_iter=390/849, batch_size=13, iter_cost=0.25s, time_cost: 01:35/01:52,
+2024-05-18 10:36:14,866   INFO  eval: epoch=22, batch_iter=400/849, batch_size=13, iter_cost=0.25s, time_cost: 01:38/01:50,
+2024-05-18 10:36:17,176   INFO  eval: epoch=22, batch_iter=410/849, batch_size=13, iter_cost=0.25s, time_cost: 01:40/01:47,
+2024-05-18 10:36:19,662   INFO  eval: epoch=22, batch_iter=420/849, batch_size=13, iter_cost=0.25s, time_cost: 01:42/01:45,
+2024-05-18 10:36:22,073   INFO  eval: epoch=22, batch_iter=430/849, batch_size=13, iter_cost=0.24s, time_cost: 01:45/01:42,
+2024-05-18 10:36:24,591   INFO  eval: epoch=22, batch_iter=440/849, batch_size=13, iter_cost=0.25s, time_cost: 01:47/01:40,
+2024-05-18 10:36:27,184   INFO  eval: epoch=22, batch_iter=450/849, batch_size=13, iter_cost=0.25s, time_cost: 01:50/01:37,
+2024-05-18 10:36:29,425   INFO  eval: epoch=22, batch_iter=460/849, batch_size=13, iter_cost=0.25s, time_cost: 01:52/01:35,
+2024-05-18 10:36:31,789   INFO  eval: epoch=22, batch_iter=470/849, batch_size=13, iter_cost=0.24s, time_cost: 01:55/01:32,
+2024-05-18 10:36:33,958   INFO  eval: epoch=22, batch_iter=480/849, batch_size=13, iter_cost=0.24s, time_cost: 01:57/01:30,
+2024-05-18 10:36:36,304   INFO  eval: epoch=22, batch_iter=490/849, batch_size=13, iter_cost=0.24s, time_cost: 01:59/01:27,
+2024-05-18 10:36:38,745   INFO  eval: epoch=22, batch_iter=500/849, batch_size=13, iter_cost=0.24s, time_cost: 02:02/01:25,
+2024-05-18 10:36:40,967   INFO  eval: epoch=22, batch_iter=510/849, batch_size=13, iter_cost=0.24s, time_cost: 02:04/01:22,
+2024-05-18 10:36:43,271   INFO  eval: epoch=22, batch_iter=520/849, batch_size=13, iter_cost=0.24s, time_cost: 02:06/01:20,
+2024-05-18 10:36:45,723   INFO  eval: epoch=22, batch_iter=530/849, batch_size=13, iter_cost=0.24s, time_cost: 02:08/01:17,
+2024-05-18 10:36:48,064   INFO  eval: epoch=22, batch_iter=540/849, batch_size=13, iter_cost=0.24s, time_cost: 02:11/01:15,
+2024-05-18 10:36:50,563   INFO  eval: epoch=22, batch_iter=550/849, batch_size=13, iter_cost=0.24s, time_cost: 02:13/01:12,
+2024-05-18 10:36:52,891   INFO  eval: epoch=22, batch_iter=560/849, batch_size=13, iter_cost=0.24s, time_cost: 02:16/01:10,
+2024-05-18 10:36:55,339   INFO  eval: epoch=22, batch_iter=570/849, batch_size=13, iter_cost=0.24s, time_cost: 02:18/01:07,
+2024-05-18 10:36:57,667   INFO  eval: epoch=22, batch_iter=580/849, batch_size=13, iter_cost=0.24s, time_cost: 02:20/01:05,
+2024-05-18 10:37:08,450   INFO  eval: epoch=22, batch_iter=590/849, batch_size=13, iter_cost=0.26s, time_cost: 02:31/01:06,
+2024-05-18 10:37:10,837   INFO  eval: epoch=22, batch_iter=600/849, batch_size=13, iter_cost=0.26s, time_cost: 02:34/01:03,
+2024-05-18 10:37:13,271   INFO  eval: epoch=22, batch_iter=610/849, batch_size=13, iter_cost=0.26s, time_cost: 02:36/01:01,
+2024-05-18 10:37:15,605   INFO  eval: epoch=22, batch_iter=620/849, batch_size=13, iter_cost=0.26s, time_cost: 02:38/00:58,
+2024-05-18 10:37:17,972   INFO  eval: epoch=22, batch_iter=630/849, batch_size=13, iter_cost=0.26s, time_cost: 02:41/00:56,
+2024-05-18 10:37:20,274   INFO  eval: epoch=22, batch_iter=640/849, batch_size=13, iter_cost=0.26s, time_cost: 02:43/00:53,
+2024-05-18 10:37:22,605   INFO  eval: epoch=22, batch_iter=650/849, batch_size=13, iter_cost=0.26s, time_cost: 02:45/00:50,
+2024-05-18 10:37:28,257   INFO  eval: epoch=22, batch_iter=660/849, batch_size=13, iter_cost=0.26s, time_cost: 02:51/00:49,
+2024-05-18 10:37:30,781   INFO  eval: epoch=22, batch_iter=670/849, batch_size=13, iter_cost=0.26s, time_cost: 02:54/00:46,
+2024-05-18 10:37:33,194   INFO  eval: epoch=22, batch_iter=680/849, batch_size=13, iter_cost=0.26s, time_cost: 02:56/00:43,
+2024-05-18 10:37:35,626   INFO  eval: epoch=22, batch_iter=690/849, batch_size=13, iter_cost=0.26s, time_cost: 02:58/00:41,
+2024-05-18 10:37:40,710   INFO  eval: epoch=22, batch_iter=700/849, batch_size=13, iter_cost=0.26s, time_cost: 03:03/00:39,
+2024-05-18 10:37:43,109   INFO  eval: epoch=22, batch_iter=710/849, batch_size=13, iter_cost=0.26s, time_cost: 03:06/00:36,
+2024-05-18 10:37:48,904   INFO  eval: epoch=22, batch_iter=720/849, batch_size=13, iter_cost=0.27s, time_cost: 03:12/00:34,
+2024-05-18 10:37:51,449   INFO  eval: epoch=22, batch_iter=730/849, batch_size=13, iter_cost=0.27s, time_cost: 03:14/00:31,
+2024-05-18 10:37:53,735   INFO  eval: epoch=22, batch_iter=740/849, batch_size=13, iter_cost=0.27s, time_cost: 03:17/00:29,
+2024-05-18 10:37:56,387   INFO  eval: epoch=22, batch_iter=750/849, batch_size=13, iter_cost=0.27s, time_cost: 03:19/00:26,
+2024-05-18 10:38:03,692   INFO  eval: epoch=22, batch_iter=760/849, batch_size=13, iter_cost=0.27s, time_cost: 03:26/00:24,
+2024-05-18 10:38:06,114   INFO  eval: epoch=22, batch_iter=770/849, batch_size=13, iter_cost=0.27s, time_cost: 03:29/00:21,
+2024-05-18 10:38:08,584   INFO  eval: epoch=22, batch_iter=780/849, batch_size=13, iter_cost=0.27s, time_cost: 03:31/00:18,
+2024-05-18 10:38:11,063   INFO  eval: epoch=22, batch_iter=790/849, batch_size=13, iter_cost=0.27s, time_cost: 03:34/00:16,
+2024-05-18 10:38:13,663   INFO  eval: epoch=22, batch_iter=800/849, batch_size=13, iter_cost=0.27s, time_cost: 03:36/00:13,
+2024-05-18 10:38:16,095   INFO  eval: epoch=22, batch_iter=810/849, batch_size=13, iter_cost=0.27s, time_cost: 03:39/00:10,
+2024-05-18 10:38:18,534   INFO  eval: epoch=22, batch_iter=820/849, batch_size=13, iter_cost=0.27s, time_cost: 03:41/00:07,
+2024-05-18 10:38:26,364   INFO  eval: epoch=22, batch_iter=830/849, batch_size=13, iter_cost=0.28s, time_cost: 03:49/00:05,
+2024-05-18 10:38:28,723   INFO  eval: epoch=22, batch_iter=840/849, batch_size=13, iter_cost=0.28s, time_cost: 03:51/00:02,
+2024-05-18 10:38:30,428   INFO  eval: epoch=22, batch_iter=848/849, batch_size=1, iter_cost=0.28s, time_cost: 03:53/00:00,
+2024-05-18 10:38:47,235   INFO  Total number of samples before merging from multiple GPUs: 11025
+2024-05-18 10:38:57,649   INFO  Total number of samples after merging from multiple GPUs (removing duplicate): 44097
+2024-05-18 10:38:57,652   INFO  *************** Performance of EPOCH 22 *****************
+2024-05-18 10:38:57,652   INFO  Generate label finished(sec_per_example: 0.0059 second).
+2024-05-18 10:45:37,545   INFO
+minADE - TYPE_VEHICLE_5	: 0.3506
+minADE - TYPE_VEHICLE_9	: 0.7024
+minADE - TYPE_VEHICLE_15	: 1.3107
+minADE - TYPE_PEDESTRIAN_5	: 0.1675
+minADE - TYPE_PEDESTRIAN_9	: 0.3248
+minADE - TYPE_PEDESTRIAN_15	: 0.5732
+minADE - TYPE_CYCLIST_5	: 0.3610
+minADE - TYPE_CYCLIST_9	: 0.6543
+minADE - TYPE_CYCLIST_15	: 1.1300
+minFDE - TYPE_VEHICLE_5	: 0.6329
+minFDE - TYPE_VEHICLE_9	: 1.3764
+minFDE - TYPE_VEHICLE_15	: 2.7524
+minFDE - TYPE_PEDESTRIAN_5	: 0.3164
+minFDE - TYPE_PEDESTRIAN_9	: 0.6600
+minFDE - TYPE_PEDESTRIAN_15	: 1.2651
+minFDE - TYPE_CYCLIST_5	: 0.6524
+minFDE - TYPE_CYCLIST_9	: 1.2579
+minFDE - TYPE_CYCLIST_15	: 2.4358
+MissRate - TYPE_VEHICLE_5	: 0.1215
+MissRate - TYPE_VEHICLE_9	: 0.1591
+MissRate - TYPE_VEHICLE_15	: 0.2118
+MissRate - TYPE_PEDESTRIAN_5	: 0.0584
+MissRate - TYPE_PEDESTRIAN_9	: 0.0730
+MissRate - TYPE_PEDESTRIAN_15	: 0.0951
+MissRate - TYPE_CYCLIST_5	: 0.1826
+MissRate - TYPE_CYCLIST_9	: 0.1779
+MissRate - TYPE_CYCLIST_15	: 0.2000
+OverlapRate - TYPE_VEHICLE_5	: 0.0058
+OverlapRate - TYPE_VEHICLE_9	: 0.0158
+OverlapRate - TYPE_VEHICLE_15	: 0.0405
+OverlapRate - TYPE_PEDESTRIAN_5	: 0.0553
+OverlapRate - TYPE_PEDESTRIAN_9	: 0.0652
+OverlapRate - TYPE_PEDESTRIAN_15	: 0.0782
+OverlapRate - TYPE_CYCLIST_5	: 0.0173
+OverlapRate - TYPE_CYCLIST_9	: 0.0339
+OverlapRate - TYPE_CYCLIST_15	: 0.0562
+mAP - TYPE_VEHICLE_5	: 0.5047
+mAP - TYPE_VEHICLE_9	: 0.4322
+mAP - TYPE_VEHICLE_15	: 0.3590
+mAP - TYPE_PEDESTRIAN_5	: 0.5245
+mAP - TYPE_PEDESTRIAN_9	: 0.4485
+mAP - TYPE_PEDESTRIAN_15	: 0.4139
+mAP - TYPE_CYCLIST_5	: 0.3606
+mAP - TYPE_CYCLIST_9	: 0.3207
+mAP - TYPE_CYCLIST_15	: 0.2677
+-------------------------------------------------------------: 0.0000
+minADE - VEHICLE: 0.7879
+minADE - PEDESTRIAN: 0.3552
+minADE - CYCLIST: 0.7151
+minFDE - VEHICLE: 1.5872
+minFDE - PEDESTRIAN: 0.7471
+minFDE - CYCLIST: 1.4487
+MissRate - VEHICLE: 0.1641
+MissRate - PEDESTRIAN: 0.0755
+MissRate - CYCLIST: 0.1868
+OverlapRate - VEHICLE: 0.0207
+OverlapRate - PEDESTRIAN: 0.0663
+OverlapRate - CYCLIST: 0.0358
+mAP - VEHICLE: 0.4320
+mAP - PEDESTRIAN: 0.4623
+mAP - CYCLIST: 0.3163
+--------------------------------------------------------------: 0.0000
+minADE: 0.6194
+minFDE: 1.2610
+MissRate: 0.1422
+mAP: 0.4035
+---------------------------------------------------------------: 0.0000
+TYPE_UNSET: 0.0000
+TYPE_VEHICLE: 165676.0000
+TYPE_PEDESTRIAN: 21068.0000
+TYPE_CYCLIST: 5428.0000
+TYPE_OTHER: 0.0000
+-----Note that this evaluation may have marginal differences with the official Waymo evaluation server-----: 0.0000
+       Waymo          mAP       minADE       minFDE     MissRate
+      VEHICLE      0.4320,      0.7879,      1.5872,      0.1641,
+   PEDESTRIAN      0.4623,      0.3552,      0.7471,      0.0755,
+      CYCLIST      0.3163,      0.7151,      1.4487,      0.1868,
+          Avg      0.4035,      0.6194,      1.2610,      0.1422,
+2024-05-18 10:45:37,550   INFO  Result is save to /home/aidrive/zhengxj/projects_new/MTR_new/output/waymo/mtr+100_percent_data_llm_augmented/llm_augmented_mtr+100_percent_attn_loop_learned_gate_inside+change_context_window_8_layer_4/eval/eval_with_train
+2024-05-18 10:45:37,550   INFO  ****************Evaluation done.*****************
+2024-05-18 10:45:48,643   INFO  epoch: 22/30, acc_iter=131125, cur_iter=0/9366, batch_size=13, iter_cost=2.71s, time_cost(epoch): 00:02/7:03:27, time_cost(all): 13:30/56:27:43, ade_TYPE_VEHICLE_layer_5=0.609, ade_TYPE_PEDESTRIAN_layer_5=0.244, ade_TYPE_CYCLIST_layer_5=-0.000, loss=84.691, lr=0.0001
+2024-05-18 10:46:17,916   INFO  epoch: 22/30, acc_iter=131150, cur_iter=25/9366, batch_size=13, iter_cost=1.23s, time_cost(epoch): 00:31/3:11:31, time_cost(all): 13:59/25:35:47, ade_TYPE_VEHICLE_layer_5=0.673, ade_TYPE_PEDESTRIAN_layer_5=0.205, ade_TYPE_CYCLIST_layer_5=0.427, loss=127.063, lr=0.0001
+2024-05-18 10:47:16,199   INFO  epoch: 22/30, acc_iter=131200, cur_iter=75/9366, batch_size=13, iter_cost=1.19s, time_cost(epoch): 01:30/3:03:55, time_cost(all): 14:57/24:41:45, ade_TYPE_VEHICLE_layer_5=0.635, ade_TYPE_PEDESTRIAN_layer_5=0.233, ade_TYPE_CYCLIST_layer_5=0.486, loss=94.115, lr=0.0001

100_percent/LLM-Augmented-MTR/log_train_20240518-104841.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

100_percent/MTR/best_eval_record.txt ADDED Viewed

	@@ -0,0 +1,40 @@

+epoch_2 mAP 0.2698469476567374
+best_epoch_2 mAP 0.2698469476567374
+epoch_4 mAP 0.30147600008381736
+best_epoch_4 mAP 0.30147600008381736
+epoch_6 mAP 0.31303117838170796
+best_epoch_6 mAP 0.31303117838170796
+epoch_8 mAP 0.3235940817329619
+best_epoch_8 mAP 0.3235940817329619
+epoch_10 mAP 0.36777884099218583
+best_epoch_10 mAP 0.36777884099218583
+epoch_12 mAP 0.3643510788679123
+best_epoch_10 mAP 0.36777884099218583
+epoch_14 mAP 0.3607478638490041
+best_epoch_10 mAP 0.36777884099218583
+epoch_16 mAP 0.3673184762398402
+best_epoch_10 mAP 0.36777884099218583
+epoch_18 mAP 0.3678972903225157
+best_epoch_18 mAP 0.3678972903225157
+epoch_20 mAP 0.3698185649183061
+best_epoch_20 mAP 0.3698185649183061
+epoch_21 mAP 0.3756412830617693
+best_epoch_21 mAP 0.3756412830617693
+epoch_22 mAP 0.384421490960651
+best_epoch_22 mAP 0.384421490960651
+epoch_23 mAP 0.3798180388079749
+best_epoch_22 mAP 0.384421490960651
+epoch_24 mAP 0.39770102169778615
+best_epoch_24 mAP 0.39770102169778615
+epoch_25 mAP 0.38524179326163405
+best_epoch_24 mAP 0.39770102169778615
+epoch_26 mAP 0.40852043694920015
+best_epoch_26 mAP 0.40852043694920015
+epoch_27 mAP 0.4085294571187761
+best_epoch_27 mAP 0.4085294571187761
+epoch_28 mAP 0.41052143772443134
+best_epoch_28 mAP 0.41052143772443134
+epoch_29 mAP 0.4173127942615085
+best_epoch_29 mAP 0.4173127942615085
+epoch_30 mAP 0.4181843135091994
+best_epoch_30 mAP 0.4181843135091994

100_percent/MTR/checkpoint_epoch_30.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f14858a1ce6b4098eef8230db39f014b337ef5e158b591e0febe722d7ae4667a
+size 777075481

100_percent/MTR/log_train_20230318-135944.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

100_percent/MTR/log_train_20230323-015050.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

100_percent/MTR/log_train_20230324-224338.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

20_percent/LLM-Augmented-MTR/best_eval_record.txt ADDED Viewed

	@@ -0,0 +1,42 @@

+epoch_1 mAP 0.20280200242996216 minADE 1.121805641386244 minFDE 2.3629365298483105 MissRate0.32461252974139315
+best_epoch_1 mAP 0.20280200242996216 minADE 1.121805641386244 minFDE 2.3629365298483105 MissRate0.32461252974139315
+epoch_2 mAP 0.2108259747425715 minADE 1.0475726491875117 minFDE 2.1439842118157277 MissRate0.28972430196073323
+best_epoch_2 mAP 0.2108259747425715 minADE 1.0475726491875117 minFDE 2.1439842118157277 MissRate0.28972430196073323
+epoch_4 mAP 0.2567381891939375 minADE 0.8995593041181564 minFDE 1.8451896177397833 MissRate0.24359686755471763
+best_epoch_4 mAP 0.2567381891939375 minADE 0.8995593041181564 minFDE 1.8451896177397833 MissRate0.24359686755471763
+epoch_6 mAP 0.280468452307913 minADE 0.8129338771104813 minFDE 1.6794896456930373 MissRate0.21835642390780982
+best_epoch_6 mAP 0.280468452307913 minADE 0.8129338771104813 minFDE 1.6794896456930373 MissRate0.21835642390780982
+epoch_8 mAP 0.3066303845908907 minADE 0.8265427615907458 minFDE 1.6715423862139385 MissRate0.20962182266844642
+best_epoch_8 mAP 0.3066303845908907 minADE 0.8265427615907458 minFDE 1.6715423862139385 MissRate0.20962182266844642
+epoch_10 mAP 0.30340896215703755 minADE 0.7995703717072805 minFDE 1.6467467910713618 MissRate0.21301125652260247
+best_epoch_8 mAP 0.3066303845908907 minADE 0.8265427615907458 minFDE 1.6715423862139385 MissRate0.20962182266844642
+epoch_12 mAP 0.2987242821190092 minADE 0.7453566574388081 minFDE 1.527520441346698 MissRate0.19389896177583274
+best_epoch_8 mAP 0.3066303845908907 minADE 0.8265427615907458 minFDE 1.6715423862139385 MissRate0.20962182266844642
+epoch_14 mAP 0.3013038718038135 minADE 0.7638516972462336 minFDE 1.539596176809735 MissRate0.19799110210604134
+best_epoch_8 mAP 0.3066303845908907 minADE 0.8265427615907458 minFDE 1.6715423862139385 MissRate0.20962182266844642
+epoch_16 mAP 0.31712262829144794 minADE 0.7448720667097305 minFDE 1.4916071097056072 MissRate0.18731188111835054
+best_epoch_16 mAP 0.31712262829144794 minADE 0.7448720667097305 minFDE 1.4916071097056072 MissRate0.18731188111835054
+epoch_18 mAP 0.29922616150644094 minADE 0.7549243850840464 minFDE 1.5041462249226043 MissRate0.19184935175710252
+best_epoch_16 mAP 0.31712262829144794 minADE 0.7448720667097305 minFDE 1.4916071097056072 MissRate0.18731188111835054
+epoch_20 mAP 0.32285115122795105 minADE 0.7543421751923031 minFDE 1.4892633656660716 MissRate0.18655251794391212
+best_epoch_20 mAP 0.32285115122795105 minADE 0.7543421751923031 minFDE 1.4892633656660716 MissRate0.18655251794391212
+epoch_21 mAP 0.3209489054150052 minADE 0.721488227446874 minFDE 1.4614114463329315 MissRate0.18441139078802535
+best_epoch_20 mAP 0.32285115122795105 minADE 0.7543421751923031 minFDE 1.4892633656660716 MissRate0.18655251794391212
+epoch_22 mAP 0.32682062354352737 minADE 0.7124388366937637 minFDE 1.4540120561917622 MissRate0.18042861835824117
+best_epoch_22 mAP 0.32682062354352737 minADE 0.7124388366937637 minFDE 1.4540120561917622 MissRate0.18042861835824117
+epoch_23 mAP 0.340921809275945 minADE 0.7024568070967993 minFDE 1.4272008803155687 MissRate0.17437677664889228
+best_epoch_23 mAP 0.340921809275945 minADE 0.7024568070967993 minFDE 1.4272008803155687 MissRate0.17437677664889228
+epoch_24 mAP 0.3347405940294266 minADE 0.7021272778511047 minFDE 1.405790156788296 MissRate0.17520727548334333
+best_epoch_23 mAP 0.340921809275945 minADE 0.7024568070967993 minFDE 1.4272008803155687 MissRate0.17437677664889228
+epoch_25 mAP 0.34384024805492824 minADE 0.6872262193097008 minFDE 1.386270996597078 MissRate0.1706915605399344
+best_epoch_25 mAP 0.34384024805492824 minADE 0.6872262193097008 minFDE 1.386270996597078 MissRate0.1706915605399344
+epoch_26 mAP 0.35064262317286604 minADE 0.6828386121326022 minFDE 1.3688042196962567 MissRate0.17072225858767828
+best_epoch_26 mAP 0.35064262317286604 minADE 0.6828386121326022 minFDE 1.3688042196962567 MissRate0.17072225858767828
+epoch_27 mAP 0.34423224296834737 minADE 0.6811849905384911 minFDE 1.3747731546560924 MissRate0.16926835477352142
+best_epoch_26 mAP 0.35064262317286604 minADE 0.6828386121326022 minFDE 1.3688042196962567 MissRate0.17072225858767828
+epoch_28 mAP 0.3391927546925015 minADE 0.6855861726734372 minFDE 1.3797330624527404 MissRate0.17102102521393037
+best_epoch_26 mAP 0.35064262317286604 minADE 0.6828386121326022 minFDE 1.3688042196962567 MissRate0.17072225858767828
+epoch_29 mAP 0.35265530480278867 minADE 0.6794825990994772 minFDE 1.3695374263657465 MissRate0.1699780879749192
+best_epoch_29 mAP 0.35265530480278867 minADE 0.6794825990994772 minFDE 1.3695374263657465 MissRate0.1699780879749192
+epoch_30 mAP 0.3505900684330199 minADE 0.6841080155637528 minFDE 1.3792778882715437 MissRate0.17003927462630805
+best_epoch_29 mAP 0.35265530480278867 minADE 0.6794825990994772 minFDE 1.3695374263657465 MissRate0.1699780879749192

20_percent/LLM-Augmented-MTR/checkpoint_epoch_29.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:528da69183bab17fd3ac0d8afafdd38d5d970e652f1d0af1fd52decd32066ab8
+size 890718577

20_percent/LLM-Augmented-MTR/log_train_20240227-140250.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

20_percent/MTR/best_eval_record.txt ADDED Viewed

	@@ -0,0 +1,42 @@

+epoch_1 mAP 0.1780766099691391 minADE 1.2116148041354284 minFDE 2.463306056128608 MissRate0.34856364462110734
+best_epoch_1 mAP 0.1780766099691391 minADE 1.2116148041354284 minFDE 2.463306056128608 MissRate0.34856364462110734
+epoch_2 mAP 0.20629685951603782 minADE 1.029665822784106 minFDE 2.1169575320349803 MissRate0.2860292113489575
+best_epoch_2 mAP 0.20629685951603782 minADE 1.029665822784106 minFDE 2.1169575320349803 MissRate0.2860292113489575
+epoch_4 mAP 0.237494428952535 minADE 0.8865823778841232 minFDE 1.837194714281294 MissRate0.24316217501958212
+best_epoch_4 mAP 0.237494428952535 minADE 0.8865823778841232 minFDE 1.837194714281294 MissRate0.24316217501958212
+epoch_6 mAP 0.24996380673514473 minADE 0.8017858978774811 minFDE 1.6643226312266457 MissRate0.2179658810297648
+best_epoch_6 mAP 0.24996380673514473 minADE 0.8017858978774811 minFDE 1.6643226312266457 MissRate0.2179658810297648
+epoch_8 mAP 0.29360215034749776 minADE 0.7573151406314639 minFDE 1.578547431363 MissRate0.19708167016506195
+best_epoch_8 mAP 0.29360215034749776 minADE 0.7573151406314639 minFDE 1.578547431363 MissRate0.19708167016506195
+epoch_10 mAP 0.30071333050727844 minADE 0.7649337003628413 minFDE 1.5673650403817494 MissRate0.20276714944177202
+best_epoch_10 mAP 0.30071333050727844 minADE 0.7649337003628413 minFDE 1.5673650403817494 MissRate0.20276714944177202
+epoch_12 mAP 0.292175743314955 minADE 0.7380434456798767 minFDE 1.5039872195985582 MissRate0.18972881303893196
+best_epoch_10 mAP 0.30071333050727844 minADE 0.7649337003628413 minFDE 1.5673650403817494 MissRate0.20276714944177202
+epoch_14 mAP 0.31314270695050556 minADE 0.7305420802699195 minFDE 1.4838222993744745 MissRate0.18249268995391
+best_epoch_14 mAP 0.31314270695050556 minADE 0.7305420802699195 minFDE 1.4838222993744745 MissRate0.18249268995391
+epoch_16 mAP 0.31479272080792325 minADE 0.7203008400069343 minFDE 1.4792389836576252 MissRate0.18043349352147842
+best_epoch_16 mAP 0.31479272080792325 minADE 0.7203008400069343 minFDE 1.4792389836576252 MissRate0.18043349352147842
+epoch_18 mAP 0.30901829567220473 minADE 0.7110151019361285 minFDE 1.4722885092099507 MissRate0.1831517426504029
+best_epoch_16 mAP 0.31479272080792325 minADE 0.7203008400069343 minFDE 1.4792389836576252 MissRate0.18043349352147842
+epoch_20 mAP 0.3403045965565576 minADE 0.6804299834701751 minFDE 1.4013747837808397 MissRate0.1693890881207254
+best_epoch_20 mAP 0.3403045965565576 minADE 0.6804299834701751 minFDE 1.4013747837808397 MissRate0.1693890881207254
+epoch_21 mAP 0.34428356422318357 minADE 0.6813108093208736 minFDE 1.3953127794795568 MissRate0.1662339808212386
+best_epoch_21 mAP 0.34428356422318357 minADE 0.6813108093208736 minFDE 1.3953127794795568 MissRate0.1662339808212386
+epoch_22 mAP 0.34294628765847945 minADE 0.6738415045870675 minFDE 1.3911531501346166 MissRate0.165701354543368
+best_epoch_21 mAP 0.34428356422318357 minADE 0.6813108093208736 minFDE 1.3953127794795568 MissRate0.1662339808212386
+epoch_23 mAP 0.34789742694960707 minADE 0.6705604626072778 minFDE 1.3779481848080952 MissRate0.16484576877620485
+best_epoch_23 mAP 0.34789742694960707 minADE 0.6705604626072778 minFDE 1.3779481848080952 MissRate0.16484576877620485
+epoch_24 mAP 0.33808205359511906 minADE 0.6704978479279412 minFDE 1.3809854719373915 MissRate0.16550052000416648
+best_epoch_23 mAP 0.34789742694960707 minADE 0.6705604626072778 minFDE 1.3779481848080952 MissRate0.16484576877620485
+epoch_25 mAP 0.34635144968827564 minADE 0.6702178435193168 minFDE 1.374932004345788 MissRate0.16507353136936823
+best_epoch_23 mAP 0.34789742694960707 minADE 0.6705604626072778 minFDE 1.3779481848080952 MissRate0.16484576877620485
+epoch_26 mAP 0.3466732932461632 minADE 0.6752092076672448 minFDE 1.3828196260664196 MissRate0.16483944985601637
+best_epoch_23 mAP 0.34789742694960707 minADE 0.6705604626072778 minFDE 1.3779481848080952 MissRate0.16484576877620485
+epoch_27 mAP 0.34161571330494356 minADE 0.6706651995579401 minFDE 1.3762814667489793 MissRate0.1658488561709722
+best_epoch_23 mAP 0.34789742694960707 minADE 0.6705604626072778 minFDE 1.3779481848080952 MissRate0.16484576877620485
+epoch_28 mAP 0.3456234435240428 minADE 0.672044810321596 minFDE 1.3780042330423992 MissRate0.16570446474684608
+best_epoch_23 mAP 0.34789742694960707 minADE 0.6705604626072778 minFDE 1.3779481848080952 MissRate0.16484576877620485
+epoch_29 mAP 0.34985576404465574 minADE 0.6696184790796704 minFDE 1.377215094036526 MissRate0.1654756905304061
+best_epoch_29 mAP 0.34985576404465574 minADE 0.6696184790796704 minFDE 1.377215094036526 MissRate0.1654756905304061
+epoch_30 mAP 0.34322212139765423 minADE 0.6689203000730939 minFDE 1.3752210405137806 MissRate0.16523590435584387
+best_epoch_29 mAP 0.34985576404465574 minADE 0.6696184790796704 minFDE 1.377215094036526 MissRate0.1654756905304061

20_percent/MTR/checkpoint_epoch_29.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0eb5c77d846d4d2d9ed8f4cd832cf8419a5d4481020e444575e0e0d389f633c8
+size 777075481

20_percent/MTR/log_train_20240315-005422.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

20_percent/MTR/log_train_20240315-075642.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

5_percent/LLM-Augmented-MTR/best_eval_record.txt ADDED Viewed

	@@ -0,0 +1,40 @@

+epoch_2 mAP 0.14707461351321804
+best_epoch_2 mAP 0.14707461351321804
+epoch_4 mAP 0.19665334704849455
+best_epoch_4 mAP 0.19665334704849455
+epoch_6 mAP 0.24278521206643844
+best_epoch_6 mAP 0.24278521206643844
+epoch_8 mAP 0.2573127862479952
+best_epoch_8 mAP 0.2573127862479952
+epoch_10 mAP 0.2338909415735139
+best_epoch_8 mAP 0.2573127862479952
+epoch_12 mAP 0.2445411466889911
+best_epoch_8 mAP 0.2573127862479952
+epoch_14 mAP 0.2600547605090671
+best_epoch_14 mAP 0.2600547605090671
+epoch_16 mAP 0.2669246411985821
+best_epoch_16 mAP 0.2669246411985821
+epoch_18 mAP 0.25567510227362317
+best_epoch_16 mAP 0.2669246411985821
+epoch_20 mAP 0.27623524599605137
+best_epoch_20 mAP 0.27623524599605137
+epoch_21 mAP 0.291039678785536
+best_epoch_21 mAP 0.291039678785536
+epoch_22 mAP 0.26954489284091526
+best_epoch_21 mAP 0.291039678785536
+epoch_23 mAP 0.28672027587890625
+best_epoch_21 mAP 0.291039678785536
+epoch_24 mAP 0.2953291071785821
+best_epoch_24 mAP 0.2953291071785821
+epoch_25 mAP 0.2961776968505648
+best_epoch_25 mAP 0.2961776968505648
+epoch_26 mAP 0.2938236908780204
+best_epoch_25 mAP 0.2961776968505648
+epoch_27 mAP 0.29479679961999256
+best_epoch_25 mAP 0.2961776968505648
+epoch_28 mAP 0.30382166306177777
+best_epoch_28 mAP 0.30382166306177777
+epoch_29 mAP 0.2993926422463523
+best_epoch_28 mAP 0.30382166306177777
+epoch_30 mAP 0.2966313726372189
+best_epoch_28 mAP 0.30382166306177777

5_percent/LLM-Augmented-MTR/checkpoint_epoch_28.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e693293b7e1054056229c0b119921fa673c48f50148fdea3fd00af72829dca0a
+size 793251102

5_percent/LLM-Augmented-MTR/log_train_20240519-174533.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

5_percent/LLM-Augmented-MTR/log_train_20240520-084733.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

5_percent/MTR/best_eval_record.txt ADDED Viewed

	@@ -0,0 +1,42 @@

+epoch_1 mAP 0.11289571225643158
+best_epoch_1 mAP 0.11289571225643158
+epoch_2 mAP 0.15150262746546006
+best_epoch_2 mAP 0.15150262746546006
+epoch_4 mAP 0.19338538083765242
+best_epoch_4 mAP 0.19338538083765242
+epoch_6 mAP 0.20877731011973488
+best_epoch_6 mAP 0.20877731011973488
+epoch_8 mAP 0.2264716509315703
+best_epoch_8 mAP 0.2264716509315703
+epoch_10 mAP 0.23379969514078566
+best_epoch_10 mAP 0.23379969514078566
+epoch_12 mAP 0.2377154164844089
+best_epoch_12 mAP 0.2377154164844089
+epoch_14 mAP 0.23920134041044447
+best_epoch_14 mAP 0.23920134041044447
+epoch_16 mAP 0.19992810570531425
+best_epoch_14 mAP 0.23920134041044447
+epoch_18 mAP 0.23819062610467276
+best_epoch_14 mAP 0.23920134041044447
+epoch_20 mAP 0.24969915880097282
+best_epoch_20 mAP 0.24969915880097282
+epoch_21 mAP 0.2677012417051527
+best_epoch_21 mAP 0.2677012417051527
+epoch_22 mAP 0.2480028718709946
+best_epoch_21 mAP 0.2677012417051527
+epoch_23 mAP 0.26686604486571414
+best_epoch_21 mAP 0.2677012417051527
+epoch_24 mAP 0.27477139068974393
+best_epoch_24 mAP 0.27477139068974393
+epoch_25 mAP 0.2842640694644716
+best_epoch_25 mAP 0.2842640694644716
+epoch_26 mAP 0.28255397578080493
+best_epoch_25 mAP 0.2842640694644716
+epoch_27 mAP 0.2821702079640494
+best_epoch_25 mAP 0.2842640694644716
+epoch_28 mAP 0.2909945597251256
+best_epoch_28 mAP 0.2909945597251256
+epoch_29 mAP 0.284342681368192
+best_epoch_28 mAP 0.2909945597251256
+epoch_30 mAP 0.28522086474630565
+best_epoch_28 mAP 0.2909945597251256

5_percent/MTR/checkpoint_epoch_28.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d7a7b99f064fea4af5c28c5118346042c977b9f549a1e4464074f8079b936651
+size 777282554

5_percent/MTR/log_train_20240429-093927.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

README.md CHANGED Viewed

@@ -1,3 +1,63 @@
 ---
 license: mit
 ---

 ---
 license: mit
 ---
+Here we provide the baseline model (MTR) and our models' checkpoint.
+We provide three types of models based on how much training data they had used:
+## 5%
+MTR's performance (epoch_28):
+```
+       Waymo          mAP       minADE       minFDE     MissRate
+      VEHICLE      0.3288,      0.9097,      1.8636,      0.2156,
+   PEDESTRIAN      0.3192,      0.4202,      0.8957,      0.1134,
+      CYCLIST      0.2250,      0.9298,      1.9409,      0.2736,
+          Avg      0.2910,      0.7532,      1.5668,      0.2008,
+```
+LLM-Augmented-MTR's performance (epoch_28):
+```
+       Waymo          mAP       minADE       minFDE     MissRate
+      VEHICLE      0.3367,      0.9216,      1.8960,      0.2236,
+   PEDESTRIAN      0.3613,      0.4295,      0.9059,      0.1103,
+      CYCLIST      0.2135,      0.9166,      1.9246,      0.2693,
+          Avg      0.3038,      0.7559,      1.5755,      0.2011,
+```
+## 20%
+MTR's performance (epoch_29):
+```
+       Waymo          mAP       minADE       minFDE     MissRate
+      VEHICLE      0.3912,      0.8239,      1.6778,      0.1800,
+   PEDESTRIAN      0.3608,      0.3829,      0.8091,      0.0935,
+      CYCLIST      0.2975,      0.8020,      1.6448,      0.2230,
+          Avg      0.3499,      0.6696,      1.3772,      0.1655,
+```
+LLM-Augmented-MTR's performance (epoch_29):
+```
+       Waymo          mAP       minADE       minFDE     MissRate
+      VEHICLE      0.4028,      0.8090,      1.5943,      0.1711,
+   PEDESTRIAN      0.3621,      0.3880,      0.8107,      0.0958,
+      CYCLIST      0.2930,      0.8415,      1.7036,      0.2430,
+          Avg      0.3527,      0.6795,      1.3695,      0.1700,
+```
+## 100%
+MTR's performance (epoch_30):
+```
+       Waymo          mAP       minADE       minFDE     MissRate
+      VEHICLE      0.4464,      0.7545,      1.5161,      0.1523,
+   PEDESTRIAN      0.4149,      0.3456,      0.7252,      0.0750,
+      CYCLIST      0.3933,      0.6849,      1.3869,      0.1795,
+          Avg      0.4182,      0.5950,      1.2094,      0.1356,
+```
+LLM-Augmented-MTR's performance (epoch_26):
+```
+       Waymo          mAP       minADE       minFDE     MissRate
+      VEHICLE      0.4578,      0.7570,      1.5308,      0.1523,
+   PEDESTRIAN      0.4794,      0.3535,      0.7376,      0.0765,
+      CYCLIST      0.3434,      0.7062,      1.4260,      0.1827,
+          Avg      0.4269,      0.6056,      1.2315,      0.1371,
+```