| CUDA_VISIBLE_DEVICES=4,5,6,7,3,1 NPROC_PER_NODE=6 xtuner train \ | |
| configs/slidechat/experiments_token_compressor/stage2_token_compressor_lgg.py \ | |
| --deepspeed configs/deepspeed/deepspeed_zero2.json \ | |
| --work-dir /data/qingq/PathVLM/baselines/github/SlideChat/models/outputs/lgg_orignal_2048maxlength_train_token_compressor \ | |
| --local_rank 0 | |
| CUDA_VISIBLE_DEVICES=4,5,6,7,3,1 NPROC_PER_NODE=6 xtuner train \ | |
| configs/slidechat/experiments_attn/stage2_reducer_attn_lgg.py \ | |
| --deepspeed configs/deepspeed/deepspeed_zero2.json \ | |
| --work-dir /data/qingq/PathVLM/baselines/github/SlideChat/models/outputs/lgg_original_2048maxlength_train_token_reducer_attn \ | |
| --local_rank 0 | |
| CUDA_VISIBLE_DEVICES=4,5,6,7,3,1 NPROC_PER_NODE=6 xtuner train \ | |
| configs/slidechat/experiments_attn/stage2_reducer_attn_luad.py \ | |
| --deepspeed configs/deepspeed/deepspeed_zero2.json \ | |
| --work-dir /data/qingq/PathVLM/baselines/github/SlideChat/models/outputs/luad_original_2048maxlength_train_token_reducer_attn \ | |
| --local_rank 0 |