slurm_config: big task_type: local_predict dataset: split: test video_processor: VideoProcessor aligner: COINActionSegmentationAligner bert_name: bert-base-uncased test_path: data/coin/COIN.json meta_processor: COINActionSegmentationMetaProcessor vfeat_dir: data/feat/feat_coin_s3d text_processor: COINActionSegmentationTextProcessor num_iso_layer: 12 sliding_window: 16 sliding_window_size: 32 max_video_len: 32 max_len: 96 fairseq: dataset: batch_size: 1 valid_subset: test num_workers: 2 common_eval: path: runs/mtm/vlm/coin/checkpoint_best.pt model: model_cls: MMFusionActionSegmentation mm_encoder_cls: MMBertForTokenClassification use_seg_emb: true eval: save_path: runs/mtm/vlm/coin/eval metric: COINActionSegmentationMetric predictor: COINPredictor