MODEL: BERT_CKPT: "bert-base-chinese" DEVICE: "cuda" NAME: "softmaskedbert4csc" GPU_IDS: [0] # [loss_coefficient] HYPER_PARAMS: [0.8] #WEIGHTS: "output/softmaskedbert4csc/epoch=2-val_loss=0.07.ckpt" WEIGHTS: "" DATASETS: TRAIN: "output/train.json" VALID: "output/dev.json" TEST: "output/test.json" SOLVER: BASE_LR: 0.0001 WEIGHT_DECAY: 5e-8 BATCH_SIZE: 32 MAX_EPOCHS: 10 ACCUMULATE_GRAD_BATCHES: 4 OUTPUT_DIR: "output/softmaskedbert4csc" MODE: ["train", "test"]