sl.yaml 1.2 KB
seed: 3407

dataset:
  name: 'SLData'
  args:
    data_root: '/dataset160x14'
    train_anno_file: '/dataset160x14/train.csv'
    val_anno_file: '/dataset160x14/valid.csv'

dataloader:
  batch_size: 8
  num_workers: 4
  pin_memory: true
  shuffle: true

model:
  name: 'SLTransformer'
  args:
    seq_lens:  160
    num_classes: 10 
    embed_dim: 14 
    depth: 6
    num_heads: 1 
    mlp_ratio: 4.0 
    qkv_bias: true
    qk_scale: null 
    drop_ratio: 0.
    attn_drop_ratio: 0. 
    drop_path_ratio: 0. 
    norm_layer: null
    act_layer: null 

solver:
  name: 'SLSolver'
  args:
    epoch: 100
    base_on: null
    model_path: null
    val_image_path: '/labeled/valid/image'
    val_go_path: '/go_res/valid'
    val_map_path: '/dataset160x14/create_map.json'
    draw_font_path: '/dataset160x14/STZHONGS.TTF'
    thresholds: 0.5

  optimizer:
    name: 'Adam'
    args:
      lr: !!float 1e-3
      # weight_decay: !!float 5e-5

  lr_scheduler:
    name: 'CosineLR'
    args:
      epochs: 100
      lrf: 0.1

  loss:
    name: 'MaskedSigmoidFocalLoss'
    # name: 'SigmoidFocalLoss'
    # name: 'CrossEntropyLoss'
    args:
      reduction: "mean"
      alpha: 0.8

  logger:
    log_root: '/logs'
    suffix: 'sl-6-1'