default.yml 2.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132
  1. data:
  2. batch_size: 256
  3. pin_memory: true
  4. num_workers: 1
  5. # Thomas said it should be at least about 5-10x your batch size; beyond that,
  6. # the differences become academic.
  7. shuffle_buffer: 10000
  8. seed: ${train.seed}
  9. bpe_path: /mnt/vos-s9gjtkm2/reid/groupvit/GroupViT/datasets/bpe_simple_vocab_16e6.txt.gz
  10. dataset:
  11. meta:
  12. gcc3m:
  13. type: img_txt_pair
  14. path: local_data/gcc3m_shards
  15. prefix: gcc-train-{000000..00436}.tar
  16. length: 2891445
  17. gcc12m:
  18. type: img_txt_pair
  19. path: local_data/gcc12m_shards
  20. prefix: gcc-conceptual-12m-{000000..001943}.tar
  21. length: 11156203
  22. yfcc14m:
  23. type: img_txt_pair
  24. path: local_data/yfcc14m_shards
  25. prefix: yfcc14m-{000000..001888}.tar
  26. length: 14615499
  27. redcap12m:
  28. type: img_txt_pair
  29. path: local_data/redcap12m_shards
  30. prefix: redcap12m-{000000..001211}.tar
  31. length: 11866987
  32. imagenet:
  33. type: img_cls_pair
  34. path: local_data/imagenet_shards
  35. prefix: imagenet-val-{000000..000049}.tar
  36. length: 50000
  37. cuhkpedes_train:
  38. name: CUHK-PEDES
  39. type: img_txt_pair
  40. path: local_data/cuhkpedes_shards
  41. prefix: cuhkpedes-train-{000000..000004}.tar
  42. length: 34054
  43. cuhkpedes_val:
  44. # raw_path: /home/linkslinks/dataset/
  45. raw_path: /mnt/vos-s9gjtkm2/reid/dataset/cross_reid/
  46. name: CUHK-PEDES
  47. type: img_txt_pair
  48. path: local_data/cuhkpedes_shards
  49. prefix: cuhkpedes-val-{000000..000000}.tar
  50. length: 3078
  51. train:
  52. # - gcc3m
  53. # - gcc12m
  54. # - yfcc14m
  55. - cuhkpedes_train
  56. val:
  57. # - imagenet
  58. - cuhkpedes_val
  59. img_aug:
  60. deit_aug: true
  61. img_size: 224
  62. img_scale: [0.08, 1.0]
  63. interpolation: bilinear
  64. color_jitter: 0.4
  65. auto_augment: 'rand-m9-mstd0.5-inc1'
  66. re_prob: 0.25
  67. re_mode: 'pixel'
  68. re_count: 1
  69. text_aug:
  70. max_seq_len: 77
  71. multi_label: 0
  72. word_type: 'noun'
  73. train:
  74. start_epoch: 0
  75. epochs: 30
  76. warmup_epochs: 2
  77. base_lr: 1.6e-3
  78. weight_decay: 0.05
  79. warmup_lr: 4e-6
  80. min_lr: 4e-5
  81. clip_grad: 5.0
  82. accumulation_steps: 0
  83. amp_opt_level: O2
  84. seed: 0
  85. lr_scheduler:
  86. name: cosine
  87. optimizer:
  88. name: adamw
  89. eps: 1e-8
  90. betas: [0.9, 0.999]
  91. evaluate:
  92. eval_only: false
  93. eval_freq: 1
  94. task:
  95. # - cls
  96. # - seg
  97. - reid
  98. cls:
  99. save_best: true
  100. template: subset
  101. seg:
  102. save_best: true
  103. cfg: segmentation/configs/_base_/datasets/pascal_voc12.py
  104. template: simple
  105. opts: []
  106. reid:
  107. save_best: true
  108. template: simple
  109. opts: []
  110. checkpoint:
  111. auto_resume: true
  112. resume: ''
  113. freq: 1
  114. max_kept: -1
  115. save_freq: 1
  116. model_name: '' # display name in the logger
  117. output: ???
  118. tag: default
  119. print_freq: 10
  120. seed: 0
  121. wandb: false
  122. local_rank: ???
  123. vis: []