-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathtrain_config.yaml
597 lines (597 loc) · 12.5 KB
/
train_config.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
CHECKPOINT:
APPEND_DISTR_RUN_ID: false
AUTO_RESUME: true
BACKEND: disk
CHECKPOINT_FREQUENCY: 5
CHECKPOINT_ITER_FREQUENCY: -1
DIR: .
LATEST_CHECKPOINT_RESUME_FILE_NUM: 1
OVERWRITE_EXISTING: false
USE_SYMLINK_CHECKPOINT_FOR_RESUME: false
CLUSTERFIT:
CLUSTER_BACKEND: faiss
DATA_LIMIT: -1
DATA_LIMIT_SAMPLING:
SEED: 0
FEATURES:
DATASET_NAME: ''
DATA_PARTITION: TRAIN
DIMENSIONALITY_REDUCTION: 0
EXTRACT: false
LAYER_NAME: ''
PATH: .
TEST_PARTITION: TEST
NUM_CLUSTERS: 16000
NUM_ITER: 50
OUTPUT_DIR: .
DATA:
DDP_BUCKET_CAP_MB: 25
ENABLE_ASYNC_GPU_COPY: true
NUM_DATALOADER_WORKERS: 5
PIN_MEMORY: true
TEST:
BASE_DATASET: generic_ssl
BATCHSIZE_PER_REPLICA: 256
COLLATE_FUNCTION: default_collate
COLLATE_FUNCTION_PARAMS: {}
COPY_DESTINATION_DIR: ''
COPY_TO_LOCAL_DISK: false
DATASET_NAMES:
- imagenet1k_folder
DATA_LIMIT: -1
DATA_LIMIT_SAMPLING:
IS_BALANCED: false
SEED: 0
SKIP_NUM_SAMPLES: 0
DATA_PATHS: []
DATA_SOURCES: []
DEFAULT_GRAY_IMG_SIZE: 224
DROP_LAST: false
ENABLE_QUEUE_DATASET: false
INPUT_KEY_NAMES:
- data
LABEL_PATHS: []
LABEL_SOURCES: []
LABEL_TYPE: sample_index
MMAP_MODE: true
NEW_IMG_PATH_PREFIX: ''
RANDOM_SYNTHETIC_IMAGES: false
REMOVE_IMG_PATH_PREFIX: ''
TARGET_KEY_NAMES:
- label
TRANSFORMS: []
USE_DEBUGGING_SAMPLER: false
USE_STATEFUL_DISTRIBUTED_SAMPLER: false
TRAIN:
BASE_DATASET: generic_ssl
BATCHSIZE_PER_REPLICA: 64
COLLATE_FUNCTION: simclr_collator
COLLATE_FUNCTION_PARAMS: {}
COPY_DESTINATION_DIR: /tmp/imagenet1k/
COPY_TO_LOCAL_DISK: false
DATASET_NAMES:
- imagenet1k_folder
DATA_LIMIT: -1
DATA_LIMIT_SAMPLING:
IS_BALANCED: false
SEED: 0
SKIP_NUM_SAMPLES: 0
DATA_PATHS: []
DATA_SOURCES:
- disk_folder
DEFAULT_GRAY_IMG_SIZE: 224
DROP_LAST: true
ENABLE_QUEUE_DATASET: false
INPUT_KEY_NAMES:
- data
LABEL_PATHS: []
LABEL_SOURCES: []
LABEL_TYPE: sample_index
MMAP_MODE: true
NEW_IMG_PATH_PREFIX: ''
RANDOM_SYNTHETIC_IMAGES: false
REMOVE_IMG_PATH_PREFIX: ''
TARGET_KEY_NAMES:
- label
TRANSFORMS:
- name: ImgReplicatePil
num_times: 2
- name: RandomResizedCrop
size: 224
- name: RandomHorizontalFlip
p: 0.5
- name: ImgPilColorDistortion
strength: 1.0
- name: ImgPilGaussianBlur
p: 0.5
radius_max: 2.0
radius_min: 0.1
- name: ToTensor
- mean:
- 0.485
- 0.456
- 0.406
name: Normalize
std:
- 0.229
- 0.224
- 0.225
USE_DEBUGGING_SAMPLER: false
USE_STATEFUL_DISTRIBUTED_SAMPLER: false
DISTRIBUTED:
BACKEND: nccl
BROADCAST_BUFFERS: true
INIT_METHOD: tcp
MANUAL_GRADIENT_REDUCTION: false
NCCL_DEBUG: true
NCCL_SOCKET_NTHREADS: ''
NUM_NODES: 8
NUM_PROC_PER_NODE: 8
RUN_ID: xxxxxxxxxxxxxxxxxxxxxxxxxxxx
EXTRACT_FEATURES:
CHUNK_THRESHOLD: 0
OUTPUT_DIR: ''
HOOKS:
CHECK_NAN: true
LOG_GPU_STATS: true
MEMORY_SUMMARY:
DUMP_MEMORY_ON_EXCEPTION: false
LOG_ITERATION_NUM: 0
PRINT_MEMORY_SUMMARY: true
MODEL_COMPLEXITY:
COMPUTE_COMPLEXITY: false
INPUT_SHAPE:
- 3
- 224
- 224
PERF_STATS:
MONITOR_PERF_STATS: true
PERF_STAT_FREQUENCY: -1
ROLLING_BTIME_FREQ: 313
TENSORBOARD_SETUP:
EXPERIMENT_LOG_DIR: tensorboard
FLUSH_EVERY_N_MIN: 5
LOG_DIR: .
LOG_PARAMS: true
LOG_PARAMS_EVERY_N_ITERS: 310
LOG_PARAMS_GRADIENTS: true
USE_TENSORBOARD: false
IMG_RETRIEVAL:
CROP_QUERY_ROI: false
DATASET_PATH: ''
DEBUG_MODE: false
EVAL_BINARY_PATH: ''
EVAL_DATASET_NAME: Paris
FEATS_PROCESSING_TYPE: ''
GEM_POOL_POWER: 4.0
IMG_SCALINGS:
- 1
NORMALIZE_FEATURES: true
NUM_DATABASE_SAMPLES: -1
NUM_QUERY_SAMPLES: -1
NUM_TRAINING_SAMPLES: -1
N_PCA: 512
RESIZE_IMG: 1024
SAVE_FEATURES: false
SAVE_RETRIEVAL_RANKINGS_SCORES: true
SIMILARITY_MEASURE: cosine_similarity
SPATIAL_LEVELS: 3
TRAIN_DATASET_NAME: Oxford
TRAIN_PCA_WHITENING: true
USE_DISTRACTORS: false
WHITEN_IMG_LIST: ''
LOG_FREQUENCY: 10
LOSS:
CrossEntropyLoss:
ignore_index: -1
barlow_twins_loss:
embedding_dim: 8192
lambda_: 0.0051
scale_loss: 0.024
bce_logits_multiple_output_single_target:
normalize_output: false
reduction: none
world_size: 1
cross_entropy_multiple_output_single_target:
ignore_index: -1
normalize_output: false
reduction: mean
temperature: 1.0
weight: null
deepclusterv2_loss:
BATCHSIZE_PER_REPLICA: 256
DROP_LAST: true
kmeans_iters: 10
memory_params:
crops_for_mb:
- 0
embedding_dim: 128
num_clusters:
- 3000
- 3000
- 3000
num_crops: 2
num_train_samples: -1
temperature: 0.1
dino_loss:
crops_for_teacher:
- 0
- 1
ema_center: 0.9
momentum: 0.996
normalize_last_layer: true
output_dim: 65536
student_temp: 0.1
teacher_temp_max: 0.07
teacher_temp_min: 0.04
teacher_temp_warmup_iters: 37500
moco_loss:
embedding_dim: 128
momentum: 0.999
queue_size: 65536
temperature: 0.2
multicrop_simclr_info_nce_loss:
buffer_params:
effective_batch_size: 4096
embedding_dim: 128
world_size: 64
num_crops: 2
temperature: 0.1
name: simclr_info_nce_loss
nce_loss_with_memory:
loss_type: nce
loss_weights:
- 1.0
memory_params:
embedding_dim: 128
memory_size: -1
momentum: 0.5
norm_init: true
update_mem_on_forward: true
negative_sampling_params:
num_negatives: 16000
type: random
norm_constant: -1
norm_embedding: true
num_train_samples: -1
temperature: 0.07
update_mem_with_emb_index: -100
simclr_info_nce_loss:
buffer_params:
effective_batch_size: 8192
embedding_dim: 128
world_size: 64
temperature: 0.1
swav_loss:
crops_for_assign:
- 0
- 1
embedding_dim: 128
epsilon: 0.05
normalize_last_layer: true
num_crops: 2
num_iters: 3
num_prototypes:
- 3000
output_dir: .
queue:
local_queue_length: 0
queue_length: 0
start_iter: 0
temp_hard_assignment_iters: 0
temperature: 0.1
use_double_precision: false
swav_momentum_loss:
crops_for_assign:
- 0
- 1
embedding_dim: 128
epsilon: 0.05
momentum: 0.99
momentum_eval_mode_iter_start: 0
normalize_last_layer: true
num_crops: 2
num_iters: 3
num_prototypes:
- 3000
queue:
local_queue_length: 0
queue_length: 0
start_iter: 0
temperature: 0.1
use_double_precision: false
MACHINE:
DEVICE: gpu
METERS:
accuracy_list_meter:
meter_names: []
num_meters: 1
topk_values:
- 1
enable_training_meter: true
mean_ap_list_meter:
max_cpu_capacity: -1
meter_names: []
num_classes: 9605
num_meters: 1
model_output_mask: false
name: ''
names: []
precision_at_k_list_meter:
meter_names: []
num_meters: 1
topk_values:
- 1
recall_at_k_list_meter:
meter_names: []
num_meters: 1
topk_values:
- 1
MODEL:
ACTIVATION_CHECKPOINTING:
NUM_ACTIVATION_CHECKPOINTING_SPLITS: 2
USE_ACTIVATION_CHECKPOINTING: false
AMP_PARAMS:
AMP_ARGS:
opt_level: O1
AMP_TYPE: apex
USE_AMP: false
BASE_MODEL_NAME: multi_input_output_model
CUDA_CACHE:
CLEAR_CUDA_CACHE: false
CLEAR_FREQ: 100
FEATURE_EVAL_SETTINGS:
EVAL_MODE_ON: true
EVAL_TRUNK_AND_HEAD: false
EXTRACT_TRUNK_FEATURES_ONLY: true
FREEZE_TRUNK_AND_HEAD: false
FREEZE_TRUNK_ONLY: true
LINEAR_EVAL_FEAT_POOL_OPS_MAP: []
SHOULD_FLATTEN_FEATS: false
FSDP_CONFIG:
AUTO_WRAP_THRESHOLD: 0
bucket_cap_mb: 0
clear_autocast_cache: true
compute_dtype: float32
flatten_parameters: true
fp32_reduce_scatter: false
mixed_precision: true
verbose: true
GRAD_CLIP:
MAX_NORM: 1
NORM_TYPE: 2
USE_GRAD_CLIP: false
HEAD:
BATCHNORM_EPS: 1.0e-05
BATCHNORM_MOMENTUM: 0.1
PARAMS:
- - mlp
- dims:
- 2048
- 2048
skip_last_layer_relu_bn: false
use_relu: true
- - mlp
- dims:
- 2048
- 128
PARAMS_MULTIPLIER: 1.0
INPUT_TYPE: rgb
MULTI_INPUT_HEAD_MAPPING: []
NON_TRAINABLE_PARAMS: []
SHARDED_DDP_SETUP:
USE_SDP: false
reduce_buffer_size: -1
SINGLE_PASS_EVERY_CROP: false
SYNC_BN_CONFIG:
CONVERT_BN_TO_SYNC_BN: true
GROUP_SIZE: 8
SYNC_BN_TYPE: apex
TEMP_FROZEN_PARAMS_ITER_MAP: []
TRUNK:
CONVIT:
CLASS_TOKEN_IN_LOCAL_LAYERS: false
LOCALITY_DIM: 10
LOCALITY_STRENGTH: 1.0
N_GPSA_LAYERS: 10
USE_LOCAL_INIT: true
EFFICIENT_NETS: {}
NAME: resnet
REGNET: {}
RESNETS:
DEPTH: 50
GROUPNORM_GROUPS: 32
GROUPS: 1
LAYER4_STRIDE: 2
NORM: BatchNorm
STANDARDIZE_CONVOLUTIONS: false
WIDTH_MULTIPLIER: 1
WIDTH_PER_GROUP: 64
ZERO_INIT_RESIDUAL: false
VISION_TRANSFORMERS:
ATTENTION_DROPOUT_RATE: 0
CLASSIFIER: token
DROPOUT_RATE: 0
DROP_PATH_RATE: 0
HIDDEN_DIM: 768
IMAGE_SIZE: 224
MLP_DIM: 3072
NUM_HEADS: 12
NUM_LAYERS: 12
PATCH_SIZE: 16
QKV_BIAS: false
QK_SCALE: false
name: null
XCIT:
ATTENTION_DROPOUT_RATE: 0
DROPOUT_RATE: 0
DROP_PATH_RATE: 0.05
ETA: 1
HIDDEN_DIM: 384
IMAGE_SIZE: 224
NUM_HEADS: 8
NUM_LAYERS: 12
PATCH_SIZE: 16
QKV_BIAS: true
QK_SCALE: false
TOKENS_NORM: true
name: null
WEIGHTS_INIT:
APPEND_PREFIX: ''
PARAMS_FILE: /home/thu/data/sg_data/vissl_model_ckpt/model_final_checkpoint_phase999.torch
REMOVE_PREFIX: ''
SKIP_LAYERS:
- num_batches_tracked
STATE_DICT_KEY_NAME: classy_state_dict
_MODEL_INIT_SEED: 0
MONITORING:
MONITOR_ACTIVATION_STATISTICS: 0
MULTI_PROCESSING_METHOD: forkserver
NEAREST_NEIGHBOR:
L2_NORM_FEATS: false
SIGMA: 0.1
TOPK: 200
OPTIMIZER:
betas:
- 0.9
- 0.999
construct_single_param_group_only: false
head_optimizer_params:
use_different_lr: false
use_different_wd: false
weight_decay: 1.0e-06
larc_config:
clip: false
eps: 1.0e-08
trust_coefficient: 0.001
momentum: 0.9
name: sgd
nesterov: false
non_regularized_parameters: []
num_epochs: 100
param_schedulers:
lr:
auto_lr_scaling:
auto_scale: true
base_lr_batch_size: 256
base_value: 0.3
scaling_type: linear
end_value: 0.0
interval_scaling: &id001
- rescaled
- fixed
lengths: &id002
- 0.1
- 0.9
milestones: &id003
- 30
- 60
name: composite
schedulers: &id004
- end_value: 4.8
name: linear
start_value: 0.6
- end_value: 0.0
name: cosine
start_value: 4.8
start_value: 0.1
update_interval: step
value: 0.1
values: &id005
- 0.1
- 0.01
- 0.001
lr_head:
auto_lr_scaling:
auto_scale: true
base_lr_batch_size: 256
base_value: 0.3
scaling_type: linear
end_value: 0.0
interval_scaling: *id001
lengths: *id002
milestones: *id003
name: composite
schedulers: *id004
start_value: 0.1
update_interval: step
value: 0.1
values: *id005
regularize_bias: true
regularize_bn: true
use_larc: true
use_zero: false
weight_decay: 1.0e-06
PROFILING:
MEMORY_PROFILING:
TRACK_BY_LAYER_MEMORY: false
NUM_ITERATIONS: 10
OUTPUT_FOLDER: .
PROFILED_RANKS:
- 0
- 1
RUNTIME_PROFILING:
LEGACY_PROFILER: false
PROFILE_CPU: true
PROFILE_GPU: true
USE_PROFILER: false
START_ITERATION: 0
STOP_TRAINING_AFTER_PROFILING: false
WARMUP_ITERATIONS: 0
REPRODUCIBILITY:
CUDDN_DETERMINISTIC: false
SEED_VALUE: 0
SLURM:
ADDITIONAL_PARAMETERS: {}
COMMENT: vissl job
CONSTRAINT: ''
LOG_FOLDER: .
MEM_GB: 250
NAME: vissl
NUM_CPU_PER_PROC: 8
PARTITION: ''
PORT_ID: 40050
TIME_HOURS: 72
TIME_MINUTES: 0
USE_SLURM: false
SVM:
cls_list: []
costs:
base: -1.0
costs_list:
- 0.1
- 0.01
power_range:
- 4
- 20
cross_val_folds: 3
dual: true
force_retrain: false
loss: squared_hinge
low_shot:
dataset_name: voc
k_values:
- 1
- 2
- 4
- 8
- 16
- 32
- 64
- 96
sample_inds:
- 1
- 2
- 3
- 4
- 5
max_iter: 2000
normalize: true
penalty: l2
TEST_EVERY_NUM_EPOCH: 1
TEST_MODEL: false
TEST_ONLY: false
TRAINER:
TASK_NAME: self_supervision_task
TRAIN_STEP_NAME: standard_train_step
VERBOSE: false