Upload all DRIP model checkpoints
Browse files- .gitattributes +3 -0
- BioCLIP_DRIP-10x/checkpoints/epoch_30.pt +3 -0
- BioCLIP_DRIP-10x/checkpoints/results.jsonl +30 -0
- BioCLIP_DRIP-10x/out.log +3 -0
- BioCLIP_DRIP-10x/params.txt +93 -0
- BioCLIP_DRIP-10x/tensorboard/events.out.tfevents.1760642379.a0014.ten.osc.edu.3376070.0 +3 -0
- BioCLIP_DRIP-4x/checkpoints/epoch_30.pt +3 -0
- BioCLIP_DRIP-4x/checkpoints/results.jsonl +30 -0
- BioCLIP_DRIP-4x/out.log +3 -0
- BioCLIP_DRIP-4x/params.txt +93 -0
- BioCLIP_DRIP-4x/tensorboard/events.out.tfevents.1760670988.a0006.ten.osc.edu.1543726.0 +3 -0
- BioCLIP_ViT/checkpoints/epoch_30.pt +3 -0
- BioCLIP_ViT/checkpoints/results.jsonl +30 -0
- BioCLIP_ViT/out.log +3 -0
- BioCLIP_ViT/params.txt +93 -0
- BioCLIP_ViT/tensorboard/events.out.tfevents.1760540395.a0001.ten.osc.edu.3717549.0 +3 -0
.gitattributes
CHANGED
|
@@ -33,3 +33,6 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
BioCLIP_DRIP-10x/out.log filter=lfs diff=lfs merge=lfs -text
|
| 37 |
+
BioCLIP_DRIP-4x/out.log filter=lfs diff=lfs merge=lfs -text
|
| 38 |
+
BioCLIP_ViT/out.log filter=lfs diff=lfs merge=lfs -text
|
BioCLIP_DRIP-10x/checkpoints/epoch_30.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6be7b97b330e20b964ffa25791763ec02feaf621d9f3425d0236b9331ceab600
|
| 3 |
+
size 1805275869
|
BioCLIP_DRIP-10x/checkpoints/results.jsonl
ADDED
|
@@ -0,0 +1,30 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{"clip_val_loss": 2.5046207904815674, "epoch": 1, "num_samples": 501656}
|
| 2 |
+
{"clip_val_loss": 2.0657501220703125, "epoch": 2, "num_samples": 501656}
|
| 3 |
+
{"clip_val_loss": 1.882075309753418, "epoch": 3, "num_samples": 501656}
|
| 4 |
+
{"clip_val_loss": 1.8267585039138794, "epoch": 4, "num_samples": 501656}
|
| 5 |
+
{"clip_val_loss": 1.7504688501358032, "epoch": 5, "num_samples": 501656}
|
| 6 |
+
{"clip_val_loss": 1.6859045028686523, "epoch": 6, "num_samples": 501656}
|
| 7 |
+
{"clip_val_loss": 1.6518208980560303, "epoch": 7, "num_samples": 501656}
|
| 8 |
+
{"clip_val_loss": 1.6349964141845703, "epoch": 8, "num_samples": 501656}
|
| 9 |
+
{"clip_val_loss": 1.6101164817810059, "epoch": 9, "num_samples": 501656}
|
| 10 |
+
{"clip_val_loss": 1.5724177360534668, "epoch": 10, "num_samples": 501656}
|
| 11 |
+
{"clip_val_loss": 1.5524085760116577, "epoch": 11, "num_samples": 501656}
|
| 12 |
+
{"clip_val_loss": 1.5449659824371338, "epoch": 12, "num_samples": 501656}
|
| 13 |
+
{"clip_val_loss": 1.5371925830841064, "epoch": 13, "num_samples": 501656}
|
| 14 |
+
{"clip_val_loss": 1.5129188299179077, "epoch": 14, "num_samples": 501656}
|
| 15 |
+
{"clip_val_loss": 1.4954185485839844, "epoch": 15, "num_samples": 501656}
|
| 16 |
+
{"clip_val_loss": 1.5068094730377197, "epoch": 16, "num_samples": 501656}
|
| 17 |
+
{"clip_val_loss": 1.4935302734375, "epoch": 17, "num_samples": 501656}
|
| 18 |
+
{"clip_val_loss": 1.4834712743759155, "epoch": 18, "num_samples": 501656}
|
| 19 |
+
{"clip_val_loss": 1.4744983911514282, "epoch": 19, "num_samples": 501656}
|
| 20 |
+
{"clip_val_loss": 1.4724007844924927, "epoch": 20, "num_samples": 501656}
|
| 21 |
+
{"clip_val_loss": 1.4541399478912354, "epoch": 21, "num_samples": 501656}
|
| 22 |
+
{"clip_val_loss": 1.454805612564087, "epoch": 22, "num_samples": 501656}
|
| 23 |
+
{"clip_val_loss": 1.4473918676376343, "epoch": 23, "num_samples": 501656}
|
| 24 |
+
{"clip_val_loss": 1.4373340606689453, "epoch": 24, "num_samples": 501656}
|
| 25 |
+
{"clip_val_loss": 1.4387410879135132, "epoch": 25, "num_samples": 501656}
|
| 26 |
+
{"clip_val_loss": 1.4473508596420288, "epoch": 26, "num_samples": 501656}
|
| 27 |
+
{"clip_val_loss": 1.4411402940750122, "epoch": 27, "num_samples": 501656}
|
| 28 |
+
{"clip_val_loss": 1.4423558712005615, "epoch": 28, "num_samples": 501656}
|
| 29 |
+
{"clip_val_loss": 1.4383875131607056, "epoch": 29, "num_samples": 501656}
|
| 30 |
+
{"clip_val_loss": 1.4349430799484253, "epoch": 30, "num_samples": 501656}
|
BioCLIP_DRIP-10x/out.log
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:eda17b8d4847681579765cdafc26446d68dee3fb198be4c8985d0962ee4b73e9
|
| 3 |
+
size 16101804
|
BioCLIP_DRIP-10x/params.txt
ADDED
|
@@ -0,0 +1,93 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
DTP: False
|
| 2 |
+
accum_freq: 2
|
| 3 |
+
aug_cfg: {}
|
| 4 |
+
batch_size: 512
|
| 5 |
+
beta1: 0.9
|
| 6 |
+
beta2: 0.98
|
| 7 |
+
checkpoint_path: /fs/scratch/PAS2836/yusenpeng_checkpoint/BioCLIP/2025_10_16-15_19_30-model_ViT-B-16-lr_0.0001-b_512-j_8-p_amp/checkpoints
|
| 8 |
+
coca_caption_loss_weight: 2.0
|
| 9 |
+
coca_contrastive_loss_weight: 1.0
|
| 10 |
+
copy_codebase: False
|
| 11 |
+
csv_caption_key: title
|
| 12 |
+
csv_img_key: filepath
|
| 13 |
+
csv_separator:
|
| 14 |
+
dataset_resampled: True
|
| 15 |
+
dataset_type: webdataset
|
| 16 |
+
ddp_static_graph: False
|
| 17 |
+
debug: False
|
| 18 |
+
delete_previous_checkpoint: False
|
| 19 |
+
device: cuda:0
|
| 20 |
+
dist_backend: nccl
|
| 21 |
+
dist_url: env://
|
| 22 |
+
distill: False
|
| 23 |
+
distill_model: None
|
| 24 |
+
distill_pretrained: None
|
| 25 |
+
distributed: True
|
| 26 |
+
epochs: 30
|
| 27 |
+
epochs_cooldown: None
|
| 28 |
+
eps: 1e-06
|
| 29 |
+
force_custom_text: False
|
| 30 |
+
force_image_size: None
|
| 31 |
+
force_patch_dropout: None
|
| 32 |
+
force_quick_gelu: False
|
| 33 |
+
gather_with_grad: False
|
| 34 |
+
grad_checkpointing: False
|
| 35 |
+
grad_clip_norm: None
|
| 36 |
+
horovod: False
|
| 37 |
+
image_mean: [0.485, 0.456, 0.406]
|
| 38 |
+
image_std: [0.229, 0.224, 0.225]
|
| 39 |
+
imagenet_v2: None
|
| 40 |
+
imagenet_val: None
|
| 41 |
+
local_loss: False
|
| 42 |
+
local_rank: 0
|
| 43 |
+
lock_image: False
|
| 44 |
+
lock_image_freeze_bn_stats: False
|
| 45 |
+
lock_image_unlocked_groups: 0
|
| 46 |
+
lock_text: False
|
| 47 |
+
lock_text_freeze_layer_norm: False
|
| 48 |
+
lock_text_unlocked_layers: 0
|
| 49 |
+
log_every_n_steps: 1
|
| 50 |
+
log_level: 20
|
| 51 |
+
log_local: False
|
| 52 |
+
log_path: /fs/scratch/PAS2836/yusenpeng_checkpoint/BioCLIP/2025_10_16-15_19_30-model_ViT-B-16-lr_0.0001-b_512-j_8-p_amp/out.log
|
| 53 |
+
logs: /fs/scratch/PAS2836/yusenpeng_checkpoint/BioCLIP
|
| 54 |
+
lr: 0.0001
|
| 55 |
+
lr_cooldown_end: 0.0
|
| 56 |
+
lr_cooldown_power: 1.0
|
| 57 |
+
lr_scheduler: cosine
|
| 58 |
+
model: ViT-B-16
|
| 59 |
+
name: 2025_10_16-15_19_30-model_ViT-B-16-lr_0.0001-b_512-j_8-p_amp
|
| 60 |
+
no_set_device_rank: False
|
| 61 |
+
precision: amp
|
| 62 |
+
pretrained: /fs/scratch/PAS2836/yusenpeng_checkpoint/CLIP/DRIP_10x_16_ViT_4_8/checkpoints/epoch_15.pt
|
| 63 |
+
pretrained_image: False
|
| 64 |
+
rank: 0
|
| 65 |
+
remote_sync: None
|
| 66 |
+
remote_sync_frequency: 300
|
| 67 |
+
remote_sync_protocol: s3
|
| 68 |
+
report_to: tensorboard
|
| 69 |
+
resume: None
|
| 70 |
+
save_frequency: 1
|
| 71 |
+
save_most_recent: False
|
| 72 |
+
seed: 0
|
| 73 |
+
skip_scheduler: False
|
| 74 |
+
tensorboard: True
|
| 75 |
+
tensorboard_path: /fs/scratch/PAS2836/yusenpeng_checkpoint/BioCLIP/2025_10_16-15_19_30-model_ViT-B-16-lr_0.0001-b_512-j_8-p_amp/tensorboard
|
| 76 |
+
text_type: random
|
| 77 |
+
torchscript: False
|
| 78 |
+
trace: False
|
| 79 |
+
train_data: /fs/scratch/PAS2836/yusenpeng_dataset/bioclip/data/TreeOfLife-10M/dataset/evobio10m-CVPR-2024/224x224/train/shard-{000000..000164}.tar
|
| 80 |
+
train_data_upsampling_factors: None
|
| 81 |
+
train_num_samples: 10000000
|
| 82 |
+
use_bn_sync: False
|
| 83 |
+
val_data: /fs/scratch/PAS2836/yusenpeng_dataset/bioclip/data/TreeOfLife-10M/dataset/evobio10m-CVPR-2024/224x224/val/shard-{000000..000034}.tar
|
| 84 |
+
val_frequency: 1
|
| 85 |
+
val_num_samples: 500000
|
| 86 |
+
wandb: False
|
| 87 |
+
wandb_notes:
|
| 88 |
+
wandb_project_name: open-clip
|
| 89 |
+
warmup: 1000
|
| 90 |
+
wd: 0.2
|
| 91 |
+
workers: 8
|
| 92 |
+
world_size: 4
|
| 93 |
+
zeroshot_frequency: 2
|
BioCLIP_DRIP-10x/tensorboard/events.out.tfevents.1760642379.a0014.ten.osc.edu.3376070.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:98fbd0a60dadd69cb856761e94b28c6eea3158471680dabb050a79829fe9c9ff
|
| 3 |
+
size 33453186
|
BioCLIP_DRIP-4x/checkpoints/epoch_30.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:25e9b64f8b572e5cf5aed00ea5c3b9075f89f879d9ab700f7de225593ff6867f
|
| 3 |
+
size 1805275869
|
BioCLIP_DRIP-4x/checkpoints/results.jsonl
ADDED
|
@@ -0,0 +1,30 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{"clip_val_loss": 2.4348039627075195, "epoch": 1, "num_samples": 501656}
|
| 2 |
+
{"clip_val_loss": 2.004694700241089, "epoch": 2, "num_samples": 501656}
|
| 3 |
+
{"clip_val_loss": 1.859370470046997, "epoch": 3, "num_samples": 501656}
|
| 4 |
+
{"clip_val_loss": 1.9185363054275513, "epoch": 4, "num_samples": 501656}
|
| 5 |
+
{"clip_val_loss": 1.7297427654266357, "epoch": 5, "num_samples": 501656}
|
| 6 |
+
{"clip_val_loss": 1.6583002805709839, "epoch": 6, "num_samples": 501656}
|
| 7 |
+
{"clip_val_loss": 1.6416922807693481, "epoch": 7, "num_samples": 501656}
|
| 8 |
+
{"clip_val_loss": 1.619407057762146, "epoch": 8, "num_samples": 501656}
|
| 9 |
+
{"clip_val_loss": 1.6424254179000854, "epoch": 9, "num_samples": 501656}
|
| 10 |
+
{"clip_val_loss": 1.562835454940796, "epoch": 10, "num_samples": 501656}
|
| 11 |
+
{"clip_val_loss": 1.5434213876724243, "epoch": 11, "num_samples": 501656}
|
| 12 |
+
{"clip_val_loss": 1.530497431755066, "epoch": 12, "num_samples": 501656}
|
| 13 |
+
{"clip_val_loss": 1.5290805101394653, "epoch": 13, "num_samples": 501656}
|
| 14 |
+
{"clip_val_loss": 1.490039587020874, "epoch": 14, "num_samples": 501656}
|
| 15 |
+
{"clip_val_loss": 1.4832487106323242, "epoch": 15, "num_samples": 501656}
|
| 16 |
+
{"clip_val_loss": 1.4945603609085083, "epoch": 16, "num_samples": 501656}
|
| 17 |
+
{"clip_val_loss": 1.47165846824646, "epoch": 17, "num_samples": 501656}
|
| 18 |
+
{"clip_val_loss": 1.4712049961090088, "epoch": 18, "num_samples": 501656}
|
| 19 |
+
{"clip_val_loss": 1.4639668464660645, "epoch": 19, "num_samples": 501656}
|
| 20 |
+
{"clip_val_loss": 1.452162742614746, "epoch": 20, "num_samples": 501656}
|
| 21 |
+
{"clip_val_loss": 1.4360315799713135, "epoch": 21, "num_samples": 501656}
|
| 22 |
+
{"clip_val_loss": 1.4377144575119019, "epoch": 22, "num_samples": 501656}
|
| 23 |
+
{"clip_val_loss": 1.4283307790756226, "epoch": 23, "num_samples": 501656}
|
| 24 |
+
{"clip_val_loss": 1.4263763427734375, "epoch": 24, "num_samples": 501656}
|
| 25 |
+
{"clip_val_loss": 1.4236398935317993, "epoch": 25, "num_samples": 501656}
|
| 26 |
+
{"clip_val_loss": 1.4321935176849365, "epoch": 26, "num_samples": 501656}
|
| 27 |
+
{"clip_val_loss": 1.4234939813613892, "epoch": 27, "num_samples": 501656}
|
| 28 |
+
{"clip_val_loss": 1.4241715669631958, "epoch": 28, "num_samples": 501656}
|
| 29 |
+
{"clip_val_loss": 1.420454740524292, "epoch": 29, "num_samples": 501656}
|
| 30 |
+
{"clip_val_loss": 1.4174911975860596, "epoch": 30, "num_samples": 501656}
|
BioCLIP_DRIP-4x/out.log
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d77b5c115a40ac98712496616d4f6f0cacfa60ebd1c33ab40144e06b35de8c1d
|
| 3 |
+
size 16101300
|
BioCLIP_DRIP-4x/params.txt
ADDED
|
@@ -0,0 +1,93 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
DTP: False
|
| 2 |
+
accum_freq: 2
|
| 3 |
+
aug_cfg: {}
|
| 4 |
+
batch_size: 512
|
| 5 |
+
beta1: 0.9
|
| 6 |
+
beta2: 0.98
|
| 7 |
+
checkpoint_path: /fs/scratch/PAS2836/yusenpeng_checkpoint/BioCLIP/2025_10_16-23_16_19-model_ViT-B-16-lr_0.0001-b_512-j_8-p_amp/checkpoints
|
| 8 |
+
coca_caption_loss_weight: 2.0
|
| 9 |
+
coca_contrastive_loss_weight: 1.0
|
| 10 |
+
copy_codebase: False
|
| 11 |
+
csv_caption_key: title
|
| 12 |
+
csv_img_key: filepath
|
| 13 |
+
csv_separator:
|
| 14 |
+
dataset_resampled: True
|
| 15 |
+
dataset_type: webdataset
|
| 16 |
+
ddp_static_graph: False
|
| 17 |
+
debug: False
|
| 18 |
+
delete_previous_checkpoint: False
|
| 19 |
+
device: cuda:0
|
| 20 |
+
dist_backend: nccl
|
| 21 |
+
dist_url: env://
|
| 22 |
+
distill: False
|
| 23 |
+
distill_model: None
|
| 24 |
+
distill_pretrained: None
|
| 25 |
+
distributed: True
|
| 26 |
+
epochs: 30
|
| 27 |
+
epochs_cooldown: None
|
| 28 |
+
eps: 1e-06
|
| 29 |
+
force_custom_text: False
|
| 30 |
+
force_image_size: None
|
| 31 |
+
force_patch_dropout: None
|
| 32 |
+
force_quick_gelu: False
|
| 33 |
+
gather_with_grad: False
|
| 34 |
+
grad_checkpointing: False
|
| 35 |
+
grad_clip_norm: None
|
| 36 |
+
horovod: False
|
| 37 |
+
image_mean: [0.485, 0.456, 0.406]
|
| 38 |
+
image_std: [0.229, 0.224, 0.225]
|
| 39 |
+
imagenet_v2: None
|
| 40 |
+
imagenet_val: None
|
| 41 |
+
local_loss: False
|
| 42 |
+
local_rank: 0
|
| 43 |
+
lock_image: False
|
| 44 |
+
lock_image_freeze_bn_stats: False
|
| 45 |
+
lock_image_unlocked_groups: 0
|
| 46 |
+
lock_text: False
|
| 47 |
+
lock_text_freeze_layer_norm: False
|
| 48 |
+
lock_text_unlocked_layers: 0
|
| 49 |
+
log_every_n_steps: 1
|
| 50 |
+
log_level: 20
|
| 51 |
+
log_local: False
|
| 52 |
+
log_path: /fs/scratch/PAS2836/yusenpeng_checkpoint/BioCLIP/2025_10_16-23_16_19-model_ViT-B-16-lr_0.0001-b_512-j_8-p_amp/out.log
|
| 53 |
+
logs: /fs/scratch/PAS2836/yusenpeng_checkpoint/BioCLIP
|
| 54 |
+
lr: 0.0001
|
| 55 |
+
lr_cooldown_end: 0.0
|
| 56 |
+
lr_cooldown_power: 1.0
|
| 57 |
+
lr_scheduler: cosine
|
| 58 |
+
model: ViT-B-16
|
| 59 |
+
name: 2025_10_16-23_16_19-model_ViT-B-16-lr_0.0001-b_512-j_8-p_amp
|
| 60 |
+
no_set_device_rank: False
|
| 61 |
+
precision: amp
|
| 62 |
+
pretrained: /fs/scratch/PAS2836/yusenpeng_checkpoint/CLIP/DRIP_4x_16_ViT_4_8/checkpoints/epoch_15.pt
|
| 63 |
+
pretrained_image: False
|
| 64 |
+
rank: 0
|
| 65 |
+
remote_sync: None
|
| 66 |
+
remote_sync_frequency: 300
|
| 67 |
+
remote_sync_protocol: s3
|
| 68 |
+
report_to: tensorboard
|
| 69 |
+
resume: None
|
| 70 |
+
save_frequency: 1
|
| 71 |
+
save_most_recent: False
|
| 72 |
+
seed: 0
|
| 73 |
+
skip_scheduler: False
|
| 74 |
+
tensorboard: True
|
| 75 |
+
tensorboard_path: /fs/scratch/PAS2836/yusenpeng_checkpoint/BioCLIP/2025_10_16-23_16_19-model_ViT-B-16-lr_0.0001-b_512-j_8-p_amp/tensorboard
|
| 76 |
+
text_type: random
|
| 77 |
+
torchscript: False
|
| 78 |
+
trace: False
|
| 79 |
+
train_data: /fs/scratch/PAS2836/yusenpeng_dataset/bioclip/data/TreeOfLife-10M/dataset/evobio10m-CVPR-2024/224x224/train/shard-{000000..000164}.tar
|
| 80 |
+
train_data_upsampling_factors: None
|
| 81 |
+
train_num_samples: 10000000
|
| 82 |
+
use_bn_sync: False
|
| 83 |
+
val_data: /fs/scratch/PAS2836/yusenpeng_dataset/bioclip/data/TreeOfLife-10M/dataset/evobio10m-CVPR-2024/224x224/val/shard-{000000..000034}.tar
|
| 84 |
+
val_frequency: 1
|
| 85 |
+
val_num_samples: 500000
|
| 86 |
+
wandb: False
|
| 87 |
+
wandb_notes:
|
| 88 |
+
wandb_project_name: open-clip
|
| 89 |
+
warmup: 1000
|
| 90 |
+
wd: 0.2
|
| 91 |
+
workers: 8
|
| 92 |
+
world_size: 4
|
| 93 |
+
zeroshot_frequency: 2
|
BioCLIP_DRIP-4x/tensorboard/events.out.tfevents.1760670988.a0006.ten.osc.edu.1543726.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bb4c8f348f805080f0d6b9f71b7c17cf658032a128a14859b46e11972863c6d7
|
| 3 |
+
size 33453186
|
BioCLIP_ViT/checkpoints/epoch_30.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d4301d903dfa2c82741380f8cb59fc2192c8e9f9f26ada02b5d14f6919b50228
|
| 3 |
+
size 1795825309
|
BioCLIP_ViT/checkpoints/results.jsonl
ADDED
|
@@ -0,0 +1,30 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{"clip_val_loss": 2.8370041847229004, "epoch": 1, "num_samples": 501656}
|
| 2 |
+
{"clip_val_loss": 2.304974317550659, "epoch": 2, "num_samples": 501656}
|
| 3 |
+
{"clip_val_loss": 2.104631185531616, "epoch": 3, "num_samples": 501656}
|
| 4 |
+
{"clip_val_loss": 2.0347816944122314, "epoch": 4, "num_samples": 501656}
|
| 5 |
+
{"clip_val_loss": 1.9566813707351685, "epoch": 5, "num_samples": 501656}
|
| 6 |
+
{"clip_val_loss": 1.8931668996810913, "epoch": 6, "num_samples": 501656}
|
| 7 |
+
{"clip_val_loss": 1.8396780490875244, "epoch": 7, "num_samples": 501656}
|
| 8 |
+
{"clip_val_loss": 1.8291608095169067, "epoch": 8, "num_samples": 501656}
|
| 9 |
+
{"clip_val_loss": 1.7909398078918457, "epoch": 9, "num_samples": 501656}
|
| 10 |
+
{"clip_val_loss": 1.7643558979034424, "epoch": 10, "num_samples": 501656}
|
| 11 |
+
{"clip_val_loss": 1.7463152408599854, "epoch": 11, "num_samples": 501656}
|
| 12 |
+
{"clip_val_loss": 1.7283272743225098, "epoch": 12, "num_samples": 501656}
|
| 13 |
+
{"clip_val_loss": 1.7322763204574585, "epoch": 13, "num_samples": 501656}
|
| 14 |
+
{"clip_val_loss": 1.7056169509887695, "epoch": 14, "num_samples": 501656}
|
| 15 |
+
{"clip_val_loss": 1.687942624092102, "epoch": 15, "num_samples": 501656}
|
| 16 |
+
{"clip_val_loss": 1.6953397989273071, "epoch": 16, "num_samples": 501656}
|
| 17 |
+
{"clip_val_loss": 1.679396629333496, "epoch": 17, "num_samples": 501656}
|
| 18 |
+
{"clip_val_loss": 1.672758936882019, "epoch": 18, "num_samples": 501656}
|
| 19 |
+
{"clip_val_loss": 1.6576241254806519, "epoch": 19, "num_samples": 501656}
|
| 20 |
+
{"clip_val_loss": 1.6537834405899048, "epoch": 20, "num_samples": 501656}
|
| 21 |
+
{"clip_val_loss": 1.6339473724365234, "epoch": 21, "num_samples": 501656}
|
| 22 |
+
{"clip_val_loss": 1.6412723064422607, "epoch": 22, "num_samples": 501656}
|
| 23 |
+
{"clip_val_loss": 1.6292186975479126, "epoch": 23, "num_samples": 501656}
|
| 24 |
+
{"clip_val_loss": 1.627284049987793, "epoch": 24, "num_samples": 501656}
|
| 25 |
+
{"clip_val_loss": 1.6244851350784302, "epoch": 25, "num_samples": 501656}
|
| 26 |
+
{"clip_val_loss": 1.6293575763702393, "epoch": 26, "num_samples": 501656}
|
| 27 |
+
{"clip_val_loss": 1.6238917112350464, "epoch": 27, "num_samples": 501656}
|
| 28 |
+
{"clip_val_loss": 1.6230109930038452, "epoch": 28, "num_samples": 501656}
|
| 29 |
+
{"clip_val_loss": 1.6196156740188599, "epoch": 29, "num_samples": 501656}
|
| 30 |
+
{"clip_val_loss": 1.6169296503067017, "epoch": 30, "num_samples": 501656}
|
BioCLIP_ViT/out.log
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9d864f7effd89f4bdbceb94e28070af5503f3ab724966330380a1f955e4da318
|
| 3 |
+
size 16162494
|
BioCLIP_ViT/params.txt
ADDED
|
@@ -0,0 +1,93 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
DTP: False
|
| 2 |
+
accum_freq: 1
|
| 3 |
+
aug_cfg: {}
|
| 4 |
+
batch_size: 1024
|
| 5 |
+
beta1: 0.9
|
| 6 |
+
beta2: 0.98
|
| 7 |
+
checkpoint_path: /fs/scratch/PAS2836/yusenpeng_checkpoint/BioCLIP/2025_10_15-10_59_47-model_ViT-B-16-lr_0.0001-b_1024-j_8-p_amp/checkpoints
|
| 8 |
+
coca_caption_loss_weight: 2.0
|
| 9 |
+
coca_contrastive_loss_weight: 1.0
|
| 10 |
+
copy_codebase: False
|
| 11 |
+
csv_caption_key: title
|
| 12 |
+
csv_img_key: filepath
|
| 13 |
+
csv_separator:
|
| 14 |
+
dataset_resampled: True
|
| 15 |
+
dataset_type: webdataset
|
| 16 |
+
ddp_static_graph: False
|
| 17 |
+
debug: False
|
| 18 |
+
delete_previous_checkpoint: False
|
| 19 |
+
device: cuda:0
|
| 20 |
+
dist_backend: nccl
|
| 21 |
+
dist_url: env://
|
| 22 |
+
distill: False
|
| 23 |
+
distill_model: None
|
| 24 |
+
distill_pretrained: None
|
| 25 |
+
distributed: True
|
| 26 |
+
epochs: 30
|
| 27 |
+
epochs_cooldown: None
|
| 28 |
+
eps: 1e-06
|
| 29 |
+
force_custom_text: False
|
| 30 |
+
force_image_size: None
|
| 31 |
+
force_patch_dropout: None
|
| 32 |
+
force_quick_gelu: False
|
| 33 |
+
gather_with_grad: True
|
| 34 |
+
grad_checkpointing: True
|
| 35 |
+
grad_clip_norm: None
|
| 36 |
+
horovod: False
|
| 37 |
+
image_mean: [0.485, 0.456, 0.406]
|
| 38 |
+
image_std: [0.229, 0.224, 0.225]
|
| 39 |
+
imagenet_v2: None
|
| 40 |
+
imagenet_val: None
|
| 41 |
+
local_loss: True
|
| 42 |
+
local_rank: 0
|
| 43 |
+
lock_image: False
|
| 44 |
+
lock_image_freeze_bn_stats: False
|
| 45 |
+
lock_image_unlocked_groups: 0
|
| 46 |
+
lock_text: False
|
| 47 |
+
lock_text_freeze_layer_norm: False
|
| 48 |
+
lock_text_unlocked_layers: 0
|
| 49 |
+
log_every_n_steps: 1
|
| 50 |
+
log_level: 20
|
| 51 |
+
log_local: False
|
| 52 |
+
log_path: /fs/scratch/PAS2836/yusenpeng_checkpoint/BioCLIP/2025_10_15-10_59_47-model_ViT-B-16-lr_0.0001-b_1024-j_8-p_amp/out.log
|
| 53 |
+
logs: /fs/scratch/PAS2836/yusenpeng_checkpoint/BioCLIP
|
| 54 |
+
lr: 0.0001
|
| 55 |
+
lr_cooldown_end: 0.0
|
| 56 |
+
lr_cooldown_power: 1.0
|
| 57 |
+
lr_scheduler: cosine
|
| 58 |
+
model: ViT-B-16
|
| 59 |
+
name: 2025_10_15-10_59_47-model_ViT-B-16-lr_0.0001-b_1024-j_8-p_amp
|
| 60 |
+
no_set_device_rank: False
|
| 61 |
+
precision: amp
|
| 62 |
+
pretrained: /fs/scratch/PAS2836/yusenpeng_checkpoint/CLIP/ViT_B_16/checkpoints/epoch_15.pt
|
| 63 |
+
pretrained_image: False
|
| 64 |
+
rank: 0
|
| 65 |
+
remote_sync: None
|
| 66 |
+
remote_sync_frequency: 300
|
| 67 |
+
remote_sync_protocol: s3
|
| 68 |
+
report_to: tensorboard
|
| 69 |
+
resume: None
|
| 70 |
+
save_frequency: 1
|
| 71 |
+
save_most_recent: False
|
| 72 |
+
seed: 0
|
| 73 |
+
skip_scheduler: False
|
| 74 |
+
tensorboard: True
|
| 75 |
+
tensorboard_path: /fs/scratch/PAS2836/yusenpeng_checkpoint/BioCLIP/2025_10_15-10_59_47-model_ViT-B-16-lr_0.0001-b_1024-j_8-p_amp/tensorboard
|
| 76 |
+
text_type: random
|
| 77 |
+
torchscript: False
|
| 78 |
+
trace: False
|
| 79 |
+
train_data: /fs/scratch/PAS2836/yusenpeng_dataset/bioclip/data/TreeOfLife-10M/dataset/evobio10m-CVPR-2024/224x224/train/shard-{000000..000164}.tar
|
| 80 |
+
train_data_upsampling_factors: None
|
| 81 |
+
train_num_samples: 10000000
|
| 82 |
+
use_bn_sync: False
|
| 83 |
+
val_data: /fs/scratch/PAS2836/yusenpeng_dataset/bioclip/data/TreeOfLife-10M/dataset/evobio10m-CVPR-2024/224x224/val/shard-{000000..000034}.tar
|
| 84 |
+
val_frequency: 1
|
| 85 |
+
val_num_samples: 500000
|
| 86 |
+
wandb: False
|
| 87 |
+
wandb_notes:
|
| 88 |
+
wandb_project_name: open-clip
|
| 89 |
+
warmup: 1000
|
| 90 |
+
wd: 0.2
|
| 91 |
+
workers: 8
|
| 92 |
+
world_size: 4
|
| 93 |
+
zeroshot_frequency: 2
|
BioCLIP_ViT/tensorboard/events.out.tfevents.1760540395.a0001.ten.osc.edu.3717549.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f65828551ea71f8a48d2fc929f24ac5980751560a34bd4e6bffdd8e47df73392
|
| 3 |
+
size 33508146
|