best quick_fid_4096=59.362679 step=150000 at 20260311-122222-UTC
Browse files- .gitattributes +4 -0
- jepa2_run_warmup/best/step_150000_20260311-122222-UTC/_CHECKPOINT_METADATA +1 -0
- jepa2_run_warmup/best/step_150000_20260311-122222-UTC/_METADATA +0 -0
- jepa2_run_warmup/best/step_150000_20260311-122222-UTC/_sharding +0 -0
- jepa2_run_warmup/best/step_150000_20260311-122222-UTC/array_metadatas/process_0 +0 -0
- jepa2_run_warmup/best/step_150000_20260311-122222-UTC/config.json +64 -0
- jepa2_run_warmup/best/step_150000_20260311-122222-UTC/d/43f95ef628a8342d9c49e3fc30f1e386 +0 -0
- jepa2_run_warmup/best/step_150000_20260311-122222-UTC/manifest.ocdbt +0 -0
- jepa2_run_warmup/best/step_150000_20260311-122222-UTC/ocdbt.process_0/d/1924c26392e8cc48779df647479bcb99 +3 -0
- jepa2_run_warmup/best/step_150000_20260311-122222-UTC/ocdbt.process_0/d/9486cd8a2c6c9bd8ab4b71a041b10281 +3 -0
- jepa2_run_warmup/best/step_150000_20260311-122222-UTC/ocdbt.process_0/d/96529a28ac8ec27455670714ec4fae6c +0 -0
- jepa2_run_warmup/best/step_150000_20260311-122222-UTC/ocdbt.process_0/d/96e654fff8d0ea948576eeb603b1a2c3 +3 -0
- jepa2_run_warmup/best/step_150000_20260311-122222-UTC/ocdbt.process_0/d/b6e84a529c42d835f1a7f08ba9080c89 +3 -0
- jepa2_run_warmup/best/step_150000_20260311-122222-UTC/ocdbt.process_0/d/eaa1055cf70f11c4cebd24c720d24718 +0 -0
- jepa2_run_warmup/best/step_150000_20260311-122222-UTC/ocdbt.process_0/d/ed32b9c4ab957e7fb24d7ce85fe39f7c +0 -0
- jepa2_run_warmup/best/step_150000_20260311-122222-UTC/ocdbt.process_0/manifest.ocdbt +0 -0
.gitattributes
CHANGED
|
@@ -98,3 +98,7 @@ jepa2_run_warmup/best/step_50000_20260311-080223-UTC/ocdbt.process_0/d/e0fcbd164
|
|
| 98 |
jepa2_run_warmup/best/step_100000_20260311-101214-UTC/ocdbt.process_0/d/af335ae3c50ff8d26037bb13f10a7ad1 filter=lfs diff=lfs merge=lfs -text
|
| 99 |
jepa2_run_warmup/best/step_100000_20260311-101214-UTC/ocdbt.process_0/d/c648870cdcdcae425310ec02077584dc filter=lfs diff=lfs merge=lfs -text
|
| 100 |
jepa2_run_warmup/best/step_100000_20260311-101214-UTC/ocdbt.process_0/d/fadc696d14b122186f4956687b5284cc filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 98 |
jepa2_run_warmup/best/step_100000_20260311-101214-UTC/ocdbt.process_0/d/af335ae3c50ff8d26037bb13f10a7ad1 filter=lfs diff=lfs merge=lfs -text
|
| 99 |
jepa2_run_warmup/best/step_100000_20260311-101214-UTC/ocdbt.process_0/d/c648870cdcdcae425310ec02077584dc filter=lfs diff=lfs merge=lfs -text
|
| 100 |
jepa2_run_warmup/best/step_100000_20260311-101214-UTC/ocdbt.process_0/d/fadc696d14b122186f4956687b5284cc filter=lfs diff=lfs merge=lfs -text
|
| 101 |
+
jepa2_run_warmup/best/step_150000_20260311-122222-UTC/ocdbt.process_0/d/1924c26392e8cc48779df647479bcb99 filter=lfs diff=lfs merge=lfs -text
|
| 102 |
+
jepa2_run_warmup/best/step_150000_20260311-122222-UTC/ocdbt.process_0/d/9486cd8a2c6c9bd8ab4b71a041b10281 filter=lfs diff=lfs merge=lfs -text
|
| 103 |
+
jepa2_run_warmup/best/step_150000_20260311-122222-UTC/ocdbt.process_0/d/96e654fff8d0ea948576eeb603b1a2c3 filter=lfs diff=lfs merge=lfs -text
|
| 104 |
+
jepa2_run_warmup/best/step_150000_20260311-122222-UTC/ocdbt.process_0/d/b6e84a529c42d835f1a7f08ba9080c89 filter=lfs diff=lfs merge=lfs -text
|
jepa2_run_warmup/best/step_150000_20260311-122222-UTC/_CHECKPOINT_METADATA
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"item_handlers": "orbax.checkpoint._src.handlers.pytree_checkpoint_handler.PyTreeCheckpointHandler", "metrics": {}, "performance_metrics": {}, "init_timestamp_nsecs": 1773231724610703405, "commit_timestamp_nsecs": 1773231742718358933, "custom_metadata": {}}
|
jepa2_run_warmup/best/step_150000_20260311-122222-UTC/_METADATA
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
jepa2_run_warmup/best/step_150000_20260311-122222-UTC/_sharding
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
jepa2_run_warmup/best/step_150000_20260311-122222-UTC/array_metadatas/process_0
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
jepa2_run_warmup/best/step_150000_20260311-122222-UTC/config.json
ADDED
|
@@ -0,0 +1,64 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"mode": "jepa2",
|
| 3 |
+
"data_dir": "/kaggle/input/datasets/bangchi/miniimagenet256-latents-arrayrecord-sdvae",
|
| 4 |
+
"num_classes": 100,
|
| 5 |
+
"patch_size": 2,
|
| 6 |
+
"hidden_size": 768,
|
| 7 |
+
"depth": 12,
|
| 8 |
+
"num_heads": 12,
|
| 9 |
+
"mlp_ratio": 4.0,
|
| 10 |
+
"opt": "adam",
|
| 11 |
+
"lr": 0.0001,
|
| 12 |
+
"beta1": 0.9,
|
| 13 |
+
"beta2": 0.99,
|
| 14 |
+
"weight_decay": 0.07,
|
| 15 |
+
"global_batch": 128,
|
| 16 |
+
"steps": 150000,
|
| 17 |
+
"seed": 42,
|
| 18 |
+
"class_dropout_prob": 0.2,
|
| 19 |
+
"aug_flip_p": 0.5,
|
| 20 |
+
"aug_jitter_eps": 0.01,
|
| 21 |
+
"t_schedule": "uniform",
|
| 22 |
+
"t_lognorm_mean": -0.4,
|
| 23 |
+
"t_lognorm_std": 1.0,
|
| 24 |
+
"lambda_jepa": 0.1,
|
| 25 |
+
"ema_decay": 0.999,
|
| 26 |
+
"mask_ratio": 0.25,
|
| 27 |
+
"student_layer": 3,
|
| 28 |
+
"teacher_layer": 7,
|
| 29 |
+
"lambda_jepa2": 8.0,
|
| 30 |
+
"jepa2_fm_warmup_steps": 10000,
|
| 31 |
+
"jepa2_split_layer": 4,
|
| 32 |
+
"jepa2_mask_lo": 0.2,
|
| 33 |
+
"jepa2_mask_hi": 0.4,
|
| 34 |
+
"jepa2_t_shift": 1.0,
|
| 35 |
+
"jepa2_alpha_lo": 1.4,
|
| 36 |
+
"jepa2_alpha_hi": 2.0,
|
| 37 |
+
"jepa2_sigreg_slices": 512,
|
| 38 |
+
"jepa2_sigreg_sigma": 1.0,
|
| 39 |
+
"jepa2_sigreg_num_points": 17,
|
| 40 |
+
"jepa2_sigreg_domain_lo": -5.0,
|
| 41 |
+
"jepa2_sigreg_domain_hi": 5.0,
|
| 42 |
+
"cfg_scale": 3.0,
|
| 43 |
+
"sample_steps": 128,
|
| 44 |
+
"num_sample_images": 16,
|
| 45 |
+
"fid_n": 4096,
|
| 46 |
+
"fid_cache_path": "checkpoints/fid_real_stats_4096.npz",
|
| 47 |
+
"fid_decode_batch": 128,
|
| 48 |
+
"fid_inception_batch": 128,
|
| 49 |
+
"log_every": 1000,
|
| 50 |
+
"eval_every": 5000,
|
| 51 |
+
"sample_every": 10000,
|
| 52 |
+
"fid_every": 50000,
|
| 53 |
+
"ckpt_every": 100000,
|
| 54 |
+
"run_name": "jepa2_run_warmup",
|
| 55 |
+
"ckpt_dir": "/kaggle/working/checkpoints_jepa2",
|
| 56 |
+
"best_metric": "quick_fid_4096",
|
| 57 |
+
"hf_repo_id": "",
|
| 58 |
+
"hf_username": "Bangchis",
|
| 59 |
+
"hf_repo_name": "soft-jepa-flow",
|
| 60 |
+
"hf_private": false,
|
| 61 |
+
"latent_size": 32,
|
| 62 |
+
"latent_channels": 4,
|
| 63 |
+
"vae_scaling_factor": 0.18215
|
| 64 |
+
}
|
jepa2_run_warmup/best/step_150000_20260311-122222-UTC/d/43f95ef628a8342d9c49e3fc30f1e386
ADDED
|
Binary file (7.1 kB). View file
|
|
|
jepa2_run_warmup/best/step_150000_20260311-122222-UTC/manifest.ocdbt
ADDED
|
Binary file (118 Bytes). View file
|
|
|
jepa2_run_warmup/best/step_150000_20260311-122222-UTC/ocdbt.process_0/d/1924c26392e8cc48779df647479bcb99
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1a4cbd2379a4cdbab1606f3325110c79dbf90247116f7fcee0ca67a277f3ac08
|
| 3 |
+
size 440815616
|
jepa2_run_warmup/best/step_150000_20260311-122222-UTC/ocdbt.process_0/d/9486cd8a2c6c9bd8ab4b71a041b10281
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c04fb579b64d01eba75d185f5a3fb6e7d91b7b1b45fec43fc36b8fd38fedcac1
|
| 3 |
+
size 141516800
|
jepa2_run_warmup/best/step_150000_20260311-122222-UTC/ocdbt.process_0/d/96529a28ac8ec27455670714ec4fae6c
ADDED
|
Binary file (787 Bytes). View file
|
|
|
jepa2_run_warmup/best/step_150000_20260311-122222-UTC/ocdbt.process_0/d/96e654fff8d0ea948576eeb603b1a2c3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8e38c65b9e2b2485704030eea9029e0b19c02baf9626c67045da1c497fa8a79e
|
| 3 |
+
size 808329216
|
jepa2_run_warmup/best/step_150000_20260311-122222-UTC/ocdbt.process_0/d/b6e84a529c42d835f1a7f08ba9080c89
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:af9129280163db2eb586fdd4768c75edc0196005792e52a2a2129fa33a8475a4
|
| 3 |
+
size 531689472
|
jepa2_run_warmup/best/step_150000_20260311-122222-UTC/ocdbt.process_0/d/eaa1055cf70f11c4cebd24c720d24718
ADDED
|
Binary file (198 Bytes). View file
|
|
|
jepa2_run_warmup/best/step_150000_20260311-122222-UTC/ocdbt.process_0/d/ed32b9c4ab957e7fb24d7ce85fe39f7c
ADDED
|
Binary file (672 Bytes). View file
|
|
|
jepa2_run_warmup/best/step_150000_20260311-122222-UTC/ocdbt.process_0/manifest.ocdbt
ADDED
|
Binary file (408 Bytes). View file
|
|
|