Bangchis commited on
Commit
2e12f13
·
verified ·
1 Parent(s): 2c3e42c

best quick_fid_4096=74.421463 step=100000 at 20260310-125131-UTC

Browse files
.gitattributes CHANGED
@@ -72,3 +72,6 @@ jepa2_run/best/step_50000_20260310-104055-UTC/ocdbt.process_0/d/9cc28e3a4be684b9
72
  baseline_run_5/best/step_100000_20260310-113201-UTC/ocdbt.process_0/d/346b7e9c71ff142679ce581d849b2e0c filter=lfs diff=lfs merge=lfs -text
73
  baseline_run_5/best/step_100000_20260310-113201-UTC/ocdbt.process_0/d/675f4cf59ea1574eaf996914ea5cf049 filter=lfs diff=lfs merge=lfs -text
74
  baseline_run_5/best/step_100000_20260310-113201-UTC/ocdbt.process_0/d/d8c5ebcc3d3dfe7926042ffd5ea55592 filter=lfs diff=lfs merge=lfs -text
 
 
 
 
72
  baseline_run_5/best/step_100000_20260310-113201-UTC/ocdbt.process_0/d/346b7e9c71ff142679ce581d849b2e0c filter=lfs diff=lfs merge=lfs -text
73
  baseline_run_5/best/step_100000_20260310-113201-UTC/ocdbt.process_0/d/675f4cf59ea1574eaf996914ea5cf049 filter=lfs diff=lfs merge=lfs -text
74
  baseline_run_5/best/step_100000_20260310-113201-UTC/ocdbt.process_0/d/d8c5ebcc3d3dfe7926042ffd5ea55592 filter=lfs diff=lfs merge=lfs -text
75
+ jepa2_run/best/step_100000_20260310-125131-UTC/ocdbt.process_0/d/2bdc3bcacc90dfaab07acc73936c810b filter=lfs diff=lfs merge=lfs -text
76
+ jepa2_run/best/step_100000_20260310-125131-UTC/ocdbt.process_0/d/862470d06a242d6137ad8eb42f6b5272 filter=lfs diff=lfs merge=lfs -text
77
+ jepa2_run/best/step_100000_20260310-125131-UTC/ocdbt.process_0/d/f24c5ceed4131d644e375425ec254cbd filter=lfs diff=lfs merge=lfs -text
jepa2_run/best/step_100000_20260310-125131-UTC/_CHECKPOINT_METADATA ADDED
@@ -0,0 +1 @@
 
 
1
+ {"item_handlers": "orbax.checkpoint._src.handlers.pytree_checkpoint_handler.PyTreeCheckpointHandler", "metrics": {}, "performance_metrics": {}, "init_timestamp_nsecs": 1773147071629372152, "commit_timestamp_nsecs": 1773147091097202257, "custom_metadata": {}}
jepa2_run/best/step_100000_20260310-125131-UTC/_METADATA ADDED
The diff for this file is too large to render. See raw diff
 
jepa2_run/best/step_100000_20260310-125131-UTC/_sharding ADDED
The diff for this file is too large to render. See raw diff
 
jepa2_run/best/step_100000_20260310-125131-UTC/array_metadatas/process_0 ADDED
The diff for this file is too large to render. See raw diff
 
jepa2_run/best/step_100000_20260310-125131-UTC/config.json ADDED
@@ -0,0 +1,63 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "mode": "jepa2",
3
+ "data_dir": "/kaggle/input/datasets/bangchi/miniimagenet256-latents-arrayrecord-sdvae",
4
+ "num_classes": 100,
5
+ "patch_size": 2,
6
+ "hidden_size": 768,
7
+ "depth": 12,
8
+ "num_heads": 12,
9
+ "mlp_ratio": 4.0,
10
+ "opt": "adam",
11
+ "lr": 0.0001,
12
+ "beta1": 0.9,
13
+ "beta2": 0.99,
14
+ "weight_decay": 0.06,
15
+ "global_batch": 128,
16
+ "steps": 200000,
17
+ "seed": 42,
18
+ "class_dropout_prob": 0.2,
19
+ "aug_flip_p": 0.5,
20
+ "aug_jitter_eps": 0.01,
21
+ "t_schedule": "uniform",
22
+ "t_lognorm_mean": -0.4,
23
+ "t_lognorm_std": 1.0,
24
+ "lambda_jepa": 0.1,
25
+ "ema_decay": 0.999,
26
+ "mask_ratio": 0.25,
27
+ "student_layer": 3,
28
+ "teacher_layer": 7,
29
+ "lambda_jepa2": 1.0,
30
+ "jepa2_split_layer": 4,
31
+ "jepa2_mask_lo": 0.2,
32
+ "jepa2_mask_hi": 0.4,
33
+ "jepa2_t_shift": 1.0,
34
+ "jepa2_alpha_lo": 1.4,
35
+ "jepa2_alpha_hi": 2.0,
36
+ "jepa2_sigreg_slices": 512,
37
+ "jepa2_sigreg_sigma": 1.0,
38
+ "jepa2_sigreg_num_points": 17,
39
+ "jepa2_sigreg_domain_lo": -5.0,
40
+ "jepa2_sigreg_domain_hi": 5.0,
41
+ "cfg_scale": 2.0,
42
+ "sample_steps": 128,
43
+ "num_sample_images": 16,
44
+ "fid_n": 4096,
45
+ "fid_cache_path": "checkpoints/fid_real_stats_4096.npz",
46
+ "fid_decode_batch": 128,
47
+ "fid_inception_batch": 128,
48
+ "log_every": 1000,
49
+ "eval_every": 5000,
50
+ "sample_every": 10000,
51
+ "fid_every": 50000,
52
+ "ckpt_every": 100000,
53
+ "run_name": "jepa2_run",
54
+ "ckpt_dir": "/kaggle/working/checkpoints_jepa2",
55
+ "best_metric": "quick_fid_4096",
56
+ "hf_repo_id": "",
57
+ "hf_username": "Bangchis",
58
+ "hf_repo_name": "soft-jepa-flow",
59
+ "hf_private": false,
60
+ "latent_size": 32,
61
+ "latent_channels": 4,
62
+ "vae_scaling_factor": 0.18215
63
+ }
jepa2_run/best/step_100000_20260310-125131-UTC/d/97cb25eab30ee92423f006c6f8ba08c5 ADDED
Binary file (7.53 kB). View file
 
jepa2_run/best/step_100000_20260310-125131-UTC/manifest.ocdbt ADDED
Binary file (118 Bytes). View file
 
jepa2_run/best/step_100000_20260310-125131-UTC/ocdbt.process_0/d/2bdc3bcacc90dfaab07acc73936c810b ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f96b68a8d4abda980dcc0af37c6c8e77813eba7c943dc147638f5a93ee367c14
3
+ size 866451456
jepa2_run/best/step_100000_20260310-125131-UTC/ocdbt.process_0/d/862470d06a242d6137ad8eb42f6b5272 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b4e9cbf1b28b95fa0325f7e832987e444fb004a43f1d5336f9553dc13167c52
3
+ size 8863744
jepa2_run/best/step_100000_20260310-125131-UTC/ocdbt.process_0/d/89c5a8d4ac4c0d673ae40bc4de67d168 ADDED
Binary file (765 Bytes). View file
 
jepa2_run/best/step_100000_20260310-125131-UTC/ocdbt.process_0/d/acdf8a577316864b77411371774cbc82 ADDED
Binary file (859 Bytes). View file
 
jepa2_run/best/step_100000_20260310-125131-UTC/ocdbt.process_0/d/eca71dd76536bd23caaa4a7886319138 ADDED
Binary file (240 Bytes). View file
 
jepa2_run/best/step_100000_20260310-125131-UTC/ocdbt.process_0/d/f24c5ceed4131d644e375425ec254cbd ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f20ed5a04280fe13cd9702b7c214f2c0b9ce2334a37581ccc4880115287d0f0c
3
+ size 1042079744
jepa2_run/best/step_100000_20260310-125131-UTC/ocdbt.process_0/manifest.ocdbt ADDED
Binary file (357 Bytes). View file