taufeeque commited on
Commit
811a8b4
β€’
1 Parent(s): 50e331d

Update models cache

Browse files
Files changed (18) hide show
  1. cache/models/TinyStories-1Layer-21M#10ksteps_vcb_mlp_2023-08-19_02-35-26/act_count_ft_tkns.pkl +0 -3
  2. cache/models/TinyStories-1Layer-21M#10ksteps_vcb_mlp_2023-08-19_02-35-26/cb_acts.pkl +0 -3
  3. cache/models/TinyStories-1Layer-21M#10ksteps_vcb_mlp_2023-08-19_02-35-26/info.txt +0 -10
  4. cache/models/TinyStories-1Layer-21M#10ksteps_vcb_mlp_2023-08-19_02-35-26/metrics.npy +0 -3
  5. cache/models/TinyStories-1Layer-21M#new-10ksteps_ccb_attn_preproj_2023-08-18_23-45-01/act_count_ft_tkns.pkl +0 -3
  6. cache/models/TinyStories-1Layer-21M#new-10ksteps_ccb_attn_preproj_2023-08-18_23-45-01/cb_acts.pkl +0 -3
  7. cache/models/TinyStories-1Layer-21M#new-10ksteps_ccb_attn_preproj_2023-08-18_23-45-01/demo_codes.txt +0 -12
  8. cache/models/TinyStories-1Layer-21M#new-10ksteps_ccb_attn_preproj_2023-08-18_23-45-01/info.txt +0 -10
  9. cache/models/TinyStories-1Layer-21M#new-10ksteps_ccb_attn_preproj_2023-08-18_23-45-01/metrics.npy +0 -3
  10. cache/models/{TinyStories-1Layer-21M#new-100ksteps_ccb_attn_preproj_2023-08-18_23-08-47 β†’ TinyStories-1Layer-21M_ccb_attn_preproj_2023-08-18_23-08-47}/act_count_ft_tkns.pkl +0 -0
  11. cache/models/{TinyStories-1Layer-21M#new-100ksteps_ccb_attn_preproj_2023-08-18_23-08-47 β†’ TinyStories-1Layer-21M_ccb_attn_preproj_2023-08-18_23-08-47}/cb_acts.pkl +0 -0
  12. cache/models/{TinyStories-1Layer-21M#new-100ksteps_ccb_attn_preproj_2023-08-18_23-08-47 β†’ TinyStories-1Layer-21M_ccb_attn_preproj_2023-08-18_23-08-47}/demo_codes.txt +0 -0
  13. cache/models/{TinyStories-1Layer-21M#new-100ksteps_ccb_attn_preproj_2023-08-18_23-08-47 β†’ TinyStories-1Layer-21M_ccb_attn_preproj_2023-08-18_23-08-47}/info.txt +0 -0
  14. cache/models/{TinyStories-1Layer-21M#new-100ksteps_ccb_attn_preproj_2023-08-18_23-08-47 β†’ TinyStories-1Layer-21M_ccb_attn_preproj_2023-08-18_23-08-47}/metrics.npy +0 -0
  15. cache/models/{TinyStories-1Layer-21M#100ksteps_vcb_mlp_2023-08-19_02-15-56 β†’ TinyStories-1Layer-21M_vcb_mlp_2023-08-19_02-15-56}/act_count_ft_tkns.pkl +0 -0
  16. cache/models/{TinyStories-1Layer-21M#100ksteps_vcb_mlp_2023-08-19_02-15-56 β†’ TinyStories-1Layer-21M_vcb_mlp_2023-08-19_02-15-56}/cb_acts.pkl +0 -0
  17. cache/models/{TinyStories-1Layer-21M#100ksteps_vcb_mlp_2023-08-19_02-15-56 β†’ TinyStories-1Layer-21M_vcb_mlp_2023-08-19_02-15-56}/info.txt +0 -0
  18. cache/models/{TinyStories-1Layer-21M#100ksteps_vcb_mlp_2023-08-19_02-15-56 β†’ TinyStories-1Layer-21M_vcb_mlp_2023-08-19_02-15-56}/metrics.npy +0 -0
cache/models/TinyStories-1Layer-21M#10ksteps_vcb_mlp_2023-08-19_02-35-26/act_count_ft_tkns.pkl DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:b3761ef12e28333f43574b945a544fbc0d2e58e9171f8c818a234c1c0cc05503
3
- size 400172
 
 
 
 
cache/models/TinyStories-1Layer-21M#10ksteps_vcb_mlp_2023-08-19_02-35-26/cb_acts.pkl DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:f980fd5b9410f146d8c96c10d6782b0d2d091b3557ec204cc5deb7666ad29247
3
- size 819200181
 
 
 
 
cache/models/TinyStories-1Layer-21M#10ksteps_vcb_mlp_2023-08-19_02-35-26/info.txt DELETED
@@ -1,10 +0,0 @@
1
- num_codes: 50000
2
- cb_at: mlp
3
- ccb: False
4
- n_layers: 1
5
- n_heads: 16
6
- model_name: roneneldan/TinyStories-1Layer-21M
7
- pretrained_path: /shared/outputs/2023-08-17/03-53-15/output_main/checkpoint-10000/
8
- seed: 42
9
- max_samples: 2000
10
- dataset_name: roneneldan/TinyStories
 
 
 
 
 
 
 
 
 
 
 
cache/models/TinyStories-1Layer-21M#10ksteps_vcb_mlp_2023-08-19_02-35-26/metrics.npy DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:950f175d9e284e6efbfe7a23d2d17477a337d04005d61fbf389e683c4537219e
3
- size 619
 
 
 
 
cache/models/TinyStories-1Layer-21M#new-10ksteps_ccb_attn_preproj_2023-08-18_23-45-01/act_count_ft_tkns.pkl DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:f5454a081fbaf5abca451fc9e913e0a239d20e4fa4ddbe889330b73780a152ee
3
- size 3201565
 
 
 
 
cache/models/TinyStories-1Layer-21M#new-10ksteps_ccb_attn_preproj_2023-08-18_23-45-01/cb_acts.pkl DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:a8ce533d002762ea010334c8308cce352cb78aecdd035d5a4be5a20629dd0e0f
3
- size 1048577327
 
 
 
 
cache/models/TinyStories-1Layer-21M#new-10ksteps_ccb_attn_preproj_2023-08-18_23-45-01/demo_codes.txt DELETED
@@ -1,12 +0,0 @@
1
-
2
- # fear and worry:
3
- layer: 0, head: 0, code: 3, num_acts: 238
4
-
5
- # where people / things have been:
6
- layer: 0, head: 0, code: 4, num_acts: 13
7
-
8
- # describing newly introduced things:
9
- layer: 0, head: 0, code: 5, num_acts: 114
10
-
11
- # dialogue that starts with "You are/must/can…":
12
- layer: 0, head: 0, code: 6, num_acts: 556
 
 
 
 
 
 
 
 
 
 
 
 
 
cache/models/TinyStories-1Layer-21M#new-10ksteps_ccb_attn_preproj_2023-08-18_23-45-01/info.txt DELETED
@@ -1,10 +0,0 @@
1
- num_codes: 25000
2
- cb_at: attn_preproj
3
- ccb: True
4
- n_layers: 1
5
- n_heads: 16
6
- model_name: roneneldan/TinyStories-1Layer-21M
7
- pretrained_path: /shared/outputs/2023-08-17/03-43-18/output_main/
8
- seed: 42
9
- max_samples: 2000
10
- dataset_name: roneneldan/TinyStories
 
 
 
 
 
 
 
 
 
 
 
cache/models/TinyStories-1Layer-21M#new-10ksteps_ccb_attn_preproj_2023-08-18_23-45-01/metrics.npy DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:06b515fcc353399ce82bff99ac0a9882480482d40b772cf6b7f7750bca32a7f1
3
- size 619
 
 
 
 
cache/models/{TinyStories-1Layer-21M#new-100ksteps_ccb_attn_preproj_2023-08-18_23-08-47 β†’ TinyStories-1Layer-21M_ccb_attn_preproj_2023-08-18_23-08-47}/act_count_ft_tkns.pkl RENAMED
File without changes
cache/models/{TinyStories-1Layer-21M#new-100ksteps_ccb_attn_preproj_2023-08-18_23-08-47 β†’ TinyStories-1Layer-21M_ccb_attn_preproj_2023-08-18_23-08-47}/cb_acts.pkl RENAMED
File without changes
cache/models/{TinyStories-1Layer-21M#new-100ksteps_ccb_attn_preproj_2023-08-18_23-08-47 β†’ TinyStories-1Layer-21M_ccb_attn_preproj_2023-08-18_23-08-47}/demo_codes.txt RENAMED
File without changes
cache/models/{TinyStories-1Layer-21M#new-100ksteps_ccb_attn_preproj_2023-08-18_23-08-47 β†’ TinyStories-1Layer-21M_ccb_attn_preproj_2023-08-18_23-08-47}/info.txt RENAMED
File without changes
cache/models/{TinyStories-1Layer-21M#new-100ksteps_ccb_attn_preproj_2023-08-18_23-08-47 β†’ TinyStories-1Layer-21M_ccb_attn_preproj_2023-08-18_23-08-47}/metrics.npy RENAMED
File without changes
cache/models/{TinyStories-1Layer-21M#100ksteps_vcb_mlp_2023-08-19_02-15-56 β†’ TinyStories-1Layer-21M_vcb_mlp_2023-08-19_02-15-56}/act_count_ft_tkns.pkl RENAMED
File without changes
cache/models/{TinyStories-1Layer-21M#100ksteps_vcb_mlp_2023-08-19_02-15-56 β†’ TinyStories-1Layer-21M_vcb_mlp_2023-08-19_02-15-56}/cb_acts.pkl RENAMED
File without changes
cache/models/{TinyStories-1Layer-21M#100ksteps_vcb_mlp_2023-08-19_02-15-56 β†’ TinyStories-1Layer-21M_vcb_mlp_2023-08-19_02-15-56}/info.txt RENAMED
File without changes
cache/models/{TinyStories-1Layer-21M#100ksteps_vcb_mlp_2023-08-19_02-15-56 β†’ TinyStories-1Layer-21M_vcb_mlp_2023-08-19_02-15-56}/metrics.npy RENAMED
File without changes