taufeeque commited on
Commit
50e331d
1 Parent(s): 8e86792

Add tinystories model cache files

Browse files
Files changed (18) hide show
  1. cache/models/TinyStories-1Layer-21M#100ksteps_vcb_mlp_2023-08-19_02-15-56/act_count_ft_tkns.pkl +3 -0
  2. cache/models/TinyStories-1Layer-21M#100ksteps_vcb_mlp_2023-08-19_02-15-56/cb_acts.pkl +3 -0
  3. cache/models/TinyStories-1Layer-21M#100ksteps_vcb_mlp_2023-08-19_02-15-56/info.txt +10 -0
  4. cache/models/TinyStories-1Layer-21M#100ksteps_vcb_mlp_2023-08-19_02-15-56/metrics.npy +3 -0
  5. cache/models/TinyStories-1Layer-21M#10ksteps_vcb_mlp_2023-08-19_02-35-26/act_count_ft_tkns.pkl +3 -0
  6. cache/models/TinyStories-1Layer-21M#10ksteps_vcb_mlp_2023-08-19_02-35-26/cb_acts.pkl +3 -0
  7. cache/models/TinyStories-1Layer-21M#10ksteps_vcb_mlp_2023-08-19_02-35-26/info.txt +10 -0
  8. cache/models/TinyStories-1Layer-21M#10ksteps_vcb_mlp_2023-08-19_02-35-26/metrics.npy +3 -0
  9. cache/models/TinyStories-1Layer-21M#new-100ksteps_ccb_attn_preproj_2023-08-18_23-08-47/act_count_ft_tkns.pkl +3 -0
  10. cache/models/TinyStories-1Layer-21M#new-100ksteps_ccb_attn_preproj_2023-08-18_23-08-47/cb_acts.pkl +3 -0
  11. cache/models/TinyStories-1Layer-21M#new-100ksteps_ccb_attn_preproj_2023-08-18_23-08-47/demo_codes.txt +9 -0
  12. cache/models/TinyStories-1Layer-21M#new-100ksteps_ccb_attn_preproj_2023-08-18_23-08-47/info.txt +10 -0
  13. cache/models/TinyStories-1Layer-21M#new-100ksteps_ccb_attn_preproj_2023-08-18_23-08-47/metrics.npy +3 -0
  14. cache/models/TinyStories-1Layer-21M#new-10ksteps_ccb_attn_preproj_2023-08-18_23-45-01/act_count_ft_tkns.pkl +3 -0
  15. cache/models/TinyStories-1Layer-21M#new-10ksteps_ccb_attn_preproj_2023-08-18_23-45-01/cb_acts.pkl +3 -0
  16. cache/models/TinyStories-1Layer-21M#new-10ksteps_ccb_attn_preproj_2023-08-18_23-45-01/demo_codes.txt +12 -0
  17. cache/models/TinyStories-1Layer-21M#new-10ksteps_ccb_attn_preproj_2023-08-18_23-45-01/info.txt +10 -0
  18. cache/models/TinyStories-1Layer-21M#new-10ksteps_ccb_attn_preproj_2023-08-18_23-45-01/metrics.npy +3 -0
cache/models/TinyStories-1Layer-21M#100ksteps_vcb_mlp_2023-08-19_02-15-56/act_count_ft_tkns.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a8780a33abdec2f60358bed0fd21a8a5610f35c3e3b0759f517b7bdde11ebe4
3
+ size 400172
cache/models/TinyStories-1Layer-21M#100ksteps_vcb_mlp_2023-08-19_02-15-56/cb_acts.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:15ab7ae8de8dcd8559b6858a8559c722e1c2887b063e371355dbde1a5d362ad5
3
+ size 819200181
cache/models/TinyStories-1Layer-21M#100ksteps_vcb_mlp_2023-08-19_02-15-56/info.txt ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ num_codes: 50000
2
+ cb_at: mlp
3
+ ccb: False
4
+ n_layers: 1
5
+ n_heads: 16
6
+ model_name: roneneldan/TinyStories-1Layer-21M
7
+ pretrained_path: /shared/outputs/2023-08-17/03-53-15/output_main/
8
+ seed: 42
9
+ max_samples: 2000
10
+ dataset_name: roneneldan/TinyStories
cache/models/TinyStories-1Layer-21M#100ksteps_vcb_mlp_2023-08-19_02-15-56/metrics.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8131533bfd013b6ce186d936cb63e697c598037c97add794ab0933bb89adf690
3
+ size 619
cache/models/TinyStories-1Layer-21M#10ksteps_vcb_mlp_2023-08-19_02-35-26/act_count_ft_tkns.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b3761ef12e28333f43574b945a544fbc0d2e58e9171f8c818a234c1c0cc05503
3
+ size 400172
cache/models/TinyStories-1Layer-21M#10ksteps_vcb_mlp_2023-08-19_02-35-26/cb_acts.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f980fd5b9410f146d8c96c10d6782b0d2d091b3557ec204cc5deb7666ad29247
3
+ size 819200181
cache/models/TinyStories-1Layer-21M#10ksteps_vcb_mlp_2023-08-19_02-35-26/info.txt ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ num_codes: 50000
2
+ cb_at: mlp
3
+ ccb: False
4
+ n_layers: 1
5
+ n_heads: 16
6
+ model_name: roneneldan/TinyStories-1Layer-21M
7
+ pretrained_path: /shared/outputs/2023-08-17/03-53-15/output_main/checkpoint-10000/
8
+ seed: 42
9
+ max_samples: 2000
10
+ dataset_name: roneneldan/TinyStories
cache/models/TinyStories-1Layer-21M#10ksteps_vcb_mlp_2023-08-19_02-35-26/metrics.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:950f175d9e284e6efbfe7a23d2d17477a337d04005d61fbf389e683c4537219e
3
+ size 619
cache/models/TinyStories-1Layer-21M#new-100ksteps_ccb_attn_preproj_2023-08-18_23-08-47/act_count_ft_tkns.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e758972a97ebdbe4ef6bffb70239519df798fc9c3dea334c0701fb8001463c3
3
+ size 3201565
cache/models/TinyStories-1Layer-21M#new-100ksteps_ccb_attn_preproj_2023-08-18_23-08-47/cb_acts.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c6510084cfa3824b07dafed7ab4af4751ba3155fcf53417475a4ce6791e0d40
3
+ size 1048577327
cache/models/TinyStories-1Layer-21M#new-100ksteps_ccb_attn_preproj_2023-08-18_23-08-47/demo_codes.txt ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+
2
+ # Catch/Grab/Pick:
3
+ layer: 0, head: 0, code: 1, num_acts: 234
4
+
5
+ # scared / fear:
6
+ layer: 0, head: 0, code: 3, num_acts: 428
7
+
8
+ # Dialogue that starts with "You are/must/can...":
9
+ layer: 0, head: 0, code: 6, num_acts: 654
cache/models/TinyStories-1Layer-21M#new-100ksteps_ccb_attn_preproj_2023-08-18_23-08-47/info.txt ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ num_codes: 25000
2
+ cb_at: attn_preproj
3
+ ccb: True
4
+ n_layers: 1
5
+ n_heads: 16
6
+ model_name: roneneldan/TinyStories-1Layer-21M
7
+ pretrained_path: /shared/outputs/2023-08-17/03-43-18/output_main/
8
+ seed: 42
9
+ max_samples: 2000
10
+ dataset_name: roneneldan/TinyStories
cache/models/TinyStories-1Layer-21M#new-100ksteps_ccb_attn_preproj_2023-08-18_23-08-47/metrics.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b5a804661a5ce3e58e7a52455cff44d412e7a93904ec4bacb2bc6d08c41ad801
3
+ size 619
cache/models/TinyStories-1Layer-21M#new-10ksteps_ccb_attn_preproj_2023-08-18_23-45-01/act_count_ft_tkns.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f5454a081fbaf5abca451fc9e913e0a239d20e4fa4ddbe889330b73780a152ee
3
+ size 3201565
cache/models/TinyStories-1Layer-21M#new-10ksteps_ccb_attn_preproj_2023-08-18_23-45-01/cb_acts.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8ce533d002762ea010334c8308cce352cb78aecdd035d5a4be5a20629dd0e0f
3
+ size 1048577327
cache/models/TinyStories-1Layer-21M#new-10ksteps_ccb_attn_preproj_2023-08-18_23-45-01/demo_codes.txt ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ # fear and worry:
3
+ layer: 0, head: 0, code: 3, num_acts: 238
4
+
5
+ # where people / things have been:
6
+ layer: 0, head: 0, code: 4, num_acts: 13
7
+
8
+ # describing newly introduced things:
9
+ layer: 0, head: 0, code: 5, num_acts: 114
10
+
11
+ # dialogue that starts with "You are/must/can…":
12
+ layer: 0, head: 0, code: 6, num_acts: 556
cache/models/TinyStories-1Layer-21M#new-10ksteps_ccb_attn_preproj_2023-08-18_23-45-01/info.txt ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ num_codes: 25000
2
+ cb_at: attn_preproj
3
+ ccb: True
4
+ n_layers: 1
5
+ n_heads: 16
6
+ model_name: roneneldan/TinyStories-1Layer-21M
7
+ pretrained_path: /shared/outputs/2023-08-17/03-43-18/output_main/
8
+ seed: 42
9
+ max_samples: 2000
10
+ dataset_name: roneneldan/TinyStories
cache/models/TinyStories-1Layer-21M#new-10ksteps_ccb_attn_preproj_2023-08-18_23-45-01/metrics.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:06b515fcc353399ce82bff99ac0a9882480482d40b772cf6b7f7750bca32a7f1
3
+ size 619