nev commited on
Commit
6f58daf
·
verified ·
1 Parent(s): 595da92

Add files using upload-large-folder tool

Browse files
Files changed (50) hide show
  1. dense_features.json +1 -0
  2. latents/layers.0.post_attention_layernorm/0_26213.safetensors +3 -0
  3. latents/layers.0.post_attention_layernorm/104857_131071.safetensors +3 -0
  4. latents/layers.0.post_attention_layernorm/26214_52427.safetensors +3 -0
  5. latents/layers.0.post_attention_layernorm/52428_78642.safetensors +3 -0
  6. latents/layers.0.post_attention_layernorm/78643_104856.safetensors +3 -0
  7. latents/layers.0.post_attention_layernorm/config.json +11 -0
  8. latents/layers.1.post_attention_layernorm/0_26213.safetensors +3 -0
  9. latents/layers.1.post_attention_layernorm/104857_131071.safetensors +3 -0
  10. latents/layers.1.post_attention_layernorm/26214_52427.safetensors +3 -0
  11. latents/layers.1.post_attention_layernorm/52428_78642.safetensors +3 -0
  12. latents/layers.1.post_attention_layernorm/78643_104856.safetensors +3 -0
  13. latents/layers.1.post_attention_layernorm/config.json +11 -0
  14. latents/layers.10.post_attention_layernorm/104857_131071.safetensors +3 -0
  15. latents/layers.10.post_attention_layernorm/config.json +11 -0
  16. latents/layers.11.post_attention_layernorm/104857_131071.safetensors +3 -0
  17. latents/layers.11.post_attention_layernorm/52428_78642.safetensors +3 -0
  18. latents/layers.11.post_attention_layernorm/config.json +11 -0
  19. latents/layers.12.post_attention_layernorm/config.json +11 -0
  20. latents/layers.13.post_attention_layernorm/config.json +11 -0
  21. latents/layers.14.post_attention_layernorm/0_26213.safetensors +3 -0
  22. latents/layers.14.post_attention_layernorm/104857_131071.safetensors +3 -0
  23. latents/layers.14.post_attention_layernorm/26214_52427.safetensors +3 -0
  24. latents/layers.14.post_attention_layernorm/52428_78642.safetensors +3 -0
  25. latents/layers.14.post_attention_layernorm/78643_104856.safetensors +3 -0
  26. latents/layers.14.post_attention_layernorm/config.json +11 -0
  27. latents/layers.15.post_attention_layernorm/0_26213.safetensors +3 -0
  28. latents/layers.15.post_attention_layernorm/104857_131071.safetensors +3 -0
  29. latents/layers.15.post_attention_layernorm/26214_52427.safetensors +3 -0
  30. latents/layers.15.post_attention_layernorm/52428_78642.safetensors +3 -0
  31. latents/layers.15.post_attention_layernorm/78643_104856.safetensors +3 -0
  32. latents/layers.15.post_attention_layernorm/config.json +11 -0
  33. latents/layers.2.post_attention_layernorm/0_26213.safetensors +3 -0
  34. latents/layers.2.post_attention_layernorm/104857_131071.safetensors +3 -0
  35. latents/layers.2.post_attention_layernorm/26214_52427.safetensors +3 -0
  36. latents/layers.2.post_attention_layernorm/52428_78642.safetensors +3 -0
  37. latents/layers.2.post_attention_layernorm/78643_104856.safetensors +3 -0
  38. latents/layers.2.post_attention_layernorm/config.json +11 -0
  39. latents/layers.3.post_attention_layernorm/78643_104856.safetensors +3 -0
  40. latents/layers.3.post_attention_layernorm/config.json +11 -0
  41. latents/layers.4.post_attention_layernorm/0_26213.safetensors +3 -0
  42. latents/layers.4.post_attention_layernorm/26214_52427.safetensors +3 -0
  43. latents/layers.4.post_attention_layernorm/52428_78642.safetensors +3 -0
  44. latents/layers.4.post_attention_layernorm/config.json +11 -0
  45. latents/layers.5.post_attention_layernorm/config.json +11 -0
  46. latents/layers.6.post_attention_layernorm/config.json +11 -0
  47. latents/layers.7.post_attention_layernorm/config.json +11 -0
  48. latents/layers.8.post_attention_layernorm/config.json +11 -0
  49. latents/layers.9.post_attention_layernorm/config.json +11 -0
  50. run_config.json +66 -0
dense_features.json ADDED
@@ -0,0 +1 @@
 
 
1
+ [[5, 1502], [5, 2643], [5, 3283], [5, 5066], [5, 6263], [5, 6495], [5, 7194], [5, 9852], [5, 10223], [5, 12349], [5, 13552], [5, 17441], [5, 20347], [5, 20459], [5, 20768], [5, 21874], [5, 21888], [5, 22105], [5, 22622], [5, 24470], [5, 25077], [5, 25452], [5, 26573], [5, 27016], [5, 27593], [5, 27995], [5, 28373], [5, 30938], [5, 31326], [5, 31658], [5, 34072], [5, 34242], [5, 34376], [5, 34578], [5, 35796], [5, 36709], [5, 38481], [5, 39216], [5, 39736], [5, 39815], [5, 40240], [5, 40249], [5, 40445], [5, 40752], [5, 40776], [5, 42813], [5, 44170], [5, 45423], [5, 45735], [5, 46595], [5, 48000], [5, 48790], [5, 48817], [5, 48962], [5, 50756], [5, 51320], [5, 53481], [5, 54808], [5, 56285], [5, 56835], [5, 56845], [5, 58332], [5, 60711], [5, 61675], [5, 62382], [5, 63563], [5, 63885], [5, 64300], [5, 64872], [5, 65447], [5, 66409], [5, 66655], [5, 66936], [5, 67530], [5, 67873], [5, 68308], [5, 70931], [5, 71376], [5, 72812], [5, 72823], [5, 73514], [5, 73885], [5, 74021], [5, 74605], [5, 74632], [5, 75393], [5, 75701], [5, 76075], [5, 77842], [5, 79766], [5, 79779], [5, 80104], [5, 80200], [5, 80218], [5, 80617], [5, 80689], [5, 82296], [5, 82895], [5, 83517], [5, 83755], [5, 83783], [5, 84911], [5, 89781], [5, 91830], [5, 91954], [5, 93260], [5, 95615], [5, 96708], [5, 98594], [5, 101470], [5, 105371], [5, 105661], [5, 105843], [5, 109010], [5, 110776], [5, 110945], [5, 111138], [5, 111593], [5, 113927], [5, 114059], [5, 114156], [5, 116263], [5, 117377], [5, 118412], [5, 120671], [5, 121090], [5, 121404], [5, 123074], [5, 125286], [5, 125433], [5, 127568], [5, 127725], [5, 128665], [5, 129435], [5, 129523], [5, 130523], [8, 1191], [8, 1290], [8, 2845], [8, 2980], [8, 4568], [8, 6379], [8, 7183], [8, 8242], [8, 8412], [8, 9062], [8, 9144], [8, 9201], [8, 9219], [8, 9619], [8, 9821], [8, 10360], [8, 10442], [8, 10510], [8, 11968], [8, 12610], [8, 13610], [8, 13846], [8, 15108], [8, 15522], [8, 15575], [8, 15741], [8, 15887], [8, 16196], [8, 16479], [8, 16639], [8, 17435], [8, 18167], [8, 18544], [8, 22095], [8, 22470], [8, 23374], [8, 23530], [8, 24694], [8, 25373], [8, 25639], [8, 26161], [8, 26246], [8, 26783], [8, 28947], [8, 29124], [8, 29277], [8, 29403], [8, 29588], [8, 30086], [8, 34056], [8, 34079], [8, 34273], [8, 34274], [8, 36284], [8, 37543], [8, 38820], [8, 38929], [8, 40347], [8, 43409], [8, 43685], [8, 44299], [8, 44817], [8, 45069], [8, 46960], [8, 48984], [8, 49058], [8, 49287], [8, 49719], [8, 50782], [8, 50973], [8, 51501], [8, 52913], [8, 54597], [8, 55203], [8, 55434], [8, 57573], [8, 58608], [8, 58786], [8, 59749], [8, 60848], [8, 61805], [8, 61924], [8, 63085], [8, 63748], [8, 63964], [8, 64130], [8, 64832], [8, 65726], [8, 67215], [8, 67644], [8, 69130], [8, 69643], [8, 69795], [8, 72570], [8, 74864], [8, 75362], [8, 76578], [8, 77436], [8, 77534], [8, 78749], [8, 79181], [8, 79618], [8, 80002], [8, 80769], [8, 80993], [8, 83511], [8, 84431], [8, 85713], [8, 86398], [8, 86545], [8, 87079], [8, 87248], [8, 87316], [8, 87709], [8, 88250], [8, 89585], [8, 89615], [8, 90801], [8, 91036], [8, 91682], [8, 92519], [8, 92996], [8, 94179], [8, 94200], [8, 97317], [8, 97627], [8, 98011], [8, 98486], [8, 99554], [8, 100503], [8, 101328], [8, 101559], [8, 105263], [8, 105487], [8, 105736], [8, 106004], [8, 106372], [8, 106988], [8, 107315], [8, 107467], [8, 108077], [8, 108125], [8, 108418], [8, 108639], [8, 110803], [8, 110829], [8, 112967], [8, 115080], [8, 115540], [8, 116028], [8, 116560], [8, 117193], [8, 117652], [8, 118478], [8, 118510], [8, 118522], [8, 118628], [8, 120376], [8, 120841], [8, 121886], [8, 122671], [8, 123244], [8, 123578], [8, 123776], [8, 124545], [8, 124605], [8, 125088], [8, 125760], [8, 126909], [8, 127241], [8, 128540], [8, 129421], [8, 129696], [8, 130431], [8, 130589], [8, 131039], [11, 814], [11, 2689], [11, 2933], [11, 3490], [11, 4566], [11, 4740], [11, 5121], [11, 6000], [11, 7090], [11, 8159], [11, 9375], [11, 9895], [11, 10071], [11, 10160], [11, 10554], [11, 11909], [11, 12576], [11, 12805], [11, 14418], [11, 15850], [11, 17555], [11, 17665], [11, 18046], [11, 20473], [11, 20900], [11, 20949], [11, 21331], [11, 21334], [11, 21404], [11, 22424], [11, 24095], [11, 24392], [11, 25340], [11, 26092], [11, 27910], [11, 28223], [11, 28821], [11, 29168], [11, 30134], [11, 30532], [11, 30625], [11, 30897], [11, 31580], [11, 33722], [11, 33878], [11, 34828], [11, 35524], [11, 35854], [11, 36112], [11, 36365], [11, 38370], [11, 38641], [11, 38677], [11, 39745], [11, 41685], [11, 42534], [11, 42569], [11, 42790], [11, 43916], [11, 44016], [11, 44707], [11, 44759], [11, 45422], [11, 47312], [11, 47777], [11, 48303], [11, 49897], [11, 51175], [11, 52507], [11, 55107], [11, 55906], [11, 56301], [11, 56769], [11, 56944], [11, 58111], [11, 58972], [11, 59638], [11, 61560], [11, 62857], [11, 63219], [11, 63761], [11, 66767], [11, 67072], [11, 68470], [11, 70069], [11, 70127], [11, 70568], [11, 72143], [11, 73154], [11, 73469], [11, 74399], [11, 74897], [11, 75396], [11, 75486], [11, 77275], [11, 77649], [11, 77792], [11, 78224], [11, 78792], [11, 79600], [11, 80210], [11, 80229], [11, 81406], [11, 81624], [11, 82858], [11, 85078], [11, 86717], [11, 87021], [11, 87164], [11, 87716], [11, 87725], [11, 87987], [11, 89226], [11, 89515], [11, 89526], [11, 89760], [11, 89938], [11, 90041], [11, 90792], [11, 91014], [11, 91366], [11, 91917], [11, 91988], [11, 92512], [11, 92672], [11, 93771], [11, 93963], [11, 94803], [11, 96644], [11, 96781], [11, 98330], [11, 99684], [11, 100261], [11, 101543], [11, 101671], [11, 101747], [11, 102464], [11, 102847], [11, 103055], [11, 104091], [11, 104292], [11, 104375], [11, 104571], [11, 105474], [11, 105478], [11, 106622], [11, 106718], [11, 107633], [11, 108901], [11, 109243], [11, 110477], [11, 110851], [11, 111069], [11, 111197], [11, 113056], [11, 113119], [11, 114055], [11, 115931], [11, 116379], [11, 116522], [11, 116879], [11, 117421], [11, 118014], [11, 122255], [11, 122385], [11, 122468], [11, 122640], [11, 123171], [11, 123187], [11, 126509], [11, 126681], [11, 129284], [11, 129310], [11, 130198], [11, 130568], [9, 763], [9, 3270], [9, 5040], [9, 6970], [9, 7422], [9, 7921], [9, 8325], [9, 8638], [9, 8737], [9, 8743], [9, 8938], [9, 9374], [9, 10017], [9, 13117], [9, 13349], [9, 14515], [9, 16193], [9, 17219], [9, 17776], [9, 17981], [9, 18894], [9, 19189], [9, 19336], [9, 19390], [9, 19661], [9, 19914], [9, 20354], [9, 22596], [9, 24206], [9, 24539], [9, 25236], [9, 25531], [9, 27463], [9, 28155], [9, 28875], [9, 29015], [9, 30213], [9, 30735], [9, 31147], [9, 31974], [9, 32458], [9, 33649], [9, 34464], [9, 34748], [9, 35575], [9, 36812], [9, 37136], [9, 38138], [9, 38928], [9, 39128], [9, 39553], [9, 42062], [9, 42841], [9, 44470], [9, 44721], [9, 46217], [9, 46963], [9, 47336], [9, 47397], [9, 48529], [9, 50448], [9, 50552], [9, 50593], [9, 53811], [9, 54965], [9, 57988], [9, 58211], [9, 59009], [9, 59841], [9, 59991], [9, 60533], [9, 61969], [9, 61976], [9, 62092], [9, 62465], [9, 62979], [9, 64986], [9, 66649], [9, 67867], [9, 70340], [9, 73285], [9, 74964], [9, 77568], [9, 77724], [9, 79045], [9, 79302], [9, 79723], [9, 79828], [9, 79971], [9, 81107], [9, 81232], [9, 81995], [9, 84621], [9, 86299], [9, 87051], [9, 87127], [9, 87666], [9, 90562], [9, 93224], [9, 93225], [9, 95481], [9, 97139], [9, 100974], [9, 101188], [9, 102504], [9, 102516], [9, 102616], [9, 103172], [9, 104881], [9, 105279], [9, 108444], [9, 109110], [9, 109636], [9, 111986], [9, 113371], [9, 114033], [9, 114070], [9, 114884], [9, 116687], [9, 117087], [9, 117722], [9, 119319], [9, 119863], [9, 120320], [9, 120902], [9, 120989], [9, 123277], [9, 124050], [9, 124223], [9, 126884], [9, 128322], [13, 2198], [13, 2680], [13, 4197], [13, 5403], [13, 7088], [13, 7221], [13, 7348], [13, 7986], [13, 8392], [13, 9190], [13, 9856], [13, 10254], [13, 11271], [13, 12824], [13, 13510], [13, 13628], [13, 13795], [13, 14062], [13, 15029], [13, 15358], [13, 15964], [13, 16121], [13, 16423], [13, 16597], [13, 16803], [13, 16868], [13, 18278], [13, 18791], [13, 19970], [13, 20605], [13, 23766], [13, 24997], [13, 25417], [13, 27100], [13, 27773], [13, 28225], [13, 29391], [13, 29683], [13, 31104], [13, 32191], [13, 32694], [13, 33028], [13, 33704], [13, 34256], [13, 34350], [13, 34618], [13, 35338], [13, 35891], [13, 36099], [13, 36148], [13, 36797], [13, 36841], [13, 38087], [13, 38402], [13, 39430], [13, 39855], [13, 40829], [13, 41028], [13, 42104], [13, 42468], [13, 42894], [13, 43491], [13, 44663], [13, 45413], [13, 46248], [13, 46591], [13, 46727], [13, 47683], [13, 49068], [13, 49516], [13, 50177], [13, 50316], [13, 52115], [13, 52159], [13, 53238], [13, 54682], [13, 54848], [13, 56632], [13, 58176], [13, 59254], [13, 60597], [13, 60639], [13, 63843], [13, 64913], [13, 65271], [13, 65652], [13, 66117], [13, 66896], [13, 68192], [13, 69134], [13, 71554], [13, 73447], [13, 74312], [13, 74913], [13, 75020], [13, 75498], [13, 78691], [13, 79380], [13, 79861], [13, 80111], [13, 80571], [13, 80641], [13, 84266], [13, 86076], [13, 86918], [13, 87411], [13, 89408], [13, 89519], [13, 91086], [13, 94233], [13, 95901], [13, 96469], [13, 96976], [13, 97540], [13, 98164], [13, 98713], [13, 102291], [13, 103358], [13, 104180], [13, 104393], [13, 104558], [13, 105595], [13, 106378], [13, 106616], [13, 106833], [13, 107874], [13, 108003], [13, 108395], [13, 108636], [13, 108683], [13, 109256], [13, 109431], [13, 109970], [13, 110632], [13, 110711], [13, 111036], [13, 111604], [13, 112048], [13, 114560], [13, 114574], [13, 115453], [13, 116125], [13, 116442], [13, 116564], [13, 117909], [13, 119442], [13, 119661], [13, 119903], [13, 120011], [13, 120985], [13, 121392], [13, 121704], [13, 123573], [13, 123990], [13, 124866], [13, 125637], [13, 125862], [13, 126307], [13, 126360], [13, 127585], [13, 127985], [13, 128352], [13, 129146], [13, 129296], [13, 130984], [1, 29498], [1, 36059], [12, 1092], [12, 1223], [12, 1244], [12, 2775], [12, 2806], [12, 3241], [12, 3354], [12, 3454], [12, 3465], [12, 4330], [12, 5204], [12, 5974], [12, 6211], [12, 7383], [12, 7683], [12, 8173], [12, 8681], [12, 10038], [12, 10630], [12, 10906], [12, 11538], [12, 11991], [12, 12205], [12, 12659], [12, 12776], [12, 13118], [12, 13597], [12, 13652], [12, 14012], [12, 14273], [12, 14382], [12, 15172], [12, 15618], [12, 15981], [12, 16795], [12, 16929], [12, 17029], [12, 17768], [12, 17829], [12, 18315], [12, 18763], [12, 19848], [12, 20402], [12, 20866], [12, 21365], [12, 22237], [12, 22386], [12, 22707], [12, 23121], [12, 24110], [12, 24330], [12, 24616], [12, 26421], [12, 26595], [12, 26788], [12, 27161], [12, 27329], [12, 28202], [12, 28641], [12, 29057], [12, 29434], [12, 29757], [12, 31555], [12, 32124], [12, 32183], [12, 32553], [12, 32677], [12, 33020], [12, 33138], [12, 34768], [12, 35534], [12, 35919], [12, 36159], [12, 36455], [12, 36696], [12, 36821], [12, 37012], [12, 37113], [12, 37314], [12, 38387], [12, 38815], [12, 38959], [12, 39227], [12, 40335], [12, 40506], [12, 41469], [12, 41942], [12, 42282], [12, 42435], [12, 43168], [12, 43441], [12, 43946], [12, 44758], [12, 45051], [12, 45443], [12, 45556], [12, 47043], [12, 47567], [12, 47902], [12, 48530], [12, 48609], [12, 48975], [12, 49121], [12, 49897], [12, 51605], [12, 52937], [12, 53621], [12, 53970], [12, 54678], [12, 55425], [12, 55477], [12, 55707], [12, 56058], [12, 56119], [12, 57025], [12, 58568], [12, 59005], [12, 59703], [12, 59991], [12, 60422], [12, 60889], [12, 61191], [12, 61487], [12, 62184], [12, 62725], [12, 63279], [12, 64640], [12, 64792], [12, 65335], [12, 65447], [12, 66083], [12, 66308], [12, 66998], [12, 67220], [12, 67341], [12, 67507], [12, 67969], [12, 68121], [12, 68265], [12, 68472], [12, 68476], [12, 68761], [12, 70062], [12, 70628], [12, 71376], [12, 72696], [12, 73598], [12, 73931], [12, 74239], [12, 75136], [12, 75715], [12, 78988], [12, 79350], [12, 79410], [12, 79505], [12, 80122], [12, 80827], [12, 81712], [12, 82946], [12, 83048], [12, 83347], [12, 83768], [12, 84570], [12, 84633], [12, 84992], [12, 85286], [12, 86243], [12, 86387], [12, 86467], [12, 87805], [12, 88747], [12, 89133], [12, 89311], [12, 89400], [12, 89555], [12, 91794], [12, 95065], [12, 95780], [12, 96268], [12, 96509], [12, 96657], [12, 97465], [12, 97620], [12, 98401], [12, 98808], [12, 99302], [12, 99329], [12, 99397], [12, 99683], [12, 100034], [12, 100548], [12, 101765], [12, 102862], [12, 103370], [12, 104666], [12, 105153], [12, 105590], [12, 106350], [12, 107320], [12, 107334], [12, 107811], [12, 108209], [12, 108668], [12, 108722], [12, 109175], [12, 109551], [12, 109563], [12, 109754], [12, 110045], [12, 110606], [12, 111355], [12, 111377], [12, 111624], [12, 112147], [12, 112374], [12, 112394], [12, 112488], [12, 112813], [12, 113323], [12, 113369], [12, 114790], [12, 115076], [12, 115517], [12, 115531], [12, 115969], [12, 116544], [12, 117660], [12, 118312], [12, 118594], [12, 118907], [12, 119360], [12, 120199], [12, 120248], [12, 120374], [12, 120825], [12, 122655], [12, 123149], [12, 123253], [12, 123901], [12, 124285], [12, 124466], [12, 125814], [12, 126419], [12, 126494], [12, 127886], [12, 128003], [12, 128746], [12, 129892], [12, 130562], [3, 399], [3, 1582], [3, 3109], [3, 3372], [3, 3479], [3, 4158], [3, 4173], [3, 5800], [3, 6116], [3, 6880], [3, 8579], [3, 9092], [3, 9107], [3, 9755], [3, 13873], [3, 14419], [3, 15875], [3, 16867], [3, 18992], [3, 22232], [3, 23044], [3, 28353], [3, 30099], [3, 30318], [3, 30652], [3, 30968], [3, 32193], [3, 33171], [3, 34739], [3, 34749], [3, 36402], [3, 36956], [3, 39446], [3, 42073], [3, 42083], [3, 42942], [3, 43598], [3, 44093], [3, 44457], [3, 48287], [3, 48305], [3, 48835], [3, 51263], [3, 52210], [3, 52495], [3, 53500], [3, 53806], [3, 54472], [3, 55220], [3, 55495], [3, 56175], [3, 58079], [3, 59885], [3, 61224], [3, 61326], [3, 61857], [3, 62737], [3, 66279], [3, 68979], [3, 69633], [3, 69749], [3, 70439], [3, 72948], [3, 73589], [3, 75081], [3, 75194], [3, 75629], [3, 75952], [3, 76321], [3, 76408], [3, 77238], [3, 78053], [3, 80823], [3, 85235], [3, 86858], [3, 86963], [3, 87238], [3, 89231], [3, 89701], [3, 89831], [3, 90804], [3, 91348], [3, 96969], [3, 99016], [3, 100119], [3, 100785], [3, 100999], [3, 105723], [3, 106721], [3, 107014], [3, 107623], [3, 108421], [3, 110621], [3, 110760], [3, 111635], [3, 112276], [3, 112354], [3, 114374], [3, 114718], [3, 117945], [3, 120123], [3, 120680], [3, 122778], [3, 123375], [3, 124341], [3, 124525], [3, 124651], [3, 128021], [3, 129121], [3, 129699], [3, 129911], [10, 615], [10, 813], [10, 1259], [10, 3894], [10, 3899], [10, 4195], [10, 4291], [10, 6967], [10, 7355], [10, 9173], [10, 11449], [10, 15731], [10, 18210], [10, 18551], [10, 21529], [10, 22354], [10, 23793], [10, 23915], [10, 24548], [10, 24665], [10, 25037], [10, 29571], [10, 30403], [10, 31123], [10, 31561], [10, 32370], [10, 32576], [10, 32770], [10, 33498], [10, 33632], [10, 34553], [10, 35679], [10, 39052], [10, 39542], [10, 39823], [10, 41282], [10, 41603], [10, 42118], [10, 42244], [10, 42949], [10, 45984], [10, 47385], [10, 49623], [10, 49719], [10, 51438], [10, 51812], [10, 56016], [10, 60323], [10, 60475], [10, 61077], [10, 62001], [10, 62675], [10, 64859], [10, 65069], [10, 65071], [10, 65573], [10, 68127], [10, 69221], [10, 70311], [10, 70326], [10, 71849], [10, 72338], [10, 72622], [10, 73252], [10, 76282], [10, 81342], [10, 83469], [10, 84288], [10, 84363], [10, 85519], [10, 86865], [10, 88198], [10, 88693], [10, 92011], [10, 92044], [10, 92149], [10, 92455], [10, 92968], [10, 93004], [10, 93370], [10, 93410], [10, 93890], [10, 94223], [10, 94351], [10, 94711], [10, 96451], [10, 99165], [10, 100763], [10, 101648], [10, 102333], [10, 103375], [10, 108049], [10, 108347], [10, 109242], [10, 109809], [10, 111978], [10, 113467], [10, 114596], [10, 116886], [10, 117209], [10, 118222], [10, 118663], [10, 118839], [10, 119263], [10, 119291], [10, 119469], [10, 119940], [10, 120527], [10, 121378], [10, 122092], [10, 123056], [10, 123327], [10, 123499], [10, 123739], [10, 124016], [10, 125751], [10, 127463], [10, 128934], [10, 129279], [10, 129669], [10, 130705], [10, 130936], [15, 5655], [15, 7806], [15, 15684], [15, 27613], [15, 31718], [15, 31806], [15, 35345], [15, 38337], [15, 44841], [15, 49221], [15, 51207], [15, 53342], [15, 60525], [15, 61338], [15, 68593], [15, 69805], [15, 70569], [15, 71672], [15, 72888], [15, 79140], [15, 97560], [15, 106143], [15, 115479], [15, 117247], [15, 117621], [15, 119319], [15, 121948], [15, 121959], [6, 2342], [6, 2501], [6, 2568], [6, 4804], [6, 5608], [6, 6226], [6, 6274], [6, 7032], [6, 7890], [6, 8623], [6, 8631], [6, 10239], [6, 10896], [6, 12317], [6, 12544], [6, 12933], [6, 13140], [6, 14344], [6, 15605], [6, 16656], [6, 17235], [6, 17358], [6, 17807], [6, 19396], [6, 19497], [6, 19726], [6, 19992], [6, 20396], [6, 23403], [6, 23484], [6, 23870], [6, 23929], [6, 24341], [6, 24372], [6, 25498], [6, 26140], [6, 26668], [6, 27650], [6, 28046], [6, 29116], [6, 29601], [6, 30750], [6, 31220], [6, 31613], [6, 33632], [6, 33637], [6, 33701], [6, 34389], [6, 35855], [6, 37121], [6, 39122], [6, 39595], [6, 40034], [6, 41534], [6, 41916], [6, 42542], [6, 43114], [6, 43335], [6, 43459], [6, 44044], [6, 44419], [6, 47772], [6, 50450], [6, 51250], [6, 51657], [6, 51797], [6, 52051], [6, 53839], [6, 55172], [6, 56394], [6, 56861], [6, 58047], [6, 59298], [6, 60093], [6, 60235], [6, 60623], [6, 61394], [6, 61798], [6, 63416], [6, 64018], [6, 64167], [6, 64232], [6, 64869], [6, 66612], [6, 68939], [6, 69883], [6, 70278], [6, 71091], [6, 71464], [6, 71607], [6, 76720], [6, 79601], [6, 80743], [6, 81090], [6, 81119], [6, 82528], [6, 82884], [6, 83506], [6, 83791], [6, 85060], [6, 85309], [6, 85922], [6, 86521], [6, 87641], [6, 87669], [6, 87718], [6, 88914], [6, 89117], [6, 89730], [6, 91283], [6, 93868], [6, 94845], [6, 94892], [6, 95379], [6, 95972], [6, 97365], [6, 97436], [6, 97978], [6, 98126], [6, 98478], [6, 99529], [6, 100055], [6, 102723], [6, 104486], [6, 104960], [6, 106582], [6, 107481], [6, 107955], [6, 112128], [6, 114106], [6, 114839], [6, 114925], [6, 116366], [6, 117615], [6, 118909], [6, 119213], [6, 119425], [6, 119819], [6, 122942], [6, 123539], [6, 125623], [6, 125805], [6, 127416], [6, 127941], [6, 128100], [2, 5087], [2, 5605], [2, 9085], [2, 9565], [2, 12375], [2, 14067], [2, 14396], [2, 15537], [2, 17373], [2, 18533], [2, 19372], [2, 20716], [2, 24659], [2, 26393], [2, 26641], [2, 30905], [2, 31346], [2, 34287], [2, 35803], [2, 35910], [2, 37229], [2, 40340], [2, 40362], [2, 43165], [2, 47244], [2, 49519], [2, 50620], [2, 50940], [2, 52792], [2, 53131], [2, 53795], [2, 56031], [2, 56717], [2, 57930], [2, 60206], [2, 66344], [2, 66431], [2, 66785], [2, 66822], [2, 67088], [2, 68219], [2, 68722], [2, 68882], [2, 69717], [2, 69927], [2, 70832], [2, 70836], [2, 70887], [2, 74155], [2, 74323], [2, 78650], [2, 81749], [2, 82502], [2, 83362], [2, 84123], [2, 86163], [2, 86492], [2, 88552], [2, 88878], [2, 89299], [2, 89424], [2, 89433], [2, 89776], [2, 90306], [2, 92117], [2, 93062], [2, 93721], [2, 94163], [2, 94358], [2, 94827], [2, 95358], [2, 96552], [2, 96757], [2, 98987], [2, 100072], [2, 100188], [2, 101693], [2, 102112], [2, 104719], [2, 108062], [2, 108366], [2, 109651], [2, 110099], [2, 110480], [2, 112325], [2, 113087], [2, 119717], [2, 121175], [2, 121227], [2, 122817], [2, 123668], [2, 124659], [2, 125262], [2, 127226], [2, 127306], [2, 128070], [2, 129849], [4, 263], [4, 617], [4, 3666], [4, 7339], [4, 9419], [4, 9598], [4, 10747], [4, 11134], [4, 13162], [4, 16673], [4, 17291], [4, 18964], [4, 19540], [4, 21858], [4, 23349], [4, 23787], [4, 24580], [4, 26593], [4, 27071], [4, 29659], [4, 29927], [4, 32080], [4, 32178], [4, 35997], [4, 36375], [4, 38708], [4, 39099], [4, 41357], [4, 41593], [4, 41695], [4, 43604], [4, 46561], [4, 49682], [4, 51016], [4, 51842], [4, 51886], [4, 53623], [4, 54311], [4, 54540], [4, 55131], [4, 57286], [4, 62798], [4, 65190], [4, 66880], [4, 69683], [4, 69726], [4, 69974], [4, 70511], [4, 76366], [4, 76822], [4, 77488], [4, 78318], [4, 79730], [4, 80497], [4, 83655], [4, 85670], [4, 88360], [4, 91468], [4, 93563], [4, 95104], [4, 96048], [4, 98420], [4, 102769], [4, 104288], [4, 105171], [4, 106768], [4, 107481], [4, 110242], [4, 110245], [4, 110318], [4, 110617], [4, 111824], [4, 114310], [4, 114749], [4, 116151], [4, 117471], [4, 118260], [4, 123070], [4, 128617], [4, 129834], [4, 130009], [4, 130098], [4, 130492], [4, 130637], [7, 410], [7, 1862], [7, 1883], [7, 2496], [7, 3131], [7, 3246], [7, 3546], [7, 4260], [7, 4307], [7, 6168], [7, 6537], [7, 7081], [7, 7154], [7, 7693], [7, 8842], [7, 10301], [7, 13885], [7, 14998], [7, 15165], [7, 15280], [7, 18481], [7, 19714], [7, 20258], [7, 21719], [7, 22081], [7, 23368], [7, 23426], [7, 25608], [7, 25613], [7, 25836], [7, 28279], [7, 28486], [7, 28945], [7, 28995], [7, 29194], [7, 29267], [7, 30131], [7, 31751], [7, 32801], [7, 33970], [7, 36312], [7, 36846], [7, 38730], [7, 39516], [7, 41095], [7, 41640], [7, 44254], [7, 46074], [7, 48464], [7, 50283], [7, 51545], [7, 53009], [7, 53241], [7, 53977], [7, 54488], [7, 55678], [7, 57285], [7, 57582], [7, 57717], [7, 58980], [7, 59206], [7, 59353], [7, 59790], [7, 65574], [7, 68282], [7, 68904], [7, 69407], [7, 69767], [7, 70473], [7, 72326], [7, 73018], [7, 73124], [7, 73515], [7, 75386], [7, 76290], [7, 76843], [7, 77395], [7, 83817], [7, 85231], [7, 86643], [7, 88586], [7, 88949], [7, 90245], [7, 90768], [7, 91029], [7, 94115], [7, 95749], [7, 96802], [7, 97331], [7, 99056], [7, 99316], [7, 99689], [7, 102511], [7, 102908], [7, 103967], [7, 105923], [7, 109197], [7, 110546], [7, 112451], [7, 112531], [7, 114600], [7, 115952], [7, 120645], [7, 122342], [7, 122478], [7, 124415], [7, 125075], [7, 127764], [14, 3591], [14, 4765], [14, 6094], [14, 7114], [14, 8233], [14, 8772], [14, 10021], [14, 12024], [14, 12216], [14, 13329], [14, 15450], [14, 15739], [14, 16623], [14, 17038], [14, 24281], [14, 25522], [14, 27358], [14, 28280], [14, 29225], [14, 29242], [14, 29916], [14, 33437], [14, 37364], [14, 39775], [14, 41291], [14, 42192], [14, 44878], [14, 45057], [14, 46894], [14, 47146], [14, 49800], [14, 53524], [14, 54854], [14, 55163], [14, 55635], [14, 60532], [14, 62227], [14, 63524], [14, 64482], [14, 66760], [14, 67115], [14, 71071], [14, 71921], [14, 74748], [14, 75248], [14, 76760], [14, 79502], [14, 79538], [14, 80435], [14, 81965], [14, 82231], [14, 84853], [14, 86009], [14, 88088], [14, 89964], [14, 90978], [14, 93323], [14, 94074], [14, 95160], [14, 100004], [14, 103008], [14, 105532], [14, 105606], [14, 107886], [14, 110705], [14, 115817], [14, 118135], [14, 118264], [14, 118384], [14, 118682], [14, 122798], [14, 123134], [14, 123788], [14, 124408], [14, 124422], [14, 127475], [14, 129414], [14, 129767], [0, 14767]]
latents/layers.0.post_attention_layernorm/0_26213.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:806300d482218e0fe4fde02ceab2e9f981466de7b227fd8e9054738b4429e3fa
3
+ size 446183072
latents/layers.0.post_attention_layernorm/104857_131071.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:425ba375fba55c6a01f8dc3012ca19e8de17146ac429a68d7ff687dd71e08b02
3
+ size 448580320
latents/layers.0.post_attention_layernorm/26214_52427.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ab6576fe449d360d311b7fdb2e10e439b453022221a4df7c6e855a9855c6ad9
3
+ size 449512344
latents/layers.0.post_attention_layernorm/52428_78642.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5624727b42e22dfed4baa82d5dfe9f8dfda707eabdee47e5c294c19e6d57d485
3
+ size 443482768
latents/layers.0.post_attention_layernorm/78643_104856.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5727c8a60150141ba8aeb2e1f1cde1e2bc79c2054dd9dcd7b9a731b39418e1c
3
+ size 452728768
latents/layers.0.post_attention_layernorm/config.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_repo": "EleutherAI/fineweb-edu-dedup-10b",
3
+ "dataset_split": "train",
4
+ "dataset_name": "",
5
+ "dataset_column": "text",
6
+ "batch_size": 16,
7
+ "cache_ctx_len": 256,
8
+ "n_tokens": 10000000,
9
+ "n_splits": 5,
10
+ "model_name": "meta-llama/Llama-3.2-1B"
11
+ }
latents/layers.1.post_attention_layernorm/0_26213.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:19fa708856966684080700b797603cb7dbd9073b5bc0cebb98563c4887dd9222
3
+ size 362624376
latents/layers.1.post_attention_layernorm/104857_131071.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e83257cc54a1d6d14ccf69f42f5d39f8e3a8568d7f5356fe39f895c3f062a99
3
+ size 359946000
latents/layers.1.post_attention_layernorm/26214_52427.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db974367d10cc3c4cc8c446ecefb8b78681f1d8540da8380dfde9bbecdc3de64
3
+ size 359193424
latents/layers.1.post_attention_layernorm/52428_78642.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71f277e76b5951a9ccc8253325c535bcfb79a527f8bbf5440874ed14289dc0df
3
+ size 358352824
latents/layers.1.post_attention_layernorm/78643_104856.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a4b890646baa3b98bc49975ee4e643a0b413d340e52c38e0bf1880aa039b77be
3
+ size 363455120
latents/layers.1.post_attention_layernorm/config.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_repo": "EleutherAI/fineweb-edu-dedup-10b",
3
+ "dataset_split": "train",
4
+ "dataset_name": "",
5
+ "dataset_column": "text",
6
+ "batch_size": 16,
7
+ "cache_ctx_len": 256,
8
+ "n_tokens": 10000000,
9
+ "n_splits": 5,
10
+ "model_name": "meta-llama/Llama-3.2-1B"
11
+ }
latents/layers.10.post_attention_layernorm/104857_131071.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:40b5de25c616447c582807e12c5fd2124650dff026306443bafbb8a070f14b69
3
+ size 710479648
latents/layers.10.post_attention_layernorm/config.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_repo": "EleutherAI/fineweb-edu-dedup-10b",
3
+ "dataset_split": "train",
4
+ "dataset_name": "",
5
+ "dataset_column": "text",
6
+ "batch_size": 16,
7
+ "cache_ctx_len": 256,
8
+ "n_tokens": 10000000,
9
+ "n_splits": 5,
10
+ "model_name": "meta-llama/Llama-3.2-1B"
11
+ }
latents/layers.11.post_attention_layernorm/104857_131071.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c504bfda93c6bc5725115fe466418045487d8f0f0a06a55277e4aa6933bc5c49
3
+ size 701753352
latents/layers.11.post_attention_layernorm/52428_78642.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd758adeb823db3fbe9e6618a045324e22406230343a122d7efee05988f77321
3
+ size 695182032
latents/layers.11.post_attention_layernorm/config.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_repo": "EleutherAI/fineweb-edu-dedup-10b",
3
+ "dataset_split": "train",
4
+ "dataset_name": "",
5
+ "dataset_column": "text",
6
+ "batch_size": 16,
7
+ "cache_ctx_len": 256,
8
+ "n_tokens": 10000000,
9
+ "n_splits": 5,
10
+ "model_name": "meta-llama/Llama-3.2-1B"
11
+ }
latents/layers.12.post_attention_layernorm/config.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_repo": "EleutherAI/fineweb-edu-dedup-10b",
3
+ "dataset_split": "train",
4
+ "dataset_name": "",
5
+ "dataset_column": "text",
6
+ "batch_size": 16,
7
+ "cache_ctx_len": 256,
8
+ "n_tokens": 10000000,
9
+ "n_splits": 5,
10
+ "model_name": "meta-llama/Llama-3.2-1B"
11
+ }
latents/layers.13.post_attention_layernorm/config.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_repo": "EleutherAI/fineweb-edu-dedup-10b",
3
+ "dataset_split": "train",
4
+ "dataset_name": "",
5
+ "dataset_column": "text",
6
+ "batch_size": 16,
7
+ "cache_ctx_len": 256,
8
+ "n_tokens": 10000000,
9
+ "n_splits": 5,
10
+ "model_name": "meta-llama/Llama-3.2-1B"
11
+ }
latents/layers.14.post_attention_layernorm/0_26213.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a12614861d79575fdd456644728f91c844f4e4fde474c1df805aaf0f25fb7b01
3
+ size 558420376
latents/layers.14.post_attention_layernorm/104857_131071.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e000945666616566a605c8a8970529eefa510b12a2d623148e8807f9e55470e
3
+ size 561086328
latents/layers.14.post_attention_layernorm/26214_52427.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44491f2fa857bb8a9ba0f1bde210c949fcd2c7a42c9b08f333ecc0889eb42d90
3
+ size 560728656
latents/layers.14.post_attention_layernorm/52428_78642.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ece2650f5221a5298fb7578d104bcabad7309a29787ecf15f3473e5b213e90e
3
+ size 553822416
latents/layers.14.post_attention_layernorm/78643_104856.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e7a5c2de038abd89ff448bbdfd493d4a1d0a6e2db95759918008928b2de61c5
3
+ size 549315520
latents/layers.14.post_attention_layernorm/config.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_repo": "EleutherAI/fineweb-edu-dedup-10b",
3
+ "dataset_split": "train",
4
+ "dataset_name": "",
5
+ "dataset_column": "text",
6
+ "batch_size": 16,
7
+ "cache_ctx_len": 256,
8
+ "n_tokens": 10000000,
9
+ "n_splits": 5,
10
+ "model_name": "meta-llama/Llama-3.2-1B"
11
+ }
latents/layers.15.post_attention_layernorm/0_26213.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b6d2fc859e7ff0d8b02aa4d038d00974e4c65cbc5285fabd07b9f56255687b2
3
+ size 247012152
latents/layers.15.post_attention_layernorm/104857_131071.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71a3080ae26d5fb517f074861082db16664ff8a95d1d658a6063b81de02bcc23
3
+ size 255860032
latents/layers.15.post_attention_layernorm/26214_52427.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:801a7a8a91000d4329dac2870835adbecde9db579ecd967aef9ab30c6844560b
3
+ size 254321752
latents/layers.15.post_attention_layernorm/52428_78642.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:74f5d0945352cff03d12b7f41fcbebd618205c77cf555d8c089f1a6a73465afb
3
+ size 252963400
latents/layers.15.post_attention_layernorm/78643_104856.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3864370dad4463f1a2ecb815d948b7e8b3fae3347591274716e4547ca9c3986
3
+ size 245325512
latents/layers.15.post_attention_layernorm/config.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_repo": "EleutherAI/fineweb-edu-dedup-10b",
3
+ "dataset_split": "train",
4
+ "dataset_name": "",
5
+ "dataset_column": "text",
6
+ "batch_size": 16,
7
+ "cache_ctx_len": 256,
8
+ "n_tokens": 10000000,
9
+ "n_splits": 5,
10
+ "model_name": "meta-llama/Llama-3.2-1B"
11
+ }
latents/layers.2.post_attention_layernorm/0_26213.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a63afaf01a8634f51cbd8ada590d6795e52f50769797b0414e07dcaec635f325
3
+ size 636166024
latents/layers.2.post_attention_layernorm/104857_131071.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ad093c1f2b7adaaf95faf0453c9ecc131e7d973baa56603af48bdbdcab158c4
3
+ size 659874152
latents/layers.2.post_attention_layernorm/26214_52427.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:461b810ddc3ac051e1668d456534f950033bbf348f9365243167b9d1e1a50ceb
3
+ size 635751200
latents/layers.2.post_attention_layernorm/52428_78642.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8acab34c3bf7e12691763682d7c05a93720478f1b6ae2ad81846a917c6df67f5
3
+ size 638273648
latents/layers.2.post_attention_layernorm/78643_104856.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af7527870b6432b9505e7c0841d18f893293037442b48380b011ab6b1bb8d3a0
3
+ size 670748176
latents/layers.2.post_attention_layernorm/config.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_repo": "EleutherAI/fineweb-edu-dedup-10b",
3
+ "dataset_split": "train",
4
+ "dataset_name": "",
5
+ "dataset_column": "text",
6
+ "batch_size": 16,
7
+ "cache_ctx_len": 256,
8
+ "n_tokens": 10000000,
9
+ "n_splits": 5,
10
+ "model_name": "meta-llama/Llama-3.2-1B"
11
+ }
latents/layers.3.post_attention_layernorm/78643_104856.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dbb44966c3b2024cd90f35d552f80f7d7478b3b05f0ebc36f5eda345b86d1771
3
+ size 695601824
latents/layers.3.post_attention_layernorm/config.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_repo": "EleutherAI/fineweb-edu-dedup-10b",
3
+ "dataset_split": "train",
4
+ "dataset_name": "",
5
+ "dataset_column": "text",
6
+ "batch_size": 16,
7
+ "cache_ctx_len": 256,
8
+ "n_tokens": 10000000,
9
+ "n_splits": 5,
10
+ "model_name": "meta-llama/Llama-3.2-1B"
11
+ }
latents/layers.4.post_attention_layernorm/0_26213.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:52cba7207b6852cdd3b12ee61481e2e5825fbdec545d08927165543bb504b2b0
3
+ size 714295352
latents/layers.4.post_attention_layernorm/26214_52427.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:389c7854e0a1573f16f9eeef37020eaba5d039194a6f5f559fc601bb886f6876
3
+ size 702580200
latents/layers.4.post_attention_layernorm/52428_78642.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45a7b317279e8e040bc1827cd0b08c2b8edba341e127c3e4ca67cfade61e3400
3
+ size 692593552
latents/layers.4.post_attention_layernorm/config.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_repo": "EleutherAI/fineweb-edu-dedup-10b",
3
+ "dataset_split": "train",
4
+ "dataset_name": "",
5
+ "dataset_column": "text",
6
+ "batch_size": 16,
7
+ "cache_ctx_len": 256,
8
+ "n_tokens": 10000000,
9
+ "n_splits": 5,
10
+ "model_name": "meta-llama/Llama-3.2-1B"
11
+ }
latents/layers.5.post_attention_layernorm/config.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_repo": "EleutherAI/fineweb-edu-dedup-10b",
3
+ "dataset_split": "train",
4
+ "dataset_name": "",
5
+ "dataset_column": "text",
6
+ "batch_size": 16,
7
+ "cache_ctx_len": 256,
8
+ "n_tokens": 10000000,
9
+ "n_splits": 5,
10
+ "model_name": "meta-llama/Llama-3.2-1B"
11
+ }
latents/layers.6.post_attention_layernorm/config.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_repo": "EleutherAI/fineweb-edu-dedup-10b",
3
+ "dataset_split": "train",
4
+ "dataset_name": "",
5
+ "dataset_column": "text",
6
+ "batch_size": 16,
7
+ "cache_ctx_len": 256,
8
+ "n_tokens": 10000000,
9
+ "n_splits": 5,
10
+ "model_name": "meta-llama/Llama-3.2-1B"
11
+ }
latents/layers.7.post_attention_layernorm/config.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_repo": "EleutherAI/fineweb-edu-dedup-10b",
3
+ "dataset_split": "train",
4
+ "dataset_name": "",
5
+ "dataset_column": "text",
6
+ "batch_size": 16,
7
+ "cache_ctx_len": 256,
8
+ "n_tokens": 10000000,
9
+ "n_splits": 5,
10
+ "model_name": "meta-llama/Llama-3.2-1B"
11
+ }
latents/layers.8.post_attention_layernorm/config.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_repo": "EleutherAI/fineweb-edu-dedup-10b",
3
+ "dataset_split": "train",
4
+ "dataset_name": "",
5
+ "dataset_column": "text",
6
+ "batch_size": 16,
7
+ "cache_ctx_len": 256,
8
+ "n_tokens": 10000000,
9
+ "n_splits": 5,
10
+ "model_name": "meta-llama/Llama-3.2-1B"
11
+ }
latents/layers.9.post_attention_layernorm/config.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_repo": "EleutherAI/fineweb-edu-dedup-10b",
3
+ "dataset_split": "train",
4
+ "dataset_name": "",
5
+ "dataset_column": "text",
6
+ "batch_size": 16,
7
+ "cache_ctx_len": 256,
8
+ "n_tokens": 10000000,
9
+ "n_splits": 5,
10
+ "model_name": "meta-llama/Llama-3.2-1B"
11
+ }
run_config.json ADDED
@@ -0,0 +1,66 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "cache_cfg": {
3
+ "dataset_repo": "EleutherAI/fineweb-edu-dedup-10b",
4
+ "dataset_split": "train",
5
+ "dataset_name": "",
6
+ "dataset_column": "text",
7
+ "batch_size": 16,
8
+ "cache_ctx_len": 256,
9
+ "n_tokens": 10000000,
10
+ "n_splits": 5
11
+ },
12
+ "constructor_cfg": {
13
+ "faiss_embedding_model": "sentence-transformers/all-MiniLM-L6-v2",
14
+ "faiss_embedding_cache_dir": ".embedding_cache",
15
+ "faiss_embedding_cache_enabled": true,
16
+ "example_ctx_len": 32,
17
+ "min_examples": 200,
18
+ "n_non_activating": 50,
19
+ "center_examples": true,
20
+ "non_activating_source": "random",
21
+ "neighbours_type": "co-occurrence"
22
+ },
23
+ "sampler_cfg": {
24
+ "n_examples_train": 40,
25
+ "n_examples_test": 50,
26
+ "n_quantiles": 10,
27
+ "train_type": "quantiles",
28
+ "test_type": "quantiles",
29
+ "ratio_top": 0.2
30
+ },
31
+ "model": "meta-llama/Llama-3.2-1B",
32
+ "sparse_model": "results/llama-mntss-relu",
33
+ "hookpoints": [
34
+ "layers.0.mlp",
35
+ "layers.1.mlp",
36
+ "layers.2.mlp",
37
+ "layers.3.mlp",
38
+ "layers.4.mlp",
39
+ "layers.5.mlp",
40
+ "layers.6.mlp",
41
+ "layers.7.mlp",
42
+ "layers.8.mlp",
43
+ "layers.9.mlp",
44
+ "layers.10.mlp",
45
+ "layers.11.mlp",
46
+ "layers.12.mlp",
47
+ "layers.13.mlp",
48
+ "layers.14.mlp",
49
+ "layers.15.mlp"
50
+ ],
51
+ "explainer_model": "hugging-quants/Meta-Llama-3.1-70B-Instruct-AWQ-INT4",
52
+ "explainer_model_max_len": 5120,
53
+ "explainer_provider": "offline",
54
+ "name": "transcoder_llama_131k_mntss",
55
+ "max_latents": null,
56
+ "filter_bos": false,
57
+ "log_probs": false,
58
+ "load_in_8bit": false,
59
+ "hf_token": null,
60
+ "pipeline_num_proc": 48,
61
+ "num_gpus": 1,
62
+ "seed": 22,
63
+ "verbose": true,
64
+ "num_examples_per_scorer_prompt": 5,
65
+ "overwrite": []
66
+ }