model.safetensors.index.fp32.json 115 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266
  1. {
  2. "metadata": {
  3. "total_size": 6173962240
  4. },
  5. "weight_map": {
  6. "model.decoder.embed_positions.weight": "model.fp32-00001-of-00002.safetensors",
  7. "model.decoder.embed_tokens.weight": "model.fp32-00001-of-00002.safetensors",
  8. "model.decoder.layer_norm.bias": "model.fp32-00002-of-00002.safetensors",
  9. "model.decoder.layer_norm.weight": "model.fp32-00002-of-00002.safetensors",
  10. "model.decoder.layers.0.encoder_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  11. "model.decoder.layers.0.encoder_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  12. "model.decoder.layers.0.encoder_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  13. "model.decoder.layers.0.encoder_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  14. "model.decoder.layers.0.encoder_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  15. "model.decoder.layers.0.encoder_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  16. "model.decoder.layers.0.encoder_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  17. "model.decoder.layers.0.encoder_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  18. "model.decoder.layers.0.encoder_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  19. "model.decoder.layers.0.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  20. "model.decoder.layers.0.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  21. "model.decoder.layers.0.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  22. "model.decoder.layers.0.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  23. "model.decoder.layers.0.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  24. "model.decoder.layers.0.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  25. "model.decoder.layers.0.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  26. "model.decoder.layers.0.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  27. "model.decoder.layers.0.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  28. "model.decoder.layers.0.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  29. "model.decoder.layers.0.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  30. "model.decoder.layers.0.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  31. "model.decoder.layers.0.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  32. "model.decoder.layers.0.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  33. "model.decoder.layers.0.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  34. "model.decoder.layers.1.encoder_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  35. "model.decoder.layers.1.encoder_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  36. "model.decoder.layers.1.encoder_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  37. "model.decoder.layers.1.encoder_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  38. "model.decoder.layers.1.encoder_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  39. "model.decoder.layers.1.encoder_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  40. "model.decoder.layers.1.encoder_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  41. "model.decoder.layers.1.encoder_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  42. "model.decoder.layers.1.encoder_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  43. "model.decoder.layers.1.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  44. "model.decoder.layers.1.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  45. "model.decoder.layers.1.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  46. "model.decoder.layers.1.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  47. "model.decoder.layers.1.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  48. "model.decoder.layers.1.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  49. "model.decoder.layers.1.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  50. "model.decoder.layers.1.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  51. "model.decoder.layers.1.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  52. "model.decoder.layers.1.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  53. "model.decoder.layers.1.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  54. "model.decoder.layers.1.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  55. "model.decoder.layers.1.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  56. "model.decoder.layers.1.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  57. "model.decoder.layers.1.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  58. "model.decoder.layers.10.encoder_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  59. "model.decoder.layers.10.encoder_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  60. "model.decoder.layers.10.encoder_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  61. "model.decoder.layers.10.encoder_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  62. "model.decoder.layers.10.encoder_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  63. "model.decoder.layers.10.encoder_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  64. "model.decoder.layers.10.encoder_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  65. "model.decoder.layers.10.encoder_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  66. "model.decoder.layers.10.encoder_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  67. "model.decoder.layers.10.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  68. "model.decoder.layers.10.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  69. "model.decoder.layers.10.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  70. "model.decoder.layers.10.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  71. "model.decoder.layers.10.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  72. "model.decoder.layers.10.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  73. "model.decoder.layers.10.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  74. "model.decoder.layers.10.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  75. "model.decoder.layers.10.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  76. "model.decoder.layers.10.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  77. "model.decoder.layers.10.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  78. "model.decoder.layers.10.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  79. "model.decoder.layers.10.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  80. "model.decoder.layers.10.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  81. "model.decoder.layers.10.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  82. "model.decoder.layers.11.encoder_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  83. "model.decoder.layers.11.encoder_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  84. "model.decoder.layers.11.encoder_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  85. "model.decoder.layers.11.encoder_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  86. "model.decoder.layers.11.encoder_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  87. "model.decoder.layers.11.encoder_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  88. "model.decoder.layers.11.encoder_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  89. "model.decoder.layers.11.encoder_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  90. "model.decoder.layers.11.encoder_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  91. "model.decoder.layers.11.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  92. "model.decoder.layers.11.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  93. "model.decoder.layers.11.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  94. "model.decoder.layers.11.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  95. "model.decoder.layers.11.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  96. "model.decoder.layers.11.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  97. "model.decoder.layers.11.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  98. "model.decoder.layers.11.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  99. "model.decoder.layers.11.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  100. "model.decoder.layers.11.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  101. "model.decoder.layers.11.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  102. "model.decoder.layers.11.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  103. "model.decoder.layers.11.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  104. "model.decoder.layers.11.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  105. "model.decoder.layers.11.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  106. "model.decoder.layers.12.encoder_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  107. "model.decoder.layers.12.encoder_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  108. "model.decoder.layers.12.encoder_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  109. "model.decoder.layers.12.encoder_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  110. "model.decoder.layers.12.encoder_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  111. "model.decoder.layers.12.encoder_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  112. "model.decoder.layers.12.encoder_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  113. "model.decoder.layers.12.encoder_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  114. "model.decoder.layers.12.encoder_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  115. "model.decoder.layers.12.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  116. "model.decoder.layers.12.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  117. "model.decoder.layers.12.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  118. "model.decoder.layers.12.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  119. "model.decoder.layers.12.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  120. "model.decoder.layers.12.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  121. "model.decoder.layers.12.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  122. "model.decoder.layers.12.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  123. "model.decoder.layers.12.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  124. "model.decoder.layers.12.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  125. "model.decoder.layers.12.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  126. "model.decoder.layers.12.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  127. "model.decoder.layers.12.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  128. "model.decoder.layers.12.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  129. "model.decoder.layers.12.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  130. "model.decoder.layers.13.encoder_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  131. "model.decoder.layers.13.encoder_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  132. "model.decoder.layers.13.encoder_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  133. "model.decoder.layers.13.encoder_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  134. "model.decoder.layers.13.encoder_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  135. "model.decoder.layers.13.encoder_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  136. "model.decoder.layers.13.encoder_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  137. "model.decoder.layers.13.encoder_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  138. "model.decoder.layers.13.encoder_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  139. "model.decoder.layers.13.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  140. "model.decoder.layers.13.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  141. "model.decoder.layers.13.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  142. "model.decoder.layers.13.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  143. "model.decoder.layers.13.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  144. "model.decoder.layers.13.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  145. "model.decoder.layers.13.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  146. "model.decoder.layers.13.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  147. "model.decoder.layers.13.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  148. "model.decoder.layers.13.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  149. "model.decoder.layers.13.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  150. "model.decoder.layers.13.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  151. "model.decoder.layers.13.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  152. "model.decoder.layers.13.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  153. "model.decoder.layers.13.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  154. "model.decoder.layers.14.encoder_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  155. "model.decoder.layers.14.encoder_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  156. "model.decoder.layers.14.encoder_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  157. "model.decoder.layers.14.encoder_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  158. "model.decoder.layers.14.encoder_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  159. "model.decoder.layers.14.encoder_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  160. "model.decoder.layers.14.encoder_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  161. "model.decoder.layers.14.encoder_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  162. "model.decoder.layers.14.encoder_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  163. "model.decoder.layers.14.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  164. "model.decoder.layers.14.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  165. "model.decoder.layers.14.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  166. "model.decoder.layers.14.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  167. "model.decoder.layers.14.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  168. "model.decoder.layers.14.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  169. "model.decoder.layers.14.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  170. "model.decoder.layers.14.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  171. "model.decoder.layers.14.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  172. "model.decoder.layers.14.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  173. "model.decoder.layers.14.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  174. "model.decoder.layers.14.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  175. "model.decoder.layers.14.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  176. "model.decoder.layers.14.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  177. "model.decoder.layers.14.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  178. "model.decoder.layers.15.encoder_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  179. "model.decoder.layers.15.encoder_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  180. "model.decoder.layers.15.encoder_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  181. "model.decoder.layers.15.encoder_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  182. "model.decoder.layers.15.encoder_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  183. "model.decoder.layers.15.encoder_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  184. "model.decoder.layers.15.encoder_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  185. "model.decoder.layers.15.encoder_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  186. "model.decoder.layers.15.encoder_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  187. "model.decoder.layers.15.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  188. "model.decoder.layers.15.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  189. "model.decoder.layers.15.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  190. "model.decoder.layers.15.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  191. "model.decoder.layers.15.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  192. "model.decoder.layers.15.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  193. "model.decoder.layers.15.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  194. "model.decoder.layers.15.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  195. "model.decoder.layers.15.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  196. "model.decoder.layers.15.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  197. "model.decoder.layers.15.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  198. "model.decoder.layers.15.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  199. "model.decoder.layers.15.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  200. "model.decoder.layers.15.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  201. "model.decoder.layers.15.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  202. "model.decoder.layers.16.encoder_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  203. "model.decoder.layers.16.encoder_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  204. "model.decoder.layers.16.encoder_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  205. "model.decoder.layers.16.encoder_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  206. "model.decoder.layers.16.encoder_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  207. "model.decoder.layers.16.encoder_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  208. "model.decoder.layers.16.encoder_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  209. "model.decoder.layers.16.encoder_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  210. "model.decoder.layers.16.encoder_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  211. "model.decoder.layers.16.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  212. "model.decoder.layers.16.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  213. "model.decoder.layers.16.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  214. "model.decoder.layers.16.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  215. "model.decoder.layers.16.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  216. "model.decoder.layers.16.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  217. "model.decoder.layers.16.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  218. "model.decoder.layers.16.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  219. "model.decoder.layers.16.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  220. "model.decoder.layers.16.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  221. "model.decoder.layers.16.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  222. "model.decoder.layers.16.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  223. "model.decoder.layers.16.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  224. "model.decoder.layers.16.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  225. "model.decoder.layers.16.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  226. "model.decoder.layers.17.encoder_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  227. "model.decoder.layers.17.encoder_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  228. "model.decoder.layers.17.encoder_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  229. "model.decoder.layers.17.encoder_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  230. "model.decoder.layers.17.encoder_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  231. "model.decoder.layers.17.encoder_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  232. "model.decoder.layers.17.encoder_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  233. "model.decoder.layers.17.encoder_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  234. "model.decoder.layers.17.encoder_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  235. "model.decoder.layers.17.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  236. "model.decoder.layers.17.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  237. "model.decoder.layers.17.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  238. "model.decoder.layers.17.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  239. "model.decoder.layers.17.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  240. "model.decoder.layers.17.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  241. "model.decoder.layers.17.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  242. "model.decoder.layers.17.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  243. "model.decoder.layers.17.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  244. "model.decoder.layers.17.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  245. "model.decoder.layers.17.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  246. "model.decoder.layers.17.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  247. "model.decoder.layers.17.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  248. "model.decoder.layers.17.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  249. "model.decoder.layers.17.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  250. "model.decoder.layers.18.encoder_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  251. "model.decoder.layers.18.encoder_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  252. "model.decoder.layers.18.encoder_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  253. "model.decoder.layers.18.encoder_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  254. "model.decoder.layers.18.encoder_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  255. "model.decoder.layers.18.encoder_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  256. "model.decoder.layers.18.encoder_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  257. "model.decoder.layers.18.encoder_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  258. "model.decoder.layers.18.encoder_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  259. "model.decoder.layers.18.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  260. "model.decoder.layers.18.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  261. "model.decoder.layers.18.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  262. "model.decoder.layers.18.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  263. "model.decoder.layers.18.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  264. "model.decoder.layers.18.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  265. "model.decoder.layers.18.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  266. "model.decoder.layers.18.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  267. "model.decoder.layers.18.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  268. "model.decoder.layers.18.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  269. "model.decoder.layers.18.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  270. "model.decoder.layers.18.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  271. "model.decoder.layers.18.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  272. "model.decoder.layers.18.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  273. "model.decoder.layers.18.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  274. "model.decoder.layers.19.encoder_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  275. "model.decoder.layers.19.encoder_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  276. "model.decoder.layers.19.encoder_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  277. "model.decoder.layers.19.encoder_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  278. "model.decoder.layers.19.encoder_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  279. "model.decoder.layers.19.encoder_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  280. "model.decoder.layers.19.encoder_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  281. "model.decoder.layers.19.encoder_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  282. "model.decoder.layers.19.encoder_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  283. "model.decoder.layers.19.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  284. "model.decoder.layers.19.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  285. "model.decoder.layers.19.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  286. "model.decoder.layers.19.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  287. "model.decoder.layers.19.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  288. "model.decoder.layers.19.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  289. "model.decoder.layers.19.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  290. "model.decoder.layers.19.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  291. "model.decoder.layers.19.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  292. "model.decoder.layers.19.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  293. "model.decoder.layers.19.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  294. "model.decoder.layers.19.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  295. "model.decoder.layers.19.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  296. "model.decoder.layers.19.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  297. "model.decoder.layers.19.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  298. "model.decoder.layers.2.encoder_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  299. "model.decoder.layers.2.encoder_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  300. "model.decoder.layers.2.encoder_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  301. "model.decoder.layers.2.encoder_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  302. "model.decoder.layers.2.encoder_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  303. "model.decoder.layers.2.encoder_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  304. "model.decoder.layers.2.encoder_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  305. "model.decoder.layers.2.encoder_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  306. "model.decoder.layers.2.encoder_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  307. "model.decoder.layers.2.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  308. "model.decoder.layers.2.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  309. "model.decoder.layers.2.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  310. "model.decoder.layers.2.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  311. "model.decoder.layers.2.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  312. "model.decoder.layers.2.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  313. "model.decoder.layers.2.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  314. "model.decoder.layers.2.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  315. "model.decoder.layers.2.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  316. "model.decoder.layers.2.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  317. "model.decoder.layers.2.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  318. "model.decoder.layers.2.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  319. "model.decoder.layers.2.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  320. "model.decoder.layers.2.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  321. "model.decoder.layers.2.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  322. "model.decoder.layers.20.encoder_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  323. "model.decoder.layers.20.encoder_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  324. "model.decoder.layers.20.encoder_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  325. "model.decoder.layers.20.encoder_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  326. "model.decoder.layers.20.encoder_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  327. "model.decoder.layers.20.encoder_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  328. "model.decoder.layers.20.encoder_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  329. "model.decoder.layers.20.encoder_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  330. "model.decoder.layers.20.encoder_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  331. "model.decoder.layers.20.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  332. "model.decoder.layers.20.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  333. "model.decoder.layers.20.fc2.bias": "model.fp32-00002-of-00002.safetensors",
  334. "model.decoder.layers.20.fc2.weight": "model.fp32-00002-of-00002.safetensors",
  335. "model.decoder.layers.20.final_layer_norm.bias": "model.fp32-00002-of-00002.safetensors",
  336. "model.decoder.layers.20.final_layer_norm.weight": "model.fp32-00002-of-00002.safetensors",
  337. "model.decoder.layers.20.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  338. "model.decoder.layers.20.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  339. "model.decoder.layers.20.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  340. "model.decoder.layers.20.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  341. "model.decoder.layers.20.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  342. "model.decoder.layers.20.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  343. "model.decoder.layers.20.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  344. "model.decoder.layers.20.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  345. "model.decoder.layers.20.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  346. "model.decoder.layers.21.encoder_attn.k_proj.weight": "model.fp32-00002-of-00002.safetensors",
  347. "model.decoder.layers.21.encoder_attn.out_proj.bias": "model.fp32-00002-of-00002.safetensors",
  348. "model.decoder.layers.21.encoder_attn.out_proj.weight": "model.fp32-00002-of-00002.safetensors",
  349. "model.decoder.layers.21.encoder_attn.q_proj.bias": "model.fp32-00002-of-00002.safetensors",
  350. "model.decoder.layers.21.encoder_attn.q_proj.weight": "model.fp32-00002-of-00002.safetensors",
  351. "model.decoder.layers.21.encoder_attn.v_proj.bias": "model.fp32-00002-of-00002.safetensors",
  352. "model.decoder.layers.21.encoder_attn.v_proj.weight": "model.fp32-00002-of-00002.safetensors",
  353. "model.decoder.layers.21.encoder_attn_layer_norm.bias": "model.fp32-00002-of-00002.safetensors",
  354. "model.decoder.layers.21.encoder_attn_layer_norm.weight": "model.fp32-00002-of-00002.safetensors",
  355. "model.decoder.layers.21.fc1.bias": "model.fp32-00002-of-00002.safetensors",
  356. "model.decoder.layers.21.fc1.weight": "model.fp32-00002-of-00002.safetensors",
  357. "model.decoder.layers.21.fc2.bias": "model.fp32-00002-of-00002.safetensors",
  358. "model.decoder.layers.21.fc2.weight": "model.fp32-00002-of-00002.safetensors",
  359. "model.decoder.layers.21.final_layer_norm.bias": "model.fp32-00002-of-00002.safetensors",
  360. "model.decoder.layers.21.final_layer_norm.weight": "model.fp32-00002-of-00002.safetensors",
  361. "model.decoder.layers.21.self_attn.k_proj.weight": "model.fp32-00002-of-00002.safetensors",
  362. "model.decoder.layers.21.self_attn.out_proj.bias": "model.fp32-00002-of-00002.safetensors",
  363. "model.decoder.layers.21.self_attn.out_proj.weight": "model.fp32-00002-of-00002.safetensors",
  364. "model.decoder.layers.21.self_attn.q_proj.bias": "model.fp32-00002-of-00002.safetensors",
  365. "model.decoder.layers.21.self_attn.q_proj.weight": "model.fp32-00002-of-00002.safetensors",
  366. "model.decoder.layers.21.self_attn.v_proj.bias": "model.fp32-00002-of-00002.safetensors",
  367. "model.decoder.layers.21.self_attn.v_proj.weight": "model.fp32-00002-of-00002.safetensors",
  368. "model.decoder.layers.21.self_attn_layer_norm.bias": "model.fp32-00002-of-00002.safetensors",
  369. "model.decoder.layers.21.self_attn_layer_norm.weight": "model.fp32-00002-of-00002.safetensors",
  370. "model.decoder.layers.22.encoder_attn.k_proj.weight": "model.fp32-00002-of-00002.safetensors",
  371. "model.decoder.layers.22.encoder_attn.out_proj.bias": "model.fp32-00002-of-00002.safetensors",
  372. "model.decoder.layers.22.encoder_attn.out_proj.weight": "model.fp32-00002-of-00002.safetensors",
  373. "model.decoder.layers.22.encoder_attn.q_proj.bias": "model.fp32-00002-of-00002.safetensors",
  374. "model.decoder.layers.22.encoder_attn.q_proj.weight": "model.fp32-00002-of-00002.safetensors",
  375. "model.decoder.layers.22.encoder_attn.v_proj.bias": "model.fp32-00002-of-00002.safetensors",
  376. "model.decoder.layers.22.encoder_attn.v_proj.weight": "model.fp32-00002-of-00002.safetensors",
  377. "model.decoder.layers.22.encoder_attn_layer_norm.bias": "model.fp32-00002-of-00002.safetensors",
  378. "model.decoder.layers.22.encoder_attn_layer_norm.weight": "model.fp32-00002-of-00002.safetensors",
  379. "model.decoder.layers.22.fc1.bias": "model.fp32-00002-of-00002.safetensors",
  380. "model.decoder.layers.22.fc1.weight": "model.fp32-00002-of-00002.safetensors",
  381. "model.decoder.layers.22.fc2.bias": "model.fp32-00002-of-00002.safetensors",
  382. "model.decoder.layers.22.fc2.weight": "model.fp32-00002-of-00002.safetensors",
  383. "model.decoder.layers.22.final_layer_norm.bias": "model.fp32-00002-of-00002.safetensors",
  384. "model.decoder.layers.22.final_layer_norm.weight": "model.fp32-00002-of-00002.safetensors",
  385. "model.decoder.layers.22.self_attn.k_proj.weight": "model.fp32-00002-of-00002.safetensors",
  386. "model.decoder.layers.22.self_attn.out_proj.bias": "model.fp32-00002-of-00002.safetensors",
  387. "model.decoder.layers.22.self_attn.out_proj.weight": "model.fp32-00002-of-00002.safetensors",
  388. "model.decoder.layers.22.self_attn.q_proj.bias": "model.fp32-00002-of-00002.safetensors",
  389. "model.decoder.layers.22.self_attn.q_proj.weight": "model.fp32-00002-of-00002.safetensors",
  390. "model.decoder.layers.22.self_attn.v_proj.bias": "model.fp32-00002-of-00002.safetensors",
  391. "model.decoder.layers.22.self_attn.v_proj.weight": "model.fp32-00002-of-00002.safetensors",
  392. "model.decoder.layers.22.self_attn_layer_norm.bias": "model.fp32-00002-of-00002.safetensors",
  393. "model.decoder.layers.22.self_attn_layer_norm.weight": "model.fp32-00002-of-00002.safetensors",
  394. "model.decoder.layers.23.encoder_attn.k_proj.weight": "model.fp32-00002-of-00002.safetensors",
  395. "model.decoder.layers.23.encoder_attn.out_proj.bias": "model.fp32-00002-of-00002.safetensors",
  396. "model.decoder.layers.23.encoder_attn.out_proj.weight": "model.fp32-00002-of-00002.safetensors",
  397. "model.decoder.layers.23.encoder_attn.q_proj.bias": "model.fp32-00002-of-00002.safetensors",
  398. "model.decoder.layers.23.encoder_attn.q_proj.weight": "model.fp32-00002-of-00002.safetensors",
  399. "model.decoder.layers.23.encoder_attn.v_proj.bias": "model.fp32-00002-of-00002.safetensors",
  400. "model.decoder.layers.23.encoder_attn.v_proj.weight": "model.fp32-00002-of-00002.safetensors",
  401. "model.decoder.layers.23.encoder_attn_layer_norm.bias": "model.fp32-00002-of-00002.safetensors",
  402. "model.decoder.layers.23.encoder_attn_layer_norm.weight": "model.fp32-00002-of-00002.safetensors",
  403. "model.decoder.layers.23.fc1.bias": "model.fp32-00002-of-00002.safetensors",
  404. "model.decoder.layers.23.fc1.weight": "model.fp32-00002-of-00002.safetensors",
  405. "model.decoder.layers.23.fc2.bias": "model.fp32-00002-of-00002.safetensors",
  406. "model.decoder.layers.23.fc2.weight": "model.fp32-00002-of-00002.safetensors",
  407. "model.decoder.layers.23.final_layer_norm.bias": "model.fp32-00002-of-00002.safetensors",
  408. "model.decoder.layers.23.final_layer_norm.weight": "model.fp32-00002-of-00002.safetensors",
  409. "model.decoder.layers.23.self_attn.k_proj.weight": "model.fp32-00002-of-00002.safetensors",
  410. "model.decoder.layers.23.self_attn.out_proj.bias": "model.fp32-00002-of-00002.safetensors",
  411. "model.decoder.layers.23.self_attn.out_proj.weight": "model.fp32-00002-of-00002.safetensors",
  412. "model.decoder.layers.23.self_attn.q_proj.bias": "model.fp32-00002-of-00002.safetensors",
  413. "model.decoder.layers.23.self_attn.q_proj.weight": "model.fp32-00002-of-00002.safetensors",
  414. "model.decoder.layers.23.self_attn.v_proj.bias": "model.fp32-00002-of-00002.safetensors",
  415. "model.decoder.layers.23.self_attn.v_proj.weight": "model.fp32-00002-of-00002.safetensors",
  416. "model.decoder.layers.23.self_attn_layer_norm.bias": "model.fp32-00002-of-00002.safetensors",
  417. "model.decoder.layers.23.self_attn_layer_norm.weight": "model.fp32-00002-of-00002.safetensors",
  418. "model.decoder.layers.24.encoder_attn.k_proj.weight": "model.fp32-00002-of-00002.safetensors",
  419. "model.decoder.layers.24.encoder_attn.out_proj.bias": "model.fp32-00002-of-00002.safetensors",
  420. "model.decoder.layers.24.encoder_attn.out_proj.weight": "model.fp32-00002-of-00002.safetensors",
  421. "model.decoder.layers.24.encoder_attn.q_proj.bias": "model.fp32-00002-of-00002.safetensors",
  422. "model.decoder.layers.24.encoder_attn.q_proj.weight": "model.fp32-00002-of-00002.safetensors",
  423. "model.decoder.layers.24.encoder_attn.v_proj.bias": "model.fp32-00002-of-00002.safetensors",
  424. "model.decoder.layers.24.encoder_attn.v_proj.weight": "model.fp32-00002-of-00002.safetensors",
  425. "model.decoder.layers.24.encoder_attn_layer_norm.bias": "model.fp32-00002-of-00002.safetensors",
  426. "model.decoder.layers.24.encoder_attn_layer_norm.weight": "model.fp32-00002-of-00002.safetensors",
  427. "model.decoder.layers.24.fc1.bias": "model.fp32-00002-of-00002.safetensors",
  428. "model.decoder.layers.24.fc1.weight": "model.fp32-00002-of-00002.safetensors",
  429. "model.decoder.layers.24.fc2.bias": "model.fp32-00002-of-00002.safetensors",
  430. "model.decoder.layers.24.fc2.weight": "model.fp32-00002-of-00002.safetensors",
  431. "model.decoder.layers.24.final_layer_norm.bias": "model.fp32-00002-of-00002.safetensors",
  432. "model.decoder.layers.24.final_layer_norm.weight": "model.fp32-00002-of-00002.safetensors",
  433. "model.decoder.layers.24.self_attn.k_proj.weight": "model.fp32-00002-of-00002.safetensors",
  434. "model.decoder.layers.24.self_attn.out_proj.bias": "model.fp32-00002-of-00002.safetensors",
  435. "model.decoder.layers.24.self_attn.out_proj.weight": "model.fp32-00002-of-00002.safetensors",
  436. "model.decoder.layers.24.self_attn.q_proj.bias": "model.fp32-00002-of-00002.safetensors",
  437. "model.decoder.layers.24.self_attn.q_proj.weight": "model.fp32-00002-of-00002.safetensors",
  438. "model.decoder.layers.24.self_attn.v_proj.bias": "model.fp32-00002-of-00002.safetensors",
  439. "model.decoder.layers.24.self_attn.v_proj.weight": "model.fp32-00002-of-00002.safetensors",
  440. "model.decoder.layers.24.self_attn_layer_norm.bias": "model.fp32-00002-of-00002.safetensors",
  441. "model.decoder.layers.24.self_attn_layer_norm.weight": "model.fp32-00002-of-00002.safetensors",
  442. "model.decoder.layers.25.encoder_attn.k_proj.weight": "model.fp32-00002-of-00002.safetensors",
  443. "model.decoder.layers.25.encoder_attn.out_proj.bias": "model.fp32-00002-of-00002.safetensors",
  444. "model.decoder.layers.25.encoder_attn.out_proj.weight": "model.fp32-00002-of-00002.safetensors",
  445. "model.decoder.layers.25.encoder_attn.q_proj.bias": "model.fp32-00002-of-00002.safetensors",
  446. "model.decoder.layers.25.encoder_attn.q_proj.weight": "model.fp32-00002-of-00002.safetensors",
  447. "model.decoder.layers.25.encoder_attn.v_proj.bias": "model.fp32-00002-of-00002.safetensors",
  448. "model.decoder.layers.25.encoder_attn.v_proj.weight": "model.fp32-00002-of-00002.safetensors",
  449. "model.decoder.layers.25.encoder_attn_layer_norm.bias": "model.fp32-00002-of-00002.safetensors",
  450. "model.decoder.layers.25.encoder_attn_layer_norm.weight": "model.fp32-00002-of-00002.safetensors",
  451. "model.decoder.layers.25.fc1.bias": "model.fp32-00002-of-00002.safetensors",
  452. "model.decoder.layers.25.fc1.weight": "model.fp32-00002-of-00002.safetensors",
  453. "model.decoder.layers.25.fc2.bias": "model.fp32-00002-of-00002.safetensors",
  454. "model.decoder.layers.25.fc2.weight": "model.fp32-00002-of-00002.safetensors",
  455. "model.decoder.layers.25.final_layer_norm.bias": "model.fp32-00002-of-00002.safetensors",
  456. "model.decoder.layers.25.final_layer_norm.weight": "model.fp32-00002-of-00002.safetensors",
  457. "model.decoder.layers.25.self_attn.k_proj.weight": "model.fp32-00002-of-00002.safetensors",
  458. "model.decoder.layers.25.self_attn.out_proj.bias": "model.fp32-00002-of-00002.safetensors",
  459. "model.decoder.layers.25.self_attn.out_proj.weight": "model.fp32-00002-of-00002.safetensors",
  460. "model.decoder.layers.25.self_attn.q_proj.bias": "model.fp32-00002-of-00002.safetensors",
  461. "model.decoder.layers.25.self_attn.q_proj.weight": "model.fp32-00002-of-00002.safetensors",
  462. "model.decoder.layers.25.self_attn.v_proj.bias": "model.fp32-00002-of-00002.safetensors",
  463. "model.decoder.layers.25.self_attn.v_proj.weight": "model.fp32-00002-of-00002.safetensors",
  464. "model.decoder.layers.25.self_attn_layer_norm.bias": "model.fp32-00002-of-00002.safetensors",
  465. "model.decoder.layers.25.self_attn_layer_norm.weight": "model.fp32-00002-of-00002.safetensors",
  466. "model.decoder.layers.26.encoder_attn.k_proj.weight": "model.fp32-00002-of-00002.safetensors",
  467. "model.decoder.layers.26.encoder_attn.out_proj.bias": "model.fp32-00002-of-00002.safetensors",
  468. "model.decoder.layers.26.encoder_attn.out_proj.weight": "model.fp32-00002-of-00002.safetensors",
  469. "model.decoder.layers.26.encoder_attn.q_proj.bias": "model.fp32-00002-of-00002.safetensors",
  470. "model.decoder.layers.26.encoder_attn.q_proj.weight": "model.fp32-00002-of-00002.safetensors",
  471. "model.decoder.layers.26.encoder_attn.v_proj.bias": "model.fp32-00002-of-00002.safetensors",
  472. "model.decoder.layers.26.encoder_attn.v_proj.weight": "model.fp32-00002-of-00002.safetensors",
  473. "model.decoder.layers.26.encoder_attn_layer_norm.bias": "model.fp32-00002-of-00002.safetensors",
  474. "model.decoder.layers.26.encoder_attn_layer_norm.weight": "model.fp32-00002-of-00002.safetensors",
  475. "model.decoder.layers.26.fc1.bias": "model.fp32-00002-of-00002.safetensors",
  476. "model.decoder.layers.26.fc1.weight": "model.fp32-00002-of-00002.safetensors",
  477. "model.decoder.layers.26.fc2.bias": "model.fp32-00002-of-00002.safetensors",
  478. "model.decoder.layers.26.fc2.weight": "model.fp32-00002-of-00002.safetensors",
  479. "model.decoder.layers.26.final_layer_norm.bias": "model.fp32-00002-of-00002.safetensors",
  480. "model.decoder.layers.26.final_layer_norm.weight": "model.fp32-00002-of-00002.safetensors",
  481. "model.decoder.layers.26.self_attn.k_proj.weight": "model.fp32-00002-of-00002.safetensors",
  482. "model.decoder.layers.26.self_attn.out_proj.bias": "model.fp32-00002-of-00002.safetensors",
  483. "model.decoder.layers.26.self_attn.out_proj.weight": "model.fp32-00002-of-00002.safetensors",
  484. "model.decoder.layers.26.self_attn.q_proj.bias": "model.fp32-00002-of-00002.safetensors",
  485. "model.decoder.layers.26.self_attn.q_proj.weight": "model.fp32-00002-of-00002.safetensors",
  486. "model.decoder.layers.26.self_attn.v_proj.bias": "model.fp32-00002-of-00002.safetensors",
  487. "model.decoder.layers.26.self_attn.v_proj.weight": "model.fp32-00002-of-00002.safetensors",
  488. "model.decoder.layers.26.self_attn_layer_norm.bias": "model.fp32-00002-of-00002.safetensors",
  489. "model.decoder.layers.26.self_attn_layer_norm.weight": "model.fp32-00002-of-00002.safetensors",
  490. "model.decoder.layers.27.encoder_attn.k_proj.weight": "model.fp32-00002-of-00002.safetensors",
  491. "model.decoder.layers.27.encoder_attn.out_proj.bias": "model.fp32-00002-of-00002.safetensors",
  492. "model.decoder.layers.27.encoder_attn.out_proj.weight": "model.fp32-00002-of-00002.safetensors",
  493. "model.decoder.layers.27.encoder_attn.q_proj.bias": "model.fp32-00002-of-00002.safetensors",
  494. "model.decoder.layers.27.encoder_attn.q_proj.weight": "model.fp32-00002-of-00002.safetensors",
  495. "model.decoder.layers.27.encoder_attn.v_proj.bias": "model.fp32-00002-of-00002.safetensors",
  496. "model.decoder.layers.27.encoder_attn.v_proj.weight": "model.fp32-00002-of-00002.safetensors",
  497. "model.decoder.layers.27.encoder_attn_layer_norm.bias": "model.fp32-00002-of-00002.safetensors",
  498. "model.decoder.layers.27.encoder_attn_layer_norm.weight": "model.fp32-00002-of-00002.safetensors",
  499. "model.decoder.layers.27.fc1.bias": "model.fp32-00002-of-00002.safetensors",
  500. "model.decoder.layers.27.fc1.weight": "model.fp32-00002-of-00002.safetensors",
  501. "model.decoder.layers.27.fc2.bias": "model.fp32-00002-of-00002.safetensors",
  502. "model.decoder.layers.27.fc2.weight": "model.fp32-00002-of-00002.safetensors",
  503. "model.decoder.layers.27.final_layer_norm.bias": "model.fp32-00002-of-00002.safetensors",
  504. "model.decoder.layers.27.final_layer_norm.weight": "model.fp32-00002-of-00002.safetensors",
  505. "model.decoder.layers.27.self_attn.k_proj.weight": "model.fp32-00002-of-00002.safetensors",
  506. "model.decoder.layers.27.self_attn.out_proj.bias": "model.fp32-00002-of-00002.safetensors",
  507. "model.decoder.layers.27.self_attn.out_proj.weight": "model.fp32-00002-of-00002.safetensors",
  508. "model.decoder.layers.27.self_attn.q_proj.bias": "model.fp32-00002-of-00002.safetensors",
  509. "model.decoder.layers.27.self_attn.q_proj.weight": "model.fp32-00002-of-00002.safetensors",
  510. "model.decoder.layers.27.self_attn.v_proj.bias": "model.fp32-00002-of-00002.safetensors",
  511. "model.decoder.layers.27.self_attn.v_proj.weight": "model.fp32-00002-of-00002.safetensors",
  512. "model.decoder.layers.27.self_attn_layer_norm.bias": "model.fp32-00002-of-00002.safetensors",
  513. "model.decoder.layers.27.self_attn_layer_norm.weight": "model.fp32-00002-of-00002.safetensors",
  514. "model.decoder.layers.28.encoder_attn.k_proj.weight": "model.fp32-00002-of-00002.safetensors",
  515. "model.decoder.layers.28.encoder_attn.out_proj.bias": "model.fp32-00002-of-00002.safetensors",
  516. "model.decoder.layers.28.encoder_attn.out_proj.weight": "model.fp32-00002-of-00002.safetensors",
  517. "model.decoder.layers.28.encoder_attn.q_proj.bias": "model.fp32-00002-of-00002.safetensors",
  518. "model.decoder.layers.28.encoder_attn.q_proj.weight": "model.fp32-00002-of-00002.safetensors",
  519. "model.decoder.layers.28.encoder_attn.v_proj.bias": "model.fp32-00002-of-00002.safetensors",
  520. "model.decoder.layers.28.encoder_attn.v_proj.weight": "model.fp32-00002-of-00002.safetensors",
  521. "model.decoder.layers.28.encoder_attn_layer_norm.bias": "model.fp32-00002-of-00002.safetensors",
  522. "model.decoder.layers.28.encoder_attn_layer_norm.weight": "model.fp32-00002-of-00002.safetensors",
  523. "model.decoder.layers.28.fc1.bias": "model.fp32-00002-of-00002.safetensors",
  524. "model.decoder.layers.28.fc1.weight": "model.fp32-00002-of-00002.safetensors",
  525. "model.decoder.layers.28.fc2.bias": "model.fp32-00002-of-00002.safetensors",
  526. "model.decoder.layers.28.fc2.weight": "model.fp32-00002-of-00002.safetensors",
  527. "model.decoder.layers.28.final_layer_norm.bias": "model.fp32-00002-of-00002.safetensors",
  528. "model.decoder.layers.28.final_layer_norm.weight": "model.fp32-00002-of-00002.safetensors",
  529. "model.decoder.layers.28.self_attn.k_proj.weight": "model.fp32-00002-of-00002.safetensors",
  530. "model.decoder.layers.28.self_attn.out_proj.bias": "model.fp32-00002-of-00002.safetensors",
  531. "model.decoder.layers.28.self_attn.out_proj.weight": "model.fp32-00002-of-00002.safetensors",
  532. "model.decoder.layers.28.self_attn.q_proj.bias": "model.fp32-00002-of-00002.safetensors",
  533. "model.decoder.layers.28.self_attn.q_proj.weight": "model.fp32-00002-of-00002.safetensors",
  534. "model.decoder.layers.28.self_attn.v_proj.bias": "model.fp32-00002-of-00002.safetensors",
  535. "model.decoder.layers.28.self_attn.v_proj.weight": "model.fp32-00002-of-00002.safetensors",
  536. "model.decoder.layers.28.self_attn_layer_norm.bias": "model.fp32-00002-of-00002.safetensors",
  537. "model.decoder.layers.28.self_attn_layer_norm.weight": "model.fp32-00002-of-00002.safetensors",
  538. "model.decoder.layers.29.encoder_attn.k_proj.weight": "model.fp32-00002-of-00002.safetensors",
  539. "model.decoder.layers.29.encoder_attn.out_proj.bias": "model.fp32-00002-of-00002.safetensors",
  540. "model.decoder.layers.29.encoder_attn.out_proj.weight": "model.fp32-00002-of-00002.safetensors",
  541. "model.decoder.layers.29.encoder_attn.q_proj.bias": "model.fp32-00002-of-00002.safetensors",
  542. "model.decoder.layers.29.encoder_attn.q_proj.weight": "model.fp32-00002-of-00002.safetensors",
  543. "model.decoder.layers.29.encoder_attn.v_proj.bias": "model.fp32-00002-of-00002.safetensors",
  544. "model.decoder.layers.29.encoder_attn.v_proj.weight": "model.fp32-00002-of-00002.safetensors",
  545. "model.decoder.layers.29.encoder_attn_layer_norm.bias": "model.fp32-00002-of-00002.safetensors",
  546. "model.decoder.layers.29.encoder_attn_layer_norm.weight": "model.fp32-00002-of-00002.safetensors",
  547. "model.decoder.layers.29.fc1.bias": "model.fp32-00002-of-00002.safetensors",
  548. "model.decoder.layers.29.fc1.weight": "model.fp32-00002-of-00002.safetensors",
  549. "model.decoder.layers.29.fc2.bias": "model.fp32-00002-of-00002.safetensors",
  550. "model.decoder.layers.29.fc2.weight": "model.fp32-00002-of-00002.safetensors",
  551. "model.decoder.layers.29.final_layer_norm.bias": "model.fp32-00002-of-00002.safetensors",
  552. "model.decoder.layers.29.final_layer_norm.weight": "model.fp32-00002-of-00002.safetensors",
  553. "model.decoder.layers.29.self_attn.k_proj.weight": "model.fp32-00002-of-00002.safetensors",
  554. "model.decoder.layers.29.self_attn.out_proj.bias": "model.fp32-00002-of-00002.safetensors",
  555. "model.decoder.layers.29.self_attn.out_proj.weight": "model.fp32-00002-of-00002.safetensors",
  556. "model.decoder.layers.29.self_attn.q_proj.bias": "model.fp32-00002-of-00002.safetensors",
  557. "model.decoder.layers.29.self_attn.q_proj.weight": "model.fp32-00002-of-00002.safetensors",
  558. "model.decoder.layers.29.self_attn.v_proj.bias": "model.fp32-00002-of-00002.safetensors",
  559. "model.decoder.layers.29.self_attn.v_proj.weight": "model.fp32-00002-of-00002.safetensors",
  560. "model.decoder.layers.29.self_attn_layer_norm.bias": "model.fp32-00002-of-00002.safetensors",
  561. "model.decoder.layers.29.self_attn_layer_norm.weight": "model.fp32-00002-of-00002.safetensors",
  562. "model.decoder.layers.3.encoder_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  563. "model.decoder.layers.3.encoder_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  564. "model.decoder.layers.3.encoder_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  565. "model.decoder.layers.3.encoder_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  566. "model.decoder.layers.3.encoder_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  567. "model.decoder.layers.3.encoder_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  568. "model.decoder.layers.3.encoder_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  569. "model.decoder.layers.3.encoder_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  570. "model.decoder.layers.3.encoder_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  571. "model.decoder.layers.3.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  572. "model.decoder.layers.3.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  573. "model.decoder.layers.3.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  574. "model.decoder.layers.3.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  575. "model.decoder.layers.3.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  576. "model.decoder.layers.3.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  577. "model.decoder.layers.3.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  578. "model.decoder.layers.3.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  579. "model.decoder.layers.3.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  580. "model.decoder.layers.3.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  581. "model.decoder.layers.3.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  582. "model.decoder.layers.3.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  583. "model.decoder.layers.3.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  584. "model.decoder.layers.3.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  585. "model.decoder.layers.3.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  586. "model.decoder.layers.30.encoder_attn.k_proj.weight": "model.fp32-00002-of-00002.safetensors",
  587. "model.decoder.layers.30.encoder_attn.out_proj.bias": "model.fp32-00002-of-00002.safetensors",
  588. "model.decoder.layers.30.encoder_attn.out_proj.weight": "model.fp32-00002-of-00002.safetensors",
  589. "model.decoder.layers.30.encoder_attn.q_proj.bias": "model.fp32-00002-of-00002.safetensors",
  590. "model.decoder.layers.30.encoder_attn.q_proj.weight": "model.fp32-00002-of-00002.safetensors",
  591. "model.decoder.layers.30.encoder_attn.v_proj.bias": "model.fp32-00002-of-00002.safetensors",
  592. "model.decoder.layers.30.encoder_attn.v_proj.weight": "model.fp32-00002-of-00002.safetensors",
  593. "model.decoder.layers.30.encoder_attn_layer_norm.bias": "model.fp32-00002-of-00002.safetensors",
  594. "model.decoder.layers.30.encoder_attn_layer_norm.weight": "model.fp32-00002-of-00002.safetensors",
  595. "model.decoder.layers.30.fc1.bias": "model.fp32-00002-of-00002.safetensors",
  596. "model.decoder.layers.30.fc1.weight": "model.fp32-00002-of-00002.safetensors",
  597. "model.decoder.layers.30.fc2.bias": "model.fp32-00002-of-00002.safetensors",
  598. "model.decoder.layers.30.fc2.weight": "model.fp32-00002-of-00002.safetensors",
  599. "model.decoder.layers.30.final_layer_norm.bias": "model.fp32-00002-of-00002.safetensors",
  600. "model.decoder.layers.30.final_layer_norm.weight": "model.fp32-00002-of-00002.safetensors",
  601. "model.decoder.layers.30.self_attn.k_proj.weight": "model.fp32-00002-of-00002.safetensors",
  602. "model.decoder.layers.30.self_attn.out_proj.bias": "model.fp32-00002-of-00002.safetensors",
  603. "model.decoder.layers.30.self_attn.out_proj.weight": "model.fp32-00002-of-00002.safetensors",
  604. "model.decoder.layers.30.self_attn.q_proj.bias": "model.fp32-00002-of-00002.safetensors",
  605. "model.decoder.layers.30.self_attn.q_proj.weight": "model.fp32-00002-of-00002.safetensors",
  606. "model.decoder.layers.30.self_attn.v_proj.bias": "model.fp32-00002-of-00002.safetensors",
  607. "model.decoder.layers.30.self_attn.v_proj.weight": "model.fp32-00002-of-00002.safetensors",
  608. "model.decoder.layers.30.self_attn_layer_norm.bias": "model.fp32-00002-of-00002.safetensors",
  609. "model.decoder.layers.30.self_attn_layer_norm.weight": "model.fp32-00002-of-00002.safetensors",
  610. "model.decoder.layers.31.encoder_attn.k_proj.weight": "model.fp32-00002-of-00002.safetensors",
  611. "model.decoder.layers.31.encoder_attn.out_proj.bias": "model.fp32-00002-of-00002.safetensors",
  612. "model.decoder.layers.31.encoder_attn.out_proj.weight": "model.fp32-00002-of-00002.safetensors",
  613. "model.decoder.layers.31.encoder_attn.q_proj.bias": "model.fp32-00002-of-00002.safetensors",
  614. "model.decoder.layers.31.encoder_attn.q_proj.weight": "model.fp32-00002-of-00002.safetensors",
  615. "model.decoder.layers.31.encoder_attn.v_proj.bias": "model.fp32-00002-of-00002.safetensors",
  616. "model.decoder.layers.31.encoder_attn.v_proj.weight": "model.fp32-00002-of-00002.safetensors",
  617. "model.decoder.layers.31.encoder_attn_layer_norm.bias": "model.fp32-00002-of-00002.safetensors",
  618. "model.decoder.layers.31.encoder_attn_layer_norm.weight": "model.fp32-00002-of-00002.safetensors",
  619. "model.decoder.layers.31.fc1.bias": "model.fp32-00002-of-00002.safetensors",
  620. "model.decoder.layers.31.fc1.weight": "model.fp32-00002-of-00002.safetensors",
  621. "model.decoder.layers.31.fc2.bias": "model.fp32-00002-of-00002.safetensors",
  622. "model.decoder.layers.31.fc2.weight": "model.fp32-00002-of-00002.safetensors",
  623. "model.decoder.layers.31.final_layer_norm.bias": "model.fp32-00002-of-00002.safetensors",
  624. "model.decoder.layers.31.final_layer_norm.weight": "model.fp32-00002-of-00002.safetensors",
  625. "model.decoder.layers.31.self_attn.k_proj.weight": "model.fp32-00002-of-00002.safetensors",
  626. "model.decoder.layers.31.self_attn.out_proj.bias": "model.fp32-00002-of-00002.safetensors",
  627. "model.decoder.layers.31.self_attn.out_proj.weight": "model.fp32-00002-of-00002.safetensors",
  628. "model.decoder.layers.31.self_attn.q_proj.bias": "model.fp32-00002-of-00002.safetensors",
  629. "model.decoder.layers.31.self_attn.q_proj.weight": "model.fp32-00002-of-00002.safetensors",
  630. "model.decoder.layers.31.self_attn.v_proj.bias": "model.fp32-00002-of-00002.safetensors",
  631. "model.decoder.layers.31.self_attn.v_proj.weight": "model.fp32-00002-of-00002.safetensors",
  632. "model.decoder.layers.31.self_attn_layer_norm.bias": "model.fp32-00002-of-00002.safetensors",
  633. "model.decoder.layers.31.self_attn_layer_norm.weight": "model.fp32-00002-of-00002.safetensors",
  634. "model.decoder.layers.4.encoder_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  635. "model.decoder.layers.4.encoder_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  636. "model.decoder.layers.4.encoder_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  637. "model.decoder.layers.4.encoder_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  638. "model.decoder.layers.4.encoder_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  639. "model.decoder.layers.4.encoder_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  640. "model.decoder.layers.4.encoder_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  641. "model.decoder.layers.4.encoder_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  642. "model.decoder.layers.4.encoder_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  643. "model.decoder.layers.4.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  644. "model.decoder.layers.4.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  645. "model.decoder.layers.4.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  646. "model.decoder.layers.4.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  647. "model.decoder.layers.4.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  648. "model.decoder.layers.4.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  649. "model.decoder.layers.4.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  650. "model.decoder.layers.4.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  651. "model.decoder.layers.4.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  652. "model.decoder.layers.4.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  653. "model.decoder.layers.4.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  654. "model.decoder.layers.4.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  655. "model.decoder.layers.4.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  656. "model.decoder.layers.4.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  657. "model.decoder.layers.4.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  658. "model.decoder.layers.5.encoder_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  659. "model.decoder.layers.5.encoder_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  660. "model.decoder.layers.5.encoder_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  661. "model.decoder.layers.5.encoder_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  662. "model.decoder.layers.5.encoder_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  663. "model.decoder.layers.5.encoder_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  664. "model.decoder.layers.5.encoder_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  665. "model.decoder.layers.5.encoder_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  666. "model.decoder.layers.5.encoder_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  667. "model.decoder.layers.5.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  668. "model.decoder.layers.5.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  669. "model.decoder.layers.5.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  670. "model.decoder.layers.5.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  671. "model.decoder.layers.5.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  672. "model.decoder.layers.5.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  673. "model.decoder.layers.5.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  674. "model.decoder.layers.5.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  675. "model.decoder.layers.5.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  676. "model.decoder.layers.5.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  677. "model.decoder.layers.5.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  678. "model.decoder.layers.5.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  679. "model.decoder.layers.5.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  680. "model.decoder.layers.5.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  681. "model.decoder.layers.5.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  682. "model.decoder.layers.6.encoder_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  683. "model.decoder.layers.6.encoder_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  684. "model.decoder.layers.6.encoder_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  685. "model.decoder.layers.6.encoder_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  686. "model.decoder.layers.6.encoder_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  687. "model.decoder.layers.6.encoder_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  688. "model.decoder.layers.6.encoder_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  689. "model.decoder.layers.6.encoder_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  690. "model.decoder.layers.6.encoder_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  691. "model.decoder.layers.6.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  692. "model.decoder.layers.6.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  693. "model.decoder.layers.6.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  694. "model.decoder.layers.6.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  695. "model.decoder.layers.6.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  696. "model.decoder.layers.6.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  697. "model.decoder.layers.6.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  698. "model.decoder.layers.6.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  699. "model.decoder.layers.6.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  700. "model.decoder.layers.6.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  701. "model.decoder.layers.6.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  702. "model.decoder.layers.6.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  703. "model.decoder.layers.6.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  704. "model.decoder.layers.6.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  705. "model.decoder.layers.6.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  706. "model.decoder.layers.7.encoder_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  707. "model.decoder.layers.7.encoder_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  708. "model.decoder.layers.7.encoder_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  709. "model.decoder.layers.7.encoder_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  710. "model.decoder.layers.7.encoder_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  711. "model.decoder.layers.7.encoder_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  712. "model.decoder.layers.7.encoder_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  713. "model.decoder.layers.7.encoder_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  714. "model.decoder.layers.7.encoder_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  715. "model.decoder.layers.7.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  716. "model.decoder.layers.7.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  717. "model.decoder.layers.7.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  718. "model.decoder.layers.7.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  719. "model.decoder.layers.7.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  720. "model.decoder.layers.7.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  721. "model.decoder.layers.7.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  722. "model.decoder.layers.7.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  723. "model.decoder.layers.7.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  724. "model.decoder.layers.7.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  725. "model.decoder.layers.7.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  726. "model.decoder.layers.7.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  727. "model.decoder.layers.7.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  728. "model.decoder.layers.7.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  729. "model.decoder.layers.7.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  730. "model.decoder.layers.8.encoder_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  731. "model.decoder.layers.8.encoder_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  732. "model.decoder.layers.8.encoder_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  733. "model.decoder.layers.8.encoder_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  734. "model.decoder.layers.8.encoder_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  735. "model.decoder.layers.8.encoder_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  736. "model.decoder.layers.8.encoder_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  737. "model.decoder.layers.8.encoder_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  738. "model.decoder.layers.8.encoder_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  739. "model.decoder.layers.8.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  740. "model.decoder.layers.8.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  741. "model.decoder.layers.8.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  742. "model.decoder.layers.8.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  743. "model.decoder.layers.8.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  744. "model.decoder.layers.8.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  745. "model.decoder.layers.8.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  746. "model.decoder.layers.8.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  747. "model.decoder.layers.8.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  748. "model.decoder.layers.8.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  749. "model.decoder.layers.8.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  750. "model.decoder.layers.8.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  751. "model.decoder.layers.8.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  752. "model.decoder.layers.8.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  753. "model.decoder.layers.8.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  754. "model.decoder.layers.9.encoder_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  755. "model.decoder.layers.9.encoder_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  756. "model.decoder.layers.9.encoder_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  757. "model.decoder.layers.9.encoder_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  758. "model.decoder.layers.9.encoder_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  759. "model.decoder.layers.9.encoder_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  760. "model.decoder.layers.9.encoder_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  761. "model.decoder.layers.9.encoder_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  762. "model.decoder.layers.9.encoder_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  763. "model.decoder.layers.9.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  764. "model.decoder.layers.9.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  765. "model.decoder.layers.9.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  766. "model.decoder.layers.9.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  767. "model.decoder.layers.9.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  768. "model.decoder.layers.9.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  769. "model.decoder.layers.9.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  770. "model.decoder.layers.9.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  771. "model.decoder.layers.9.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  772. "model.decoder.layers.9.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  773. "model.decoder.layers.9.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  774. "model.decoder.layers.9.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  775. "model.decoder.layers.9.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  776. "model.decoder.layers.9.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  777. "model.decoder.layers.9.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  778. "model.encoder.conv1.bias": "model.fp32-00001-of-00002.safetensors",
  779. "model.encoder.conv1.weight": "model.fp32-00001-of-00002.safetensors",
  780. "model.encoder.conv2.bias": "model.fp32-00001-of-00002.safetensors",
  781. "model.encoder.conv2.weight": "model.fp32-00001-of-00002.safetensors",
  782. "model.encoder.embed_positions.weight": "model.fp32-00001-of-00002.safetensors",
  783. "model.encoder.layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  784. "model.encoder.layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  785. "model.encoder.layers.0.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  786. "model.encoder.layers.0.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  787. "model.encoder.layers.0.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  788. "model.encoder.layers.0.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  789. "model.encoder.layers.0.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  790. "model.encoder.layers.0.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  791. "model.encoder.layers.0.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  792. "model.encoder.layers.0.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  793. "model.encoder.layers.0.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  794. "model.encoder.layers.0.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  795. "model.encoder.layers.0.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  796. "model.encoder.layers.0.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  797. "model.encoder.layers.0.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  798. "model.encoder.layers.0.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  799. "model.encoder.layers.0.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  800. "model.encoder.layers.1.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  801. "model.encoder.layers.1.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  802. "model.encoder.layers.1.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  803. "model.encoder.layers.1.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  804. "model.encoder.layers.1.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  805. "model.encoder.layers.1.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  806. "model.encoder.layers.1.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  807. "model.encoder.layers.1.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  808. "model.encoder.layers.1.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  809. "model.encoder.layers.1.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  810. "model.encoder.layers.1.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  811. "model.encoder.layers.1.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  812. "model.encoder.layers.1.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  813. "model.encoder.layers.1.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  814. "model.encoder.layers.1.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  815. "model.encoder.layers.10.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  816. "model.encoder.layers.10.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  817. "model.encoder.layers.10.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  818. "model.encoder.layers.10.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  819. "model.encoder.layers.10.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  820. "model.encoder.layers.10.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  821. "model.encoder.layers.10.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  822. "model.encoder.layers.10.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  823. "model.encoder.layers.10.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  824. "model.encoder.layers.10.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  825. "model.encoder.layers.10.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  826. "model.encoder.layers.10.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  827. "model.encoder.layers.10.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  828. "model.encoder.layers.10.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  829. "model.encoder.layers.10.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  830. "model.encoder.layers.11.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  831. "model.encoder.layers.11.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  832. "model.encoder.layers.11.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  833. "model.encoder.layers.11.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  834. "model.encoder.layers.11.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  835. "model.encoder.layers.11.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  836. "model.encoder.layers.11.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  837. "model.encoder.layers.11.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  838. "model.encoder.layers.11.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  839. "model.encoder.layers.11.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  840. "model.encoder.layers.11.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  841. "model.encoder.layers.11.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  842. "model.encoder.layers.11.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  843. "model.encoder.layers.11.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  844. "model.encoder.layers.11.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  845. "model.encoder.layers.12.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  846. "model.encoder.layers.12.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  847. "model.encoder.layers.12.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  848. "model.encoder.layers.12.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  849. "model.encoder.layers.12.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  850. "model.encoder.layers.12.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  851. "model.encoder.layers.12.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  852. "model.encoder.layers.12.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  853. "model.encoder.layers.12.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  854. "model.encoder.layers.12.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  855. "model.encoder.layers.12.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  856. "model.encoder.layers.12.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  857. "model.encoder.layers.12.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  858. "model.encoder.layers.12.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  859. "model.encoder.layers.12.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  860. "model.encoder.layers.13.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  861. "model.encoder.layers.13.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  862. "model.encoder.layers.13.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  863. "model.encoder.layers.13.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  864. "model.encoder.layers.13.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  865. "model.encoder.layers.13.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  866. "model.encoder.layers.13.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  867. "model.encoder.layers.13.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  868. "model.encoder.layers.13.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  869. "model.encoder.layers.13.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  870. "model.encoder.layers.13.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  871. "model.encoder.layers.13.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  872. "model.encoder.layers.13.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  873. "model.encoder.layers.13.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  874. "model.encoder.layers.13.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  875. "model.encoder.layers.14.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  876. "model.encoder.layers.14.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  877. "model.encoder.layers.14.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  878. "model.encoder.layers.14.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  879. "model.encoder.layers.14.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  880. "model.encoder.layers.14.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  881. "model.encoder.layers.14.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  882. "model.encoder.layers.14.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  883. "model.encoder.layers.14.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  884. "model.encoder.layers.14.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  885. "model.encoder.layers.14.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  886. "model.encoder.layers.14.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  887. "model.encoder.layers.14.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  888. "model.encoder.layers.14.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  889. "model.encoder.layers.14.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  890. "model.encoder.layers.15.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  891. "model.encoder.layers.15.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  892. "model.encoder.layers.15.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  893. "model.encoder.layers.15.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  894. "model.encoder.layers.15.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  895. "model.encoder.layers.15.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  896. "model.encoder.layers.15.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  897. "model.encoder.layers.15.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  898. "model.encoder.layers.15.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  899. "model.encoder.layers.15.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  900. "model.encoder.layers.15.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  901. "model.encoder.layers.15.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  902. "model.encoder.layers.15.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  903. "model.encoder.layers.15.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  904. "model.encoder.layers.15.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  905. "model.encoder.layers.16.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  906. "model.encoder.layers.16.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  907. "model.encoder.layers.16.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  908. "model.encoder.layers.16.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  909. "model.encoder.layers.16.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  910. "model.encoder.layers.16.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  911. "model.encoder.layers.16.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  912. "model.encoder.layers.16.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  913. "model.encoder.layers.16.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  914. "model.encoder.layers.16.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  915. "model.encoder.layers.16.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  916. "model.encoder.layers.16.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  917. "model.encoder.layers.16.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  918. "model.encoder.layers.16.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  919. "model.encoder.layers.16.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  920. "model.encoder.layers.17.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  921. "model.encoder.layers.17.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  922. "model.encoder.layers.17.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  923. "model.encoder.layers.17.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  924. "model.encoder.layers.17.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  925. "model.encoder.layers.17.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  926. "model.encoder.layers.17.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  927. "model.encoder.layers.17.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  928. "model.encoder.layers.17.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  929. "model.encoder.layers.17.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  930. "model.encoder.layers.17.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  931. "model.encoder.layers.17.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  932. "model.encoder.layers.17.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  933. "model.encoder.layers.17.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  934. "model.encoder.layers.17.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  935. "model.encoder.layers.18.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  936. "model.encoder.layers.18.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  937. "model.encoder.layers.18.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  938. "model.encoder.layers.18.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  939. "model.encoder.layers.18.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  940. "model.encoder.layers.18.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  941. "model.encoder.layers.18.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  942. "model.encoder.layers.18.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  943. "model.encoder.layers.18.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  944. "model.encoder.layers.18.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  945. "model.encoder.layers.18.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  946. "model.encoder.layers.18.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  947. "model.encoder.layers.18.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  948. "model.encoder.layers.18.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  949. "model.encoder.layers.18.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  950. "model.encoder.layers.19.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  951. "model.encoder.layers.19.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  952. "model.encoder.layers.19.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  953. "model.encoder.layers.19.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  954. "model.encoder.layers.19.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  955. "model.encoder.layers.19.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  956. "model.encoder.layers.19.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  957. "model.encoder.layers.19.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  958. "model.encoder.layers.19.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  959. "model.encoder.layers.19.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  960. "model.encoder.layers.19.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  961. "model.encoder.layers.19.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  962. "model.encoder.layers.19.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  963. "model.encoder.layers.19.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  964. "model.encoder.layers.19.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  965. "model.encoder.layers.2.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  966. "model.encoder.layers.2.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  967. "model.encoder.layers.2.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  968. "model.encoder.layers.2.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  969. "model.encoder.layers.2.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  970. "model.encoder.layers.2.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  971. "model.encoder.layers.2.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  972. "model.encoder.layers.2.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  973. "model.encoder.layers.2.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  974. "model.encoder.layers.2.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  975. "model.encoder.layers.2.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  976. "model.encoder.layers.2.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  977. "model.encoder.layers.2.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  978. "model.encoder.layers.2.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  979. "model.encoder.layers.2.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  980. "model.encoder.layers.20.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  981. "model.encoder.layers.20.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  982. "model.encoder.layers.20.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  983. "model.encoder.layers.20.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  984. "model.encoder.layers.20.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  985. "model.encoder.layers.20.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  986. "model.encoder.layers.20.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  987. "model.encoder.layers.20.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  988. "model.encoder.layers.20.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  989. "model.encoder.layers.20.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  990. "model.encoder.layers.20.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  991. "model.encoder.layers.20.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  992. "model.encoder.layers.20.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  993. "model.encoder.layers.20.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  994. "model.encoder.layers.20.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  995. "model.encoder.layers.21.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  996. "model.encoder.layers.21.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  997. "model.encoder.layers.21.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  998. "model.encoder.layers.21.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  999. "model.encoder.layers.21.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  1000. "model.encoder.layers.21.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  1001. "model.encoder.layers.21.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1002. "model.encoder.layers.21.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1003. "model.encoder.layers.21.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1004. "model.encoder.layers.21.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1005. "model.encoder.layers.21.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1006. "model.encoder.layers.21.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1007. "model.encoder.layers.21.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1008. "model.encoder.layers.21.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  1009. "model.encoder.layers.21.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  1010. "model.encoder.layers.22.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  1011. "model.encoder.layers.22.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  1012. "model.encoder.layers.22.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  1013. "model.encoder.layers.22.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  1014. "model.encoder.layers.22.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  1015. "model.encoder.layers.22.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  1016. "model.encoder.layers.22.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1017. "model.encoder.layers.22.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1018. "model.encoder.layers.22.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1019. "model.encoder.layers.22.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1020. "model.encoder.layers.22.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1021. "model.encoder.layers.22.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1022. "model.encoder.layers.22.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1023. "model.encoder.layers.22.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  1024. "model.encoder.layers.22.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  1025. "model.encoder.layers.23.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  1026. "model.encoder.layers.23.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  1027. "model.encoder.layers.23.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  1028. "model.encoder.layers.23.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  1029. "model.encoder.layers.23.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  1030. "model.encoder.layers.23.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  1031. "model.encoder.layers.23.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1032. "model.encoder.layers.23.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1033. "model.encoder.layers.23.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1034. "model.encoder.layers.23.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1035. "model.encoder.layers.23.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1036. "model.encoder.layers.23.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1037. "model.encoder.layers.23.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1038. "model.encoder.layers.23.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  1039. "model.encoder.layers.23.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  1040. "model.encoder.layers.24.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  1041. "model.encoder.layers.24.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  1042. "model.encoder.layers.24.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  1043. "model.encoder.layers.24.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  1044. "model.encoder.layers.24.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  1045. "model.encoder.layers.24.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  1046. "model.encoder.layers.24.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1047. "model.encoder.layers.24.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1048. "model.encoder.layers.24.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1049. "model.encoder.layers.24.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1050. "model.encoder.layers.24.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1051. "model.encoder.layers.24.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1052. "model.encoder.layers.24.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1053. "model.encoder.layers.24.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  1054. "model.encoder.layers.24.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  1055. "model.encoder.layers.25.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  1056. "model.encoder.layers.25.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  1057. "model.encoder.layers.25.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  1058. "model.encoder.layers.25.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  1059. "model.encoder.layers.25.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  1060. "model.encoder.layers.25.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  1061. "model.encoder.layers.25.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1062. "model.encoder.layers.25.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1063. "model.encoder.layers.25.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1064. "model.encoder.layers.25.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1065. "model.encoder.layers.25.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1066. "model.encoder.layers.25.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1067. "model.encoder.layers.25.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1068. "model.encoder.layers.25.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  1069. "model.encoder.layers.25.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  1070. "model.encoder.layers.26.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  1071. "model.encoder.layers.26.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  1072. "model.encoder.layers.26.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  1073. "model.encoder.layers.26.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  1074. "model.encoder.layers.26.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  1075. "model.encoder.layers.26.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  1076. "model.encoder.layers.26.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1077. "model.encoder.layers.26.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1078. "model.encoder.layers.26.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1079. "model.encoder.layers.26.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1080. "model.encoder.layers.26.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1081. "model.encoder.layers.26.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1082. "model.encoder.layers.26.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1083. "model.encoder.layers.26.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  1084. "model.encoder.layers.26.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  1085. "model.encoder.layers.27.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  1086. "model.encoder.layers.27.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  1087. "model.encoder.layers.27.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  1088. "model.encoder.layers.27.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  1089. "model.encoder.layers.27.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  1090. "model.encoder.layers.27.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  1091. "model.encoder.layers.27.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1092. "model.encoder.layers.27.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1093. "model.encoder.layers.27.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1094. "model.encoder.layers.27.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1095. "model.encoder.layers.27.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1096. "model.encoder.layers.27.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1097. "model.encoder.layers.27.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1098. "model.encoder.layers.27.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  1099. "model.encoder.layers.27.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  1100. "model.encoder.layers.28.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  1101. "model.encoder.layers.28.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  1102. "model.encoder.layers.28.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  1103. "model.encoder.layers.28.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  1104. "model.encoder.layers.28.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  1105. "model.encoder.layers.28.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  1106. "model.encoder.layers.28.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1107. "model.encoder.layers.28.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1108. "model.encoder.layers.28.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1109. "model.encoder.layers.28.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1110. "model.encoder.layers.28.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1111. "model.encoder.layers.28.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1112. "model.encoder.layers.28.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1113. "model.encoder.layers.28.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  1114. "model.encoder.layers.28.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  1115. "model.encoder.layers.29.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  1116. "model.encoder.layers.29.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  1117. "model.encoder.layers.29.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  1118. "model.encoder.layers.29.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  1119. "model.encoder.layers.29.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  1120. "model.encoder.layers.29.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  1121. "model.encoder.layers.29.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1122. "model.encoder.layers.29.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1123. "model.encoder.layers.29.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1124. "model.encoder.layers.29.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1125. "model.encoder.layers.29.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1126. "model.encoder.layers.29.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1127. "model.encoder.layers.29.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1128. "model.encoder.layers.29.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  1129. "model.encoder.layers.29.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  1130. "model.encoder.layers.3.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  1131. "model.encoder.layers.3.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  1132. "model.encoder.layers.3.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  1133. "model.encoder.layers.3.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  1134. "model.encoder.layers.3.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  1135. "model.encoder.layers.3.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  1136. "model.encoder.layers.3.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1137. "model.encoder.layers.3.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1138. "model.encoder.layers.3.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1139. "model.encoder.layers.3.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1140. "model.encoder.layers.3.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1141. "model.encoder.layers.3.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1142. "model.encoder.layers.3.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1143. "model.encoder.layers.3.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  1144. "model.encoder.layers.3.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  1145. "model.encoder.layers.30.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  1146. "model.encoder.layers.30.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  1147. "model.encoder.layers.30.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  1148. "model.encoder.layers.30.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  1149. "model.encoder.layers.30.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  1150. "model.encoder.layers.30.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  1151. "model.encoder.layers.30.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1152. "model.encoder.layers.30.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1153. "model.encoder.layers.30.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1154. "model.encoder.layers.30.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1155. "model.encoder.layers.30.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1156. "model.encoder.layers.30.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1157. "model.encoder.layers.30.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1158. "model.encoder.layers.30.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  1159. "model.encoder.layers.30.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  1160. "model.encoder.layers.31.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  1161. "model.encoder.layers.31.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  1162. "model.encoder.layers.31.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  1163. "model.encoder.layers.31.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  1164. "model.encoder.layers.31.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  1165. "model.encoder.layers.31.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  1166. "model.encoder.layers.31.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1167. "model.encoder.layers.31.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1168. "model.encoder.layers.31.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1169. "model.encoder.layers.31.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1170. "model.encoder.layers.31.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1171. "model.encoder.layers.31.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1172. "model.encoder.layers.31.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1173. "model.encoder.layers.31.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  1174. "model.encoder.layers.31.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  1175. "model.encoder.layers.4.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  1176. "model.encoder.layers.4.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  1177. "model.encoder.layers.4.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  1178. "model.encoder.layers.4.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  1179. "model.encoder.layers.4.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  1180. "model.encoder.layers.4.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  1181. "model.encoder.layers.4.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1182. "model.encoder.layers.4.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1183. "model.encoder.layers.4.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1184. "model.encoder.layers.4.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1185. "model.encoder.layers.4.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1186. "model.encoder.layers.4.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1187. "model.encoder.layers.4.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1188. "model.encoder.layers.4.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  1189. "model.encoder.layers.4.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  1190. "model.encoder.layers.5.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  1191. "model.encoder.layers.5.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  1192. "model.encoder.layers.5.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  1193. "model.encoder.layers.5.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  1194. "model.encoder.layers.5.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  1195. "model.encoder.layers.5.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  1196. "model.encoder.layers.5.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1197. "model.encoder.layers.5.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1198. "model.encoder.layers.5.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1199. "model.encoder.layers.5.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1200. "model.encoder.layers.5.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1201. "model.encoder.layers.5.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1202. "model.encoder.layers.5.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1203. "model.encoder.layers.5.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  1204. "model.encoder.layers.5.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  1205. "model.encoder.layers.6.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  1206. "model.encoder.layers.6.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  1207. "model.encoder.layers.6.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  1208. "model.encoder.layers.6.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  1209. "model.encoder.layers.6.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  1210. "model.encoder.layers.6.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  1211. "model.encoder.layers.6.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1212. "model.encoder.layers.6.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1213. "model.encoder.layers.6.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1214. "model.encoder.layers.6.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1215. "model.encoder.layers.6.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1216. "model.encoder.layers.6.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1217. "model.encoder.layers.6.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1218. "model.encoder.layers.6.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  1219. "model.encoder.layers.6.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  1220. "model.encoder.layers.7.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  1221. "model.encoder.layers.7.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  1222. "model.encoder.layers.7.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  1223. "model.encoder.layers.7.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  1224. "model.encoder.layers.7.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  1225. "model.encoder.layers.7.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  1226. "model.encoder.layers.7.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1227. "model.encoder.layers.7.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1228. "model.encoder.layers.7.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1229. "model.encoder.layers.7.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1230. "model.encoder.layers.7.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1231. "model.encoder.layers.7.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1232. "model.encoder.layers.7.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1233. "model.encoder.layers.7.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  1234. "model.encoder.layers.7.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  1235. "model.encoder.layers.8.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  1236. "model.encoder.layers.8.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  1237. "model.encoder.layers.8.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  1238. "model.encoder.layers.8.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  1239. "model.encoder.layers.8.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  1240. "model.encoder.layers.8.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  1241. "model.encoder.layers.8.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1242. "model.encoder.layers.8.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1243. "model.encoder.layers.8.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1244. "model.encoder.layers.8.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1245. "model.encoder.layers.8.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1246. "model.encoder.layers.8.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1247. "model.encoder.layers.8.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1248. "model.encoder.layers.8.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  1249. "model.encoder.layers.8.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  1250. "model.encoder.layers.9.fc1.bias": "model.fp32-00001-of-00002.safetensors",
  1251. "model.encoder.layers.9.fc1.weight": "model.fp32-00001-of-00002.safetensors",
  1252. "model.encoder.layers.9.fc2.bias": "model.fp32-00001-of-00002.safetensors",
  1253. "model.encoder.layers.9.fc2.weight": "model.fp32-00001-of-00002.safetensors",
  1254. "model.encoder.layers.9.final_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  1255. "model.encoder.layers.9.final_layer_norm.weight": "model.fp32-00001-of-00002.safetensors",
  1256. "model.encoder.layers.9.self_attn.k_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1257. "model.encoder.layers.9.self_attn.out_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1258. "model.encoder.layers.9.self_attn.out_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1259. "model.encoder.layers.9.self_attn.q_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1260. "model.encoder.layers.9.self_attn.q_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1261. "model.encoder.layers.9.self_attn.v_proj.bias": "model.fp32-00001-of-00002.safetensors",
  1262. "model.encoder.layers.9.self_attn.v_proj.weight": "model.fp32-00001-of-00002.safetensors",
  1263. "model.encoder.layers.9.self_attn_layer_norm.bias": "model.fp32-00001-of-00002.safetensors",
  1264. "model.encoder.layers.9.self_attn_layer_norm.weight": "model.fp32-00001-of-00002.safetensors"
  1265. }
  1266. }