Skip to content

Instantly share code, notes, and snippets.

@cedrickchee
Last active July 23, 2024 03:58
Show Gist options
  • Save cedrickchee/2e086ccb7427a96af60da5e1ba51dda8 to your computer and use it in GitHub Desktop.
Save cedrickchee/2e086ccb7427a96af60da5e1ba51dda8 to your computer and use it in GitHub Desktop.
Llama 3.1 Leaks: SoTA Open Model 405B & What We Know So Far

Llama 3.1 Leaks: SoTA Open Model 405B & What We Know So Far

TLDR: 8B gets a big bump across the board, 70B instruct shows minor improvements, and 405B is the SoTA open model. But 405B still lags behind flagship models.

Here are the notable upgrades:

  • Every model now supports 128k context length (up from 8k)
  • Trained on a massive ~15T tokens of public data
  • Fine-tuning data includes publicly available instruction datasets and over 25M synthetically generated examples
  • Multilingual support for 7 languages: French, German, Hindi, Italian, Portuguese, Spanish, and Thai
  • Training required a whopping 39.3M GPU hours on H100-80GB: 1.5m for 8B, 7m for 70B, and 31M for 405B

Meta's benchmarks are in, but we're still waiting for the verdict.

Check out the leaked model card for yourself: https://lnkd.in/gSVt3Ex7

A Peek Into Llama 3 405B

A list of base model files with their size:

files

405B is a dense model release instead of Mixture of experts (MoE).

{
"architectures": [
"LlamaForCausalLM"
],
"attention_bias": false,
"attention_dropout": 0.0,
"bos_token_id": 128000,
"eos_token_id": 128001,
"hidden_act": "silu",
"hidden_size": 16384,
"initializer_range": 0.02,
"intermediate_size": 53248,
"max_position_embeddings": 131072,
"mlp_bias": false,
"model_type": "llama",
"num_attention_heads": 128,
"num_hidden_layers": 126,
"num_key_value_heads": 16,
"pretraining_tp": 1,
"rms_norm_eps": 1e-05,
"rope_scaling": null,
"rope_theta": 500000.0,
"tie_word_embeddings": false,
"torch_dtype": "bfloat16",
"transformers_version": "4.42.3",
"use_cache": true,
"vocab_size": 128256
}
{
"_from_model_config": true,
"bos_token_id": 128000,
"eos_token_id": 128001,
"transformers_version": "4.42.3"
}
{
"metadata": {
"total_size": 820162494464
},
"weight_map": {
"lm_head.weight": "model-00191-of-00191.safetensors",
"model.embed_tokens.weight": "model-00001-of-00191.safetensors",
"model.layers.0.input_layernorm.weight": "model-00003-of-00191.safetensors",
"model.layers.0.mlp.down_proj.weight": "model-00003-of-00191.safetensors",
"model.layers.0.mlp.gate_proj.weight": "model-00002-of-00191.safetensors",
"model.layers.0.mlp.up_proj.weight": "model-00002-of-00191.safetensors",
"model.layers.0.post_attention_layernorm.weight": "model-00003-of-00191.safetensors",
"model.layers.0.self_attn.k_proj.weight": "model-00001-of-00191.safetensors",
"model.layers.0.self_attn.o_proj.weight": "model-00002-of-00191.safetensors",
"model.layers.0.self_attn.q_proj.weight": "model-00001-of-00191.safetensors",
"model.layers.0.self_attn.v_proj.weight": "model-00001-of-00191.safetensors",
"model.layers.1.input_layernorm.weight": "model-00004-of-00191.safetensors",
"model.layers.1.mlp.down_proj.weight": "model-00004-of-00191.safetensors",
"model.layers.1.mlp.gate_proj.weight": "model-00003-of-00191.safetensors",
"model.layers.1.mlp.up_proj.weight": "model-00004-of-00191.safetensors",
"model.layers.1.post_attention_layernorm.weight": "model-00004-of-00191.safetensors",
"model.layers.1.self_attn.k_proj.weight": "model-00003-of-00191.safetensors",
"model.layers.1.self_attn.o_proj.weight": "model-00003-of-00191.safetensors",
"model.layers.1.self_attn.q_proj.weight": "model-00003-of-00191.safetensors",
"model.layers.1.self_attn.v_proj.weight": "model-00003-of-00191.safetensors",
"model.layers.10.input_layernorm.weight": "model-00018-of-00191.safetensors",
"model.layers.10.mlp.down_proj.weight": "model-00018-of-00191.safetensors",
"model.layers.10.mlp.gate_proj.weight": "model-00017-of-00191.safetensors",
"model.layers.10.mlp.up_proj.weight": "model-00017-of-00191.safetensors",
"model.layers.10.post_attention_layernorm.weight": "model-00018-of-00191.safetensors",
"model.layers.10.self_attn.k_proj.weight": "model-00016-of-00191.safetensors",
"model.layers.10.self_attn.o_proj.weight": "model-00016-of-00191.safetensors",
"model.layers.10.self_attn.q_proj.weight": "model-00016-of-00191.safetensors",
"model.layers.10.self_attn.v_proj.weight": "model-00016-of-00191.safetensors",
"model.layers.100.input_layernorm.weight": "model-00153-of-00191.safetensors",
"model.layers.100.mlp.down_proj.weight": "model-00153-of-00191.safetensors",
"model.layers.100.mlp.gate_proj.weight": "model-00152-of-00191.safetensors",
"model.layers.100.mlp.up_proj.weight": "model-00152-of-00191.safetensors",
"model.layers.100.post_attention_layernorm.weight": "model-00153-of-00191.safetensors",
"model.layers.100.self_attn.k_proj.weight": "model-00151-of-00191.safetensors",
"model.layers.100.self_attn.o_proj.weight": "model-00151-of-00191.safetensors",
"model.layers.100.self_attn.q_proj.weight": "model-00151-of-00191.safetensors",
"model.layers.100.self_attn.v_proj.weight": "model-00151-of-00191.safetensors",
"model.layers.101.input_layernorm.weight": "model-00154-of-00191.safetensors",
"model.layers.101.mlp.down_proj.weight": "model-00154-of-00191.safetensors",
"model.layers.101.mlp.gate_proj.weight": "model-00153-of-00191.safetensors",
"model.layers.101.mlp.up_proj.weight": "model-00154-of-00191.safetensors",
"model.layers.101.post_attention_layernorm.weight": "model-00154-of-00191.safetensors",
"model.layers.101.self_attn.k_proj.weight": "model-00153-of-00191.safetensors",
"model.layers.101.self_attn.o_proj.weight": "model-00153-of-00191.safetensors",
"model.layers.101.self_attn.q_proj.weight": "model-00153-of-00191.safetensors",
"model.layers.101.self_attn.v_proj.weight": "model-00153-of-00191.safetensors",
"model.layers.102.input_layernorm.weight": "model-00156-of-00191.safetensors",
"model.layers.102.mlp.down_proj.weight": "model-00156-of-00191.safetensors",
"model.layers.102.mlp.gate_proj.weight": "model-00155-of-00191.safetensors",
"model.layers.102.mlp.up_proj.weight": "model-00155-of-00191.safetensors",
"model.layers.102.post_attention_layernorm.weight": "model-00156-of-00191.safetensors",
"model.layers.102.self_attn.k_proj.weight": "model-00154-of-00191.safetensors",
"model.layers.102.self_attn.o_proj.weight": "model-00154-of-00191.safetensors",
"model.layers.102.self_attn.q_proj.weight": "model-00154-of-00191.safetensors",
"model.layers.102.self_attn.v_proj.weight": "model-00154-of-00191.safetensors",
"model.layers.103.input_layernorm.weight": "model-00157-of-00191.safetensors",
"model.layers.103.mlp.down_proj.weight": "model-00157-of-00191.safetensors",
"model.layers.103.mlp.gate_proj.weight": "model-00156-of-00191.safetensors",
"model.layers.103.mlp.up_proj.weight": "model-00157-of-00191.safetensors",
"model.layers.103.post_attention_layernorm.weight": "model-00157-of-00191.safetensors",
"model.layers.103.self_attn.k_proj.weight": "model-00156-of-00191.safetensors",
"model.layers.103.self_attn.o_proj.weight": "model-00156-of-00191.safetensors",
"model.layers.103.self_attn.q_proj.weight": "model-00156-of-00191.safetensors",
"model.layers.103.self_attn.v_proj.weight": "model-00156-of-00191.safetensors",
"model.layers.104.input_layernorm.weight": "model-00159-of-00191.safetensors",
"model.layers.104.mlp.down_proj.weight": "model-00159-of-00191.safetensors",
"model.layers.104.mlp.gate_proj.weight": "model-00158-of-00191.safetensors",
"model.layers.104.mlp.up_proj.weight": "model-00158-of-00191.safetensors",
"model.layers.104.post_attention_layernorm.weight": "model-00159-of-00191.safetensors",
"model.layers.104.self_attn.k_proj.weight": "model-00157-of-00191.safetensors",
"model.layers.104.self_attn.o_proj.weight": "model-00157-of-00191.safetensors",
"model.layers.104.self_attn.q_proj.weight": "model-00157-of-00191.safetensors",
"model.layers.104.self_attn.v_proj.weight": "model-00157-of-00191.safetensors",
"model.layers.105.input_layernorm.weight": "model-00160-of-00191.safetensors",
"model.layers.105.mlp.down_proj.weight": "model-00160-of-00191.safetensors",
"model.layers.105.mlp.gate_proj.weight": "model-00159-of-00191.safetensors",
"model.layers.105.mlp.up_proj.weight": "model-00160-of-00191.safetensors",
"model.layers.105.post_attention_layernorm.weight": "model-00160-of-00191.safetensors",
"model.layers.105.self_attn.k_proj.weight": "model-00159-of-00191.safetensors",
"model.layers.105.self_attn.o_proj.weight": "model-00159-of-00191.safetensors",
"model.layers.105.self_attn.q_proj.weight": "model-00159-of-00191.safetensors",
"model.layers.105.self_attn.v_proj.weight": "model-00159-of-00191.safetensors",
"model.layers.106.input_layernorm.weight": "model-00162-of-00191.safetensors",
"model.layers.106.mlp.down_proj.weight": "model-00162-of-00191.safetensors",
"model.layers.106.mlp.gate_proj.weight": "model-00161-of-00191.safetensors",
"model.layers.106.mlp.up_proj.weight": "model-00161-of-00191.safetensors",
"model.layers.106.post_attention_layernorm.weight": "model-00162-of-00191.safetensors",
"model.layers.106.self_attn.k_proj.weight": "model-00160-of-00191.safetensors",
"model.layers.106.self_attn.o_proj.weight": "model-00160-of-00191.safetensors",
"model.layers.106.self_attn.q_proj.weight": "model-00160-of-00191.safetensors",
"model.layers.106.self_attn.v_proj.weight": "model-00160-of-00191.safetensors",
"model.layers.107.input_layernorm.weight": "model-00163-of-00191.safetensors",
"model.layers.107.mlp.down_proj.weight": "model-00163-of-00191.safetensors",
"model.layers.107.mlp.gate_proj.weight": "model-00162-of-00191.safetensors",
"model.layers.107.mlp.up_proj.weight": "model-00163-of-00191.safetensors",
"model.layers.107.post_attention_layernorm.weight": "model-00163-of-00191.safetensors",
"model.layers.107.self_attn.k_proj.weight": "model-00162-of-00191.safetensors",
"model.layers.107.self_attn.o_proj.weight": "model-00162-of-00191.safetensors",
"model.layers.107.self_attn.q_proj.weight": "model-00162-of-00191.safetensors",
"model.layers.107.self_attn.v_proj.weight": "model-00162-of-00191.safetensors",
"model.layers.108.input_layernorm.weight": "model-00165-of-00191.safetensors",
"model.layers.108.mlp.down_proj.weight": "model-00165-of-00191.safetensors",
"model.layers.108.mlp.gate_proj.weight": "model-00164-of-00191.safetensors",
"model.layers.108.mlp.up_proj.weight": "model-00164-of-00191.safetensors",
"model.layers.108.post_attention_layernorm.weight": "model-00165-of-00191.safetensors",
"model.layers.108.self_attn.k_proj.weight": "model-00163-of-00191.safetensors",
"model.layers.108.self_attn.o_proj.weight": "model-00163-of-00191.safetensors",
"model.layers.108.self_attn.q_proj.weight": "model-00163-of-00191.safetensors",
"model.layers.108.self_attn.v_proj.weight": "model-00163-of-00191.safetensors",
"model.layers.109.input_layernorm.weight": "model-00166-of-00191.safetensors",
"model.layers.109.mlp.down_proj.weight": "model-00166-of-00191.safetensors",
"model.layers.109.mlp.gate_proj.weight": "model-00165-of-00191.safetensors",
"model.layers.109.mlp.up_proj.weight": "model-00166-of-00191.safetensors",
"model.layers.109.post_attention_layernorm.weight": "model-00166-of-00191.safetensors",
"model.layers.109.self_attn.k_proj.weight": "model-00165-of-00191.safetensors",
"model.layers.109.self_attn.o_proj.weight": "model-00165-of-00191.safetensors",
"model.layers.109.self_attn.q_proj.weight": "model-00165-of-00191.safetensors",
"model.layers.109.self_attn.v_proj.weight": "model-00165-of-00191.safetensors",
"model.layers.11.input_layernorm.weight": "model-00019-of-00191.safetensors",
"model.layers.11.mlp.down_proj.weight": "model-00019-of-00191.safetensors",
"model.layers.11.mlp.gate_proj.weight": "model-00018-of-00191.safetensors",
"model.layers.11.mlp.up_proj.weight": "model-00019-of-00191.safetensors",
"model.layers.11.post_attention_layernorm.weight": "model-00019-of-00191.safetensors",
"model.layers.11.self_attn.k_proj.weight": "model-00018-of-00191.safetensors",
"model.layers.11.self_attn.o_proj.weight": "model-00018-of-00191.safetensors",
"model.layers.11.self_attn.q_proj.weight": "model-00018-of-00191.safetensors",
"model.layers.11.self_attn.v_proj.weight": "model-00018-of-00191.safetensors",
"model.layers.110.input_layernorm.weight": "model-00168-of-00191.safetensors",
"model.layers.110.mlp.down_proj.weight": "model-00168-of-00191.safetensors",
"model.layers.110.mlp.gate_proj.weight": "model-00167-of-00191.safetensors",
"model.layers.110.mlp.up_proj.weight": "model-00167-of-00191.safetensors",
"model.layers.110.post_attention_layernorm.weight": "model-00168-of-00191.safetensors",
"model.layers.110.self_attn.k_proj.weight": "model-00166-of-00191.safetensors",
"model.layers.110.self_attn.o_proj.weight": "model-00166-of-00191.safetensors",
"model.layers.110.self_attn.q_proj.weight": "model-00166-of-00191.safetensors",
"model.layers.110.self_attn.v_proj.weight": "model-00166-of-00191.safetensors",
"model.layers.111.input_layernorm.weight": "model-00169-of-00191.safetensors",
"model.layers.111.mlp.down_proj.weight": "model-00169-of-00191.safetensors",
"model.layers.111.mlp.gate_proj.weight": "model-00168-of-00191.safetensors",
"model.layers.111.mlp.up_proj.weight": "model-00169-of-00191.safetensors",
"model.layers.111.post_attention_layernorm.weight": "model-00169-of-00191.safetensors",
"model.layers.111.self_attn.k_proj.weight": "model-00168-of-00191.safetensors",
"model.layers.111.self_attn.o_proj.weight": "model-00168-of-00191.safetensors",
"model.layers.111.self_attn.q_proj.weight": "model-00168-of-00191.safetensors",
"model.layers.111.self_attn.v_proj.weight": "model-00168-of-00191.safetensors",
"model.layers.112.input_layernorm.weight": "model-00171-of-00191.safetensors",
"model.layers.112.mlp.down_proj.weight": "model-00171-of-00191.safetensors",
"model.layers.112.mlp.gate_proj.weight": "model-00170-of-00191.safetensors",
"model.layers.112.mlp.up_proj.weight": "model-00170-of-00191.safetensors",
"model.layers.112.post_attention_layernorm.weight": "model-00171-of-00191.safetensors",
"model.layers.112.self_attn.k_proj.weight": "model-00169-of-00191.safetensors",
"model.layers.112.self_attn.o_proj.weight": "model-00169-of-00191.safetensors",
"model.layers.112.self_attn.q_proj.weight": "model-00169-of-00191.safetensors",
"model.layers.112.self_attn.v_proj.weight": "model-00169-of-00191.safetensors",
"model.layers.113.input_layernorm.weight": "model-00172-of-00191.safetensors",
"model.layers.113.mlp.down_proj.weight": "model-00172-of-00191.safetensors",
"model.layers.113.mlp.gate_proj.weight": "model-00171-of-00191.safetensors",
"model.layers.113.mlp.up_proj.weight": "model-00172-of-00191.safetensors",
"model.layers.113.post_attention_layernorm.weight": "model-00172-of-00191.safetensors",
"model.layers.113.self_attn.k_proj.weight": "model-00171-of-00191.safetensors",
"model.layers.113.self_attn.o_proj.weight": "model-00171-of-00191.safetensors",
"model.layers.113.self_attn.q_proj.weight": "model-00171-of-00191.safetensors",
"model.layers.113.self_attn.v_proj.weight": "model-00171-of-00191.safetensors",
"model.layers.114.input_layernorm.weight": "model-00174-of-00191.safetensors",
"model.layers.114.mlp.down_proj.weight": "model-00174-of-00191.safetensors",
"model.layers.114.mlp.gate_proj.weight": "model-00173-of-00191.safetensors",
"model.layers.114.mlp.up_proj.weight": "model-00173-of-00191.safetensors",
"model.layers.114.post_attention_layernorm.weight": "model-00174-of-00191.safetensors",
"model.layers.114.self_attn.k_proj.weight": "model-00172-of-00191.safetensors",
"model.layers.114.self_attn.o_proj.weight": "model-00172-of-00191.safetensors",
"model.layers.114.self_attn.q_proj.weight": "model-00172-of-00191.safetensors",
"model.layers.114.self_attn.v_proj.weight": "model-00172-of-00191.safetensors",
"model.layers.115.input_layernorm.weight": "model-00175-of-00191.safetensors",
"model.layers.115.mlp.down_proj.weight": "model-00175-of-00191.safetensors",
"model.layers.115.mlp.gate_proj.weight": "model-00174-of-00191.safetensors",
"model.layers.115.mlp.up_proj.weight": "model-00175-of-00191.safetensors",
"model.layers.115.post_attention_layernorm.weight": "model-00175-of-00191.safetensors",
"model.layers.115.self_attn.k_proj.weight": "model-00174-of-00191.safetensors",
"model.layers.115.self_attn.o_proj.weight": "model-00174-of-00191.safetensors",
"model.layers.115.self_attn.q_proj.weight": "model-00174-of-00191.safetensors",
"model.layers.115.self_attn.v_proj.weight": "model-00174-of-00191.safetensors",
"model.layers.116.input_layernorm.weight": "model-00177-of-00191.safetensors",
"model.layers.116.mlp.down_proj.weight": "model-00177-of-00191.safetensors",
"model.layers.116.mlp.gate_proj.weight": "model-00176-of-00191.safetensors",
"model.layers.116.mlp.up_proj.weight": "model-00176-of-00191.safetensors",
"model.layers.116.post_attention_layernorm.weight": "model-00177-of-00191.safetensors",
"model.layers.116.self_attn.k_proj.weight": "model-00175-of-00191.safetensors",
"model.layers.116.self_attn.o_proj.weight": "model-00175-of-00191.safetensors",
"model.layers.116.self_attn.q_proj.weight": "model-00175-of-00191.safetensors",
"model.layers.116.self_attn.v_proj.weight": "model-00175-of-00191.safetensors",
"model.layers.117.input_layernorm.weight": "model-00178-of-00191.safetensors",
"model.layers.117.mlp.down_proj.weight": "model-00178-of-00191.safetensors",
"model.layers.117.mlp.gate_proj.weight": "model-00177-of-00191.safetensors",
"model.layers.117.mlp.up_proj.weight": "model-00178-of-00191.safetensors",
"model.layers.117.post_attention_layernorm.weight": "model-00178-of-00191.safetensors",
"model.layers.117.self_attn.k_proj.weight": "model-00177-of-00191.safetensors",
"model.layers.117.self_attn.o_proj.weight": "model-00177-of-00191.safetensors",
"model.layers.117.self_attn.q_proj.weight": "model-00177-of-00191.safetensors",
"model.layers.117.self_attn.v_proj.weight": "model-00177-of-00191.safetensors",
"model.layers.118.input_layernorm.weight": "model-00180-of-00191.safetensors",
"model.layers.118.mlp.down_proj.weight": "model-00180-of-00191.safetensors",
"model.layers.118.mlp.gate_proj.weight": "model-00179-of-00191.safetensors",
"model.layers.118.mlp.up_proj.weight": "model-00179-of-00191.safetensors",
"model.layers.118.post_attention_layernorm.weight": "model-00180-of-00191.safetensors",
"model.layers.118.self_attn.k_proj.weight": "model-00178-of-00191.safetensors",
"model.layers.118.self_attn.o_proj.weight": "model-00178-of-00191.safetensors",
"model.layers.118.self_attn.q_proj.weight": "model-00178-of-00191.safetensors",
"model.layers.118.self_attn.v_proj.weight": "model-00178-of-00191.safetensors",
"model.layers.119.input_layernorm.weight": "model-00181-of-00191.safetensors",
"model.layers.119.mlp.down_proj.weight": "model-00181-of-00191.safetensors",
"model.layers.119.mlp.gate_proj.weight": "model-00180-of-00191.safetensors",
"model.layers.119.mlp.up_proj.weight": "model-00181-of-00191.safetensors",
"model.layers.119.post_attention_layernorm.weight": "model-00181-of-00191.safetensors",
"model.layers.119.self_attn.k_proj.weight": "model-00180-of-00191.safetensors",
"model.layers.119.self_attn.o_proj.weight": "model-00180-of-00191.safetensors",
"model.layers.119.self_attn.q_proj.weight": "model-00180-of-00191.safetensors",
"model.layers.119.self_attn.v_proj.weight": "model-00180-of-00191.safetensors",
"model.layers.12.input_layernorm.weight": "model-00021-of-00191.safetensors",
"model.layers.12.mlp.down_proj.weight": "model-00021-of-00191.safetensors",
"model.layers.12.mlp.gate_proj.weight": "model-00020-of-00191.safetensors",
"model.layers.12.mlp.up_proj.weight": "model-00020-of-00191.safetensors",
"model.layers.12.post_attention_layernorm.weight": "model-00021-of-00191.safetensors",
"model.layers.12.self_attn.k_proj.weight": "model-00019-of-00191.safetensors",
"model.layers.12.self_attn.o_proj.weight": "model-00019-of-00191.safetensors",
"model.layers.12.self_attn.q_proj.weight": "model-00019-of-00191.safetensors",
"model.layers.12.self_attn.v_proj.weight": "model-00019-of-00191.safetensors",
"model.layers.120.input_layernorm.weight": "model-00183-of-00191.safetensors",
"model.layers.120.mlp.down_proj.weight": "model-00183-of-00191.safetensors",
"model.layers.120.mlp.gate_proj.weight": "model-00182-of-00191.safetensors",
"model.layers.120.mlp.up_proj.weight": "model-00182-of-00191.safetensors",
"model.layers.120.post_attention_layernorm.weight": "model-00183-of-00191.safetensors",
"model.layers.120.self_attn.k_proj.weight": "model-00181-of-00191.safetensors",
"model.layers.120.self_attn.o_proj.weight": "model-00181-of-00191.safetensors",
"model.layers.120.self_attn.q_proj.weight": "model-00181-of-00191.safetensors",
"model.layers.120.self_attn.v_proj.weight": "model-00181-of-00191.safetensors",
"model.layers.121.input_layernorm.weight": "model-00184-of-00191.safetensors",
"model.layers.121.mlp.down_proj.weight": "model-00184-of-00191.safetensors",
"model.layers.121.mlp.gate_proj.weight": "model-00183-of-00191.safetensors",
"model.layers.121.mlp.up_proj.weight": "model-00184-of-00191.safetensors",
"model.layers.121.post_attention_layernorm.weight": "model-00184-of-00191.safetensors",
"model.layers.121.self_attn.k_proj.weight": "model-00183-of-00191.safetensors",
"model.layers.121.self_attn.o_proj.weight": "model-00183-of-00191.safetensors",
"model.layers.121.self_attn.q_proj.weight": "model-00183-of-00191.safetensors",
"model.layers.121.self_attn.v_proj.weight": "model-00183-of-00191.safetensors",
"model.layers.122.input_layernorm.weight": "model-00186-of-00191.safetensors",
"model.layers.122.mlp.down_proj.weight": "model-00186-of-00191.safetensors",
"model.layers.122.mlp.gate_proj.weight": "model-00185-of-00191.safetensors",
"model.layers.122.mlp.up_proj.weight": "model-00185-of-00191.safetensors",
"model.layers.122.post_attention_layernorm.weight": "model-00186-of-00191.safetensors",
"model.layers.122.self_attn.k_proj.weight": "model-00184-of-00191.safetensors",
"model.layers.122.self_attn.o_proj.weight": "model-00184-of-00191.safetensors",
"model.layers.122.self_attn.q_proj.weight": "model-00184-of-00191.safetensors",
"model.layers.122.self_attn.v_proj.weight": "model-00184-of-00191.safetensors",
"model.layers.123.input_layernorm.weight": "model-00187-of-00191.safetensors",
"model.layers.123.mlp.down_proj.weight": "model-00187-of-00191.safetensors",
"model.layers.123.mlp.gate_proj.weight": "model-00186-of-00191.safetensors",
"model.layers.123.mlp.up_proj.weight": "model-00187-of-00191.safetensors",
"model.layers.123.post_attention_layernorm.weight": "model-00187-of-00191.safetensors",
"model.layers.123.self_attn.k_proj.weight": "model-00186-of-00191.safetensors",
"model.layers.123.self_attn.o_proj.weight": "model-00186-of-00191.safetensors",
"model.layers.123.self_attn.q_proj.weight": "model-00186-of-00191.safetensors",
"model.layers.123.self_attn.v_proj.weight": "model-00186-of-00191.safetensors",
"model.layers.124.input_layernorm.weight": "model-00189-of-00191.safetensors",
"model.layers.124.mlp.down_proj.weight": "model-00189-of-00191.safetensors",
"model.layers.124.mlp.gate_proj.weight": "model-00188-of-00191.safetensors",
"model.layers.124.mlp.up_proj.weight": "model-00188-of-00191.safetensors",
"model.layers.124.post_attention_layernorm.weight": "model-00189-of-00191.safetensors",
"model.layers.124.self_attn.k_proj.weight": "model-00187-of-00191.safetensors",
"model.layers.124.self_attn.o_proj.weight": "model-00187-of-00191.safetensors",
"model.layers.124.self_attn.q_proj.weight": "model-00187-of-00191.safetensors",
"model.layers.124.self_attn.v_proj.weight": "model-00187-of-00191.safetensors",
"model.layers.125.input_layernorm.weight": "model-00190-of-00191.safetensors",
"model.layers.125.mlp.down_proj.weight": "model-00190-of-00191.safetensors",
"model.layers.125.mlp.gate_proj.weight": "model-00189-of-00191.safetensors",
"model.layers.125.mlp.up_proj.weight": "model-00190-of-00191.safetensors",
"model.layers.125.post_attention_layernorm.weight": "model-00190-of-00191.safetensors",
"model.layers.125.self_attn.k_proj.weight": "model-00189-of-00191.safetensors",
"model.layers.125.self_attn.o_proj.weight": "model-00189-of-00191.safetensors",
"model.layers.125.self_attn.q_proj.weight": "model-00189-of-00191.safetensors",
"model.layers.125.self_attn.v_proj.weight": "model-00189-of-00191.safetensors",
"model.layers.13.input_layernorm.weight": "model-00022-of-00191.safetensors",
"model.layers.13.mlp.down_proj.weight": "model-00022-of-00191.safetensors",
"model.layers.13.mlp.gate_proj.weight": "model-00021-of-00191.safetensors",
"model.layers.13.mlp.up_proj.weight": "model-00022-of-00191.safetensors",
"model.layers.13.post_attention_layernorm.weight": "model-00022-of-00191.safetensors",
"model.layers.13.self_attn.k_proj.weight": "model-00021-of-00191.safetensors",
"model.layers.13.self_attn.o_proj.weight": "model-00021-of-00191.safetensors",
"model.layers.13.self_attn.q_proj.weight": "model-00021-of-00191.safetensors",
"model.layers.13.self_attn.v_proj.weight": "model-00021-of-00191.safetensors",
"model.layers.14.input_layernorm.weight": "model-00024-of-00191.safetensors",
"model.layers.14.mlp.down_proj.weight": "model-00024-of-00191.safetensors",
"model.layers.14.mlp.gate_proj.weight": "model-00023-of-00191.safetensors",
"model.layers.14.mlp.up_proj.weight": "model-00023-of-00191.safetensors",
"model.layers.14.post_attention_layernorm.weight": "model-00024-of-00191.safetensors",
"model.layers.14.self_attn.k_proj.weight": "model-00022-of-00191.safetensors",
"model.layers.14.self_attn.o_proj.weight": "model-00022-of-00191.safetensors",
"model.layers.14.self_attn.q_proj.weight": "model-00022-of-00191.safetensors",
"model.layers.14.self_attn.v_proj.weight": "model-00022-of-00191.safetensors",
"model.layers.15.input_layernorm.weight": "model-00025-of-00191.safetensors",
"model.layers.15.mlp.down_proj.weight": "model-00025-of-00191.safetensors",
"model.layers.15.mlp.gate_proj.weight": "model-00024-of-00191.safetensors",
"model.layers.15.mlp.up_proj.weight": "model-00025-of-00191.safetensors",
"model.layers.15.post_attention_layernorm.weight": "model-00025-of-00191.safetensors",
"model.layers.15.self_attn.k_proj.weight": "model-00024-of-00191.safetensors",
"model.layers.15.self_attn.o_proj.weight": "model-00024-of-00191.safetensors",
"model.layers.15.self_attn.q_proj.weight": "model-00024-of-00191.safetensors",
"model.layers.15.self_attn.v_proj.weight": "model-00024-of-00191.safetensors",
"model.layers.16.input_layernorm.weight": "model-00027-of-00191.safetensors",
"model.layers.16.mlp.down_proj.weight": "model-00027-of-00191.safetensors",
"model.layers.16.mlp.gate_proj.weight": "model-00026-of-00191.safetensors",
"model.layers.16.mlp.up_proj.weight": "model-00026-of-00191.safetensors",
"model.layers.16.post_attention_layernorm.weight": "model-00027-of-00191.safetensors",
"model.layers.16.self_attn.k_proj.weight": "model-00025-of-00191.safetensors",
"model.layers.16.self_attn.o_proj.weight": "model-00025-of-00191.safetensors",
"model.layers.16.self_attn.q_proj.weight": "model-00025-of-00191.safetensors",
"model.layers.16.self_attn.v_proj.weight": "model-00025-of-00191.safetensors",
"model.layers.17.input_layernorm.weight": "model-00028-of-00191.safetensors",
"model.layers.17.mlp.down_proj.weight": "model-00028-of-00191.safetensors",
"model.layers.17.mlp.gate_proj.weight": "model-00027-of-00191.safetensors",
"model.layers.17.mlp.up_proj.weight": "model-00028-of-00191.safetensors",
"model.layers.17.post_attention_layernorm.weight": "model-00028-of-00191.safetensors",
"model.layers.17.self_attn.k_proj.weight": "model-00027-of-00191.safetensors",
"model.layers.17.self_attn.o_proj.weight": "model-00027-of-00191.safetensors",
"model.layers.17.self_attn.q_proj.weight": "model-00027-of-00191.safetensors",
"model.layers.17.self_attn.v_proj.weight": "model-00027-of-00191.safetensors",
"model.layers.18.input_layernorm.weight": "model-00030-of-00191.safetensors",
"model.layers.18.mlp.down_proj.weight": "model-00030-of-00191.safetensors",
"model.layers.18.mlp.gate_proj.weight": "model-00029-of-00191.safetensors",
"model.layers.18.mlp.up_proj.weight": "model-00029-of-00191.safetensors",
"model.layers.18.post_attention_layernorm.weight": "model-00030-of-00191.safetensors",
"model.layers.18.self_attn.k_proj.weight": "model-00028-of-00191.safetensors",
"model.layers.18.self_attn.o_proj.weight": "model-00028-of-00191.safetensors",
"model.layers.18.self_attn.q_proj.weight": "model-00028-of-00191.safetensors",
"model.layers.18.self_attn.v_proj.weight": "model-00028-of-00191.safetensors",
"model.layers.19.input_layernorm.weight": "model-00031-of-00191.safetensors",
"model.layers.19.mlp.down_proj.weight": "model-00031-of-00191.safetensors",
"model.layers.19.mlp.gate_proj.weight": "model-00030-of-00191.safetensors",
"model.layers.19.mlp.up_proj.weight": "model-00031-of-00191.safetensors",
"model.layers.19.post_attention_layernorm.weight": "model-00031-of-00191.safetensors",
"model.layers.19.self_attn.k_proj.weight": "model-00030-of-00191.safetensors",
"model.layers.19.self_attn.o_proj.weight": "model-00030-of-00191.safetensors",
"model.layers.19.self_attn.q_proj.weight": "model-00030-of-00191.safetensors",
"model.layers.19.self_attn.v_proj.weight": "model-00030-of-00191.safetensors",
"model.layers.2.input_layernorm.weight": "model-00006-of-00191.safetensors",
"model.layers.2.mlp.down_proj.weight": "model-00006-of-00191.safetensors",
"model.layers.2.mlp.gate_proj.weight": "model-00005-of-00191.safetensors",
"model.layers.2.mlp.up_proj.weight": "model-00005-of-00191.safetensors",
"model.layers.2.post_attention_layernorm.weight": "model-00006-of-00191.safetensors",
"model.layers.2.self_attn.k_proj.weight": "model-00004-of-00191.safetensors",
"model.layers.2.self_attn.o_proj.weight": "model-00004-of-00191.safetensors",
"model.layers.2.self_attn.q_proj.weight": "model-00004-of-00191.safetensors",
"model.layers.2.self_attn.v_proj.weight": "model-00004-of-00191.safetensors",
"model.layers.20.input_layernorm.weight": "model-00033-of-00191.safetensors",
"model.layers.20.mlp.down_proj.weight": "model-00033-of-00191.safetensors",
"model.layers.20.mlp.gate_proj.weight": "model-00032-of-00191.safetensors",
"model.layers.20.mlp.up_proj.weight": "model-00032-of-00191.safetensors",
"model.layers.20.post_attention_layernorm.weight": "model-00033-of-00191.safetensors",
"model.layers.20.self_attn.k_proj.weight": "model-00031-of-00191.safetensors",
"model.layers.20.self_attn.o_proj.weight": "model-00031-of-00191.safetensors",
"model.layers.20.self_attn.q_proj.weight": "model-00031-of-00191.safetensors",
"model.layers.20.self_attn.v_proj.weight": "model-00031-of-00191.safetensors",
"model.layers.21.input_layernorm.weight": "model-00034-of-00191.safetensors",
"model.layers.21.mlp.down_proj.weight": "model-00034-of-00191.safetensors",
"model.layers.21.mlp.gate_proj.weight": "model-00033-of-00191.safetensors",
"model.layers.21.mlp.up_proj.weight": "model-00034-of-00191.safetensors",
"model.layers.21.post_attention_layernorm.weight": "model-00034-of-00191.safetensors",
"model.layers.21.self_attn.k_proj.weight": "model-00033-of-00191.safetensors",
"model.layers.21.self_attn.o_proj.weight": "model-00033-of-00191.safetensors",
"model.layers.21.self_attn.q_proj.weight": "model-00033-of-00191.safetensors",
"model.layers.21.self_attn.v_proj.weight": "model-00033-of-00191.safetensors",
"model.layers.22.input_layernorm.weight": "model-00036-of-00191.safetensors",
"model.layers.22.mlp.down_proj.weight": "model-00036-of-00191.safetensors",
"model.layers.22.mlp.gate_proj.weight": "model-00035-of-00191.safetensors",
"model.layers.22.mlp.up_proj.weight": "model-00035-of-00191.safetensors",
"model.layers.22.post_attention_layernorm.weight": "model-00036-of-00191.safetensors",
"model.layers.22.self_attn.k_proj.weight": "model-00034-of-00191.safetensors",
"model.layers.22.self_attn.o_proj.weight": "model-00034-of-00191.safetensors",
"model.layers.22.self_attn.q_proj.weight": "model-00034-of-00191.safetensors",
"model.layers.22.self_attn.v_proj.weight": "model-00034-of-00191.safetensors",
"model.layers.23.input_layernorm.weight": "model-00037-of-00191.safetensors",
"model.layers.23.mlp.down_proj.weight": "model-00037-of-00191.safetensors",
"model.layers.23.mlp.gate_proj.weight": "model-00036-of-00191.safetensors",
"model.layers.23.mlp.up_proj.weight": "model-00037-of-00191.safetensors",
"model.layers.23.post_attention_layernorm.weight": "model-00037-of-00191.safetensors",
"model.layers.23.self_attn.k_proj.weight": "model-00036-of-00191.safetensors",
"model.layers.23.self_attn.o_proj.weight": "model-00036-of-00191.safetensors",
"model.layers.23.self_attn.q_proj.weight": "model-00036-of-00191.safetensors",
"model.layers.23.self_attn.v_proj.weight": "model-00036-of-00191.safetensors",
"model.layers.24.input_layernorm.weight": "model-00039-of-00191.safetensors",
"model.layers.24.mlp.down_proj.weight": "model-00039-of-00191.safetensors",
"model.layers.24.mlp.gate_proj.weight": "model-00038-of-00191.safetensors",
"model.layers.24.mlp.up_proj.weight": "model-00038-of-00191.safetensors",
"model.layers.24.post_attention_layernorm.weight": "model-00039-of-00191.safetensors",
"model.layers.24.self_attn.k_proj.weight": "model-00037-of-00191.safetensors",
"model.layers.24.self_attn.o_proj.weight": "model-00037-of-00191.safetensors",
"model.layers.24.self_attn.q_proj.weight": "model-00037-of-00191.safetensors",
"model.layers.24.self_attn.v_proj.weight": "model-00037-of-00191.safetensors",
"model.layers.25.input_layernorm.weight": "model-00040-of-00191.safetensors",
"model.layers.25.mlp.down_proj.weight": "model-00040-of-00191.safetensors",
"model.layers.25.mlp.gate_proj.weight": "model-00039-of-00191.safetensors",
"model.layers.25.mlp.up_proj.weight": "model-00040-of-00191.safetensors",
"model.layers.25.post_attention_layernorm.weight": "model-00040-of-00191.safetensors",
"model.layers.25.self_attn.k_proj.weight": "model-00039-of-00191.safetensors",
"model.layers.25.self_attn.o_proj.weight": "model-00039-of-00191.safetensors",
"model.layers.25.self_attn.q_proj.weight": "model-00039-of-00191.safetensors",
"model.layers.25.self_attn.v_proj.weight": "model-00039-of-00191.safetensors",
"model.layers.26.input_layernorm.weight": "model-00042-of-00191.safetensors",
"model.layers.26.mlp.down_proj.weight": "model-00042-of-00191.safetensors",
"model.layers.26.mlp.gate_proj.weight": "model-00041-of-00191.safetensors",
"model.layers.26.mlp.up_proj.weight": "model-00041-of-00191.safetensors",
"model.layers.26.post_attention_layernorm.weight": "model-00042-of-00191.safetensors",
"model.layers.26.self_attn.k_proj.weight": "model-00040-of-00191.safetensors",
"model.layers.26.self_attn.o_proj.weight": "model-00040-of-00191.safetensors",
"model.layers.26.self_attn.q_proj.weight": "model-00040-of-00191.safetensors",
"model.layers.26.self_attn.v_proj.weight": "model-00040-of-00191.safetensors",
"model.layers.27.input_layernorm.weight": "model-00043-of-00191.safetensors",
"model.layers.27.mlp.down_proj.weight": "model-00043-of-00191.safetensors",
"model.layers.27.mlp.gate_proj.weight": "model-00042-of-00191.safetensors",
"model.layers.27.mlp.up_proj.weight": "model-00043-of-00191.safetensors",
"model.layers.27.post_attention_layernorm.weight": "model-00043-of-00191.safetensors",
"model.layers.27.self_attn.k_proj.weight": "model-00042-of-00191.safetensors",
"model.layers.27.self_attn.o_proj.weight": "model-00042-of-00191.safetensors",
"model.layers.27.self_attn.q_proj.weight": "model-00042-of-00191.safetensors",
"model.layers.27.self_attn.v_proj.weight": "model-00042-of-00191.safetensors",
"model.layers.28.input_layernorm.weight": "model-00045-of-00191.safetensors",
"model.layers.28.mlp.down_proj.weight": "model-00045-of-00191.safetensors",
"model.layers.28.mlp.gate_proj.weight": "model-00044-of-00191.safetensors",
"model.layers.28.mlp.up_proj.weight": "model-00044-of-00191.safetensors",
"model.layers.28.post_attention_layernorm.weight": "model-00045-of-00191.safetensors",
"model.layers.28.self_attn.k_proj.weight": "model-00043-of-00191.safetensors",
"model.layers.28.self_attn.o_proj.weight": "model-00043-of-00191.safetensors",
"model.layers.28.self_attn.q_proj.weight": "model-00043-of-00191.safetensors",
"model.layers.28.self_attn.v_proj.weight": "model-00043-of-00191.safetensors",
"model.layers.29.input_layernorm.weight": "model-00046-of-00191.safetensors",
"model.layers.29.mlp.down_proj.weight": "model-00046-of-00191.safetensors",
"model.layers.29.mlp.gate_proj.weight": "model-00045-of-00191.safetensors",
"model.layers.29.mlp.up_proj.weight": "model-00046-of-00191.safetensors",
"model.layers.29.post_attention_layernorm.weight": "model-00046-of-00191.safetensors",
"model.layers.29.self_attn.k_proj.weight": "model-00045-of-00191.safetensors",
"model.layers.29.self_attn.o_proj.weight": "model-00045-of-00191.safetensors",
"model.layers.29.self_attn.q_proj.weight": "model-00045-of-00191.safetensors",
"model.layers.29.self_attn.v_proj.weight": "model-00045-of-00191.safetensors",
"model.layers.3.input_layernorm.weight": "model-00007-of-00191.safetensors",
"model.layers.3.mlp.down_proj.weight": "model-00007-of-00191.safetensors",
"model.layers.3.mlp.gate_proj.weight": "model-00006-of-00191.safetensors",
"model.layers.3.mlp.up_proj.weight": "model-00007-of-00191.safetensors",
"model.layers.3.post_attention_layernorm.weight": "model-00007-of-00191.safetensors",
"model.layers.3.self_attn.k_proj.weight": "model-00006-of-00191.safetensors",
"model.layers.3.self_attn.o_proj.weight": "model-00006-of-00191.safetensors",
"model.layers.3.self_attn.q_proj.weight": "model-00006-of-00191.safetensors",
"model.layers.3.self_attn.v_proj.weight": "model-00006-of-00191.safetensors",
"model.layers.30.input_layernorm.weight": "model-00048-of-00191.safetensors",
"model.layers.30.mlp.down_proj.weight": "model-00048-of-00191.safetensors",
"model.layers.30.mlp.gate_proj.weight": "model-00047-of-00191.safetensors",
"model.layers.30.mlp.up_proj.weight": "model-00047-of-00191.safetensors",
"model.layers.30.post_attention_layernorm.weight": "model-00048-of-00191.safetensors",
"model.layers.30.self_attn.k_proj.weight": "model-00046-of-00191.safetensors",
"model.layers.30.self_attn.o_proj.weight": "model-00046-of-00191.safetensors",
"model.layers.30.self_attn.q_proj.weight": "model-00046-of-00191.safetensors",
"model.layers.30.self_attn.v_proj.weight": "model-00046-of-00191.safetensors",
"model.layers.31.input_layernorm.weight": "model-00049-of-00191.safetensors",
"model.layers.31.mlp.down_proj.weight": "model-00049-of-00191.safetensors",
"model.layers.31.mlp.gate_proj.weight": "model-00048-of-00191.safetensors",
"model.layers.31.mlp.up_proj.weight": "model-00049-of-00191.safetensors",
"model.layers.31.post_attention_layernorm.weight": "model-00049-of-00191.safetensors",
"model.layers.31.self_attn.k_proj.weight": "model-00048-of-00191.safetensors",
"model.layers.31.self_attn.o_proj.weight": "model-00048-of-00191.safetensors",
"model.layers.31.self_attn.q_proj.weight": "model-00048-of-00191.safetensors",
"model.layers.31.self_attn.v_proj.weight": "model-00048-of-00191.safetensors",
"model.layers.32.input_layernorm.weight": "model-00051-of-00191.safetensors",
"model.layers.32.mlp.down_proj.weight": "model-00051-of-00191.safetensors",
"model.layers.32.mlp.gate_proj.weight": "model-00050-of-00191.safetensors",
"model.layers.32.mlp.up_proj.weight": "model-00050-of-00191.safetensors",
"model.layers.32.post_attention_layernorm.weight": "model-00051-of-00191.safetensors",
"model.layers.32.self_attn.k_proj.weight": "model-00049-of-00191.safetensors",
"model.layers.32.self_attn.o_proj.weight": "model-00049-of-00191.safetensors",
"model.layers.32.self_attn.q_proj.weight": "model-00049-of-00191.safetensors",
"model.layers.32.self_attn.v_proj.weight": "model-00049-of-00191.safetensors",
"model.layers.33.input_layernorm.weight": "model-00052-of-00191.safetensors",
"model.layers.33.mlp.down_proj.weight": "model-00052-of-00191.safetensors",
"model.layers.33.mlp.gate_proj.weight": "model-00051-of-00191.safetensors",
"model.layers.33.mlp.up_proj.weight": "model-00052-of-00191.safetensors",
"model.layers.33.post_attention_layernorm.weight": "model-00052-of-00191.safetensors",
"model.layers.33.self_attn.k_proj.weight": "model-00051-of-00191.safetensors",
"model.layers.33.self_attn.o_proj.weight": "model-00051-of-00191.safetensors",
"model.layers.33.self_attn.q_proj.weight": "model-00051-of-00191.safetensors",
"model.layers.33.self_attn.v_proj.weight": "model-00051-of-00191.safetensors",
"model.layers.34.input_layernorm.weight": "model-00054-of-00191.safetensors",
"model.layers.34.mlp.down_proj.weight": "model-00054-of-00191.safetensors",
"model.layers.34.mlp.gate_proj.weight": "model-00053-of-00191.safetensors",
"model.layers.34.mlp.up_proj.weight": "model-00053-of-00191.safetensors",
"model.layers.34.post_attention_layernorm.weight": "model-00054-of-00191.safetensors",
"model.layers.34.self_attn.k_proj.weight": "model-00052-of-00191.safetensors",
"model.layers.34.self_attn.o_proj.weight": "model-00052-of-00191.safetensors",
"model.layers.34.self_attn.q_proj.weight": "model-00052-of-00191.safetensors",
"model.layers.34.self_attn.v_proj.weight": "model-00052-of-00191.safetensors",
"model.layers.35.input_layernorm.weight": "model-00055-of-00191.safetensors",
"model.layers.35.mlp.down_proj.weight": "model-00055-of-00191.safetensors",
"model.layers.35.mlp.gate_proj.weight": "model-00054-of-00191.safetensors",
"model.layers.35.mlp.up_proj.weight": "model-00055-of-00191.safetensors",
"model.layers.35.post_attention_layernorm.weight": "model-00055-of-00191.safetensors",
"model.layers.35.self_attn.k_proj.weight": "model-00054-of-00191.safetensors",
"model.layers.35.self_attn.o_proj.weight": "model-00054-of-00191.safetensors",
"model.layers.35.self_attn.q_proj.weight": "model-00054-of-00191.safetensors",
"model.layers.35.self_attn.v_proj.weight": "model-00054-of-00191.safetensors",
"model.layers.36.input_layernorm.weight": "model-00057-of-00191.safetensors",
"model.layers.36.mlp.down_proj.weight": "model-00057-of-00191.safetensors",
"model.layers.36.mlp.gate_proj.weight": "model-00056-of-00191.safetensors",
"model.layers.36.mlp.up_proj.weight": "model-00056-of-00191.safetensors",
"model.layers.36.post_attention_layernorm.weight": "model-00057-of-00191.safetensors",
"model.layers.36.self_attn.k_proj.weight": "model-00055-of-00191.safetensors",
"model.layers.36.self_attn.o_proj.weight": "model-00055-of-00191.safetensors",
"model.layers.36.self_attn.q_proj.weight": "model-00055-of-00191.safetensors",
"model.layers.36.self_attn.v_proj.weight": "model-00055-of-00191.safetensors",
"model.layers.37.input_layernorm.weight": "model-00058-of-00191.safetensors",
"model.layers.37.mlp.down_proj.weight": "model-00058-of-00191.safetensors",
"model.layers.37.mlp.gate_proj.weight": "model-00057-of-00191.safetensors",
"model.layers.37.mlp.up_proj.weight": "model-00058-of-00191.safetensors",
"model.layers.37.post_attention_layernorm.weight": "model-00058-of-00191.safetensors",
"model.layers.37.self_attn.k_proj.weight": "model-00057-of-00191.safetensors",
"model.layers.37.self_attn.o_proj.weight": "model-00057-of-00191.safetensors",
"model.layers.37.self_attn.q_proj.weight": "model-00057-of-00191.safetensors",
"model.layers.37.self_attn.v_proj.weight": "model-00057-of-00191.safetensors",
"model.layers.38.input_layernorm.weight": "model-00060-of-00191.safetensors",
"model.layers.38.mlp.down_proj.weight": "model-00060-of-00191.safetensors",
"model.layers.38.mlp.gate_proj.weight": "model-00059-of-00191.safetensors",
"model.layers.38.mlp.up_proj.weight": "model-00059-of-00191.safetensors",
"model.layers.38.post_attention_layernorm.weight": "model-00060-of-00191.safetensors",
"model.layers.38.self_attn.k_proj.weight": "model-00058-of-00191.safetensors",
"model.layers.38.self_attn.o_proj.weight": "model-00058-of-00191.safetensors",
"model.layers.38.self_attn.q_proj.weight": "model-00058-of-00191.safetensors",
"model.layers.38.self_attn.v_proj.weight": "model-00058-of-00191.safetensors",
"model.layers.39.input_layernorm.weight": "model-00061-of-00191.safetensors",
"model.layers.39.mlp.down_proj.weight": "model-00061-of-00191.safetensors",
"model.layers.39.mlp.gate_proj.weight": "model-00060-of-00191.safetensors",
"model.layers.39.mlp.up_proj.weight": "model-00061-of-00191.safetensors",
"model.layers.39.post_attention_layernorm.weight": "model-00061-of-00191.safetensors",
"model.layers.39.self_attn.k_proj.weight": "model-00060-of-00191.safetensors",
"model.layers.39.self_attn.o_proj.weight": "model-00060-of-00191.safetensors",
"model.layers.39.self_attn.q_proj.weight": "model-00060-of-00191.safetensors",
"model.layers.39.self_attn.v_proj.weight": "model-00060-of-00191.safetensors",
"model.layers.4.input_layernorm.weight": "model-00009-of-00191.safetensors",
"model.layers.4.mlp.down_proj.weight": "model-00009-of-00191.safetensors",
"model.layers.4.mlp.gate_proj.weight": "model-00008-of-00191.safetensors",
"model.layers.4.mlp.up_proj.weight": "model-00008-of-00191.safetensors",
"model.layers.4.post_attention_layernorm.weight": "model-00009-of-00191.safetensors",
"model.layers.4.self_attn.k_proj.weight": "model-00007-of-00191.safetensors",
"model.layers.4.self_attn.o_proj.weight": "model-00007-of-00191.safetensors",
"model.layers.4.self_attn.q_proj.weight": "model-00007-of-00191.safetensors",
"model.layers.4.self_attn.v_proj.weight": "model-00007-of-00191.safetensors",
"model.layers.40.input_layernorm.weight": "model-00063-of-00191.safetensors",
"model.layers.40.mlp.down_proj.weight": "model-00063-of-00191.safetensors",
"model.layers.40.mlp.gate_proj.weight": "model-00062-of-00191.safetensors",
"model.layers.40.mlp.up_proj.weight": "model-00062-of-00191.safetensors",
"model.layers.40.post_attention_layernorm.weight": "model-00063-of-00191.safetensors",
"model.layers.40.self_attn.k_proj.weight": "model-00061-of-00191.safetensors",
"model.layers.40.self_attn.o_proj.weight": "model-00061-of-00191.safetensors",
"model.layers.40.self_attn.q_proj.weight": "model-00061-of-00191.safetensors",
"model.layers.40.self_attn.v_proj.weight": "model-00061-of-00191.safetensors",
"model.layers.41.input_layernorm.weight": "model-00064-of-00191.safetensors",
"model.layers.41.mlp.down_proj.weight": "model-00064-of-00191.safetensors",
"model.layers.41.mlp.gate_proj.weight": "model-00063-of-00191.safetensors",
"model.layers.41.mlp.up_proj.weight": "model-00064-of-00191.safetensors",
"model.layers.41.post_attention_layernorm.weight": "model-00064-of-00191.safetensors",
"model.layers.41.self_attn.k_proj.weight": "model-00063-of-00191.safetensors",
"model.layers.41.self_attn.o_proj.weight": "model-00063-of-00191.safetensors",
"model.layers.41.self_attn.q_proj.weight": "model-00063-of-00191.safetensors",
"model.layers.41.self_attn.v_proj.weight": "model-00063-of-00191.safetensors",
"model.layers.42.input_layernorm.weight": "model-00066-of-00191.safetensors",
"model.layers.42.mlp.down_proj.weight": "model-00066-of-00191.safetensors",
"model.layers.42.mlp.gate_proj.weight": "model-00065-of-00191.safetensors",
"model.layers.42.mlp.up_proj.weight": "model-00065-of-00191.safetensors",
"model.layers.42.post_attention_layernorm.weight": "model-00066-of-00191.safetensors",
"model.layers.42.self_attn.k_proj.weight": "model-00064-of-00191.safetensors",
"model.layers.42.self_attn.o_proj.weight": "model-00064-of-00191.safetensors",
"model.layers.42.self_attn.q_proj.weight": "model-00064-of-00191.safetensors",
"model.layers.42.self_attn.v_proj.weight": "model-00064-of-00191.safetensors",
"model.layers.43.input_layernorm.weight": "model-00067-of-00191.safetensors",
"model.layers.43.mlp.down_proj.weight": "model-00067-of-00191.safetensors",
"model.layers.43.mlp.gate_proj.weight": "model-00066-of-00191.safetensors",
"model.layers.43.mlp.up_proj.weight": "model-00067-of-00191.safetensors",
"model.layers.43.post_attention_layernorm.weight": "model-00067-of-00191.safetensors",
"model.layers.43.self_attn.k_proj.weight": "model-00066-of-00191.safetensors",
"model.layers.43.self_attn.o_proj.weight": "model-00066-of-00191.safetensors",
"model.layers.43.self_attn.q_proj.weight": "model-00066-of-00191.safetensors",
"model.layers.43.self_attn.v_proj.weight": "model-00066-of-00191.safetensors",
"model.layers.44.input_layernorm.weight": "model-00069-of-00191.safetensors",
"model.layers.44.mlp.down_proj.weight": "model-00069-of-00191.safetensors",
"model.layers.44.mlp.gate_proj.weight": "model-00068-of-00191.safetensors",
"model.layers.44.mlp.up_proj.weight": "model-00068-of-00191.safetensors",
"model.layers.44.post_attention_layernorm.weight": "model-00069-of-00191.safetensors",
"model.layers.44.self_attn.k_proj.weight": "model-00067-of-00191.safetensors",
"model.layers.44.self_attn.o_proj.weight": "model-00067-of-00191.safetensors",
"model.layers.44.self_attn.q_proj.weight": "model-00067-of-00191.safetensors",
"model.layers.44.self_attn.v_proj.weight": "model-00067-of-00191.safetensors",
"model.layers.45.input_layernorm.weight": "model-00070-of-00191.safetensors",
"model.layers.45.mlp.down_proj.weight": "model-00070-of-00191.safetensors",
"model.layers.45.mlp.gate_proj.weight": "model-00069-of-00191.safetensors",
"model.layers.45.mlp.up_proj.weight": "model-00070-of-00191.safetensors",
"model.layers.45.post_attention_layernorm.weight": "model-00070-of-00191.safetensors",
"model.layers.45.self_attn.k_proj.weight": "model-00069-of-00191.safetensors",
"model.layers.45.self_attn.o_proj.weight": "model-00069-of-00191.safetensors",
"model.layers.45.self_attn.q_proj.weight": "model-00069-of-00191.safetensors",
"model.layers.45.self_attn.v_proj.weight": "model-00069-of-00191.safetensors",
"model.layers.46.input_layernorm.weight": "model-00072-of-00191.safetensors",
"model.layers.46.mlp.down_proj.weight": "model-00072-of-00191.safetensors",
"model.layers.46.mlp.gate_proj.weight": "model-00071-of-00191.safetensors",
"model.layers.46.mlp.up_proj.weight": "model-00071-of-00191.safetensors",
"model.layers.46.post_attention_layernorm.weight": "model-00072-of-00191.safetensors",
"model.layers.46.self_attn.k_proj.weight": "model-00070-of-00191.safetensors",
"model.layers.46.self_attn.o_proj.weight": "model-00070-of-00191.safetensors",
"model.layers.46.self_attn.q_proj.weight": "model-00070-of-00191.safetensors",
"model.layers.46.self_attn.v_proj.weight": "model-00070-of-00191.safetensors",
"model.layers.47.input_layernorm.weight": "model-00073-of-00191.safetensors",
"model.layers.47.mlp.down_proj.weight": "model-00073-of-00191.safetensors",
"model.layers.47.mlp.gate_proj.weight": "model-00072-of-00191.safetensors",
"model.layers.47.mlp.up_proj.weight": "model-00073-of-00191.safetensors",
"model.layers.47.post_attention_layernorm.weight": "model-00073-of-00191.safetensors",
"model.layers.47.self_attn.k_proj.weight": "model-00072-of-00191.safetensors",
"model.layers.47.self_attn.o_proj.weight": "model-00072-of-00191.safetensors",
"model.layers.47.self_attn.q_proj.weight": "model-00072-of-00191.safetensors",
"model.layers.47.self_attn.v_proj.weight": "model-00072-of-00191.safetensors",
"model.layers.48.input_layernorm.weight": "model-00075-of-00191.safetensors",
"model.layers.48.mlp.down_proj.weight": "model-00075-of-00191.safetensors",
"model.layers.48.mlp.gate_proj.weight": "model-00074-of-00191.safetensors",
"model.layers.48.mlp.up_proj.weight": "model-00074-of-00191.safetensors",
"model.layers.48.post_attention_layernorm.weight": "model-00075-of-00191.safetensors",
"model.layers.48.self_attn.k_proj.weight": "model-00073-of-00191.safetensors",
"model.layers.48.self_attn.o_proj.weight": "model-00073-of-00191.safetensors",
"model.layers.48.self_attn.q_proj.weight": "model-00073-of-00191.safetensors",
"model.layers.48.self_attn.v_proj.weight": "model-00073-of-00191.safetensors",
"model.layers.49.input_layernorm.weight": "model-00076-of-00191.safetensors",
"model.layers.49.mlp.down_proj.weight": "model-00076-of-00191.safetensors",
"model.layers.49.mlp.gate_proj.weight": "model-00075-of-00191.safetensors",
"model.layers.49.mlp.up_proj.weight": "model-00076-of-00191.safetensors",
"model.layers.49.post_attention_layernorm.weight": "model-00076-of-00191.safetensors",
"model.layers.49.self_attn.k_proj.weight": "model-00075-of-00191.safetensors",
"model.layers.49.self_attn.o_proj.weight": "model-00075-of-00191.safetensors",
"model.layers.49.self_attn.q_proj.weight": "model-00075-of-00191.safetensors",
"model.layers.49.self_attn.v_proj.weight": "model-00075-of-00191.safetensors",
"model.layers.5.input_layernorm.weight": "model-00010-of-00191.safetensors",
"model.layers.5.mlp.down_proj.weight": "model-00010-of-00191.safetensors",
"model.layers.5.mlp.gate_proj.weight": "model-00009-of-00191.safetensors",
"model.layers.5.mlp.up_proj.weight": "model-00010-of-00191.safetensors",
"model.layers.5.post_attention_layernorm.weight": "model-00010-of-00191.safetensors",
"model.layers.5.self_attn.k_proj.weight": "model-00009-of-00191.safetensors",
"model.layers.5.self_attn.o_proj.weight": "model-00009-of-00191.safetensors",
"model.layers.5.self_attn.q_proj.weight": "model-00009-of-00191.safetensors",
"model.layers.5.self_attn.v_proj.weight": "model-00009-of-00191.safetensors",
"model.layers.50.input_layernorm.weight": "model-00078-of-00191.safetensors",
"model.layers.50.mlp.down_proj.weight": "model-00078-of-00191.safetensors",
"model.layers.50.mlp.gate_proj.weight": "model-00077-of-00191.safetensors",
"model.layers.50.mlp.up_proj.weight": "model-00077-of-00191.safetensors",
"model.layers.50.post_attention_layernorm.weight": "model-00078-of-00191.safetensors",
"model.layers.50.self_attn.k_proj.weight": "model-00076-of-00191.safetensors",
"model.layers.50.self_attn.o_proj.weight": "model-00076-of-00191.safetensors",
"model.layers.50.self_attn.q_proj.weight": "model-00076-of-00191.safetensors",
"model.layers.50.self_attn.v_proj.weight": "model-00076-of-00191.safetensors",
"model.layers.51.input_layernorm.weight": "model-00079-of-00191.safetensors",
"model.layers.51.mlp.down_proj.weight": "model-00079-of-00191.safetensors",
"model.layers.51.mlp.gate_proj.weight": "model-00078-of-00191.safetensors",
"model.layers.51.mlp.up_proj.weight": "model-00079-of-00191.safetensors",
"model.layers.51.post_attention_layernorm.weight": "model-00079-of-00191.safetensors",
"model.layers.51.self_attn.k_proj.weight": "model-00078-of-00191.safetensors",
"model.layers.51.self_attn.o_proj.weight": "model-00078-of-00191.safetensors",
"model.layers.51.self_attn.q_proj.weight": "model-00078-of-00191.safetensors",
"model.layers.51.self_attn.v_proj.weight": "model-00078-of-00191.safetensors",
"model.layers.52.input_layernorm.weight": "model-00081-of-00191.safetensors",
"model.layers.52.mlp.down_proj.weight": "model-00081-of-00191.safetensors",
"model.layers.52.mlp.gate_proj.weight": "model-00080-of-00191.safetensors",
"model.layers.52.mlp.up_proj.weight": "model-00080-of-00191.safetensors",
"model.layers.52.post_attention_layernorm.weight": "model-00081-of-00191.safetensors",
"model.layers.52.self_attn.k_proj.weight": "model-00079-of-00191.safetensors",
"model.layers.52.self_attn.o_proj.weight": "model-00079-of-00191.safetensors",
"model.layers.52.self_attn.q_proj.weight": "model-00079-of-00191.safetensors",
"model.layers.52.self_attn.v_proj.weight": "model-00079-of-00191.safetensors",
"model.layers.53.input_layernorm.weight": "model-00082-of-00191.safetensors",
"model.layers.53.mlp.down_proj.weight": "model-00082-of-00191.safetensors",
"model.layers.53.mlp.gate_proj.weight": "model-00081-of-00191.safetensors",
"model.layers.53.mlp.up_proj.weight": "model-00082-of-00191.safetensors",
"model.layers.53.post_attention_layernorm.weight": "model-00082-of-00191.safetensors",
"model.layers.53.self_attn.k_proj.weight": "model-00081-of-00191.safetensors",
"model.layers.53.self_attn.o_proj.weight": "model-00081-of-00191.safetensors",
"model.layers.53.self_attn.q_proj.weight": "model-00081-of-00191.safetensors",
"model.layers.53.self_attn.v_proj.weight": "model-00081-of-00191.safetensors",
"model.layers.54.input_layernorm.weight": "model-00084-of-00191.safetensors",
"model.layers.54.mlp.down_proj.weight": "model-00084-of-00191.safetensors",
"model.layers.54.mlp.gate_proj.weight": "model-00083-of-00191.safetensors",
"model.layers.54.mlp.up_proj.weight": "model-00083-of-00191.safetensors",
"model.layers.54.post_attention_layernorm.weight": "model-00084-of-00191.safetensors",
"model.layers.54.self_attn.k_proj.weight": "model-00082-of-00191.safetensors",
"model.layers.54.self_attn.o_proj.weight": "model-00082-of-00191.safetensors",
"model.layers.54.self_attn.q_proj.weight": "model-00082-of-00191.safetensors",
"model.layers.54.self_attn.v_proj.weight": "model-00082-of-00191.safetensors",
"model.layers.55.input_layernorm.weight": "model-00085-of-00191.safetensors",
"model.layers.55.mlp.down_proj.weight": "model-00085-of-00191.safetensors",
"model.layers.55.mlp.gate_proj.weight": "model-00084-of-00191.safetensors",
"model.layers.55.mlp.up_proj.weight": "model-00085-of-00191.safetensors",
"model.layers.55.post_attention_layernorm.weight": "model-00085-of-00191.safetensors",
"model.layers.55.self_attn.k_proj.weight": "model-00084-of-00191.safetensors",
"model.layers.55.self_attn.o_proj.weight": "model-00084-of-00191.safetensors",
"model.layers.55.self_attn.q_proj.weight": "model-00084-of-00191.safetensors",
"model.layers.55.self_attn.v_proj.weight": "model-00084-of-00191.safetensors",
"model.layers.56.input_layernorm.weight": "model-00087-of-00191.safetensors",
"model.layers.56.mlp.down_proj.weight": "model-00087-of-00191.safetensors",
"model.layers.56.mlp.gate_proj.weight": "model-00086-of-00191.safetensors",
"model.layers.56.mlp.up_proj.weight": "model-00086-of-00191.safetensors",
"model.layers.56.post_attention_layernorm.weight": "model-00087-of-00191.safetensors",
"model.layers.56.self_attn.k_proj.weight": "model-00085-of-00191.safetensors",
"model.layers.56.self_attn.o_proj.weight": "model-00085-of-00191.safetensors",
"model.layers.56.self_attn.q_proj.weight": "model-00085-of-00191.safetensors",
"model.layers.56.self_attn.v_proj.weight": "model-00085-of-00191.safetensors",
"model.layers.57.input_layernorm.weight": "model-00088-of-00191.safetensors",
"model.layers.57.mlp.down_proj.weight": "model-00088-of-00191.safetensors",
"model.layers.57.mlp.gate_proj.weight": "model-00087-of-00191.safetensors",
"model.layers.57.mlp.up_proj.weight": "model-00088-of-00191.safetensors",
"model.layers.57.post_attention_layernorm.weight": "model-00088-of-00191.safetensors",
"model.layers.57.self_attn.k_proj.weight": "model-00087-of-00191.safetensors",
"model.layers.57.self_attn.o_proj.weight": "model-00087-of-00191.safetensors",
"model.layers.57.self_attn.q_proj.weight": "model-00087-of-00191.safetensors",
"model.layers.57.self_attn.v_proj.weight": "model-00087-of-00191.safetensors",
"model.layers.58.input_layernorm.weight": "model-00090-of-00191.safetensors",
"model.layers.58.mlp.down_proj.weight": "model-00090-of-00191.safetensors",
"model.layers.58.mlp.gate_proj.weight": "model-00089-of-00191.safetensors",
"model.layers.58.mlp.up_proj.weight": "model-00089-of-00191.safetensors",
"model.layers.58.post_attention_layernorm.weight": "model-00090-of-00191.safetensors",
"model.layers.58.self_attn.k_proj.weight": "model-00088-of-00191.safetensors",
"model.layers.58.self_attn.o_proj.weight": "model-00088-of-00191.safetensors",
"model.layers.58.self_attn.q_proj.weight": "model-00088-of-00191.safetensors",
"model.layers.58.self_attn.v_proj.weight": "model-00088-of-00191.safetensors",
"model.layers.59.input_layernorm.weight": "model-00091-of-00191.safetensors",
"model.layers.59.mlp.down_proj.weight": "model-00091-of-00191.safetensors",
"model.layers.59.mlp.gate_proj.weight": "model-00090-of-00191.safetensors",
"model.layers.59.mlp.up_proj.weight": "model-00091-of-00191.safetensors",
"model.layers.59.post_attention_layernorm.weight": "model-00091-of-00191.safetensors",
"model.layers.59.self_attn.k_proj.weight": "model-00090-of-00191.safetensors",
"model.layers.59.self_attn.o_proj.weight": "model-00090-of-00191.safetensors",
"model.layers.59.self_attn.q_proj.weight": "model-00090-of-00191.safetensors",
"model.layers.59.self_attn.v_proj.weight": "model-00090-of-00191.safetensors",
"model.layers.6.input_layernorm.weight": "model-00012-of-00191.safetensors",
"model.layers.6.mlp.down_proj.weight": "model-00012-of-00191.safetensors",
"model.layers.6.mlp.gate_proj.weight": "model-00011-of-00191.safetensors",
"model.layers.6.mlp.up_proj.weight": "model-00011-of-00191.safetensors",
"model.layers.6.post_attention_layernorm.weight": "model-00012-of-00191.safetensors",
"model.layers.6.self_attn.k_proj.weight": "model-00010-of-00191.safetensors",
"model.layers.6.self_attn.o_proj.weight": "model-00010-of-00191.safetensors",
"model.layers.6.self_attn.q_proj.weight": "model-00010-of-00191.safetensors",
"model.layers.6.self_attn.v_proj.weight": "model-00010-of-00191.safetensors",
"model.layers.60.input_layernorm.weight": "model-00093-of-00191.safetensors",
"model.layers.60.mlp.down_proj.weight": "model-00093-of-00191.safetensors",
"model.layers.60.mlp.gate_proj.weight": "model-00092-of-00191.safetensors",
"model.layers.60.mlp.up_proj.weight": "model-00092-of-00191.safetensors",
"model.layers.60.post_attention_layernorm.weight": "model-00093-of-00191.safetensors",
"model.layers.60.self_attn.k_proj.weight": "model-00091-of-00191.safetensors",
"model.layers.60.self_attn.o_proj.weight": "model-00091-of-00191.safetensors",
"model.layers.60.self_attn.q_proj.weight": "model-00091-of-00191.safetensors",
"model.layers.60.self_attn.v_proj.weight": "model-00091-of-00191.safetensors",
"model.layers.61.input_layernorm.weight": "model-00094-of-00191.safetensors",
"model.layers.61.mlp.down_proj.weight": "model-00094-of-00191.safetensors",
"model.layers.61.mlp.gate_proj.weight": "model-00093-of-00191.safetensors",
"model.layers.61.mlp.up_proj.weight": "model-00094-of-00191.safetensors",
"model.layers.61.post_attention_layernorm.weight": "model-00094-of-00191.safetensors",
"model.layers.61.self_attn.k_proj.weight": "model-00093-of-00191.safetensors",
"model.layers.61.self_attn.o_proj.weight": "model-00093-of-00191.safetensors",
"model.layers.61.self_attn.q_proj.weight": "model-00093-of-00191.safetensors",
"model.layers.61.self_attn.v_proj.weight": "model-00093-of-00191.safetensors",
"model.layers.62.input_layernorm.weight": "model-00096-of-00191.safetensors",
"model.layers.62.mlp.down_proj.weight": "model-00096-of-00191.safetensors",
"model.layers.62.mlp.gate_proj.weight": "model-00095-of-00191.safetensors",
"model.layers.62.mlp.up_proj.weight": "model-00095-of-00191.safetensors",
"model.layers.62.post_attention_layernorm.weight": "model-00096-of-00191.safetensors",
"model.layers.62.self_attn.k_proj.weight": "model-00094-of-00191.safetensors",
"model.layers.62.self_attn.o_proj.weight": "model-00094-of-00191.safetensors",
"model.layers.62.self_attn.q_proj.weight": "model-00094-of-00191.safetensors",
"model.layers.62.self_attn.v_proj.weight": "model-00094-of-00191.safetensors",
"model.layers.63.input_layernorm.weight": "model-00097-of-00191.safetensors",
"model.layers.63.mlp.down_proj.weight": "model-00097-of-00191.safetensors",
"model.layers.63.mlp.gate_proj.weight": "model-00096-of-00191.safetensors",
"model.layers.63.mlp.up_proj.weight": "model-00097-of-00191.safetensors",
"model.layers.63.post_attention_layernorm.weight": "model-00097-of-00191.safetensors",
"model.layers.63.self_attn.k_proj.weight": "model-00096-of-00191.safetensors",
"model.layers.63.self_attn.o_proj.weight": "model-00096-of-00191.safetensors",
"model.layers.63.self_attn.q_proj.weight": "model-00096-of-00191.safetensors",
"model.layers.63.self_attn.v_proj.weight": "model-00096-of-00191.safetensors",
"model.layers.64.input_layernorm.weight": "model-00099-of-00191.safetensors",
"model.layers.64.mlp.down_proj.weight": "model-00099-of-00191.safetensors",
"model.layers.64.mlp.gate_proj.weight": "model-00098-of-00191.safetensors",
"model.layers.64.mlp.up_proj.weight": "model-00098-of-00191.safetensors",
"model.layers.64.post_attention_layernorm.weight": "model-00099-of-00191.safetensors",
"model.layers.64.self_attn.k_proj.weight": "model-00097-of-00191.safetensors",
"model.layers.64.self_attn.o_proj.weight": "model-00097-of-00191.safetensors",
"model.layers.64.self_attn.q_proj.weight": "model-00097-of-00191.safetensors",
"model.layers.64.self_attn.v_proj.weight": "model-00097-of-00191.safetensors",
"model.layers.65.input_layernorm.weight": "model-00100-of-00191.safetensors",
"model.layers.65.mlp.down_proj.weight": "model-00100-of-00191.safetensors",
"model.layers.65.mlp.gate_proj.weight": "model-00099-of-00191.safetensors",
"model.layers.65.mlp.up_proj.weight": "model-00100-of-00191.safetensors",
"model.layers.65.post_attention_layernorm.weight": "model-00100-of-00191.safetensors",
"model.layers.65.self_attn.k_proj.weight": "model-00099-of-00191.safetensors",
"model.layers.65.self_attn.o_proj.weight": "model-00099-of-00191.safetensors",
"model.layers.65.self_attn.q_proj.weight": "model-00099-of-00191.safetensors",
"model.layers.65.self_attn.v_proj.weight": "model-00099-of-00191.safetensors",
"model.layers.66.input_layernorm.weight": "model-00102-of-00191.safetensors",
"model.layers.66.mlp.down_proj.weight": "model-00102-of-00191.safetensors",
"model.layers.66.mlp.gate_proj.weight": "model-00101-of-00191.safetensors",
"model.layers.66.mlp.up_proj.weight": "model-00101-of-00191.safetensors",
"model.layers.66.post_attention_layernorm.weight": "model-00102-of-00191.safetensors",
"model.layers.66.self_attn.k_proj.weight": "model-00100-of-00191.safetensors",
"model.layers.66.self_attn.o_proj.weight": "model-00100-of-00191.safetensors",
"model.layers.66.self_attn.q_proj.weight": "model-00100-of-00191.safetensors",
"model.layers.66.self_attn.v_proj.weight": "model-00100-of-00191.safetensors",
"model.layers.67.input_layernorm.weight": "model-00103-of-00191.safetensors",
"model.layers.67.mlp.down_proj.weight": "model-00103-of-00191.safetensors",
"model.layers.67.mlp.gate_proj.weight": "model-00102-of-00191.safetensors",
"model.layers.67.mlp.up_proj.weight": "model-00103-of-00191.safetensors",
"model.layers.67.post_attention_layernorm.weight": "model-00103-of-00191.safetensors",
"model.layers.67.self_attn.k_proj.weight": "model-00102-of-00191.safetensors",
"model.layers.67.self_attn.o_proj.weight": "model-00102-of-00191.safetensors",
"model.layers.67.self_attn.q_proj.weight": "model-00102-of-00191.safetensors",
"model.layers.67.self_attn.v_proj.weight": "model-00102-of-00191.safetensors",
"model.layers.68.input_layernorm.weight": "model-00105-of-00191.safetensors",
"model.layers.68.mlp.down_proj.weight": "model-00105-of-00191.safetensors",
"model.layers.68.mlp.gate_proj.weight": "model-00104-of-00191.safetensors",
"model.layers.68.mlp.up_proj.weight": "model-00104-of-00191.safetensors",
"model.layers.68.post_attention_layernorm.weight": "model-00105-of-00191.safetensors",
"model.layers.68.self_attn.k_proj.weight": "model-00103-of-00191.safetensors",
"model.layers.68.self_attn.o_proj.weight": "model-00103-of-00191.safetensors",
"model.layers.68.self_attn.q_proj.weight": "model-00103-of-00191.safetensors",
"model.layers.68.self_attn.v_proj.weight": "model-00103-of-00191.safetensors",
"model.layers.69.input_layernorm.weight": "model-00106-of-00191.safetensors",
"model.layers.69.mlp.down_proj.weight": "model-00106-of-00191.safetensors",
"model.layers.69.mlp.gate_proj.weight": "model-00105-of-00191.safetensors",
"model.layers.69.mlp.up_proj.weight": "model-00106-of-00191.safetensors",
"model.layers.69.post_attention_layernorm.weight": "model-00106-of-00191.safetensors",
"model.layers.69.self_attn.k_proj.weight": "model-00105-of-00191.safetensors",
"model.layers.69.self_attn.o_proj.weight": "model-00105-of-00191.safetensors",
"model.layers.69.self_attn.q_proj.weight": "model-00105-of-00191.safetensors",
"model.layers.69.self_attn.v_proj.weight": "model-00105-of-00191.safetensors",
"model.layers.7.input_layernorm.weight": "model-00013-of-00191.safetensors",
"model.layers.7.mlp.down_proj.weight": "model-00013-of-00191.safetensors",
"model.layers.7.mlp.gate_proj.weight": "model-00012-of-00191.safetensors",
"model.layers.7.mlp.up_proj.weight": "model-00013-of-00191.safetensors",
"model.layers.7.post_attention_layernorm.weight": "model-00013-of-00191.safetensors",
"model.layers.7.self_attn.k_proj.weight": "model-00012-of-00191.safetensors",
"model.layers.7.self_attn.o_proj.weight": "model-00012-of-00191.safetensors",
"model.layers.7.self_attn.q_proj.weight": "model-00012-of-00191.safetensors",
"model.layers.7.self_attn.v_proj.weight": "model-00012-of-00191.safetensors",
"model.layers.70.input_layernorm.weight": "model-00108-of-00191.safetensors",
"model.layers.70.mlp.down_proj.weight": "model-00108-of-00191.safetensors",
"model.layers.70.mlp.gate_proj.weight": "model-00107-of-00191.safetensors",
"model.layers.70.mlp.up_proj.weight": "model-00107-of-00191.safetensors",
"model.layers.70.post_attention_layernorm.weight": "model-00108-of-00191.safetensors",
"model.layers.70.self_attn.k_proj.weight": "model-00106-of-00191.safetensors",
"model.layers.70.self_attn.o_proj.weight": "model-00106-of-00191.safetensors",
"model.layers.70.self_attn.q_proj.weight": "model-00106-of-00191.safetensors",
"model.layers.70.self_attn.v_proj.weight": "model-00106-of-00191.safetensors",
"model.layers.71.input_layernorm.weight": "model-00109-of-00191.safetensors",
"model.layers.71.mlp.down_proj.weight": "model-00109-of-00191.safetensors",
"model.layers.71.mlp.gate_proj.weight": "model-00108-of-00191.safetensors",
"model.layers.71.mlp.up_proj.weight": "model-00109-of-00191.safetensors",
"model.layers.71.post_attention_layernorm.weight": "model-00109-of-00191.safetensors",
"model.layers.71.self_attn.k_proj.weight": "model-00108-of-00191.safetensors",
"model.layers.71.self_attn.o_proj.weight": "model-00108-of-00191.safetensors",
"model.layers.71.self_attn.q_proj.weight": "model-00108-of-00191.safetensors",
"model.layers.71.self_attn.v_proj.weight": "model-00108-of-00191.safetensors",
"model.layers.72.input_layernorm.weight": "model-00111-of-00191.safetensors",
"model.layers.72.mlp.down_proj.weight": "model-00111-of-00191.safetensors",
"model.layers.72.mlp.gate_proj.weight": "model-00110-of-00191.safetensors",
"model.layers.72.mlp.up_proj.weight": "model-00110-of-00191.safetensors",
"model.layers.72.post_attention_layernorm.weight": "model-00111-of-00191.safetensors",
"model.layers.72.self_attn.k_proj.weight": "model-00109-of-00191.safetensors",
"model.layers.72.self_attn.o_proj.weight": "model-00109-of-00191.safetensors",
"model.layers.72.self_attn.q_proj.weight": "model-00109-of-00191.safetensors",
"model.layers.72.self_attn.v_proj.weight": "model-00109-of-00191.safetensors",
"model.layers.73.input_layernorm.weight": "model-00112-of-00191.safetensors",
"model.layers.73.mlp.down_proj.weight": "model-00112-of-00191.safetensors",
"model.layers.73.mlp.gate_proj.weight": "model-00111-of-00191.safetensors",
"model.layers.73.mlp.up_proj.weight": "model-00112-of-00191.safetensors",
"model.layers.73.post_attention_layernorm.weight": "model-00112-of-00191.safetensors",
"model.layers.73.self_attn.k_proj.weight": "model-00111-of-00191.safetensors",
"model.layers.73.self_attn.o_proj.weight": "model-00111-of-00191.safetensors",
"model.layers.73.self_attn.q_proj.weight": "model-00111-of-00191.safetensors",
"model.layers.73.self_attn.v_proj.weight": "model-00111-of-00191.safetensors",
"model.layers.74.input_layernorm.weight": "model-00114-of-00191.safetensors",
"model.layers.74.mlp.down_proj.weight": "model-00114-of-00191.safetensors",
"model.layers.74.mlp.gate_proj.weight": "model-00113-of-00191.safetensors",
"model.layers.74.mlp.up_proj.weight": "model-00113-of-00191.safetensors",
"model.layers.74.post_attention_layernorm.weight": "model-00114-of-00191.safetensors",
"model.layers.74.self_attn.k_proj.weight": "model-00112-of-00191.safetensors",
"model.layers.74.self_attn.o_proj.weight": "model-00112-of-00191.safetensors",
"model.layers.74.self_attn.q_proj.weight": "model-00112-of-00191.safetensors",
"model.layers.74.self_attn.v_proj.weight": "model-00112-of-00191.safetensors",
"model.layers.75.input_layernorm.weight": "model-00115-of-00191.safetensors",
"model.layers.75.mlp.down_proj.weight": "model-00115-of-00191.safetensors",
"model.layers.75.mlp.gate_proj.weight": "model-00114-of-00191.safetensors",
"model.layers.75.mlp.up_proj.weight": "model-00115-of-00191.safetensors",
"model.layers.75.post_attention_layernorm.weight": "model-00115-of-00191.safetensors",
"model.layers.75.self_attn.k_proj.weight": "model-00114-of-00191.safetensors",
"model.layers.75.self_attn.o_proj.weight": "model-00114-of-00191.safetensors",
"model.layers.75.self_attn.q_proj.weight": "model-00114-of-00191.safetensors",
"model.layers.75.self_attn.v_proj.weight": "model-00114-of-00191.safetensors",
"model.layers.76.input_layernorm.weight": "model-00117-of-00191.safetensors",
"model.layers.76.mlp.down_proj.weight": "model-00117-of-00191.safetensors",
"model.layers.76.mlp.gate_proj.weight": "model-00116-of-00191.safetensors",
"model.layers.76.mlp.up_proj.weight": "model-00116-of-00191.safetensors",
"model.layers.76.post_attention_layernorm.weight": "model-00117-of-00191.safetensors",
"model.layers.76.self_attn.k_proj.weight": "model-00115-of-00191.safetensors",
"model.layers.76.self_attn.o_proj.weight": "model-00115-of-00191.safetensors",
"model.layers.76.self_attn.q_proj.weight": "model-00115-of-00191.safetensors",
"model.layers.76.self_attn.v_proj.weight": "model-00115-of-00191.safetensors",
"model.layers.77.input_layernorm.weight": "model-00118-of-00191.safetensors",
"model.layers.77.mlp.down_proj.weight": "model-00118-of-00191.safetensors",
"model.layers.77.mlp.gate_proj.weight": "model-00117-of-00191.safetensors",
"model.layers.77.mlp.up_proj.weight": "model-00118-of-00191.safetensors",
"model.layers.77.post_attention_layernorm.weight": "model-00118-of-00191.safetensors",
"model.layers.77.self_attn.k_proj.weight": "model-00117-of-00191.safetensors",
"model.layers.77.self_attn.o_proj.weight": "model-00117-of-00191.safetensors",
"model.layers.77.self_attn.q_proj.weight": "model-00117-of-00191.safetensors",
"model.layers.77.self_attn.v_proj.weight": "model-00117-of-00191.safetensors",
"model.layers.78.input_layernorm.weight": "model-00120-of-00191.safetensors",
"model.layers.78.mlp.down_proj.weight": "model-00120-of-00191.safetensors",
"model.layers.78.mlp.gate_proj.weight": "model-00119-of-00191.safetensors",
"model.layers.78.mlp.up_proj.weight": "model-00119-of-00191.safetensors",
"model.layers.78.post_attention_layernorm.weight": "model-00120-of-00191.safetensors",
"model.layers.78.self_attn.k_proj.weight": "model-00118-of-00191.safetensors",
"model.layers.78.self_attn.o_proj.weight": "model-00118-of-00191.safetensors",
"model.layers.78.self_attn.q_proj.weight": "model-00118-of-00191.safetensors",
"model.layers.78.self_attn.v_proj.weight": "model-00118-of-00191.safetensors",
"model.layers.79.input_layernorm.weight": "model-00121-of-00191.safetensors",
"model.layers.79.mlp.down_proj.weight": "model-00121-of-00191.safetensors",
"model.layers.79.mlp.gate_proj.weight": "model-00120-of-00191.safetensors",
"model.layers.79.mlp.up_proj.weight": "model-00121-of-00191.safetensors",
"model.layers.79.post_attention_layernorm.weight": "model-00121-of-00191.safetensors",
"model.layers.79.self_attn.k_proj.weight": "model-00120-of-00191.safetensors",
"model.layers.79.self_attn.o_proj.weight": "model-00120-of-00191.safetensors",
"model.layers.79.self_attn.q_proj.weight": "model-00120-of-00191.safetensors",
"model.layers.79.self_attn.v_proj.weight": "model-00120-of-00191.safetensors",
"model.layers.8.input_layernorm.weight": "model-00015-of-00191.safetensors",
"model.layers.8.mlp.down_proj.weight": "model-00015-of-00191.safetensors",
"model.layers.8.mlp.gate_proj.weight": "model-00014-of-00191.safetensors",
"model.layers.8.mlp.up_proj.weight": "model-00014-of-00191.safetensors",
"model.layers.8.post_attention_layernorm.weight": "model-00015-of-00191.safetensors",
"model.layers.8.self_attn.k_proj.weight": "model-00013-of-00191.safetensors",
"model.layers.8.self_attn.o_proj.weight": "model-00013-of-00191.safetensors",
"model.layers.8.self_attn.q_proj.weight": "model-00013-of-00191.safetensors",
"model.layers.8.self_attn.v_proj.weight": "model-00013-of-00191.safetensors",
"model.layers.80.input_layernorm.weight": "model-00123-of-00191.safetensors",
"model.layers.80.mlp.down_proj.weight": "model-00123-of-00191.safetensors",
"model.layers.80.mlp.gate_proj.weight": "model-00122-of-00191.safetensors",
"model.layers.80.mlp.up_proj.weight": "model-00122-of-00191.safetensors",
"model.layers.80.post_attention_layernorm.weight": "model-00123-of-00191.safetensors",
"model.layers.80.self_attn.k_proj.weight": "model-00121-of-00191.safetensors",
"model.layers.80.self_attn.o_proj.weight": "model-00121-of-00191.safetensors",
"model.layers.80.self_attn.q_proj.weight": "model-00121-of-00191.safetensors",
"model.layers.80.self_attn.v_proj.weight": "model-00121-of-00191.safetensors",
"model.layers.81.input_layernorm.weight": "model-00124-of-00191.safetensors",
"model.layers.81.mlp.down_proj.weight": "model-00124-of-00191.safetensors",
"model.layers.81.mlp.gate_proj.weight": "model-00123-of-00191.safetensors",
"model.layers.81.mlp.up_proj.weight": "model-00124-of-00191.safetensors",
"model.layers.81.post_attention_layernorm.weight": "model-00124-of-00191.safetensors",
"model.layers.81.self_attn.k_proj.weight": "model-00123-of-00191.safetensors",
"model.layers.81.self_attn.o_proj.weight": "model-00123-of-00191.safetensors",
"model.layers.81.self_attn.q_proj.weight": "model-00123-of-00191.safetensors",
"model.layers.81.self_attn.v_proj.weight": "model-00123-of-00191.safetensors",
"model.layers.82.input_layernorm.weight": "model-00126-of-00191.safetensors",
"model.layers.82.mlp.down_proj.weight": "model-00126-of-00191.safetensors",
"model.layers.82.mlp.gate_proj.weight": "model-00125-of-00191.safetensors",
"model.layers.82.mlp.up_proj.weight": "model-00125-of-00191.safetensors",
"model.layers.82.post_attention_layernorm.weight": "model-00126-of-00191.safetensors",
"model.layers.82.self_attn.k_proj.weight": "model-00124-of-00191.safetensors",
"model.layers.82.self_attn.o_proj.weight": "model-00124-of-00191.safetensors",
"model.layers.82.self_attn.q_proj.weight": "model-00124-of-00191.safetensors",
"model.layers.82.self_attn.v_proj.weight": "model-00124-of-00191.safetensors",
"model.layers.83.input_layernorm.weight": "model-00127-of-00191.safetensors",
"model.layers.83.mlp.down_proj.weight": "model-00127-of-00191.safetensors",
"model.layers.83.mlp.gate_proj.weight": "model-00126-of-00191.safetensors",
"model.layers.83.mlp.up_proj.weight": "model-00127-of-00191.safetensors",
"model.layers.83.post_attention_layernorm.weight": "model-00127-of-00191.safetensors",
"model.layers.83.self_attn.k_proj.weight": "model-00126-of-00191.safetensors",
"model.layers.83.self_attn.o_proj.weight": "model-00126-of-00191.safetensors",
"model.layers.83.self_attn.q_proj.weight": "model-00126-of-00191.safetensors",
"model.layers.83.self_attn.v_proj.weight": "model-00126-of-00191.safetensors",
"model.layers.84.input_layernorm.weight": "model-00129-of-00191.safetensors",
"model.layers.84.mlp.down_proj.weight": "model-00129-of-00191.safetensors",
"model.layers.84.mlp.gate_proj.weight": "model-00128-of-00191.safetensors",
"model.layers.84.mlp.up_proj.weight": "model-00128-of-00191.safetensors",
"model.layers.84.post_attention_layernorm.weight": "model-00129-of-00191.safetensors",
"model.layers.84.self_attn.k_proj.weight": "model-00127-of-00191.safetensors",
"model.layers.84.self_attn.o_proj.weight": "model-00127-of-00191.safetensors",
"model.layers.84.self_attn.q_proj.weight": "model-00127-of-00191.safetensors",
"model.layers.84.self_attn.v_proj.weight": "model-00127-of-00191.safetensors",
"model.layers.85.input_layernorm.weight": "model-00130-of-00191.safetensors",
"model.layers.85.mlp.down_proj.weight": "model-00130-of-00191.safetensors",
"model.layers.85.mlp.gate_proj.weight": "model-00129-of-00191.safetensors",
"model.layers.85.mlp.up_proj.weight": "model-00130-of-00191.safetensors",
"model.layers.85.post_attention_layernorm.weight": "model-00130-of-00191.safetensors",
"model.layers.85.self_attn.k_proj.weight": "model-00129-of-00191.safetensors",
"model.layers.85.self_attn.o_proj.weight": "model-00129-of-00191.safetensors",
"model.layers.85.self_attn.q_proj.weight": "model-00129-of-00191.safetensors",
"model.layers.85.self_attn.v_proj.weight": "model-00129-of-00191.safetensors",
"model.layers.86.input_layernorm.weight": "model-00132-of-00191.safetensors",
"model.layers.86.mlp.down_proj.weight": "model-00132-of-00191.safetensors",
"model.layers.86.mlp.gate_proj.weight": "model-00131-of-00191.safetensors",
"model.layers.86.mlp.up_proj.weight": "model-00131-of-00191.safetensors",
"model.layers.86.post_attention_layernorm.weight": "model-00132-of-00191.safetensors",
"model.layers.86.self_attn.k_proj.weight": "model-00130-of-00191.safetensors",
"model.layers.86.self_attn.o_proj.weight": "model-00130-of-00191.safetensors",
"model.layers.86.self_attn.q_proj.weight": "model-00130-of-00191.safetensors",
"model.layers.86.self_attn.v_proj.weight": "model-00130-of-00191.safetensors",
"model.layers.87.input_layernorm.weight": "model-00133-of-00191.safetensors",
"model.layers.87.mlp.down_proj.weight": "model-00133-of-00191.safetensors",
"model.layers.87.mlp.gate_proj.weight": "model-00132-of-00191.safetensors",
"model.layers.87.mlp.up_proj.weight": "model-00133-of-00191.safetensors",
"model.layers.87.post_attention_layernorm.weight": "model-00133-of-00191.safetensors",
"model.layers.87.self_attn.k_proj.weight": "model-00132-of-00191.safetensors",
"model.layers.87.self_attn.o_proj.weight": "model-00132-of-00191.safetensors",
"model.layers.87.self_attn.q_proj.weight": "model-00132-of-00191.safetensors",
"model.layers.87.self_attn.v_proj.weight": "model-00132-of-00191.safetensors",
"model.layers.88.input_layernorm.weight": "model-00135-of-00191.safetensors",
"model.layers.88.mlp.down_proj.weight": "model-00135-of-00191.safetensors",
"model.layers.88.mlp.gate_proj.weight": "model-00134-of-00191.safetensors",
"model.layers.88.mlp.up_proj.weight": "model-00134-of-00191.safetensors",
"model.layers.88.post_attention_layernorm.weight": "model-00135-of-00191.safetensors",
"model.layers.88.self_attn.k_proj.weight": "model-00133-of-00191.safetensors",
"model.layers.88.self_attn.o_proj.weight": "model-00133-of-00191.safetensors",
"model.layers.88.self_attn.q_proj.weight": "model-00133-of-00191.safetensors",
"model.layers.88.self_attn.v_proj.weight": "model-00133-of-00191.safetensors",
"model.layers.89.input_layernorm.weight": "model-00136-of-00191.safetensors",
"model.layers.89.mlp.down_proj.weight": "model-00136-of-00191.safetensors",
"model.layers.89.mlp.gate_proj.weight": "model-00135-of-00191.safetensors",
"model.layers.89.mlp.up_proj.weight": "model-00136-of-00191.safetensors",
"model.layers.89.post_attention_layernorm.weight": "model-00136-of-00191.safetensors",
"model.layers.89.self_attn.k_proj.weight": "model-00135-of-00191.safetensors",
"model.layers.89.self_attn.o_proj.weight": "model-00135-of-00191.safetensors",
"model.layers.89.self_attn.q_proj.weight": "model-00135-of-00191.safetensors",
"model.layers.89.self_attn.v_proj.weight": "model-00135-of-00191.safetensors",
"model.layers.9.input_layernorm.weight": "model-00016-of-00191.safetensors",
"model.layers.9.mlp.down_proj.weight": "model-00016-of-00191.safetensors",
"model.layers.9.mlp.gate_proj.weight": "model-00015-of-00191.safetensors",
"model.layers.9.mlp.up_proj.weight": "model-00016-of-00191.safetensors",
"model.layers.9.post_attention_layernorm.weight": "model-00016-of-00191.safetensors",
"model.layers.9.self_attn.k_proj.weight": "model-00015-of-00191.safetensors",
"model.layers.9.self_attn.o_proj.weight": "model-00015-of-00191.safetensors",
"model.layers.9.self_attn.q_proj.weight": "model-00015-of-00191.safetensors",
"model.layers.9.self_attn.v_proj.weight": "model-00015-of-00191.safetensors",
"model.layers.90.input_layernorm.weight": "model-00138-of-00191.safetensors",
"model.layers.90.mlp.down_proj.weight": "model-00138-of-00191.safetensors",
"model.layers.90.mlp.gate_proj.weight": "model-00137-of-00191.safetensors",
"model.layers.90.mlp.up_proj.weight": "model-00137-of-00191.safetensors",
"model.layers.90.post_attention_layernorm.weight": "model-00138-of-00191.safetensors",
"model.layers.90.self_attn.k_proj.weight": "model-00136-of-00191.safetensors",
"model.layers.90.self_attn.o_proj.weight": "model-00136-of-00191.safetensors",
"model.layers.90.self_attn.q_proj.weight": "model-00136-of-00191.safetensors",
"model.layers.90.self_attn.v_proj.weight": "model-00136-of-00191.safetensors",
"model.layers.91.input_layernorm.weight": "model-00139-of-00191.safetensors",
"model.layers.91.mlp.down_proj.weight": "model-00139-of-00191.safetensors",
"model.layers.91.mlp.gate_proj.weight": "model-00138-of-00191.safetensors",
"model.layers.91.mlp.up_proj.weight": "model-00139-of-00191.safetensors",
"model.layers.91.post_attention_layernorm.weight": "model-00139-of-00191.safetensors",
"model.layers.91.self_attn.k_proj.weight": "model-00138-of-00191.safetensors",
"model.layers.91.self_attn.o_proj.weight": "model-00138-of-00191.safetensors",
"model.layers.91.self_attn.q_proj.weight": "model-00138-of-00191.safetensors",
"model.layers.91.self_attn.v_proj.weight": "model-00138-of-00191.safetensors",
"model.layers.92.input_layernorm.weight": "model-00141-of-00191.safetensors",
"model.layers.92.mlp.down_proj.weight": "model-00141-of-00191.safetensors",
"model.layers.92.mlp.gate_proj.weight": "model-00140-of-00191.safetensors",
"model.layers.92.mlp.up_proj.weight": "model-00140-of-00191.safetensors",
"model.layers.92.post_attention_layernorm.weight": "model-00141-of-00191.safetensors",
"model.layers.92.self_attn.k_proj.weight": "model-00139-of-00191.safetensors",
"model.layers.92.self_attn.o_proj.weight": "model-00139-of-00191.safetensors",
"model.layers.92.self_attn.q_proj.weight": "model-00139-of-00191.safetensors",
"model.layers.92.self_attn.v_proj.weight": "model-00139-of-00191.safetensors",
"model.layers.93.input_layernorm.weight": "model-00142-of-00191.safetensors",
"model.layers.93.mlp.down_proj.weight": "model-00142-of-00191.safetensors",
"model.layers.93.mlp.gate_proj.weight": "model-00141-of-00191.safetensors",
"model.layers.93.mlp.up_proj.weight": "model-00142-of-00191.safetensors",
"model.layers.93.post_attention_layernorm.weight": "model-00142-of-00191.safetensors",
"model.layers.93.self_attn.k_proj.weight": "model-00141-of-00191.safetensors",
"model.layers.93.self_attn.o_proj.weight": "model-00141-of-00191.safetensors",
"model.layers.93.self_attn.q_proj.weight": "model-00141-of-00191.safetensors",
"model.layers.93.self_attn.v_proj.weight": "model-00141-of-00191.safetensors",
"model.layers.94.input_layernorm.weight": "model-00144-of-00191.safetensors",
"model.layers.94.mlp.down_proj.weight": "model-00144-of-00191.safetensors",
"model.layers.94.mlp.gate_proj.weight": "model-00143-of-00191.safetensors",
"model.layers.94.mlp.up_proj.weight": "model-00143-of-00191.safetensors",
"model.layers.94.post_attention_layernorm.weight": "model-00144-of-00191.safetensors",
"model.layers.94.self_attn.k_proj.weight": "model-00142-of-00191.safetensors",
"model.layers.94.self_attn.o_proj.weight": "model-00142-of-00191.safetensors",
"model.layers.94.self_attn.q_proj.weight": "model-00142-of-00191.safetensors",
"model.layers.94.self_attn.v_proj.weight": "model-00142-of-00191.safetensors",
"model.layers.95.input_layernorm.weight": "model-00145-of-00191.safetensors",
"model.layers.95.mlp.down_proj.weight": "model-00145-of-00191.safetensors",
"model.layers.95.mlp.gate_proj.weight": "model-00144-of-00191.safetensors",
"model.layers.95.mlp.up_proj.weight": "model-00145-of-00191.safetensors",
"model.layers.95.post_attention_layernorm.weight": "model-00145-of-00191.safetensors",
"model.layers.95.self_attn.k_proj.weight": "model-00144-of-00191.safetensors",
"model.layers.95.self_attn.o_proj.weight": "model-00144-of-00191.safetensors",
"model.layers.95.self_attn.q_proj.weight": "model-00144-of-00191.safetensors",
"model.layers.95.self_attn.v_proj.weight": "model-00144-of-00191.safetensors",
"model.layers.96.input_layernorm.weight": "model-00147-of-00191.safetensors",
"model.layers.96.mlp.down_proj.weight": "model-00147-of-00191.safetensors",
"model.layers.96.mlp.gate_proj.weight": "model-00146-of-00191.safetensors",
"model.layers.96.mlp.up_proj.weight": "model-00146-of-00191.safetensors",
"model.layers.96.post_attention_layernorm.weight": "model-00147-of-00191.safetensors",
"model.layers.96.self_attn.k_proj.weight": "model-00145-of-00191.safetensors",
"model.layers.96.self_attn.o_proj.weight": "model-00145-of-00191.safetensors",
"model.layers.96.self_attn.q_proj.weight": "model-00145-of-00191.safetensors",
"model.layers.96.self_attn.v_proj.weight": "model-00145-of-00191.safetensors",
"model.layers.97.input_layernorm.weight": "model-00148-of-00191.safetensors",
"model.layers.97.mlp.down_proj.weight": "model-00148-of-00191.safetensors",
"model.layers.97.mlp.gate_proj.weight": "model-00147-of-00191.safetensors",
"model.layers.97.mlp.up_proj.weight": "model-00148-of-00191.safetensors",
"model.layers.97.post_attention_layernorm.weight": "model-00148-of-00191.safetensors",
"model.layers.97.self_attn.k_proj.weight": "model-00147-of-00191.safetensors",
"model.layers.97.self_attn.o_proj.weight": "model-00147-of-00191.safetensors",
"model.layers.97.self_attn.q_proj.weight": "model-00147-of-00191.safetensors",
"model.layers.97.self_attn.v_proj.weight": "model-00147-of-00191.safetensors",
"model.layers.98.input_layernorm.weight": "model-00150-of-00191.safetensors",
"model.layers.98.mlp.down_proj.weight": "model-00150-of-00191.safetensors",
"model.layers.98.mlp.gate_proj.weight": "model-00149-of-00191.safetensors",
"model.layers.98.mlp.up_proj.weight": "model-00149-of-00191.safetensors",
"model.layers.98.post_attention_layernorm.weight": "model-00150-of-00191.safetensors",
"model.layers.98.self_attn.k_proj.weight": "model-00148-of-00191.safetensors",
"model.layers.98.self_attn.o_proj.weight": "model-00148-of-00191.safetensors",
"model.layers.98.self_attn.q_proj.weight": "model-00148-of-00191.safetensors",
"model.layers.98.self_attn.v_proj.weight": "model-00148-of-00191.safetensors",
"model.layers.99.input_layernorm.weight": "model-00151-of-00191.safetensors",
"model.layers.99.mlp.down_proj.weight": "model-00151-of-00191.safetensors",
"model.layers.99.mlp.gate_proj.weight": "model-00150-of-00191.safetensors",
"model.layers.99.mlp.up_proj.weight": "model-00151-of-00191.safetensors",
"model.layers.99.post_attention_layernorm.weight": "model-00151-of-00191.safetensors",
"model.layers.99.self_attn.k_proj.weight": "model-00150-of-00191.safetensors",
"model.layers.99.self_attn.o_proj.weight": "model-00150-of-00191.safetensors",
"model.layers.99.self_attn.q_proj.weight": "model-00150-of-00191.safetensors",
"model.layers.99.self_attn.v_proj.weight": "model-00150-of-00191.safetensors",
"model.norm.weight": "model-00190-of-00191.safetensors"
}
}

Original README

⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⣀⣠⣴⣶⡀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀
⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠘⢻⣿⣿⣿⣷⡀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀
⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⣿⣿⣿⣿⣿⡄⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀
⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⣀⣀⣀⠀⠀⠀⠀⠀⠀⠀⠘⣿⣿⣿⣿⣿⣶⣶⡶⢶⣶⣶⣦⣤⣄⣀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀
⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⢀⣠⣤⠶⠶⠛⠛⠉⠉⠉⠉⠛⠛⠳⢶⣤⣄⠀⠀⠹⣿⣿⣿⣿⣿⣿⣾⡱⢆⡲⢤⠉⡍⢛⠻⠷⣦⣄⡀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀
⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⢀⣴⣤⣤⣀⣀⡀⠀⠀⠀⠀⠀⠀⠀⣀⣠⣤⡶⠶⢻⠛⠛⠋⢉⠀⠠⠀⠄⠠⠐⠀⠂⠀⠄⢀⠀⡀⢈⠙⡻⣷⣤⣿⣿⣿⣿⣿⣿⣿⣿⣯⣖⡣⡝⡰⢃⠎⡴⢈⡙⠻⢷⣤⣀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀
⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⢸⣿⣿⡿⠛⠛⠿⠿⣷⣶⣦⣤⠶⠟⢋⡉⢄⠢⡑⢢⢉⡔⢣⠎⠬⠣⠜⠲⠄⠢⠁⠤⠁⡄⢂⠰⢠⠡⠌⡐⠌⡹⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣷⣹⣕⢫⡜⡰⢃⠬⡑⢢⡘⡙⢳⣦⣀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀
⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⣿⣿⣿⠇⠀⠀⠀⠀⣠⣿⠟⣋⡔⣩⢒⡜⡢⢇⡙⢂⠡⢈⠀⡀⠂⠀⠄⡀⠄⠐⠀⠄⠐⠀⠈⠁⡁⢂⠐⡀⢂⠁⢚⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣾⣿⣾⣱⣋⢖⡉⢆⠰⡁⠆⣈⠙⢷⣦⡀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀
⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⢸⣿⣿⣿⣷⣾⣿⣶⡾⡟⠧⠛⠤⠙⡄⢋⡌⣁⠂⡐⠄⡃⠆⢡⢀⠃⠌⡀⠄⡐⠈⡀⠂⢈⠀⠡⠐⠀⠠⠐⠀⠂⠌⠠⡘⣿⣿⣿⣿⣿⣿⣿⣿⡉⠛⠛⠿⠿⣿⣿⣮⣽⣊⢦⠁⢆⠠⢈⠀⡈⠻⢦⣄⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀
⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⣼⣿⣿⣿⣿⣿⡿⢋⡁⢒⠠⢣⢌⠳⡌⢇⡒⡄⢆⡱⢌⡰⢉⠢⡘⢌⠢⡑⠢⢄⠡⡐⢈⠀⡐⠀⠂⠁⠄⠂⠁⠌⠠⠁⡔⠩⢿⣿⣿⣿⣿⣿⣿⣇⠀⠀⠀⠀⠀⠀⠉⠙⠻⣷⣏⠦⡘⢄⠂⠄⡀⠂⠙⢧⡄⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀
⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⢠⣿⣿⣿⣿⡟⢣⠜⡤⢓⡌⣎⠵⣊⠷⣘⢦⢳⡘⢦⡑⢎⡔⣡⢂⠐⡀⢂⠁⠣⢌⠢⣁⠣⡘⣀⠂⡁⠌⠀⠌⠐⡀⢁⠂⠠⠑⡌⢛⣿⣿⣿⣿⣿⣿⣆⠀⠀⠀⠀⠀⠀⠀⠀⠈⠻⣶⣍⠢⠜⠠⠐⠀⠡⠀⠻⣦⡀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀
⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⣸⣿⣿⣿⠧⡜⣡⠚⣔⢣⡞⡬⢣⣙⢮⣓⢮⡱⢎⡇⡞⣡⠚⡔⣊⠖⡰⠀⠌⢀⠂⠐⡀⠆⣁⠢⠑⡄⢂⠡⠐⢀⠐⠠⢀⠁⢂⠘⠤⡹⣿⣿⣿⣿⣿⣿⠆⠀⠀⠀⠀⠀⠀⠀⠀⠀⠈⠻⣷⡌⠱⡈⠄⠡⠐⢀⠈⢷⣄⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀
⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⣿⣿⣿⢏⡴⠣⡍⢶⣙⢮⠳⡡⢎⡝⣾⡹⣌⠧⣊⠵⣑⢋⠖⣡⢋⡔⣃⠒⠤⡈⢀⠂⢁⠠⠉⠄⢂⠁⠎⡰⢀⠌⠠⠀⠌⠐⡈⠐⡠⢃⢿⣿⣿⡿⠟⠋⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠻⣷⣆⠱⡀⢂⠠⠈⡀⠈⢿⣆⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀
⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⢸⣿⣿⢏⠖⣡⠓⣜⢣⣞⡉⢲⠡⣏⡜⢧⡻⣌⡳⣜⢢⡑⠎⡜⠤⢃⠲⢌⡩⢆⠱⢠⠐⠀⡀⠂⢈⠠⢈⠐⢠⠃⠎⡄⢈⠠⠁⠰⣁⠰⢈⠚⣿⣿⡀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠙⢿⣦⠑⢄⡀⢂⠀⡁⠀⠹⣦⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀
⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⣾⣿⣿⡾⠁⢧⠹⣜⢯⢖⡩⢆⡝⢤⣋⠷⣹⠶⣱⢎⢷⣸⠱⣌⠊⡅⢣⠘⡰⢈⠆⡡⠊⠔⡀⠐⠀⡀⠄⠈⠂⠌⠒⡌⢲⡀⠌⠐⢠⠃⡬⢘⡹⣿⣷⡀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠈⢻⣏⣆⠐⠠⢀⠐⠈⢀⠘⣧⡀⠀⠀⠀⠀⠀⠀⠀⠀
⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠙⢿⣿⢃⡍⢶⡙⣮⣿⢌⠳⡌⡜⢦⡩⢞⡽⣟⢦⣋⠞⣜⡻⢶⣭⣐⠂⢆⠁⠢⠘⡠⠑⠂⠌⠤⣁⠀⠠⠀⠁⠠⠑⡈⠦⡑⢎⡀⠂⠱⢌⠣⡜⣹⣿⣿⡄⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⣠⣿⣿⣿⡦⠀⡐⠈⠀⠄⠘⣷⡀⠀⠀⠀⠀⠀⠀⠀
⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⣿⣿⢣⡜⣣⢝⣺⣿⣎⠵⡘⡜⢦⠱⣋⡼⣿⣧⢏⡞⣥⢛⢧⣛⢿⣿⣦⣌⠀⠡⢀⠡⠘⡐⠂⠄⠚⢤⡐⠈⢀⠐⠀⠡⢉⠖⡱⡌⡑⢪⠱⡌⡽⣿⣿⣿⣦⣄⣀⠀⠀⠀⠀⠀⠀⠀⠀⢠⡆⠀⢰⡿⠛⣿⣿⣟⠀⠄⡈⠄⢈⠀⡘⣧⡀⠀⠀⠀⠀⠀⠀
⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⢸⣿⣏⠶⣹⢆⡏⣶⣿⣿⢢⡙⠜⣢⠓⡬⢒⣿⣿⣿⡜⣧⢫⠖⡭⢞⡼⣛⡿⣷⣦⣄⠀⢂⠠⠁⠎⡐⢂⠘⢢⠀⠄⡈⠐⠈⢎⠵⢣⠜⣠⠛⣜⡹⣿⣿⣿⣿⣿⣿⠃⠀⠀⠀⠀⠀⠀⠀⢰⣇⠀⣾⠃⠀⣼⣿⡃⢌⠠⢀⠐⠀⠄⠠⠘⣷⠀⠀⠀⠀⠀⠀
⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⣾⣿⡎⣽⠲⣍⠞⣶⢻⣿⣧⡘⠜⣠⠙⠴⡉⢖⣿⣿⣿⣾⣧⣿⣘⢧⡚⣥⢫⡝⡻⢿⣿⣦⣀⠂⠄⠡⠈⡜⠠⢍⢢⠐⠈⡀⢊⠜⣱⢚⠤⡛⡴⡹⣿⣿⣿⣿⢋⣿⠀⠀⠀⠀⠀⠀⠀⠀⢸⣿⣾⠏⢀⡿⠀⢻⣿⠴⣦⡄⠂⢁⠐⠀⡁⢹⣧⠀⠀⠀⠀⠀
⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⢠⣿⣿⣜⠲⣏⠼⣹⣾⣏⡿⣿⣎⠒⠤⢉⠆⡉⠎⡴⢻⣿⣿⣉⠛⠛⠿⣷⣶⣧⣞⣭⢓⢮⡛⣿⣿⣴⣂⠡⡐⡉⢆⢢⡙⡔⢠⠂⡘⢥⣋⠶⣡⢳⡹⣿⡿⢉⣿⣿⣿⠀⠀⠀⠀⠀⠀⠀⠀⣼⢻⡟⠀⢨⠃⠀⢈⡟⠀⢘⣿⡄⠂⠠⠁⠠⠀⢻⣆⠀⠀⠀⠀
⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⢸⣿⣿⣎⠷⡸⡑⢮⣿⡾⣝⡿⣿⣏⠦⡁⢎⡐⢁⠂⠧⢻⣿⡆⠄⠀⠀⠀⠈⠉⠛⠻⠿⣶⣿⣴⣭⣛⣿⣷⣼⡰⣌⢢⠱⢌⢣⡜⠤⣃⢮⠳⡥⢎⣳⣿⣷⣿⣿⣿⡇⠀⠀⠀⠀⠀⠀⠀⠀⣿⣸⠇⠀⠀⠀⠀⣌⣷⣴⡿⠛⠁⠠⠁⠠⠁⡐⠈⣿⡄⠀⠀⠀
⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⢸⣿⣿⣿⡚⣥⠃⣞⣿⣿⡽⣞⣿⣿⣷⣑⠂⡌⠤⢈⠐⠡⢚⣿⣆⠀⠀⠀⠀⠀⠀⠀⣠⡾⠋⠉⠙⣻⣿⣿⣿⣿⣾⣧⣗⢮⡱⢎⡳⣌⢎⠷⣙⢮⣿⣿⣿⣿⣿⣿⠇⠀⠀⠀⠀⠀⠀⠀⢰⡏⡌⠀⠀⠀⢀⣴⠋⢻⣯⠠⠁⠌⠐⡀⠁⡐⠀⡐⠘⣷⠀⠀⠀
⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⢸⣿⣿⣿⣟⠴⣃⠸⣿⣿⣿⣟⣾⣿⡿⠿⣷⣮⡐⡡⢌⠂⡅⠚⣿⣧⠀⠀⠀⠀⠰⠞⠋⠀⢀⣠⣾⣿⠟⠉⠀⠉⠙⠻⢿⣿⣿⣭⣷⣹⣎⢯⡳⢾⣿⣿⣿⣿⡿⠋⠀⠀⠀⠀⠀⠀⠀⠀⣾⠁⠀⠀⠀⣴⠟⠁⠀⢸⣿⠠⢉⠐⠠⢀⠁⡀⠂⠄⡈⢽⡆⠀⠀
⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⣾⣿⣿⣿⣿⣽⢢⡝⣽⣿⣿⣿⣿⣿⣿⣅⡀⠙⠿⣷⣌⣒⢌⡱⢂⠿⣷⣀⠀⠀⠀⠀⢀⣴⣾⠿⠋⠀⠀⠀⠀⠀⠀⠀⣼⣿⡿⢿⣿⣷⣯⣷⣻⣿⣿⣿⡿⠛⠀⠀⠀⠀⠀⠀⠀⠀⠀⢸⠇⠀⠀⣠⡾⠁⠀⠀⠀⢸⣿⠐⠂⠌⡐⠀⠄⠐⡀⠂⠄⠘⣷⠀⠀
⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⢰⣿⣿⣿⣿⣿⣿⣗⡞⣜⣻⢿⣿⣿⣿⡙⠿⠿⣷⣶⣬⣙⣿⢷⣮⣇⣎⡹⢿⣆⠀⠀⠀⣿⣿⣷⣶⣶⣶⣶⣶⣶⣾⡿⠉⠀⣿⡟⡽⣹⣿⢿⣿⣷⣿⡿⠋⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⢀⡿⠀⠀⣰⠋⠀⠀⠀⠀⠀⢨⣿⢈⡁⠆⢠⠁⠌⢀⠐⠠⢈⠐⢿⡆⠀
⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⢀⣾⣿⣿⣿⣿⣿⣿⣿⣿⡬⢏⡿⣽⣻⣿⣿⣄⠄⠀⠈⠙⢛⣿⣿⣯⠙⠛⠻⠿⠿⠛⠀⠀⠀⠉⠁⠉⠈⠀⠁⠀⡀⠄⡐⢂⠲⣿⣯⢳⣽⡇⠀⠹⡟⠁⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⣼⠃⢀⡼⠁⠀⠀⠀⠀⠀⠀⠰⣿⠠⡐⠈⠤⡈⠄⠂⢈⠐⠠⡈⢼⣇⠀
⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⣼⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣝⡾⣱⣟⣿⣿⣿⡶⣬⣶⣿⣿⠿⠋⠁⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠰⣏⡐⢠⠂⠁⣿⣿⣳⣿⣿⣶⣾⠆⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⣰⠏⢀⡾⠁⠀⠀⠀⠀⠀⠀⠀⢸⣿⠠⢁⠜⣀⠒⡈⠐⡀⠌⠠⠁⠆⣿⠀
⠀⠀⠀⠀⠀⠀⠀⠀⠀⣰⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣳⣻⢾⣿⣿⣿⡟⣿⣉⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⢀⣀⠀⠀⠀⠀⠀⠀⠉⠉⠁⠀⣠⡿⢻⡟⠁⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⢀⣀⣤⣤⣤⣰⡟⠀⡞⠁⠀⠀⠀⠀⠀⠀⠀⠀⣸⣏⠐⠌⡰⢀⠣⡐⢁⠠⠈⠄⠃⡌⢿⡇
⠀⠀⠀⠀⠀⠀⠀⠀⢠⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣯⣟⣿⣿⣿⣿⣞⢻⣧⠀⠀⠀⠀⢀⣤⣤⡴⡶⠶⠛⢏⡙⢻⣦⡀⠀⠀⠀⠀⠀⠀⣰⣿⡀⠛⠁⠀⠀⠀⠀⠀⠀⢀⣀⣤⣶⣿⣿⣿⠟⠉⠿⠇⠀⠘⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⣿⡇⠌⢢⠑⡌⢢⠑⡂⠄⡈⠄⡃⠜⣸⡇
⠀⠀⠀⠀⠀⠀⠀⣠⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣧⠿⣦⣀⠀⠀⠈⢿⣇⡲⢄⠣⡉⢆⠸⢠⠹⣷⠀⠀⠀⣠⣴⣿⣿⣿⣿⣷⣤⣀⣤⣠⣤⣴⣾⣿⣿⣿⣿⣿⣿⣿⣦⠄⠀⠀⠀⢀⡀⠀⠀⠀⠀⠀⠀⠀⠀⣸⣿⢂⡑⢢⠱⡨⢅⡊⠔⠠⠐⡈⠔⣩⢸⡇
⠀⠀⠀⠀⠀⠀⣰⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣻⣿⡿⠿⣿⡇⠀⠉⢻⣦⣤⣈⠛⠿⣿⣶⣭⣦⢿⠶⢉⣡⣤⣶⣿⣿⠿⣹⣿⡿⣧⠩⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⡿⠀⠀⠀⠀⠀⠀⣧⠀⠀⠀⠀⠀⠀⠀⢀⣿⢇⠢⡘⢤⢣⡑⢎⠴⣉⢂⠐⢄⠣⢆⣻⡇
⠀⠀⠀⠀⠀⣼⣿⣿⣟⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⡷⣯⣿⡇⠀⠈⠙⠀⣠⠟⠇⠉⠹⢿⣷⣶⣴⣶⣶⣶⣾⣿⣿⣿⡝⣲⣬⣾⣟⣿⣯⡑⠘⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⡤⡄⣀⡀⢀⣼⡟⠀⠀⠀⠀⠀⠀⢀⣾⠟⡄⢣⠘⣆⢣⢜⣊⠖⡰⡈⠔⡨⣘⠢⣿⠇
⠀⠀⠀⢀⣾⣿⣟⣷⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣟⣷⣿⣇⡀⠀⠀⣠⡟⠄⠶⣤⣄⣸⣿⣿⣷⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⡟⠁⢻⣿⡅⢢⡽⠿⠿⢿⣿⣿⣿⣿⣿⣿⣿⣿⣿⡏⠀⠀⣼⣶⣿⡿⠁⠀⠀⠀⠀⠀⢠⣾⠏⡜⢄⠣⣍⠲⣍⠶⣩⠞⣡⠱⡈⠴⢠⠣⣿⠀
⠀⠀⢀⣾⣿⣻⣾⢿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣟⣾⣿⣿⣿⣿⣿⣿⣿⣿⣦⣤⣼⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⠀⠀⠘⣿⣿⣹⡇⠀⠀⠀⠀⠀⠀⠀⠉⠉⠙⠛⠋⠀⠀⠰⠿⠟⠋⠀⠀⠀⠀⠀⠀⣴⣿⠏⡜⡰⢊⠵⣨⠳⣬⢓⢧⡛⣤⢣⢡⢋⠦⣹⡟⠀
⠀⠀⣾⣿⣳⣯⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣻⣾⡿⠏⠁⠀⠈⠻⣿⣿⣿⣿⣿⣿⡿⠋⠉⣿⣿⣿⣿⣿⣿⣿⣿⣇⠀⠸⣿⡀⠀⠀⣿⣿⣿⣧⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⣠⣾⣟⢣⢛⡴⢡⣋⠶⣡⢟⡲⢏⡮⡵⣊⢆⠣⢎⠖⣽⠇⠀
⠀⣼⣿⣿⣳⣿⢿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣷⣿⣿⠁⠀⠀⠀⠀⠀⢈⠉⣿⣿⡟⠉⠀⠀⠀⠈⢿⣿⣿⣿⣟⢾⣻⣿⡀⠀⠈⠉⣉⣤⣿⠿⣿⣿⡄⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⢀⣠⣾⡿⣏⡜⣣⢳⣜⣳⢬⠳⣍⠾⣭⢻⡼⣱⢣⢎⡱⢎⢾⡟⠀⠀
⢠⣿⣟⣾⣿⣽⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣷⣿⣿⣦⡀⠀⠀⠀⠀⣠⣶⣿⠃⠀⠀⠀⠀⠀⠀⢸⡷⣿⣿⢎⡷⣹⣿⡇⠈⠉⠛⠉⠁⠀⠀⢹⠟⣿⡄⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⣀⣤⣶⣿⡟⣯⢵⡺⣜⣷⣻⣾⣟⢮⡝⢮⡝⣮⣳⡝⣧⢋⠶⣩⢞⣿⠁⠀⠀
⢸⣿⣿⣻⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⡾⣿⣿⣿⣿⣷⣤⣴⣿⣿⠟⠁⠀⠀⠀⠀⠀⠀⠀⣾⢇⣿⣟⡞⣴⢣⣿⣿⠀⠀⠀⠀⠀⠀⠀⠀⠀⠸⣿⣧⣀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠈⠉⠛⠿⣿⠿⠿⢿⣿⣿⣿⣿⣛⢮⣜⢧⣛⣶⢻⡼⣣⢏⡞⣥⡿⠃⠀⠀⠀
⢹⣿⣿⣿⡟⢿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⢿⣽⣿⣿⠟⠻⠟⠛⠋⠁⠀⠀⠀⠀⠀⠀⠀⠀⢸⣿⠀⣿⡿⣜⡖⣏⣿⣿⡀⠄⢈⠀⠀⠀⠀⠀⠀⠀⠹⣿⣿⢷⣤⣀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⢀⣼⣿⣿⣿⣽⡹⣞⡼⣏⣷⢫⣿⣱⠳⣎⣾⡟⠁⠀⠀⠀⠀
⢸⣿⣿⡿⠀⠈⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⡾⣿⣿⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⢀⣾⢿⡎⣿⣿⣳⢞⡵⣺⣿⡇⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠻⣿⣎⣝⣻⣷⣤⡀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⣠⣿⣿⣿⣿⣳⢏⣷⣹⢾⡽⣞⣯⢖⣯⣿⡾⠋⠀⠀⠀⠀⠀⠀
⠀⢻⣿⡇⠀⠀⠘⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣽⣿⣿⣿⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⢠⡟⠁⠻⣿⣿⣿⣿⣯⡞⡵⣿⣷⠀⠀⡀⣠⣤⣤⡠⠜⠻⣅⠂⢈⣿⣿⣿⣿⣯⠁⠀⠀⠀⠀⠀⠀⠀⠀⠀⢠⣼⣿⣿⣿⣻⢾⣝⡾⣣⣟⣯⣟⢷⣮⣿⠾⠃⠀⠀⠀⠀⠀⠀⠀⠀
⠀⠀⠻⣇⠀⠀⠀⠙⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⣰⠏⠀⠀⣾⣿⣿⣿⣿⡿⣽⡹⣿⣿⣶⣡⠛⣝⣻⣿⣿⣦⡥⢌⣳⡿⣿⣿⢹⣾⣿⣷⣦⡀⠀⠀⠀⠀⠀⢀⣴⣿⣿⡿⣯⢷⣻⡟⣮⢷⣻⣞⣷⣾⠿⠋⠁⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀
⠀⠀⠀⠈⠀⠀⠀⠀⠘⣿⣿⣿⣿⣿⣿⣿⣿⣿⣾⣿⡿⠟⠋⠀⠹⣿⣿⣆⠀⠀⠀⠀⠀⠀⠀⠀⠀⢀⣿⡀⠀⠘⠑⣿⣿⣿⣿⠽⣶⣹⢿⣿⣏⠻⣿⣌⢿⣽⣿⣿⣽⣿⣩⣾⣯⣽⣿⣿⣿⣿⣿⣿⣷⣄⠀⣠⣾⣿⣿⣿⣯⣿⣯⣿⣧⣿⡿⠿⠛⠋⠁⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀
⠀⠀⠀⠀⠀⠀⠀⠀⠀⠈⢿⣿⣿⣿⣿⣿⣿⠿⠛⠁⠀⠀⠀⠀⠀⠈⠙⠻⠂⠀⠀⠀⠀⠀⠀⠀⠀⢀⣼⣷⣴⣁⣶⡿⣿⣿⣭⣟⡶⣯⣿⣿⣿⣷⣌⣻⣿⣾⣿⢿⣿⡍⣿⣿⣿⣿⣿⣿⣿⣿⣿⡿⠁⠹⣿⠛⠛⠛⠛⠛⠛⠉⠉⠉⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀
⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠘⢿⣿⣿⣿⡿⠋⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⢠⣾⣿⣿⣿⣿⣏⣵⣿⣿⣿⣽⣷⣿⣿⣿⣿⣿⣿⣯⣿⣿⣯⡌⣿⣷⣿⣿⡿⣏⠙⢻⣿⣿⡟⠁⠀⠀⣿⡀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀
⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠹⣿⡿⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⢠⣤⣿⣿⣿⡟⢻⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣧⣾⣿⣿⣿⣿⣿⣿⣿⣿⣼⣿⣿⣿⣟⣶⣾⣿⡿⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀
⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠈⠃⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠈⠛⠿⣿⣿⢀⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⡏⠁⠀⠈⠉⠛⠛⠛⠋⠁⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀
⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠈⢻⣹⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣏⣭⣿⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀
⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⢀⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⠟⠛⠛⠛⠙⣿⣿⣿⣿⣿⣿⣿⣿⡏⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀
⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⢸⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⣿⡇⠀⠀⠀⠀⣿⣿⣿⣿⣿⣿⣿⣿⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀
⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠈⢻⣿⣿⣿⣿⣿⣿⠿⠿⢿⡿⠃⠀⠀⠀⠀⣿⣿⣿⣿⣿⣿⣿⡏⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀
⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠉⠛⠛⠛⠉⠁⠀⠀⠀⠀⠀⠀⠀⠀⠀⣿⣿⣿⣿⣿⣿⣿⠁⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀
⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⢸⣿⣿⣿⣿⣿⣿⡏⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀
⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⢠⣿⣿⣿⣿⣿⣿⡟⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀
⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⣾⣿⣿⣿⣽⣿⡿⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀
⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠙⠉⠛⠛⠉⠉⠁⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀
diff --git a/src/transformers/models/llama/modeling_llama.py b/src/transformers/models/llama/modeling_llama.py
index 5c0c57f3e..f94a4cb37 100644
--- a/src/transformers/models/llama/modeling_llama.py
+++ b/src/transformers/models/llama/modeling_llama.py
@@ -73,6 +73,29 @@ class LlamaRMSNorm(nn.Module):
 
 ALL_LAYERNORM_LAYERS.append(LlamaRMSNorm)
 
+def apply_scaling(freqs: torch.Tensor):
+    # Values obtained from grid search
+    scale_factor = 8
+    low_freq_factor = 1
+    high_freq_factor = 4
+    old_context_len = 8192  # original llama3 length
+
+    low_freq_wavelen = old_context_len / low_freq_factor
+    high_freq_wavelen = old_context_len / high_freq_factor
+    new_freqs = []
+    for freq in freqs:
+        wavelen = 2 * math.pi / freq
+        if wavelen < high_freq_wavelen:
+            new_freqs.append(freq)
+        elif wavelen > low_freq_wavelen:
+            new_freqs.append(freq / scale_factor)
+        else:
+            assert low_freq_wavelen != high_freq_wavelen
+            smooth = (old_context_len / wavelen - low_freq_factor) / (
+                high_freq_factor - low_freq_factor
+            )
+            new_freqs.append((1 - smooth) * freq / scale_factor + smooth * freq)
+    return torch.tensor(new_freqs, dtype=freqs.dtype, device=freqs.device)
 
 class LlamaRotaryEmbedding(nn.Module):
     def __init__(self, dim, max_position_embeddings=2048, base=10000, device=None, scaling_factor=1.0):
@@ -82,6 +105,7 @@ class LlamaRotaryEmbedding(nn.Module):
         self.max_position_embeddings = max_position_embeddings
         self.base = base
         inv_freq = 1.0 / (self.base ** (torch.arange(0, self.dim, 2, dtype=torch.int64).float().to(device) / self.dim))
+        inv_freq = apply_scaling(inv_freq)
         self.register_buffer("inv_freq", inv_freq, persistent=False)
         # For BC we register cos and sin cached
         self.max_seq_len_cached = max_position_embeddings
{
"bos_token": {
"content": "<|begin_of_text|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false
},
"eos_token": {
"content": "<|end_of_text|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false
}
}
{
"version": "1.0",
"truncation": null,
"padding": null,
"added_tokens": [
{
"id": 128000,
"content": "<|begin_of_text|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128001,
"content": "<|end_of_text|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128002,
"content": "<|reserved_special_token_0|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128003,
"content": "<|reserved_special_token_1|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128004,
"content": "<|finetune_right_pad_id|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128005,
"content": "<|reserved_special_token_2|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128006,
"content": "<|start_header_id|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128007,
"content": "<|end_header_id|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128008,
"content": "<|eom_id|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128009,
"content": "<|eot_id|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128010,
"content": "<|python_tag|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128011,
"content": "<|reserved_special_token_3|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128012,
"content": "<|reserved_special_token_4|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128013,
"content": "<|reserved_special_token_5|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128014,
"content": "<|reserved_special_token_6|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128015,
"content": "<|reserved_special_token_7|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128016,
"content": "<|reserved_special_token_8|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128017,
"content": "<|reserved_special_token_9|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128018,
"content": "<|reserved_special_token_10|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128019,
"content": "<|reserved_special_token_11|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128020,
"content": "<|reserved_special_token_12|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128021,
"content": "<|reserved_special_token_13|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128022,
"content": "<|reserved_special_token_14|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128023,
"content": "<|reserved_special_token_15|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128024,
"content": "<|reserved_special_token_16|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128025,
"content": "<|reserved_special_token_17|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128026,
"content": "<|reserved_special_token_18|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128027,
"content": "<|reserved_special_token_19|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128028,
"content": "<|reserved_special_token_20|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128029,
"content": "<|reserved_special_token_21|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128030,
"content": "<|reserved_special_token_22|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128031,
"content": "<|reserved_special_token_23|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128032,
"content": "<|reserved_special_token_24|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128033,
"content": "<|reserved_special_token_25|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128034,
"content": "<|reserved_special_token_26|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128035,
"content": "<|reserved_special_token_27|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128036,
"content": "<|reserved_special_token_28|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128037,
"content": "<|reserved_special_token_29|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128038,
"content": "<|reserved_special_token_30|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128039,
"content": "<|reserved_special_token_31|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128040,
"content": "<|reserved_special_token_32|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128041,
"content": "<|reserved_special_token_33|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128042,
"content": "<|reserved_special_token_34|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128043,
"content": "<|reserved_special_token_35|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128044,
"content": "<|reserved_special_token_36|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128045,
"content": "<|reserved_special_token_37|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128046,
"content": "<|reserved_special_token_38|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128047,
"content": "<|reserved_special_token_39|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128048,
"content": "<|reserved_special_token_40|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128049,
"content": "<|reserved_special_token_41|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128050,
"content": "<|reserved_special_token_42|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128051,
"content": "<|reserved_special_token_43|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128052,
"content": "<|reserved_special_token_44|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128053,
"content": "<|reserved_special_token_45|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128054,
"content": "<|reserved_special_token_46|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128055,
"content": "<|reserved_special_token_47|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128056,
"content": "<|reserved_special_token_48|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128057,
"content": "<|reserved_special_token_49|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128058,
"content": "<|reserved_special_token_50|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128059,
"content": "<|reserved_special_token_51|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128060,
"content": "<|reserved_special_token_52|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128061,
"content": "<|reserved_special_token_53|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128062,
"content": "<|reserved_special_token_54|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128063,
"content": "<|reserved_special_token_55|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128064,
"content": "<|reserved_special_token_56|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128065,
"content": "<|reserved_special_token_57|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128066,
"content": "<|reserved_special_token_58|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128067,
"content": "<|reserved_special_token_59|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128068,
"content": "<|reserved_special_token_60|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128069,
"content": "<|reserved_special_token_61|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128070,
"content": "<|reserved_special_token_62|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128071,
"content": "<|reserved_special_token_63|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128072,
"content": "<|reserved_special_token_64|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128073,
"content": "<|reserved_special_token_65|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128074,
"content": "<|reserved_special_token_66|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128075,
"content": "<|reserved_special_token_67|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128076,
"content": "<|reserved_special_token_68|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128077,
"content": "<|reserved_special_token_69|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128078,
"content": "<|reserved_special_token_70|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128079,
"content": "<|reserved_special_token_71|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128080,
"content": "<|reserved_special_token_72|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128081,
"content": "<|reserved_special_token_73|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128082,
"content": "<|reserved_special_token_74|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128083,
"content": "<|reserved_special_token_75|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128084,
"content": "<|reserved_special_token_76|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128085,
"content": "<|reserved_special_token_77|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128086,
"content": "<|reserved_special_token_78|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128087,
"content": "<|reserved_special_token_79|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128088,
"content": "<|reserved_special_token_80|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128089,
"content": "<|reserved_special_token_81|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128090,
"content": "<|reserved_special_token_82|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128091,
"content": "<|reserved_special_token_83|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128092,
"content": "<|reserved_special_token_84|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128093,
"content": "<|reserved_special_token_85|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128094,
"content": "<|reserved_special_token_86|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128095,
"content": "<|reserved_special_token_87|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128096,
"content": "<|reserved_special_token_88|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128097,
"content": "<|reserved_special_token_89|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128098,
"content": "<|reserved_special_token_90|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128099,
"content": "<|reserved_special_token_91|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128100,
"content": "<|reserved_special_token_92|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128101,
"content": "<|reserved_special_token_93|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128102,
"content": "<|reserved_special_token_94|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128103,
"content": "<|reserved_special_token_95|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128104,
"content": "<|reserved_special_token_96|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128105,
"content": "<|reserved_special_token_97|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128106,
"content": "<|reserved_special_token_98|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128107,
"content": "<|reserved_special_token_99|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128108,
"content": "<|reserved_special_token_100|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128109,
"content": "<|reserved_special_token_101|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128110,
"content": "<|reserved_special_token_102|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128111,
"content": "<|reserved_special_token_103|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128112,
"content": "<|reserved_special_token_104|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128113,
"content": "<|reserved_special_token_105|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128114,
"content": "<|reserved_special_token_106|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128115,
"content": "<|reserved_special_token_107|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128116,
"content": "<|reserved_special_token_108|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128117,
"content": "<|reserved_special_token_109|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128118,
"content": "<|reserved_special_token_110|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128119,
"content": "<|reserved_special_token_111|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128120,
"content": "<|reserved_special_token_112|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128121,
"content": "<|reserved_special_token_113|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128122,
"content": "<|reserved_special_token_114|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128123,
"content": "<|reserved_special_token_115|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128124,
"content": "<|reserved_special_token_116|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128125,
"content": "<|reserved_special_token_117|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128126,
"content": "<|reserved_special_token_118|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128127,
"content": "<|reserved_special_token_119|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128128,
"content": "<|reserved_special_token_120|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128129,
"content": "<|reserved_special_token_121|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128130,
"content": "<|reserved_special_token_122|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128131,
"content": "<|reserved_special_token_123|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128132,
"content": "<|reserved_special_token_124|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128133,
"content": "<|reserved_special_token_125|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128134,
"content": "<|reserved_special_token_126|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128135,
"content": "<|reserved_special_token_127|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128136,
"content": "<|reserved_special_token_128|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128137,
"content": "<|reserved_special_token_129|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128138,
"content": "<|reserved_special_token_130|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128139,
"content": "<|reserved_special_token_131|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128140,
"content": "<|reserved_special_token_132|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128141,
"content": "<|reserved_special_token_133|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128142,
"content": "<|reserved_special_token_134|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128143,
"content": "<|reserved_special_token_135|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128144,
"content": "<|reserved_special_token_136|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128145,
"content": "<|reserved_special_token_137|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128146,
"content": "<|reserved_special_token_138|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128147,
"content": "<|reserved_special_token_139|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128148,
"content": "<|reserved_special_token_140|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128149,
"content": "<|reserved_special_token_141|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128150,
"content": "<|reserved_special_token_142|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128151,
"content": "<|reserved_special_token_143|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128152,
"content": "<|reserved_special_token_144|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128153,
"content": "<|reserved_special_token_145|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128154,
"content": "<|reserved_special_token_146|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128155,
"content": "<|reserved_special_token_147|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128156,
"content": "<|reserved_special_token_148|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128157,
"content": "<|reserved_special_token_149|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128158,
"content": "<|reserved_special_token_150|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128159,
"content": "<|reserved_special_token_151|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128160,
"content": "<|reserved_special_token_152|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128161,
"content": "<|reserved_special_token_153|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128162,
"content": "<|reserved_special_token_154|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128163,
"content": "<|reserved_special_token_155|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128164,
"content": "<|reserved_special_token_156|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128165,
"content": "<|reserved_special_token_157|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128166,
"content": "<|reserved_special_token_158|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128167,
"content": "<|reserved_special_token_159|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128168,
"content": "<|reserved_special_token_160|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128169,
"content": "<|reserved_special_token_161|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128170,
"content": "<|reserved_special_token_162|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128171,
"content": "<|reserved_special_token_163|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128172,
"content": "<|reserved_special_token_164|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128173,
"content": "<|reserved_special_token_165|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128174,
"content": "<|reserved_special_token_166|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128175,
"content": "<|reserved_special_token_167|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128176,
"content": "<|reserved_special_token_168|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128177,
"content": "<|reserved_special_token_169|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128178,
"content": "<|reserved_special_token_170|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128179,
"content": "<|reserved_special_token_171|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128180,
"content": "<|reserved_special_token_172|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128181,
"content": "<|reserved_special_token_173|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128182,
"content": "<|reserved_special_token_174|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128183,
"content": "<|reserved_special_token_175|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128184,
"content": "<|reserved_special_token_176|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128185,
"content": "<|reserved_special_token_177|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128186,
"content": "<|reserved_special_token_178|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128187,
"content": "<|reserved_special_token_179|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128188,
"content": "<|reserved_special_token_180|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128189,
"content": "<|reserved_special_token_181|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128190,
"content": "<|reserved_special_token_182|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128191,
"content": "<|reserved_special_token_183|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128192,
"content": "<|reserved_special_token_184|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128193,
"content": "<|reserved_special_token_185|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128194,
"content": "<|reserved_special_token_186|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128195,
"content": "<|reserved_special_token_187|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128196,
"content": "<|reserved_special_token_188|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128197,
"content": "<|reserved_special_token_189|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128198,
"content": "<|reserved_special_token_190|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128199,
"content": "<|reserved_special_token_191|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128200,
"content": "<|reserved_special_token_192|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128201,
"content": "<|reserved_special_token_193|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128202,
"content": "<|reserved_special_token_194|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128203,
"content": "<|reserved_special_token_195|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128204,
"content": "<|reserved_special_token_196|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128205,
"content": "<|reserved_special_token_197|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128206,
"content": "<|reserved_special_token_198|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128207,
"content": "<|reserved_special_token_199|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128208,
"content": "<|reserved_special_token_200|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128209,
"content": "<|reserved_special_token_201|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128210,
"content": "<|reserved_special_token_202|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128211,
"content": "<|reserved_special_token_203|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128212,
"content": "<|reserved_special_token_204|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128213,
"content": "<|reserved_special_token_205|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128214,
"content": "<|reserved_special_token_206|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128215,
"content": "<|reserved_special_token_207|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128216,
"content": "<|reserved_special_token_208|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128217,
"content": "<|reserved_special_token_209|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128218,
"content": "<|reserved_special_token_210|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128219,
"content": "<|reserved_special_token_211|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128220,
"content": "<|reserved_special_token_212|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128221,
"content": "<|reserved_special_token_213|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128222,
"content": "<|reserved_special_token_214|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128223,
"content": "<|reserved_special_token_215|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128224,
"content": "<|reserved_special_token_216|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128225,
"content": "<|reserved_special_token_217|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128226,
"content": "<|reserved_special_token_218|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128227,
"content": "<|reserved_special_token_219|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128228,
"content": "<|reserved_special_token_220|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128229,
"content": "<|reserved_special_token_221|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128230,
"content": "<|reserved_special_token_222|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128231,
"content": "<|reserved_special_token_223|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128232,
"content": "<|reserved_special_token_224|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128233,
"content": "<|reserved_special_token_225|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128234,
"content": "<|reserved_special_token_226|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128235,
"content": "<|reserved_special_token_227|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128236,
"content": "<|reserved_special_token_228|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128237,
"content": "<|reserved_special_token_229|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128238,
"content": "<|reserved_special_token_230|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128239,
"content": "<|reserved_special_token_231|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128240,
"content": "<|reserved_special_token_232|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128241,
"content": "<|reserved_special_token_233|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128242,
"content": "<|reserved_special_token_234|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128243,
"content": "<|reserved_special_token_235|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128244,
"content": "<|reserved_special_token_236|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128245,
"content": "<|reserved_special_token_237|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128246,
"content": "<|reserved_special_token_238|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128247,
"content": "<|reserved_special_token_239|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128248,
"content": "<|reserved_special_token_240|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128249,
"content": "<|reserved_special_token_241|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128250,
"content": "<|reserved_special_token_242|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128251,
"content": "<|reserved_special_token_243|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128252,
"content": "<|reserved_special_token_244|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128253,
"content": "<|reserved_special_token_245|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128254,
"content": "<|reserved_special_token_246|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 128255,
"content": "<|reserved_special_token_247|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
}
],
"normalizer": null,
"pre_tokenizer": {
"type": "Sequence",
"pretokenizers": [
{
"type": "Split",
"pattern": {
"Regex": "(?i:'s|'t|'re|'ve|'m|'ll|'d)|[^\\r\\n\\p{L}\\p{N}]?\\p{L}+|\\p{N}{1,3}| ?[^\\s\\p{L}\\p{N}]+[\\r\\n]*|\\s*[\\r\\n]+|\\s+(?!\\S)|\\s+"
},
"behavior": "Isolated",
"invert": false
},
{
"type": "ByteLevel",
"add_prefix_space": false,
"trim_offsets": true,
"use_regex": false
}
]
},
"post_processor": {
"type": "ByteLevel",
"add_prefix_space": true,
"trim_offsets": false,
"use_regex": true
},
"decoder": {
"type": "ByteLevel",
"add_prefix_space": true,
"trim_offsets": true,
"use_regex": true
},
"model": {
"type": "BPE",
"dropout": null,
"unk_token": null,
"continuing_subword_prefix": null,
"end_of_word_suffix": null,
"fuse_unk": false,
"byte_fallback": false,
"ignore_merges": true,
"vocab": {
"!": 0,
"\"": 1,
"#": 2,
"$": 3,
"%": 4,
"&": 5,
"'": 6,
"(": 7,
")": 8,
"*": 9,
"+": 10,
",": 11,
"-": 12,
".": 13,
"/": 14,
"0": 15,
"1": 16,
"2": 17,
"3": 18,
"4": 19,
"5": 20,
"6": 21,
"7": 22,
"8": 23,
"9": 24,
":": 25,
";": 26,
"<": 27,
"=": 28,
">": 29,
"?": 30,
"@": 31,
"A": 32,
"B": 33,
"C": 34,
"D": 35,
"E": 36,
"F": 37,
"G": 38,
"H": 39,
"I": 40,
"J": 41,
"K": 42,
"L": 43,
"M": 44,
"N": 45,
"O": 46,
"P": 47,
"Q": 48,
"R": 49,
"S": 50,
"T": 51,
"U": 52,
"V": 53,
"W": 54,
"X": 55,
"Y": 56,
"Z": 57,
"[": 58,
"\\": 59,
"]": 60,
"^": 61,
"_": 62,
"`": 63,
"a": 64,
"b": 65,
"c": 66,
"d": 67,
"e": 68,
"f": 69,
"g": 70,
"h": 71,
"i": 72,
"j": 73,
"k": 74,
"l": 75,
"m": 76,
"n": 77,
"o": 78,
"p": 79,
"q": 80,
"r": 81,
"s": 82,
"t": 83,
"u": 84,
"v": 85,
"w": 86,
"x": 87,
"y": 88,
"z": 89,
"{": 90,
"|": 91,
"}": 92,
"~": 93,
"¡": 94,
"¢": 95,
"£": 96,
"¤": 97,
"¥": 98,
"¦": 99,
"§": 100,
"¨": 101,
"©": 102,
"ª": 103,
"«": 104,
"¬": 105,
"®": 106,
"¯": 107,
"°": 108,
"±": 109,
"²": 110,
"³": 111,
"´": 112,
"µ": 113,
"¶": 114,
"·": 115,
"¸": 116,
"¹": 117,
"º": 118,
"»": 119,
"¼": 120,
"½": 121,
"¾": 122,
"¿": 123,
"À": 124,
"Á": 125,
"Â": 126,
"Ã": 127,
"Ä": 128,
"Å": 129,
"Æ": 130,
"Ç": 131,
"È": 132,
"É": 133,
"Ê": 134,
"Ë": 135,
"Ì": 136,
"Í": 137,
"Î": 138,
"Ï": 139,
"Ð": 140,
"Ñ": 141,
"Ò": 142,
"Ó": 143,
"Ô": 144,
"Õ": 145,
"Ö": 146,
"×": 147,
"Ø": 148,
"Ù": 149,
"Ú": 150,
"Û": 151,
"Ü": 152,
"Ý": 153,
"Þ": 154,
"ß": 155,
"à": 156,
"á": 157,
"â": 158,
"ã": 159,
"ä": 160,
"å": 161,
"æ": 162,
"ç": 163,
"è": 164,
"é": 165,
"ê": 166,
"ë": 167,
"ì": 168,
"í": 169,
"î": 170,
"ï": 171,
"ð": 172,
"ñ": 173,
"ò": 174,
"ó": 175,
"ô": 176,
"õ": 177,
"ö": 178,
"÷": 179,
"ø": 180,
"ù": 181,
"ú": 182,
"û": 183,
"ü": 184,
"ý": 185,
"þ": 186,
"ÿ": 187,
"Ā": 188,
"ā": 189,
"Ă": 190,
"ă": 191,
"Ą": 192,
"ą": 193,
"Ć": 194,
"ć": 195,
"Ĉ": 196,
"ĉ": 197,
"Ċ": 198,
"ċ": 199,
"Č": 200,
"č": 201,
"Ď": 202,
"ď": 203,
"Đ": 204,
"đ": 205,
"Ē": 206,
"ē": 207,
"Ĕ": 208,
"ĕ": 209,
"Ė": 210,
"ė": 211,
"Ę": 212,
"ę": 213,
"Ě": 214,
"ě": 215,
"Ĝ": 216,
"ĝ": 217,
"Ğ": 218,
"ğ": 219,
"Ġ": 220,
"ġ": 221,
"Ģ": 222,
"ģ": 223,
"Ĥ": 224,
"ĥ": 225,
"Ħ": 226,
"ħ": 227,
"Ĩ": 228,
"ĩ": 229,
"Ī": 230,
"ī": 231,
"Ĭ": 232,
"ĭ": 233,
"Į": 234,
"į": 235,
"İ": 236,
"ı": 237,
"IJ": 238,
"ij": 239,
"Ĵ": 240,
"ĵ": 241,
"Ķ": 242,
"ķ": 243,
"ĸ": 244,
"Ĺ": 245,
"ĺ": 246,
"Ļ": 247,
"ļ": 248,
"Ľ": 249,
"ľ": 250,
"Ŀ": 251,
"ŀ": 252,
"Ł": 253,
"ł": 254,
"Ń": 255,
"ĠĠ": 256,
"ĠĠĠĠ": 257,
"in": 258,
"Ġt": 259,
"ĠĠĠĠĠĠĠĠ": 260,
"er": 261,
"ĠĠĠ": 262,
"on": 263,
"Ġa": 264,
"re": 265,
"at": 266,
"st": 267,
"en": 268,
"or": 269,
"Ġth": 270,
"ĊĊ": 271,
"Ġc": 272,
"le": 273,
"Ġs": 274,
"it": 275,
"an": 276,
"ar": 277,
"al": 278,
"Ġthe": 279,
";Ċ": 280,
"Ġp": 281,
"Ġf": 282,
"ou": 283,
"Ġ=": 284,
"is": 285,
"ĠĠĠĠĠĠĠ": 286,
"ing": 287,
"es": 288,
"Ġw": 289,
"ion": 290,
"ed": 291,
"ic": 292,
"Ġb": 293,
"Ġd": 294,
"et": 295,
"Ġm": 296,
"Ġo": 297,
"ĉĉ": 298,
"ro": 299,
"as": 300,
"el": 301,
"ct": 302,
"nd": 303,
"Ġin": 304,
"Ġh": 305,
"ent": 306,
"id": 307,
"Ġn": 308,
"am": 309,
"ĠĠĠĠĠĠĠĠĠĠĠ": 310,
"Ġto": 311,
"Ġre": 312,
"--": 313,
"Ġ{": 314,
"Ġof": 315,
"om": 316,
");Ċ": 317,
"im": 318,
"čĊ": 319,
"Ġ(": 320,
"il": 321,
"//": 322,
"Ġand": 323,
"ur": 324,
"se": 325,
"Ġl": 326,
"ex": 327,
"ĠS": 328,
"ad": 329,
\"": 330,
"ch": 331,
"ut": 332,
"if": 333,
"**": 334,
"Ġ}": 335,
"em": 336,
"ol": 337,
"ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 338,
"th": 339,
")Ċ": 340,
"Ġ{Ċ": 341,
"Ġg": 342,
"ig": 343,
"iv": 344,
",Ċ": 345,
"ce": 346,
"od": 347,
"Ġv": 348,
"ate": 349,
"ĠT": 350,
"ag": 351,
"ay": 352,
"Ġ*": 353,
"ot": 354,
"us": 355,
"ĠC": 356,
"Ġst": 357,
"ĠI": 358,
"un": 359,
"ul": 360,
"ue": 361,
"ĠA": 362,
"ow": 363,
"Ġ'": 364,
"ew": 365,
"Ġ<": 366,
"ation": 367,
"()": 368,
"Ġfor": 369,
"ab": 370,
"ort": 371,
"um": 372,
"ame": 373,
"Ġis": 374,
"pe": 375,
"tr": 376,
"ck": 377,
"âĢ": 378,
"Ġy": 379,
"ist": 380,
"----": 381,
".ĊĊ": 382,
"he": 383,
"Ġe": 384,
"lo": 385,
"ĠM": 386,
"Ġbe": 387,
"ers": 388,
"Ġon": 389,
"Ġcon": 390,
"ap": 391,
"ub": 392,
"ĠP": 393,
"ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 394,
"ass": 395,
"int": 396,
">Ċ": 397,
"ly": 398,
"urn": 399,
"Ġ$": 400,
";ĊĊ": 401,
"av": 402,
"port": 403,
"ir": 404,
"->": 405,
"nt": 406,
"ction": 407,
"end": 408,
"Ġde": 409,
"00": 410,
"ith": 411,
"out": 412,
"turn": 413,
"our": 414,
"ĠĠĠĠĠ": 415,
"lic": 416,
"res": 417,
"pt": 418,
"==": 419,
"Ġthis": 420,
"Ġwh": 421,
"Ġif": 422,
"ĠD": 423,
"ver": 424,
"age": 425,
"ĠB": 426,
"ht": 427,
"ext": 428,
"=\"": 429,
"Ġthat": 430,
"****": 431,
"ĠR": 432,
"Ġit": 433,
"ess": 434,
"ĠF": 435,
"Ġr": 436,
"os": 437,
"and": 438,
"Ġas": 439,
"ect": 440,
"ke": 441,
"rom": 442,
"Ġ//": 443,
"con": 444,
"ĠL": 445,
"(\"": 446,
"qu": 447,
"lass": 448,
"Ġwith": 449,
"iz": 450,
"de": 451,
"ĠN": 452,
"Ġal": 453,
"op": 454,
"up": 455,
"get": 456,
"Ġ}Ċ": 457,
"ile": 458,
"Ġan": 459,
"ata": 460,
"ore": 461,
"ri": 462,
"Ġpro": 463,
";čĊ": 464,
"ĉĉĉĉ": 465,
"ter": 466,
"ain": 467,
"ĠW": 468,
"ĠE": 469,
"Ġcom": 470,
"Ġreturn": 471,
"art": 472,
"ĠH": 473,
"ack": 474,
"import": 475,
"ublic": 476,
"Ġor": 477,
"est": 478,
"ment": 479,
"ĠG": 480,
"able": 481,
"Ġ-": 482,
"ine": 483,
"ill": 484,
"ind": 485,
"ere": 486,
"::": 487,
"ity": 488,
"Ġ+": 489,
"Ġtr": 490,
"elf": 491,
"ight": 492,
"('": 493,
"orm": 494,
"ult": 495,
"str": 496,
"..": 497,
"\",": 498,
"Ġyou": 499,
"ype": 500,
"pl": 501,
"Ġnew": 502,
"Ġj": 503,
"ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 504,
"Ġfrom": 505,
"Ġex": 506,
"ĠO": 507,
"20": 508,
"ld": 509,
"Ġ[": 510,
"oc": 511,
":Ċ": 512,
"Ġse": 513,
"Ġle": 514,
"--------": 515,
".s": 516,
"{Ċ": 517,
"',": 518,
"ant": 519,
"Ġat": 520,
"ase": 521,
".c": 522,
"Ġch": 523,
"</": 524,
"ave": 525,
"ang": 526,
"Ġare": 527,
"Ġint": 528,
"âĢĻ": 529,
"_t": 530,
"ert": 531,
"ial": 532,
"act": 533,
"}Ċ": 534,
"ive": 535,
"ode": 536,
"ost": 537,
"Ġclass": 538,
"Ġnot": 539,
"og": 540,
"ord": 541,
"alue": 542,
"all": 543,
"ff": 544,
"();Ċ": 545,
"ont": 546,
"ime": 547,
"are": 548,
"ĠU": 549,
"Ġpr": 550,
"Ġ:": 551,
"ies": 552,
"ize": 553,
"ure": 554,
"Ġby": 555,
"ire": 556,
"Ġ}ĊĊ": 557,
".p": 558,
"Ġsh": 559,
"ice": 560,
"ast": 561,
"ption": 562,
"tring": 563,
"ok": 564,
"__": 565,
"cl": 566,
"##": 567,
"Ġhe": 568,
"ard": 569,
").": 570,
"Ġ@": 571,
"iew": 572,
"ĉĉĉ": 573,
"Ġwas": 574,
"ip": 575,
"this": 576,
"Ġu": 577,
"ĠThe": 578,
"ide": 579,
"ace": 580,
"ib": 581,
"ac": 582,
"rou": 583,
"Ġwe": 584,
"ject": 585,
"Ġpublic": 586,
"ak": 587,
"ve": 588,
"ath": 589,
"oid": 590,
"Ġ=>": 591,
"ust": 592,
"que": 593,
"Ġres": 594,
"))": 595,
"'s": 596,
"Ġk": 597,
"ans": 598,
"yst": 599,
"unction": 600,
"********": 601,
"Ġi": 602,
"Ġus": 603,
"pp": 604,
"10": 605,
"one": 606,
"ail": 607,
"====": 608,
"name": 609,
"Ġstr": 610,
"Ġ/": 611,
"Ġ&": 612,
"ach": 613,
"div": 614,
"ystem": 615,
"ell": 616,
"Ġhave": 617,
"err": 618,
"ould": 619,
"ull": 620,
"pon": 621,
"ĠJ": 622,
"_p": 623,
"Ġ==": 624,
"ign": 625,
"St": 626,
".Ċ": 627,
"Ġpl": 628,
");ĊĊ": 629,
"form": 630,
"put": 631,
"ount": 632,
"}ĊĊ": 633,
"dd": 634,
"ite": 635,
"Ġget": 636,
"rr": 637,
"ome": 638,
"ĠâĢ": 639,
"aram": 640,
"cc": 641,
"Ġ*/": 642,
"ER": 643,
"In": 644,
"les": 645,
"_s": 646,
"ong": 647,
"ie": 648,
"Ġcan": 649,
"ĠV": 650,
"erv": 651,
"pr": 652,
"Ġun": 653,
"row": 654,
"ber": 655,
"Ġdo": 656,
"ll": 657,
"Ġel": 658,
"Ġself": 659,
"ated": 660,
"ary": 661,
"Ġ.": 662,
"']": 663,
"ud": 664,
"Ġen": 665,
"ĠTh": 666,
"ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 667,
"te": 668,
"_c": 669,
"uct": 670,
"Ġab": 671,
"ork": 672,
".get": 673,
"Ġ#": 674,
"aw": 675,
"ress": 676,
"ob": 677,
"Name": 678,
"201": 679,
"app": 680,
"['": 681,
"Ġall": 682,
"ory": 683,
"ition": 684,
"ance": 685,
"ear": 686,
"Ġcont": 687,
"vent": 688,
"ia": 689,
"Ġwill": 690,
"IN": 691,
"ĠĠĠĠĠĠĠĠĠ": 692,
"return": 693,
"Ġ</": 694,
"data": 695,
")ĊĊ": 696,
"Re": 697,
"ple": 698,
"ild": 699,
"ther": 700,
"Ġyour": 701,
"\"Ċ": 702,
"($": 703,
"Ġout": 704,
"),": 705,
"Ġhas": 706,
"String": 707,
"so": 708,
"Ġup": 709,
"ax": 710,
"Ġdef": 711,
"Ġbo": 712,
"ge": 713,
"alse": 714,
"ON": 715,
"per": 716,
"12": 717,
"ich": 718,
"Ġbut": 719,
"ĠĊ": 720,
"Ġ_": 721,
"_m": 722,
"add": 723,
"quest": 724,
"odel": 725,
"self": 726,
"ery": 727,
"ft": 728,
"ens": 729,
"////": 730,
"ake": 731,
".C": 732,
"Ġgo": 733,
"Ġfunction": 734,
"ĠK": 735,
"ivate": 736,
"Ġim": 737,
"Ġconst": 738,
".t": 739,
"Ġ*/Ċ": 740,
");čĊ": 741,
"Ġvoid": 742,
"Ġset": 743,
"ĠSystem": 744,
"cri": 745,
"()Ċ": 746,
"li": 747,
"ĉif": 748,
".m": 749,
"ally": 750,
"set": 751,
"ep": 752,
"âĢĻs": 753,
"bo": 754,
"def": 755,
"',Ċ": 756,
"Ġme": 757,
"Ġ!": 758,
"atch": 759,
"\">": 760,
"\",Ċ": 761,
"ec": 762,
"ĠIn": 763,
"ph": 764,
"Ġ|": 765,
"_f": 766,
"Ġvar": 767,
"ence": 768,
"Id": 769,
"ree": 770,
"ink": 771,
"lect": 772,
"ug": 773,
"eth": 774,
"Ġelse": 775,
"----------------": 776,
"19": 777,
"cont": 778,
"Ġso": 779,
"atic": 780,
"Ġlo": 781,
"pro": 782,
"ton": 783,
"ss": 784,
"own": 785,
"abel": 786,
"oint": 787,
"ous": 788,
"eld": 789,
"ST": 790,
"The": 791,
"ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 792,
"RE": 793,
"\":": 794,
"olor": 795,
"tp": 796,
"eg": 797,
"key": 798,
"ude": 799,
"ĠSt": 800,
"ound": 801,
"Ġar": 802,
"\");Ċ": 803,
"ener": 804,
"ser": 805,
"11": 806,
"bject": 807,
"essage": 808,
"fer": 809,
"Ġmore": 810,
"ations": 811,
"ents": 812,
"Ġhis": 813,
"Ġthey": 814,
".S": 815,
"ĠY": 816,
"use": 817,
"ne": 818,
"ish": 819,
"old": 820,
"_d": 821,
"io": 822,
"ield": 823,
"Ġper": 824,
"Cont": 825,
"ings": 826,
"####": 827,
"Ġdata": 828,
"Ġsa": 829,
"ef": 830,
"fo": 831,
"Ġone": 832,
"eng": 833,
"Ġdis": 834,
"AT": 835,
"Ġname": 836,
"Ġtrue": 837,
"val": 838,
"led": 839,
".f": 840,
"Ġne": 841,
"Ġend": 842,
"32": 843,
".T": 844,
"16": 845,
"cre": 846,
"ark": 847,
"log": 848,
"Ex": 849,
"error": 850,
"_id": 851,
"urre": 852,
"ange": 853,
"Ġnull": 854,
"rray": 855,
"Ġmy": 856,
"pan": 857,
"ict": 858,
"ator": 859,
"View": 860,
"List": 861,
"ĉreturn": 862,
"âĢĿ": 863,
"Ġpre": 864,
"Ġx": 865,
"clude": 866,
"arg": 867,
"15": 868,
"ov": 869,
".h": 870,
"Ġ>": 871,
"Ġtheir": 872,
"')": 873,
"irst": 874,
"ick": 875,
"gh": 876,
"LE": 877,
"OR": 878,
"Ġprivate": 879,
"tem": 880,
"čĊčĊ": 881,
"user": 882,
"Ġ)": 883,
"com": 884,
".A": 885,
"\";Ċ": 886,
"Ġid": 887,
"read": 888,
"Ġwho": 889,
"_b": 890,
"\">Ċ": 891,
"Ġtime": 892,
"Ġman": 893,
"ry": 894,
"========": 895,
"roup": 896,
"rop": 897,
"public": 898,
"vel": 899,
"umber": 900,
"ble": 901,
"Ġwhich": 902,
"****************": 903,
"Ġany": 904,
"Ġfalse": 905,
"we": 906,
"Ġvalue": 907,
"Ġli": 908,
"\")": 909,
"nder": 910,
"gr": 911,
"Ġno": 912,
"param": 913,
"25": 914,
"fig": 915,
".com": 916,
"Ġapp": 917,
"_l": 918,
"ions": 919,
".D": 920,
"ĠCh": 921,
"Ġabout": 922,
"Ġadd": 923,
"Ġsu": 924,
"Ġstring": 925,
"ID": 926,
"Ġover": 927,
"string": 928,
".l": 929,
"ource": 930,
"000": 931,
"_C": 932,
"]Ċ": 933,
"Ġqu": 934,
"ĠString": 935,
"ca": 936,
"SE": 937,
"Ġro": 938,
"sh": 939,
"ual": 940,
"Type": 941,
"son": 942,
"new": 943,
"ern": 944,
"Ġag": 945,
"AR": 946,
"];Ċ": 947,
"].": 948,
"Ġ?": 949,
"ical": 950,
"Ġdes": 951,
"uth": 952,
"ix": 953,
"ays": 954,
"Ġtype": 955,
"'t": 956,
"ault": 957,
"Ġinter": 958,
"var": 959,
".b": 960,
"Ġpart": 961,
".d": 962,
"urrent": 963,
"IT": 964,
"EN": 965,
"30": 966,
"enc": 967,
"(f": 968,
"ra": 969,
"value": 970,
"cho": 971,
"18": 972,
"utton": 973,
"ose": 974,
"14": 975,
"Ġ!=": 976,
"ater": 977,
"é": 978,
"reate": 979,
"oll": 980,
"pos": 981,
"yle": 982,
"ng": 983,
"AL": 984,
"using": 985,
"ames": 986,
"Ġ{čĊ": 987,
"ates": 988,
"ely": 989,
"Ġwork": 990,
"Ġem": 991,
"inal": 992,
"Ġsp": 993,
"Ġwhen": 994,
".set": 995,
"ĠĠĠĠĠĠ": 996,
"):Ċ": 997,
"to": 998,
"quire": 999,
"indow": 1000,
"..................................................": -999
"ãĥ¼ãĥ¼": 127998,
"éĶ¦": 127999
},
"merges": [
"Ġ Ġ",
"Ġ ĠĠĠ",
"ĠĠ ĠĠ",
"ĠĠĠ Ġ",
"i n",
"Ġ t",
"Ġ ĠĠĠĠĠĠĠ",
"ĠĠ ĠĠĠĠĠĠ",
"ĠĠĠĠ ĠĠĠĠ",
"ĠĠĠ ĠĠĠĠĠ",
"ĠĠĠĠĠĠĠ Ġ",
"ĠĠĠĠĠ ĠĠĠ",
"ĠĠĠĠĠĠ ĠĠ",
"e r",
"Ġ ĠĠ",
"ĠĠ Ġ",
"o n",
"Ġ a",
"r e",
"a t",
"s t",
"e n",
"o r",
"Ġ th",
"Ġt h",
"Ċ Ċ",
"Ġ c",
"l e",
"Ġ s",
"i t",
"a n",
"a r",
"a l",
"Ġ the",
"............................................................................................................",
"ĠвÑĭÑģок ой",
"ãĥ¼ ãĥ¼",
"ãĥ¼ãĥ ¼",
"éĶ ¦"
]
}
}
{
"added_tokens_decoder": {
"128000": {
"content": "<|begin_of_text|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128001": {
"content": "<|end_of_text|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128002": {
"content": "<|reserved_special_token_0|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128003": {
"content": "<|reserved_special_token_1|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128004": {
"content": "<|finetune_right_pad_id|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128005": {
"content": "<|reserved_special_token_2|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128006": {
"content": "<|start_header_id|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128007": {
"content": "<|end_header_id|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128008": {
"content": "<|eom_id|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128009": {
"content": "<|eot_id|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128010": {
"content": "<|python_tag|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128011": {
"content": "<|reserved_special_token_3|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128012": {
"content": "<|reserved_special_token_4|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128013": {
"content": "<|reserved_special_token_5|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128014": {
"content": "<|reserved_special_token_6|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128015": {
"content": "<|reserved_special_token_7|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128016": {
"content": "<|reserved_special_token_8|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128017": {
"content": "<|reserved_special_token_9|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128018": {
"content": "<|reserved_special_token_10|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128019": {
"content": "<|reserved_special_token_11|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128020": {
"content": "<|reserved_special_token_12|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128021": {
"content": "<|reserved_special_token_13|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128022": {
"content": "<|reserved_special_token_14|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128023": {
"content": "<|reserved_special_token_15|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128024": {
"content": "<|reserved_special_token_16|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128025": {
"content": "<|reserved_special_token_17|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128026": {
"content": "<|reserved_special_token_18|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128027": {
"content": "<|reserved_special_token_19|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128028": {
"content": "<|reserved_special_token_20|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128029": {
"content": "<|reserved_special_token_21|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128030": {
"content": "<|reserved_special_token_22|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128031": {
"content": "<|reserved_special_token_23|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128032": {
"content": "<|reserved_special_token_24|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128033": {
"content": "<|reserved_special_token_25|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128034": {
"content": "<|reserved_special_token_26|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128035": {
"content": "<|reserved_special_token_27|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128036": {
"content": "<|reserved_special_token_28|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128037": {
"content": "<|reserved_special_token_29|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128038": {
"content": "<|reserved_special_token_30|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128039": {
"content": "<|reserved_special_token_31|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128040": {
"content": "<|reserved_special_token_32|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128041": {
"content": "<|reserved_special_token_33|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128042": {
"content": "<|reserved_special_token_34|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128043": {
"content": "<|reserved_special_token_35|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128044": {
"content": "<|reserved_special_token_36|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128045": {
"content": "<|reserved_special_token_37|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128046": {
"content": "<|reserved_special_token_38|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128047": {
"content": "<|reserved_special_token_39|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128048": {
"content": "<|reserved_special_token_40|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128049": {
"content": "<|reserved_special_token_41|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128050": {
"content": "<|reserved_special_token_42|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128051": {
"content": "<|reserved_special_token_43|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128052": {
"content": "<|reserved_special_token_44|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128053": {
"content": "<|reserved_special_token_45|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128054": {
"content": "<|reserved_special_token_46|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128055": {
"content": "<|reserved_special_token_47|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128056": {
"content": "<|reserved_special_token_48|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128057": {
"content": "<|reserved_special_token_49|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128058": {
"content": "<|reserved_special_token_50|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128059": {
"content": "<|reserved_special_token_51|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128060": {
"content": "<|reserved_special_token_52|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128061": {
"content": "<|reserved_special_token_53|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128062": {
"content": "<|reserved_special_token_54|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128063": {
"content": "<|reserved_special_token_55|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128064": {
"content": "<|reserved_special_token_56|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128065": {
"content": "<|reserved_special_token_57|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128066": {
"content": "<|reserved_special_token_58|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128067": {
"content": "<|reserved_special_token_59|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128068": {
"content": "<|reserved_special_token_60|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128069": {
"content": "<|reserved_special_token_61|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128070": {
"content": "<|reserved_special_token_62|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128071": {
"content": "<|reserved_special_token_63|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128072": {
"content": "<|reserved_special_token_64|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128073": {
"content": "<|reserved_special_token_65|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128074": {
"content": "<|reserved_special_token_66|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128075": {
"content": "<|reserved_special_token_67|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128076": {
"content": "<|reserved_special_token_68|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128077": {
"content": "<|reserved_special_token_69|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128078": {
"content": "<|reserved_special_token_70|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128079": {
"content": "<|reserved_special_token_71|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128080": {
"content": "<|reserved_special_token_72|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128081": {
"content": "<|reserved_special_token_73|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128082": {
"content": "<|reserved_special_token_74|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128083": {
"content": "<|reserved_special_token_75|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128084": {
"content": "<|reserved_special_token_76|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128085": {
"content": "<|reserved_special_token_77|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128086": {
"content": "<|reserved_special_token_78|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128087": {
"content": "<|reserved_special_token_79|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128088": {
"content": "<|reserved_special_token_80|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128089": {
"content": "<|reserved_special_token_81|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128090": {
"content": "<|reserved_special_token_82|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128091": {
"content": "<|reserved_special_token_83|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128092": {
"content": "<|reserved_special_token_84|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128093": {
"content": "<|reserved_special_token_85|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128094": {
"content": "<|reserved_special_token_86|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128095": {
"content": "<|reserved_special_token_87|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128096": {
"content": "<|reserved_special_token_88|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128097": {
"content": "<|reserved_special_token_89|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128098": {
"content": "<|reserved_special_token_90|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128099": {
"content": "<|reserved_special_token_91|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128100": {
"content": "<|reserved_special_token_92|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128101": {
"content": "<|reserved_special_token_93|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128102": {
"content": "<|reserved_special_token_94|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128103": {
"content": "<|reserved_special_token_95|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128104": {
"content": "<|reserved_special_token_96|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128105": {
"content": "<|reserved_special_token_97|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128106": {
"content": "<|reserved_special_token_98|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128107": {
"content": "<|reserved_special_token_99|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128108": {
"content": "<|reserved_special_token_100|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128109": {
"content": "<|reserved_special_token_101|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128110": {
"content": "<|reserved_special_token_102|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128111": {
"content": "<|reserved_special_token_103|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128112": {
"content": "<|reserved_special_token_104|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128113": {
"content": "<|reserved_special_token_105|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128114": {
"content": "<|reserved_special_token_106|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128115": {
"content": "<|reserved_special_token_107|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128116": {
"content": "<|reserved_special_token_108|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128117": {
"content": "<|reserved_special_token_109|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128118": {
"content": "<|reserved_special_token_110|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128119": {
"content": "<|reserved_special_token_111|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128120": {
"content": "<|reserved_special_token_112|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128121": {
"content": "<|reserved_special_token_113|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128122": {
"content": "<|reserved_special_token_114|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128123": {
"content": "<|reserved_special_token_115|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128124": {
"content": "<|reserved_special_token_116|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128125": {
"content": "<|reserved_special_token_117|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128126": {
"content": "<|reserved_special_token_118|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128127": {
"content": "<|reserved_special_token_119|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128128": {
"content": "<|reserved_special_token_120|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128129": {
"content": "<|reserved_special_token_121|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128130": {
"content": "<|reserved_special_token_122|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128131": {
"content": "<|reserved_special_token_123|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128132": {
"content": "<|reserved_special_token_124|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128133": {
"content": "<|reserved_special_token_125|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128134": {
"content": "<|reserved_special_token_126|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128135": {
"content": "<|reserved_special_token_127|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128136": {
"content": "<|reserved_special_token_128|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128137": {
"content": "<|reserved_special_token_129|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128138": {
"content": "<|reserved_special_token_130|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128139": {
"content": "<|reserved_special_token_131|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128140": {
"content": "<|reserved_special_token_132|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128141": {
"content": "<|reserved_special_token_133|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128142": {
"content": "<|reserved_special_token_134|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128143": {
"content": "<|reserved_special_token_135|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128144": {
"content": "<|reserved_special_token_136|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128145": {
"content": "<|reserved_special_token_137|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128146": {
"content": "<|reserved_special_token_138|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128147": {
"content": "<|reserved_special_token_139|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128148": {
"content": "<|reserved_special_token_140|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128149": {
"content": "<|reserved_special_token_141|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128150": {
"content": "<|reserved_special_token_142|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128151": {
"content": "<|reserved_special_token_143|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128152": {
"content": "<|reserved_special_token_144|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128153": {
"content": "<|reserved_special_token_145|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128154": {
"content": "<|reserved_special_token_146|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128155": {
"content": "<|reserved_special_token_147|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128156": {
"content": "<|reserved_special_token_148|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128157": {
"content": "<|reserved_special_token_149|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128158": {
"content": "<|reserved_special_token_150|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128159": {
"content": "<|reserved_special_token_151|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128160": {
"content": "<|reserved_special_token_152|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128161": {
"content": "<|reserved_special_token_153|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128162": {
"content": "<|reserved_special_token_154|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128163": {
"content": "<|reserved_special_token_155|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128164": {
"content": "<|reserved_special_token_156|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128165": {
"content": "<|reserved_special_token_157|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128166": {
"content": "<|reserved_special_token_158|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128167": {
"content": "<|reserved_special_token_159|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128168": {
"content": "<|reserved_special_token_160|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128169": {
"content": "<|reserved_special_token_161|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128170": {
"content": "<|reserved_special_token_162|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128171": {
"content": "<|reserved_special_token_163|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128172": {
"content": "<|reserved_special_token_164|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128173": {
"content": "<|reserved_special_token_165|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128174": {
"content": "<|reserved_special_token_166|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128175": {
"content": "<|reserved_special_token_167|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128176": {
"content": "<|reserved_special_token_168|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128177": {
"content": "<|reserved_special_token_169|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128178": {
"content": "<|reserved_special_token_170|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128179": {
"content": "<|reserved_special_token_171|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128180": {
"content": "<|reserved_special_token_172|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128181": {
"content": "<|reserved_special_token_173|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128182": {
"content": "<|reserved_special_token_174|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128183": {
"content": "<|reserved_special_token_175|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128184": {
"content": "<|reserved_special_token_176|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128185": {
"content": "<|reserved_special_token_177|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128186": {
"content": "<|reserved_special_token_178|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128187": {
"content": "<|reserved_special_token_179|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128188": {
"content": "<|reserved_special_token_180|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128189": {
"content": "<|reserved_special_token_181|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128190": {
"content": "<|reserved_special_token_182|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128191": {
"content": "<|reserved_special_token_183|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128192": {
"content": "<|reserved_special_token_184|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128193": {
"content": "<|reserved_special_token_185|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128194": {
"content": "<|reserved_special_token_186|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128195": {
"content": "<|reserved_special_token_187|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128196": {
"content": "<|reserved_special_token_188|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128197": {
"content": "<|reserved_special_token_189|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128198": {
"content": "<|reserved_special_token_190|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128199": {
"content": "<|reserved_special_token_191|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128200": {
"content": "<|reserved_special_token_192|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128201": {
"content": "<|reserved_special_token_193|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128202": {
"content": "<|reserved_special_token_194|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128203": {
"content": "<|reserved_special_token_195|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128204": {
"content": "<|reserved_special_token_196|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128205": {
"content": "<|reserved_special_token_197|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128206": {
"content": "<|reserved_special_token_198|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128207": {
"content": "<|reserved_special_token_199|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128208": {
"content": "<|reserved_special_token_200|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128209": {
"content": "<|reserved_special_token_201|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128210": {
"content": "<|reserved_special_token_202|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128211": {
"content": "<|reserved_special_token_203|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128212": {
"content": "<|reserved_special_token_204|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128213": {
"content": "<|reserved_special_token_205|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128214": {
"content": "<|reserved_special_token_206|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128215": {
"content": "<|reserved_special_token_207|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128216": {
"content": "<|reserved_special_token_208|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128217": {
"content": "<|reserved_special_token_209|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128218": {
"content": "<|reserved_special_token_210|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128219": {
"content": "<|reserved_special_token_211|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128220": {
"content": "<|reserved_special_token_212|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128221": {
"content": "<|reserved_special_token_213|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128222": {
"content": "<|reserved_special_token_214|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128223": {
"content": "<|reserved_special_token_215|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128224": {
"content": "<|reserved_special_token_216|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128225": {
"content": "<|reserved_special_token_217|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128226": {
"content": "<|reserved_special_token_218|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128227": {
"content": "<|reserved_special_token_219|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128228": {
"content": "<|reserved_special_token_220|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128229": {
"content": "<|reserved_special_token_221|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128230": {
"content": "<|reserved_special_token_222|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128231": {
"content": "<|reserved_special_token_223|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128232": {
"content": "<|reserved_special_token_224|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128233": {
"content": "<|reserved_special_token_225|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128234": {
"content": "<|reserved_special_token_226|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128235": {
"content": "<|reserved_special_token_227|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128236": {
"content": "<|reserved_special_token_228|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128237": {
"content": "<|reserved_special_token_229|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128238": {
"content": "<|reserved_special_token_230|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128239": {
"content": "<|reserved_special_token_231|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128240": {
"content": "<|reserved_special_token_232|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128241": {
"content": "<|reserved_special_token_233|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128242": {
"content": "<|reserved_special_token_234|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128243": {
"content": "<|reserved_special_token_235|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128244": {
"content": "<|reserved_special_token_236|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128245": {
"content": "<|reserved_special_token_237|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128246": {
"content": "<|reserved_special_token_238|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128247": {
"content": "<|reserved_special_token_239|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128248": {
"content": "<|reserved_special_token_240|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128249": {
"content": "<|reserved_special_token_241|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128250": {
"content": "<|reserved_special_token_242|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128251": {
"content": "<|reserved_special_token_243|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128252": {
"content": "<|reserved_special_token_244|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128253": {
"content": "<|reserved_special_token_245|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128254": {
"content": "<|reserved_special_token_246|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"128255": {
"content": "<|reserved_special_token_247|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
}
},
"bos_token": "<|begin_of_text|>",
"clean_up_tokenization_spaces": true,
"eos_token": "<|end_of_text|>",
"model_input_names": [
"input_ids",
"attention_mask"
],
"model_max_length": 131072,
"tokenizer_class": "PreTrainedTokenizerFast"
}
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment