gpt-oss-20b / .gitattributes
erfanzar's picture
Upload tokenizer
a394781 verified
*.7z filter=lfs diff=lfs merge=lfs -text
*.arrow filter=lfs diff=lfs merge=lfs -text
*.bin filter=lfs diff=lfs merge=lfs -text
*.bz2 filter=lfs diff=lfs merge=lfs -text
*.ckpt filter=lfs diff=lfs merge=lfs -text
*.ftz filter=lfs diff=lfs merge=lfs -text
*.gz filter=lfs diff=lfs merge=lfs -text
*.h5 filter=lfs diff=lfs merge=lfs -text
*.joblib filter=lfs diff=lfs merge=lfs -text
*.lfs.* filter=lfs diff=lfs merge=lfs -text
*.mlmodel filter=lfs diff=lfs merge=lfs -text
*.model filter=lfs diff=lfs merge=lfs -text
*.msgpack filter=lfs diff=lfs merge=lfs -text
*.npy filter=lfs diff=lfs merge=lfs -text
*.npz filter=lfs diff=lfs merge=lfs -text
*.onnx filter=lfs diff=lfs merge=lfs -text
*.ot filter=lfs diff=lfs merge=lfs -text
*.parquet filter=lfs diff=lfs merge=lfs -text
*.pb filter=lfs diff=lfs merge=lfs -text
*.pickle filter=lfs diff=lfs merge=lfs -text
*.pkl filter=lfs diff=lfs merge=lfs -text
*.pt filter=lfs diff=lfs merge=lfs -text
*.pth filter=lfs diff=lfs merge=lfs -text
*.rar filter=lfs diff=lfs merge=lfs -text
*.safetensors filter=lfs diff=lfs merge=lfs -text
saved_model/**/* filter=lfs diff=lfs merge=lfs -text
*.tar.* filter=lfs diff=lfs merge=lfs -text
*.tar filter=lfs diff=lfs merge=lfs -text
*.tflite filter=lfs diff=lfs merge=lfs -text
*.tgz filter=lfs diff=lfs merge=lfs -text
*.wasm filter=lfs diff=lfs merge=lfs -text
*.xz filter=lfs diff=lfs merge=lfs -text
*.zip filter=lfs diff=lfs merge=lfs -text
*.zst filter=lfs diff=lfs merge=lfs -text
*tfevents* filter=lfs diff=lfs merge=lfs -text
model/model/embed_tokens/embedding/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/embed_tokens/embedding/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/embed_tokens/embedding/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/embed_tokens/embedding/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/21/self_attn/v_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/21/self_attn/v_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/21/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/21/self_attn/v_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/21/self_attn/q_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/21/self_attn/q_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/21/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/21/self_attn/q_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/21/self_attn/o_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/21/self_attn/o_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/21/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/21/self_attn/o_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/21/self_attn/k_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/21/self_attn/k_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/21/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/21/self_attn/k_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/21/mlp/experts/gate_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/21/mlp/experts/gate_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/21/mlp/experts/up_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/21/mlp/experts/up_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/21/mlp/experts/down_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/21/mlp/experts/down_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/21/mlp/router/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/13/self_attn/v_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/13/self_attn/v_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/13/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/13/self_attn/v_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/13/self_attn/q_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/13/self_attn/q_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/13/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/13/self_attn/q_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/13/self_attn/o_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/13/self_attn/o_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/13/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/13/self_attn/o_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/13/self_attn/k_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/13/self_attn/k_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/13/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/13/self_attn/k_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/13/mlp/experts/gate_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/13/mlp/experts/gate_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/13/mlp/experts/up_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/13/mlp/experts/up_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/13/mlp/experts/down_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/13/mlp/experts/down_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/13/mlp/router/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/1/self_attn/v_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/1/self_attn/v_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/1/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/1/self_attn/v_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/1/self_attn/q_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/1/self_attn/q_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/1/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/1/self_attn/q_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/1/self_attn/o_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/1/self_attn/o_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/1/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/1/self_attn/o_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/1/self_attn/k_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/1/self_attn/k_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/1/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/1/self_attn/k_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/1/mlp/experts/gate_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/1/mlp/experts/gate_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/1/mlp/experts/up_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/1/mlp/experts/up_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/1/mlp/experts/down_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/1/mlp/experts/down_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/1/mlp/router/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/3/self_attn/v_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/3/self_attn/v_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/3/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/3/self_attn/v_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/3/self_attn/q_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/3/self_attn/q_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/3/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/3/self_attn/q_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/3/self_attn/o_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/3/self_attn/o_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/3/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/3/self_attn/o_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/3/self_attn/k_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/3/self_attn/k_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/3/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/3/self_attn/k_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/3/mlp/experts/gate_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/3/mlp/experts/gate_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/3/mlp/experts/up_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/3/mlp/experts/up_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/3/mlp/experts/down_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/3/mlp/experts/down_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/3/mlp/router/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/4/self_attn/v_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/4/self_attn/v_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/4/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/4/self_attn/v_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/4/self_attn/q_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/4/self_attn/q_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/4/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/4/self_attn/q_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/4/self_attn/o_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/4/self_attn/o_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/4/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/4/self_attn/o_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/4/self_attn/k_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/4/self_attn/k_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/4/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/4/self_attn/k_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/4/mlp/experts/gate_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/4/mlp/experts/gate_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/4/mlp/experts/up_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/4/mlp/experts/up_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/4/mlp/experts/down_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/4/mlp/experts/down_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/4/mlp/router/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/5/self_attn/v_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/5/self_attn/v_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/5/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/5/self_attn/v_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/5/self_attn/q_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/5/self_attn/q_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/5/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/5/self_attn/q_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/5/self_attn/o_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/5/self_attn/o_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/5/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/5/self_attn/o_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/5/self_attn/k_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/5/self_attn/k_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/5/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/5/self_attn/k_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/5/mlp/experts/gate_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/5/mlp/experts/gate_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/5/mlp/experts/up_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/5/mlp/experts/up_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/5/mlp/experts/down_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/5/mlp/experts/down_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/5/mlp/router/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/20/self_attn/v_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/20/self_attn/v_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/20/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/20/self_attn/v_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/20/self_attn/q_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/20/self_attn/q_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/20/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/20/self_attn/q_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/20/self_attn/o_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/20/self_attn/o_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/20/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/20/self_attn/o_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/20/self_attn/k_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/20/self_attn/k_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/20/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/20/self_attn/k_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/20/mlp/experts/gate_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/20/mlp/experts/gate_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/20/mlp/experts/up_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/20/mlp/experts/up_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/20/mlp/experts/down_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/20/mlp/experts/down_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/20/mlp/router/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/18/self_attn/v_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/18/self_attn/v_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/18/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/18/self_attn/v_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/18/self_attn/q_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/18/self_attn/q_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/18/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/18/self_attn/q_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/18/self_attn/o_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/18/self_attn/o_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/18/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/18/self_attn/o_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/18/self_attn/k_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/18/self_attn/k_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/18/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/18/self_attn/k_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/18/mlp/experts/gate_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/18/mlp/experts/gate_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/18/mlp/experts/up_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/18/mlp/experts/up_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/18/mlp/experts/down_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/18/mlp/experts/down_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/18/mlp/router/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/17/self_attn/v_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/17/self_attn/v_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/17/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/17/self_attn/v_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/17/self_attn/q_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/17/self_attn/q_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/17/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/17/self_attn/q_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/17/self_attn/o_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/17/self_attn/o_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/17/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/17/self_attn/o_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/17/self_attn/k_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/17/self_attn/k_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/17/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/17/self_attn/k_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/17/mlp/experts/gate_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/17/mlp/experts/gate_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/17/mlp/experts/up_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/17/mlp/experts/up_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/17/mlp/experts/down_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/17/mlp/experts/down_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/17/mlp/router/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/19/self_attn/v_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/19/self_attn/v_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/19/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/19/self_attn/v_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/19/self_attn/q_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/19/self_attn/q_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/19/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/19/self_attn/q_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/19/self_attn/o_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/19/self_attn/o_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/19/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/19/self_attn/o_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/19/self_attn/k_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/19/self_attn/k_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/19/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/19/self_attn/k_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/19/mlp/experts/gate_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/19/mlp/experts/gate_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/19/mlp/experts/up_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/19/mlp/experts/up_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/19/mlp/experts/down_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/19/mlp/experts/down_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/19/mlp/router/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/10/self_attn/v_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/10/self_attn/v_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/10/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/10/self_attn/v_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/10/self_attn/q_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/10/self_attn/q_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/10/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/10/self_attn/q_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/10/self_attn/o_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/10/self_attn/o_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/10/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/10/self_attn/o_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/10/self_attn/k_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/10/self_attn/k_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/10/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/10/self_attn/k_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/10/mlp/experts/gate_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/10/mlp/experts/gate_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/10/mlp/experts/up_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/10/mlp/experts/up_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/10/mlp/experts/down_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/10/mlp/experts/down_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/10/mlp/router/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/8/self_attn/v_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/8/self_attn/v_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/8/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/8/self_attn/v_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/8/self_attn/q_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/8/self_attn/q_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/8/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/8/self_attn/q_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/8/self_attn/o_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/8/self_attn/o_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/8/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/8/self_attn/o_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/8/self_attn/k_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/8/self_attn/k_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/8/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/8/self_attn/k_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/8/mlp/experts/gate_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/8/mlp/experts/gate_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/8/mlp/experts/up_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/8/mlp/experts/up_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/8/mlp/experts/down_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/8/mlp/experts/down_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/8/mlp/router/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/16/self_attn/v_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/16/self_attn/v_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/16/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/16/self_attn/v_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/16/self_attn/q_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/16/self_attn/q_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/16/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/16/self_attn/q_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/16/self_attn/o_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/16/self_attn/o_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/16/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/16/self_attn/o_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/16/self_attn/k_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/16/self_attn/k_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/16/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/16/self_attn/k_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/16/mlp/experts/gate_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/16/mlp/experts/gate_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/16/mlp/experts/up_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/16/mlp/experts/up_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/16/mlp/experts/down_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/16/mlp/experts/down_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/16/mlp/router/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/11/self_attn/v_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/11/self_attn/v_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/11/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/11/self_attn/v_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/11/self_attn/q_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/11/self_attn/q_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/11/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/11/self_attn/q_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/11/self_attn/o_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/11/self_attn/o_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/11/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/11/self_attn/o_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/11/self_attn/k_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/11/self_attn/k_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/11/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/11/self_attn/k_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/11/mlp/experts/gate_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/11/mlp/experts/gate_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/11/mlp/experts/up_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/11/mlp/experts/up_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/11/mlp/experts/down_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/11/mlp/experts/down_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/11/mlp/router/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/14/self_attn/v_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/14/self_attn/v_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/14/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/14/self_attn/v_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/14/self_attn/q_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/14/self_attn/q_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/14/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/14/self_attn/q_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/14/self_attn/o_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/14/self_attn/o_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/14/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/14/self_attn/o_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/14/self_attn/k_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/14/self_attn/k_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/14/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/14/self_attn/k_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/14/mlp/experts/gate_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/14/mlp/experts/gate_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/14/mlp/experts/up_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/14/mlp/experts/up_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/14/mlp/experts/down_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/14/mlp/experts/down_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/14/mlp/router/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/6/self_attn/v_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/6/self_attn/v_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/6/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/6/self_attn/v_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/6/self_attn/q_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/6/self_attn/q_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/6/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/6/self_attn/q_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/6/self_attn/o_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/6/self_attn/o_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/6/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/6/self_attn/o_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/6/self_attn/k_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/6/self_attn/k_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/6/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/6/self_attn/k_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/6/mlp/experts/gate_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/6/mlp/experts/gate_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/6/mlp/experts/up_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/6/mlp/experts/up_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/6/mlp/experts/down_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/6/mlp/experts/down_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/6/mlp/router/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/23/self_attn/v_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/23/self_attn/v_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/23/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/23/self_attn/v_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/23/self_attn/q_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/23/self_attn/q_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/23/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/23/self_attn/q_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/23/self_attn/o_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/23/self_attn/o_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/23/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/23/self_attn/o_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/23/self_attn/k_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/23/self_attn/k_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/23/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/23/self_attn/k_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/23/mlp/experts/gate_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/23/mlp/experts/gate_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/23/mlp/experts/up_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/23/mlp/experts/up_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/23/mlp/experts/down_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/23/mlp/experts/down_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/23/mlp/router/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/2/self_attn/v_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/2/self_attn/v_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/2/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/2/self_attn/v_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/2/self_attn/q_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/2/self_attn/q_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/2/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/2/self_attn/q_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/2/self_attn/o_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/2/self_attn/o_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/2/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/2/self_attn/o_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/2/self_attn/k_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/2/self_attn/k_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/2/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/2/self_attn/k_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/2/mlp/experts/gate_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/2/mlp/experts/gate_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/2/mlp/experts/up_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/2/mlp/experts/up_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/2/mlp/experts/down_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/2/mlp/experts/down_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/2/mlp/router/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/9/self_attn/v_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/9/self_attn/v_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/9/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/9/self_attn/v_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/9/self_attn/q_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/9/self_attn/q_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/9/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/9/self_attn/q_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/9/self_attn/o_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/9/self_attn/o_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/9/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/9/self_attn/o_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/9/self_attn/k_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/9/self_attn/k_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/9/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/9/self_attn/k_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/9/mlp/experts/gate_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/9/mlp/experts/gate_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/9/mlp/experts/up_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/9/mlp/experts/up_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/9/mlp/experts/down_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/9/mlp/experts/down_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/9/mlp/router/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/22/self_attn/v_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/22/self_attn/v_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/22/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/22/self_attn/v_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/22/self_attn/q_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/22/self_attn/q_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/22/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/22/self_attn/q_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/22/self_attn/o_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/22/self_attn/o_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/22/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/22/self_attn/o_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/22/self_attn/k_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/22/self_attn/k_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/22/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/22/self_attn/k_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/22/mlp/experts/gate_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/22/mlp/experts/gate_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/22/mlp/experts/up_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/22/mlp/experts/up_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/22/mlp/experts/down_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/22/mlp/experts/down_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/22/mlp/router/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/15/self_attn/v_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/15/self_attn/v_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/15/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/15/self_attn/v_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/15/self_attn/q_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/15/self_attn/q_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/15/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/15/self_attn/q_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/15/self_attn/o_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/15/self_attn/o_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/15/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/15/self_attn/o_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/15/self_attn/k_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/15/self_attn/k_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/15/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/15/self_attn/k_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/15/mlp/experts/gate_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/15/mlp/experts/gate_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/15/mlp/experts/up_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/15/mlp/experts/up_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/15/mlp/experts/down_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/15/mlp/experts/down_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/15/mlp/router/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/7/self_attn/v_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/7/self_attn/v_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/7/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/7/self_attn/v_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/7/self_attn/q_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/7/self_attn/q_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/7/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/7/self_attn/q_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/7/self_attn/o_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/7/self_attn/o_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/7/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/7/self_attn/o_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/7/self_attn/k_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/7/self_attn/k_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/7/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/7/self_attn/k_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/7/mlp/experts/gate_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/7/mlp/experts/gate_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/7/mlp/experts/up_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/7/mlp/experts/up_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/7/mlp/experts/down_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/7/mlp/experts/down_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/7/mlp/router/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/0/self_attn/v_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/0/self_attn/v_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/0/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/0/self_attn/v_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/0/self_attn/q_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/0/self_attn/q_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/0/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/0/self_attn/q_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/0/self_attn/o_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/0/self_attn/o_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/0/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/0/self_attn/o_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/0/self_attn/k_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/0/self_attn/k_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/0/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/0/self_attn/k_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/0/mlp/experts/gate_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/0/mlp/experts/gate_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/0/mlp/experts/up_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/0/mlp/experts/up_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/0/mlp/experts/down_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/0/mlp/experts/down_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/0/mlp/router/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/12/self_attn/v_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/12/self_attn/v_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/12/self_attn/v_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/12/self_attn/v_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/12/self_attn/q_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/12/self_attn/q_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/12/self_attn/q_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/12/self_attn/q_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/12/self_attn/o_proj/kernel/1.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/12/self_attn/o_proj/kernel/3.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/12/self_attn/o_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/12/self_attn/o_proj/kernel/2.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/12/self_attn/k_proj/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/model/layers/12/self_attn/k_proj/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/model/layers/12/self_attn/k_proj/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/12/self_attn/k_proj/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
model/model/layers/12/mlp/experts/gate_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/12/mlp/experts/gate_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/12/mlp/experts/up_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/12/mlp/experts/up_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/12/mlp/experts/down_proj/kernel/0.0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/12/mlp/experts/down_proj/bias/0.0 filter=lfs diff=lfs merge=lfs -text
model/model/layers/12/mlp/router/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/lm_head/kernel/0.1 filter=lfs diff=lfs merge=lfs -text
model/lm_head/kernel/0.3 filter=lfs diff=lfs merge=lfs -text
model/lm_head/kernel/0.0 filter=lfs diff=lfs merge=lfs -text
model/lm_head/kernel/0.2 filter=lfs diff=lfs merge=lfs -text
tokenizer.json filter=lfs diff=lfs merge=lfs -text