tabby/testdata/gptneox/models/fastertransformer/1/1-gpu
Meng Zhang f177fab951
Add docker compose (#3)
* Add docker-compose.yaml

* Update docker-compose
2023-03-22 02:42:47 +08:00
..
config.ini Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.final_layernorm.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.final_layernorm.weight.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.0.attention.dense.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.0.attention.dense.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.0.attention.query_key_value.bias.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.0.attention.query_key_value.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.0.input_layernorm.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.0.input_layernorm.weight.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.0.mlp.dense_4h_to_h.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.0.mlp.dense_4h_to_h.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.0.mlp.dense_h_to_4h.bias.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.0.mlp.dense_h_to_4h.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.0.post_attention_layernorm.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.0.post_attention_layernorm.weight.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.1.attention.dense.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.1.attention.dense.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.1.attention.query_key_value.bias.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.1.attention.query_key_value.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.1.input_layernorm.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.1.input_layernorm.weight.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.1.mlp.dense_4h_to_h.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.1.mlp.dense_4h_to_h.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.1.mlp.dense_h_to_4h.bias.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.1.mlp.dense_h_to_4h.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.1.post_attention_layernorm.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.1.post_attention_layernorm.weight.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.2.attention.dense.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.2.attention.dense.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.2.attention.query_key_value.bias.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.2.attention.query_key_value.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.2.input_layernorm.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.2.input_layernorm.weight.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.2.mlp.dense_4h_to_h.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.2.mlp.dense_4h_to_h.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.2.mlp.dense_h_to_4h.bias.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.2.mlp.dense_h_to_4h.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.2.post_attention_layernorm.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.2.post_attention_layernorm.weight.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.3.attention.dense.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.3.attention.dense.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.3.attention.query_key_value.bias.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.3.attention.query_key_value.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.3.input_layernorm.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.3.input_layernorm.weight.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.3.mlp.dense_4h_to_h.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.3.mlp.dense_4h_to_h.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.3.mlp.dense_h_to_4h.bias.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.3.mlp.dense_h_to_4h.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.3.post_attention_layernorm.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.3.post_attention_layernorm.weight.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.4.attention.dense.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.4.attention.dense.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.4.attention.query_key_value.bias.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.4.attention.query_key_value.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.4.input_layernorm.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.4.input_layernorm.weight.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.4.mlp.dense_4h_to_h.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.4.mlp.dense_4h_to_h.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.4.mlp.dense_h_to_4h.bias.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.4.mlp.dense_h_to_4h.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.4.post_attention_layernorm.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.4.post_attention_layernorm.weight.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.5.attention.dense.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.5.attention.dense.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.5.attention.query_key_value.bias.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.5.attention.query_key_value.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.5.input_layernorm.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.5.input_layernorm.weight.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.5.mlp.dense_4h_to_h.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.5.mlp.dense_4h_to_h.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.5.mlp.dense_h_to_4h.bias.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.5.mlp.dense_h_to_4h.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.5.post_attention_layernorm.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.5.post_attention_layernorm.weight.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.6.attention.dense.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.6.attention.dense.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.6.attention.query_key_value.bias.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.6.attention.query_key_value.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.6.input_layernorm.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.6.input_layernorm.weight.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.6.mlp.dense_4h_to_h.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.6.mlp.dense_4h_to_h.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.6.mlp.dense_h_to_4h.bias.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.6.mlp.dense_h_to_4h.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.6.post_attention_layernorm.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.6.post_attention_layernorm.weight.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.7.attention.dense.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.7.attention.dense.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.7.attention.query_key_value.bias.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.7.attention.query_key_value.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.7.input_layernorm.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.7.input_layernorm.weight.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.7.mlp.dense_4h_to_h.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.7.mlp.dense_4h_to_h.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.7.mlp.dense_h_to_4h.bias.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.7.mlp.dense_h_to_4h.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.7.post_attention_layernorm.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.7.post_attention_layernorm.weight.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.8.attention.dense.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.8.attention.dense.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.8.attention.query_key_value.bias.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.8.attention.query_key_value.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.8.input_layernorm.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.8.input_layernorm.weight.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.8.mlp.dense_4h_to_h.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.8.mlp.dense_4h_to_h.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.8.mlp.dense_h_to_4h.bias.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.8.mlp.dense_h_to_4h.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.8.post_attention_layernorm.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.8.post_attention_layernorm.weight.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.9.attention.dense.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.9.attention.dense.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.9.attention.query_key_value.bias.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.9.attention.query_key_value.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.9.input_layernorm.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.9.input_layernorm.weight.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.9.mlp.dense_4h_to_h.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.9.mlp.dense_4h_to_h.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.9.mlp.dense_h_to_4h.bias.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.9.mlp.dense_h_to_4h.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.9.post_attention_layernorm.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.9.post_attention_layernorm.weight.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.10.attention.dense.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.10.attention.dense.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.10.attention.query_key_value.bias.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.10.attention.query_key_value.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.10.input_layernorm.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.10.input_layernorm.weight.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.10.mlp.dense_4h_to_h.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.10.mlp.dense_4h_to_h.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.10.mlp.dense_h_to_4h.bias.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.10.mlp.dense_h_to_4h.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.10.post_attention_layernorm.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.10.post_attention_layernorm.weight.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.11.attention.dense.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.11.attention.dense.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.11.attention.query_key_value.bias.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.11.attention.query_key_value.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.11.input_layernorm.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.11.input_layernorm.weight.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.11.mlp.dense_4h_to_h.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.11.mlp.dense_4h_to_h.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.11.mlp.dense_h_to_4h.bias.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.11.mlp.dense_h_to_4h.weight.0.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.11.post_attention_layernorm.bias.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.layers.11.post_attention_layernorm.weight.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.lm_head.weight.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00
model.wte.bin Add docker compose (#3) 2023-03-22 02:42:47 +08:00