diff --git a/README.md b/README.md
index 10792c5..5aa3441 100644
--- a/README.md
+++ b/README.md
@@ -6,5 +6,6 @@
 > This repository is undering heavy construction, everything changes fast.
 
 ## Contents
+* [`tabformer`](./tabformer): *NOT RELEASED* Distributed trainer for tabby models.
 * [`preprocess`](./preprocess): Preprocess files into [datasets](https://huggingface.co/docs/datasets)
 * [`converter`](./converter): Converts a [transformers](https://huggingface.co/docs/transformers) causal LM model into TensorRT / FasterTransformer serving formats.
diff --git a/converter/.gitattributes b/converter/.gitattributes
new file mode 100644
index 0000000..4edd5ac
--- /dev/null
+++ b/converter/.gitattributes
@@ -0,0 +1 @@
+*.bin filter=lfs diff=lfs merge=lfs -text
diff --git a/converter/huggingface_gptj_convert.py b/converter/huggingface_gptj_convert.py
new file mode 100644
index 0000000..c435819
--- /dev/null
+++ b/converter/huggingface_gptj_convert.py
@@ -0,0 +1,253 @@
+# Copyright (c) 2021-2022, NVIDIA CORPORATION.  All rights reserved.
+# Modified by Brendan Dolan-Gavitt, 2022
+# Modified by Meng Zhang, 2023
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import argparse
+import configparser
+import multiprocessing
+import os
+import sys
+from pathlib import Path
+
+import numpy as np
+import torch
+from transformers import GPTJForCausalLM
+
+dir_path = os.path.dirname(os.path.realpath(__file__))
+sys.path.append(dir_path + "/../../../..")
+sys.path.append(dir_path)
+
+
+def get_weight_data_type(data_type):
+    if data_type == "fp32":
+        return np.float32
+    elif data_type == "fp16":
+        return np.float16
+    else:
+        assert False, f"Invalid weight data type {data_type}"
+
+
+def split_and_convert_process(i, saved_dir, factor, key, val):
+    if (
+        key.find("input_layernorm.weight") != -1
+        or key.find("input_layernorm.bias") != -1
+        or key.find("attention.dense.bias") != -1
+        or key.find("post_attention_layernorm.weight") != -1
+        or key.find("post_attention_layernorm.bias") != -1
+        or key.find("mlp.dense_4h_to_h.bias") != -1
+        or key.find("final_layernorm.weight") != -1
+        or key.find("final_layernorm.bias") != -1
+    ):
+
+        # shared weights, only need to convert the weights of rank 0
+        if i == 0:
+            saved_path = saved_dir + "/model." + key + ".bin"
+            val.tofile(saved_path)
+
+    elif (
+        key.find("attention.dense.weight") != -1
+        or key.find("mlp.dense_4h_to_h.weight") != -1
+    ):
+        split_vals = np.split(val, factor, axis=0)
+        for j in range(factor):
+            saved_path = saved_dir + "/model." + key + ".%d.bin" % (i * factor + j)
+            split_vals[j].tofile(saved_path)
+
+    elif (
+        key.find("mlp.dense_h_to_4h.weight") != -1
+        or key.find("mlp.dense_h_to_4h.bias") != -1
+    ):
+
+        split_vals = np.split(val, factor, axis=-1)
+        for j in range(factor):
+            saved_path = saved_dir + "/model." + key + ".%d.bin" % (i * factor + j)
+            split_vals[j].tofile(saved_path)
+
+    elif key.find("attention.query_key_value.weight") != -1:
+        split_vals = np.split(val, factor, axis=-1)
+
+        for j in range(factor):
+            saved_path = saved_dir + "/model." + key + ".%d.bin" % (i * factor + j)
+            split_vals[j].tofile(saved_path)
+
+    else:
+        print("[ERROR] cannot find key '{}'".format(key))
+
+
+def split_and_convert(args):
+    saved_dir = args.saved_dir + "/%d-gpu/" % args.infer_gpu_num
+
+    if os.path.exists(saved_dir) is False:
+        os.makedirs(saved_dir)
+
+    t_gpu_num = args.trained_gpu_num
+    i_gpu_num = args.infer_gpu_num
+    assert i_gpu_num % t_gpu_num == 0
+
+    factor = (int)(i_gpu_num / t_gpu_num)
+
+    model = GPTJForCausalLM.from_pretrained(args.in_file)
+
+    try:
+        config = configparser.ConfigParser()
+        config["gpt"] = {}
+        for key in vars(args):
+            config["gpt"][key] = f"{vars(args)[key]}"
+        for k, v in vars(model.config).items():
+            config["gpt"][k] = f"{v}"
+        config["gpt"]["weight_data_type"] = args.weight_data_type
+        with open((Path(saved_dir) / "config.ini").as_posix(), "w") as configfile:
+            config.write(configfile)
+    except Exception:
+        print("Fail to save the config in config.ini.")
+    np_weight_data_type = get_weight_data_type(args.weight_data_type)
+
+    huggingface_model_name_pattern = [
+        "ln_1.bias",
+        "ln_1.weight",
+        "attn.q_proj.weight",
+        "attn.out_proj.weight",
+        "mlp.fc_in.bias",
+        "mlp.fc_in.weight",
+        "mlp.fc_out.bias",
+        "mlp.fc_out.weight",
+    ]
+
+    ft_model_name_pattern = [
+        "input_layernorm.bias",
+        "input_layernorm.weight",
+        "attention.query_key_value.weight",
+        "attention.dense.weight",
+        "mlp.dense_h_to_4h.bias",
+        "mlp.dense_h_to_4h.weight",
+        "mlp.dense_4h_to_h.bias",
+        "mlp.dense_4h_to_h.weight",
+    ]
+
+    torch.multiprocessing.set_start_method("spawn")
+    pool = multiprocessing.Pool(args.processes)
+    for name, param in model.named_parameters():
+        if name.find("weight") == -1 and name.find("bias") == -1:
+            continue
+        print(name)
+        if name == "transformer.wte.weight":
+            param.detach().cpu().numpy().astype(np_weight_data_type).tofile(
+                saved_dir + "model.wte.bin"
+            )
+        elif name == "transformer.ln_f.bias":
+            param.detach().cpu().numpy().astype(np_weight_data_type).tofile(
+                saved_dir + "model.final_layernorm.bias.bin"
+            )
+        elif name == "transformer.ln_f.weight":
+            param.detach().cpu().numpy().astype(np_weight_data_type).tofile(
+                saved_dir + "model.final_layernorm.weight.bin"
+            )
+        elif name == "lm_head.weight":
+            param.detach().cpu().numpy().astype(np_weight_data_type).tofile(
+                saved_dir + "model.lm_head.weight.bin"
+            )
+        elif name == "lm_head.bias":
+            param.detach().cpu().numpy().astype(np_weight_data_type).tofile(
+                saved_dir + "model.lm_head.bias.bin"
+            )
+        else:
+            for i in range(len(huggingface_model_name_pattern)):
+                if name.find(huggingface_model_name_pattern[i]) != -1:
+                    # Special case for QKV weights
+                    if name.find("attn.q_proj.weight") != -1:
+                        layer = name.split(".")[2]
+                        base_k = f"transformer.h.{layer}."
+                        w = model.state_dict()
+                        QKV_w = torch.stack(
+                            [
+                                w[base_k + "attn.q_proj.weight"],
+                                w[base_k + "attn.k_proj.weight"],
+                                w[base_k + "attn.v_proj.weight"],
+                            ]
+                        )  # [qkv, n_heads * dim_head, latent_space]
+                        QKV_w = QKV_w.permute(2, 0, 1)
+                        weights = (
+                            QKV_w.detach().cpu().numpy().astype(np_weight_data_type)
+                        )
+                    else:
+                        weights = (
+                            param.detach().cpu().numpy().astype(np_weight_data_type)
+                        )
+
+                    # Some weights need to be transposed
+                    if (
+                        name.find("mlp.fc_in.weight") != -1
+                        or name.find("mlp.fc_out.weight") != -1
+                        or name.find("attn.out_proj.weight") != -1
+                    ):
+                        weights = weights.T
+
+                    new_name = name.replace("transformer.h.", "layers.").replace(
+                        huggingface_model_name_pattern[i], ft_model_name_pattern[i]
+                    )
+
+                    pool.starmap(
+                        split_and_convert_process,
+                        [(0, saved_dir, factor, new_name, weights)],
+                    )
+
+    pool.close()
+    pool.join()
+
+
+if __name__ == "__main__":
+    parser = argparse.ArgumentParser(formatter_class=argparse.RawTextHelpFormatter)
+    parser.add_argument(
+        "-saved_dir", "-o", type=str, help="file name of output file", required=True
+    )
+    parser.add_argument(
+        "-in_file", "-i", type=str, help="HF model name or directory", required=True
+    )
+    parser.add_argument(
+        "-trained_gpu_num",
+        "-t_g",
+        type=int,
+        help="How many gpus for training",
+        default=1,
+    )
+    parser.add_argument(
+        "-infer_gpu_num",
+        "-i_g",
+        type=int,
+        help="How many gpus for inference",
+        required=True,
+    )
+    parser.add_argument(
+        "-processes",
+        "-p",
+        type=int,
+        help="How many processes to spawn for conversion (default: 4)",
+        default=4,
+    )
+    parser.add_argument(
+        "-weight_data_type",
+        type=str,
+        default="fp32",
+        choices=["fp32", "fp16"],
+        help="output weight data type",
+    )
+
+    args = parser.parse_args()
+    print("\n=============== Argument ===============")
+    for key in vars(args):
+        print("{}: {}".format(key, vars(args)[key]))
+    print("========================================")
+
+    split_and_convert(args)
diff --git a/converter/testdata/1-gpu/config.ini b/converter/testdata/1-gpu/config.ini
new file mode 100644
index 0000000..975a385
--- /dev/null
+++ b/converter/testdata/1-gpu/config.ini
@@ -0,0 +1,86 @@
+[gpt]
+saved_dir = out
+in_file = hf-internal-testing/tiny-random-gptj
+trained_gpu_num = 1
+infer_gpu_num = 1
+processes = 4
+weight_data_type = fp32
+vocab_size = 1000
+n_positions = 512
+n_embd = 32
+n_layer = 5
+n_head = 4
+n_inner = None
+rotary_dim = 4
+activation_function = gelu_new
+resid_pdrop = 0.0
+embd_pdrop = 0.0
+attn_pdrop = 0.0
+layer_norm_epsilon = 1e-05
+initializer_range = 0.02
+use_cache = True
+bos_token_id = 98
+eos_token_id = 98
+return_dict = True
+output_hidden_states = False
+output_attentions = False
+torchscript = False
+torch_dtype = None
+use_bfloat16 = False
+tf_legacy_loss = False
+pruned_heads = {}
+tie_word_embeddings = False
+is_encoder_decoder = False
+is_decoder = False
+cross_attention_hidden_size = None
+add_cross_attention = False
+tie_encoder_decoder = False
+max_length = 20
+min_length = 0
+do_sample = False
+early_stopping = False
+num_beams = 1
+num_beam_groups = 1
+diversity_penalty = 0.0
+temperature = 1.0
+top_k = 50
+top_p = 1.0
+typical_p = 1.0
+repetition_penalty = 1.0
+length_penalty = 1.0
+no_repeat_ngram_size = 0
+encoder_no_repeat_ngram_size = 0
+bad_words_ids = None
+num_return_sequences = 1
+chunk_size_feed_forward = 0
+output_scores = False
+return_dict_in_generate = False
+forced_bos_token_id = None
+forced_eos_token_id = None
+remove_invalid_values = False
+exponential_decay_length_penalty = None
+suppress_tokens = None
+begin_suppress_tokens = None
+architectures = None
+finetuning_task = None
+id2label = {0: 'LABEL_0', 1: 'LABEL_1'}
+label2id = {'LABEL_0': 0, 'LABEL_1': 1}
+tokenizer_class = None
+prefix = None
+pad_token_id = 98
+sep_token_id = None
+decoder_start_token_id = None
+task_specific_params = None
+problem_type = None
+_name_or_path = hf-internal-testing/tiny-random-gptj
+_commit_hash = b96595a4bcdeb272096214589efa0314259853a0
+transformers_version = 4.11.0.dev0
+attention_probs_dropout_prob = 0.0
+gradient_checkpointing = False
+hidden_act = gelu
+hidden_dropout_prob = 0.0
+intermediate_size = 37
+model_type = gptj
+n_ctx = 512
+scale_attn_weights = True
+type_vocab_size = 16
diff --git a/converter/testdata/1-gpu/model.final_layernorm.bias.bin b/converter/testdata/1-gpu/model.final_layernorm.bias.bin
new file mode 100644
index 0000000..67415c7
--- /dev/null
+++ b/converter/testdata/1-gpu/model.final_layernorm.bias.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:38723a2e5e8a17aa7950dc008209944e898f69a7bd10a23c839d341e935fd5ca
+size 128
diff --git a/converter/testdata/1-gpu/model.final_layernorm.weight.bin b/converter/testdata/1-gpu/model.final_layernorm.weight.bin
new file mode 100644
index 0000000..d0c1df9
--- /dev/null
+++ b/converter/testdata/1-gpu/model.final_layernorm.weight.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b638277a8690e175a9137feff1e43c067f9faf4e2f600caf468fb05b0403b717
+size 128
diff --git a/converter/testdata/1-gpu/model.layers.0.attention.dense.weight.0.bin b/converter/testdata/1-gpu/model.layers.0.attention.dense.weight.0.bin
new file mode 100644
index 0000000..48a4419
--- /dev/null
+++ b/converter/testdata/1-gpu/model.layers.0.attention.dense.weight.0.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:125bd07dc5e7a5c6444f7689ba78df0f4c7959b6dcfbaf7c89edd0634a147ea0
+size 4096
diff --git a/converter/testdata/1-gpu/model.layers.0.attention.query_key_value.weight.0.bin b/converter/testdata/1-gpu/model.layers.0.attention.query_key_value.weight.0.bin
new file mode 100644
index 0000000..33c2eca
--- /dev/null
+++ b/converter/testdata/1-gpu/model.layers.0.attention.query_key_value.weight.0.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:11fd52f2b94fad5fe54e2e03c5848050703ec4d798a43a4c1813f109a6703883
+size 12288
diff --git a/converter/testdata/1-gpu/model.layers.0.input_layernorm.bias.bin b/converter/testdata/1-gpu/model.layers.0.input_layernorm.bias.bin
new file mode 100644
index 0000000..67415c7
--- /dev/null
+++ b/converter/testdata/1-gpu/model.layers.0.input_layernorm.bias.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:38723a2e5e8a17aa7950dc008209944e898f69a7bd10a23c839d341e935fd5ca
+size 128
diff --git a/converter/testdata/1-gpu/model.layers.0.input_layernorm.weight.bin b/converter/testdata/1-gpu/model.layers.0.input_layernorm.weight.bin
new file mode 100644
index 0000000..d0c1df9
--- /dev/null
+++ b/converter/testdata/1-gpu/model.layers.0.input_layernorm.weight.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b638277a8690e175a9137feff1e43c067f9faf4e2f600caf468fb05b0403b717
+size 128
diff --git a/converter/testdata/1-gpu/model.layers.0.mlp.dense_4h_to_h.bias.bin b/converter/testdata/1-gpu/model.layers.0.mlp.dense_4h_to_h.bias.bin
new file mode 100644
index 0000000..67415c7
--- /dev/null
+++ b/converter/testdata/1-gpu/model.layers.0.mlp.dense_4h_to_h.bias.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:38723a2e5e8a17aa7950dc008209944e898f69a7bd10a23c839d341e935fd5ca
+size 128
diff --git a/converter/testdata/1-gpu/model.layers.0.mlp.dense_4h_to_h.weight.0.bin b/converter/testdata/1-gpu/model.layers.0.mlp.dense_4h_to_h.weight.0.bin
new file mode 100644
index 0000000..4da1133
--- /dev/null
+++ b/converter/testdata/1-gpu/model.layers.0.mlp.dense_4h_to_h.weight.0.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c7459667751237cef87ba33e5faf46e82ea33f7f53aaae7bf95a8667b6f9e639
+size 16384
diff --git a/converter/testdata/1-gpu/model.layers.0.mlp.dense_h_to_4h.bias.0.bin b/converter/testdata/1-gpu/model.layers.0.mlp.dense_h_to_4h.bias.0.bin
new file mode 100644
index 0000000..c30ec76
--- /dev/null
+++ b/converter/testdata/1-gpu/model.layers.0.mlp.dense_h_to_4h.bias.0.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:076a27c79e5ace2a3d47f9dd2e83e4ff6ea8872b3c2218f66c92b89b55f36560
+size 512
diff --git a/converter/testdata/1-gpu/model.layers.0.mlp.dense_h_to_4h.weight.0.bin b/converter/testdata/1-gpu/model.layers.0.mlp.dense_h_to_4h.weight.0.bin
new file mode 100644
index 0000000..668eaee
--- /dev/null
+++ b/converter/testdata/1-gpu/model.layers.0.mlp.dense_h_to_4h.weight.0.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:55de52e2d73e7e92962bc02673a7dce6123d77e486ac4f8ce7bead1a6727d227
+size 16384
diff --git a/converter/testdata/1-gpu/model.layers.1.attention.dense.weight.0.bin b/converter/testdata/1-gpu/model.layers.1.attention.dense.weight.0.bin
new file mode 100644
index 0000000..97a8f58
--- /dev/null
+++ b/converter/testdata/1-gpu/model.layers.1.attention.dense.weight.0.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ec12f3d7c73cbc440b476ad66bb4a1ef43881c4d740e8114dc1578bb0197a17e
+size 4096
diff --git a/converter/testdata/1-gpu/model.layers.1.attention.query_key_value.weight.0.bin b/converter/testdata/1-gpu/model.layers.1.attention.query_key_value.weight.0.bin
new file mode 100644
index 0000000..33b977e
--- /dev/null
+++ b/converter/testdata/1-gpu/model.layers.1.attention.query_key_value.weight.0.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:86d3c23c240260084ac27bd98d52524f0b3559d8106839d85bc927b44750bd81
+size 12288
diff --git a/converter/testdata/1-gpu/model.layers.1.input_layernorm.bias.bin b/converter/testdata/1-gpu/model.layers.1.input_layernorm.bias.bin
new file mode 100644
index 0000000..67415c7
--- /dev/null
+++ b/converter/testdata/1-gpu/model.layers.1.input_layernorm.bias.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:38723a2e5e8a17aa7950dc008209944e898f69a7bd10a23c839d341e935fd5ca
+size 128
diff --git a/converter/testdata/1-gpu/model.layers.1.input_layernorm.weight.bin b/converter/testdata/1-gpu/model.layers.1.input_layernorm.weight.bin
new file mode 100644
index 0000000..d0c1df9
--- /dev/null
+++ b/converter/testdata/1-gpu/model.layers.1.input_layernorm.weight.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b638277a8690e175a9137feff1e43c067f9faf4e2f600caf468fb05b0403b717
+size 128
diff --git a/converter/testdata/1-gpu/model.layers.1.mlp.dense_4h_to_h.bias.bin b/converter/testdata/1-gpu/model.layers.1.mlp.dense_4h_to_h.bias.bin
new file mode 100644
index 0000000..67415c7
--- /dev/null
+++ b/converter/testdata/1-gpu/model.layers.1.mlp.dense_4h_to_h.bias.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:38723a2e5e8a17aa7950dc008209944e898f69a7bd10a23c839d341e935fd5ca
+size 128
diff --git a/converter/testdata/1-gpu/model.layers.1.mlp.dense_4h_to_h.weight.0.bin b/converter/testdata/1-gpu/model.layers.1.mlp.dense_4h_to_h.weight.0.bin
new file mode 100644
index 0000000..d6e7188
--- /dev/null
+++ b/converter/testdata/1-gpu/model.layers.1.mlp.dense_4h_to_h.weight.0.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:75338924b49fb652d556c260013520b58ca70c8bd782bf59732c5ca8d1de111d
+size 16384
diff --git a/converter/testdata/1-gpu/model.layers.1.mlp.dense_h_to_4h.bias.0.bin b/converter/testdata/1-gpu/model.layers.1.mlp.dense_h_to_4h.bias.0.bin
new file mode 100644
index 0000000..c30ec76
--- /dev/null
+++ b/converter/testdata/1-gpu/model.layers.1.mlp.dense_h_to_4h.bias.0.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:076a27c79e5ace2a3d47f9dd2e83e4ff6ea8872b3c2218f66c92b89b55f36560
+size 512
diff --git a/converter/testdata/1-gpu/model.layers.1.mlp.dense_h_to_4h.weight.0.bin b/converter/testdata/1-gpu/model.layers.1.mlp.dense_h_to_4h.weight.0.bin
new file mode 100644
index 0000000..622a346
--- /dev/null
+++ b/converter/testdata/1-gpu/model.layers.1.mlp.dense_h_to_4h.weight.0.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:be97681ddf43d42ee25d0439c6958edac3549b0edda8a4e3e8bce4275916bb7c
+size 16384
diff --git a/converter/testdata/1-gpu/model.layers.2.attention.dense.weight.0.bin b/converter/testdata/1-gpu/model.layers.2.attention.dense.weight.0.bin
new file mode 100644
index 0000000..9fef556
--- /dev/null
+++ b/converter/testdata/1-gpu/model.layers.2.attention.dense.weight.0.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:52bfbb09f85dba050a997ddd1869ae74aa8e76a70a63fd4b7c047531128bec07
+size 4096
diff --git a/converter/testdata/1-gpu/model.layers.2.attention.query_key_value.weight.0.bin b/converter/testdata/1-gpu/model.layers.2.attention.query_key_value.weight.0.bin
new file mode 100644
index 0000000..f84cc8b
--- /dev/null
+++ b/converter/testdata/1-gpu/model.layers.2.attention.query_key_value.weight.0.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:869b24c7a494832730ba41e0286966b23e700e4239d39198e78551a7ef5e8d7f
+size 12288
diff --git a/converter/testdata/1-gpu/model.layers.2.input_layernorm.bias.bin b/converter/testdata/1-gpu/model.layers.2.input_layernorm.bias.bin
new file mode 100644
index 0000000..67415c7
--- /dev/null
+++ b/converter/testdata/1-gpu/model.layers.2.input_layernorm.bias.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:38723a2e5e8a17aa7950dc008209944e898f69a7bd10a23c839d341e935fd5ca
+size 128
diff --git a/converter/testdata/1-gpu/model.layers.2.input_layernorm.weight.bin b/converter/testdata/1-gpu/model.layers.2.input_layernorm.weight.bin
new file mode 100644
index 0000000..d0c1df9
--- /dev/null
+++ b/converter/testdata/1-gpu/model.layers.2.input_layernorm.weight.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b638277a8690e175a9137feff1e43c067f9faf4e2f600caf468fb05b0403b717
+size 128
diff --git a/converter/testdata/1-gpu/model.layers.2.mlp.dense_4h_to_h.bias.bin b/converter/testdata/1-gpu/model.layers.2.mlp.dense_4h_to_h.bias.bin
new file mode 100644
index 0000000..67415c7
--- /dev/null
+++ b/converter/testdata/1-gpu/model.layers.2.mlp.dense_4h_to_h.bias.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:38723a2e5e8a17aa7950dc008209944e898f69a7bd10a23c839d341e935fd5ca
+size 128
diff --git a/converter/testdata/1-gpu/model.layers.2.mlp.dense_4h_to_h.weight.0.bin b/converter/testdata/1-gpu/model.layers.2.mlp.dense_4h_to_h.weight.0.bin
new file mode 100644
index 0000000..a71148a
--- /dev/null
+++ b/converter/testdata/1-gpu/model.layers.2.mlp.dense_4h_to_h.weight.0.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:029775363050d9e4c232301274a8085474ca7992a42cabc1112ff46938c5a178
+size 16384
diff --git a/converter/testdata/1-gpu/model.layers.2.mlp.dense_h_to_4h.bias.0.bin b/converter/testdata/1-gpu/model.layers.2.mlp.dense_h_to_4h.bias.0.bin
new file mode 100644
index 0000000..c30ec76
--- /dev/null
+++ b/converter/testdata/1-gpu/model.layers.2.mlp.dense_h_to_4h.bias.0.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:076a27c79e5ace2a3d47f9dd2e83e4ff6ea8872b3c2218f66c92b89b55f36560
+size 512
diff --git a/converter/testdata/1-gpu/model.layers.2.mlp.dense_h_to_4h.weight.0.bin b/converter/testdata/1-gpu/model.layers.2.mlp.dense_h_to_4h.weight.0.bin
new file mode 100644
index 0000000..63df77d
--- /dev/null
+++ b/converter/testdata/1-gpu/model.layers.2.mlp.dense_h_to_4h.weight.0.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:95beee5255e9d3d5d255ebc6d3f18465e1ab005b7e33e3d0d6495eb7a6178eed
+size 16384
diff --git a/converter/testdata/1-gpu/model.layers.3.attention.dense.weight.0.bin b/converter/testdata/1-gpu/model.layers.3.attention.dense.weight.0.bin
new file mode 100644
index 0000000..dfc1df1
--- /dev/null
+++ b/converter/testdata/1-gpu/model.layers.3.attention.dense.weight.0.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7af1303e224fc1185c5d936ca8fb3ab336e46f1bd09c94f1e749936d0b023713
+size 4096
diff --git a/converter/testdata/1-gpu/model.layers.3.attention.query_key_value.weight.0.bin b/converter/testdata/1-gpu/model.layers.3.attention.query_key_value.weight.0.bin
new file mode 100644
index 0000000..2603376
--- /dev/null
+++ b/converter/testdata/1-gpu/model.layers.3.attention.query_key_value.weight.0.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:55961585790611913b727f6043af3589274c4b2350ea68bcacf25009e750cc37
+size 12288
diff --git a/converter/testdata/1-gpu/model.layers.3.input_layernorm.bias.bin b/converter/testdata/1-gpu/model.layers.3.input_layernorm.bias.bin
new file mode 100644
index 0000000..67415c7
--- /dev/null
+++ b/converter/testdata/1-gpu/model.layers.3.input_layernorm.bias.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:38723a2e5e8a17aa7950dc008209944e898f69a7bd10a23c839d341e935fd5ca
+size 128
diff --git a/converter/testdata/1-gpu/model.layers.3.input_layernorm.weight.bin b/converter/testdata/1-gpu/model.layers.3.input_layernorm.weight.bin
new file mode 100644
index 0000000..d0c1df9
--- /dev/null
+++ b/converter/testdata/1-gpu/model.layers.3.input_layernorm.weight.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b638277a8690e175a9137feff1e43c067f9faf4e2f600caf468fb05b0403b717
+size 128
diff --git a/converter/testdata/1-gpu/model.layers.3.mlp.dense_4h_to_h.bias.bin b/converter/testdata/1-gpu/model.layers.3.mlp.dense_4h_to_h.bias.bin
new file mode 100644
index 0000000..67415c7
--- /dev/null
+++ b/converter/testdata/1-gpu/model.layers.3.mlp.dense_4h_to_h.bias.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:38723a2e5e8a17aa7950dc008209944e898f69a7bd10a23c839d341e935fd5ca
+size 128
diff --git a/converter/testdata/1-gpu/model.layers.3.mlp.dense_4h_to_h.weight.0.bin b/converter/testdata/1-gpu/model.layers.3.mlp.dense_4h_to_h.weight.0.bin
new file mode 100644
index 0000000..01f32ad
--- /dev/null
+++ b/converter/testdata/1-gpu/model.layers.3.mlp.dense_4h_to_h.weight.0.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9f37f3e28a6e716d08d29d02126854bd6e6248763b9a30af2f2e1dcf7b8fd9a5
+size 16384
diff --git a/converter/testdata/1-gpu/model.layers.3.mlp.dense_h_to_4h.bias.0.bin b/converter/testdata/1-gpu/model.layers.3.mlp.dense_h_to_4h.bias.0.bin
new file mode 100644
index 0000000..c30ec76
--- /dev/null
+++ b/converter/testdata/1-gpu/model.layers.3.mlp.dense_h_to_4h.bias.0.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:076a27c79e5ace2a3d47f9dd2e83e4ff6ea8872b3c2218f66c92b89b55f36560
+size 512
diff --git a/converter/testdata/1-gpu/model.layers.3.mlp.dense_h_to_4h.weight.0.bin b/converter/testdata/1-gpu/model.layers.3.mlp.dense_h_to_4h.weight.0.bin
new file mode 100644
index 0000000..10fcdeb
--- /dev/null
+++ b/converter/testdata/1-gpu/model.layers.3.mlp.dense_h_to_4h.weight.0.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d903dfb50cce4eae673a2d96a7814353ac1436c0c4d65490bb3ed7d8f8cfc586
+size 16384
diff --git a/converter/testdata/1-gpu/model.layers.4.attention.dense.weight.0.bin b/converter/testdata/1-gpu/model.layers.4.attention.dense.weight.0.bin
new file mode 100644
index 0000000..2d07ce1
--- /dev/null
+++ b/converter/testdata/1-gpu/model.layers.4.attention.dense.weight.0.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cb76390eda7af1d23d5b162446b4c5da0b791ec337d20d9a643b9716377ae514
+size 4096
diff --git a/converter/testdata/1-gpu/model.layers.4.attention.query_key_value.weight.0.bin b/converter/testdata/1-gpu/model.layers.4.attention.query_key_value.weight.0.bin
new file mode 100644
index 0000000..b0008a0
--- /dev/null
+++ b/converter/testdata/1-gpu/model.layers.4.attention.query_key_value.weight.0.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8f54ff65f519de2db6343ec257da92091162381082fbb5dba04df50d8e12a158
+size 12288
diff --git a/converter/testdata/1-gpu/model.layers.4.input_layernorm.bias.bin b/converter/testdata/1-gpu/model.layers.4.input_layernorm.bias.bin
new file mode 100644
index 0000000..67415c7
--- /dev/null
+++ b/converter/testdata/1-gpu/model.layers.4.input_layernorm.bias.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:38723a2e5e8a17aa7950dc008209944e898f69a7bd10a23c839d341e935fd5ca
+size 128
diff --git a/converter/testdata/1-gpu/model.layers.4.input_layernorm.weight.bin b/converter/testdata/1-gpu/model.layers.4.input_layernorm.weight.bin
new file mode 100644
index 0000000..d0c1df9
--- /dev/null
+++ b/converter/testdata/1-gpu/model.layers.4.input_layernorm.weight.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b638277a8690e175a9137feff1e43c067f9faf4e2f600caf468fb05b0403b717
+size 128
diff --git a/converter/testdata/1-gpu/model.layers.4.mlp.dense_4h_to_h.bias.bin b/converter/testdata/1-gpu/model.layers.4.mlp.dense_4h_to_h.bias.bin
new file mode 100644
index 0000000..67415c7
--- /dev/null
+++ b/converter/testdata/1-gpu/model.layers.4.mlp.dense_4h_to_h.bias.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:38723a2e5e8a17aa7950dc008209944e898f69a7bd10a23c839d341e935fd5ca
+size 128
diff --git a/converter/testdata/1-gpu/model.layers.4.mlp.dense_4h_to_h.weight.0.bin b/converter/testdata/1-gpu/model.layers.4.mlp.dense_4h_to_h.weight.0.bin
new file mode 100644
index 0000000..41b7c12
--- /dev/null
+++ b/converter/testdata/1-gpu/model.layers.4.mlp.dense_4h_to_h.weight.0.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:67e7225a2de28f7e21a72b7ea1cab517071744c53d13f4c6964cbc27f4d261e4
+size 16384
diff --git a/converter/testdata/1-gpu/model.layers.4.mlp.dense_h_to_4h.bias.0.bin b/converter/testdata/1-gpu/model.layers.4.mlp.dense_h_to_4h.bias.0.bin
new file mode 100644
index 0000000..c30ec76
--- /dev/null
+++ b/converter/testdata/1-gpu/model.layers.4.mlp.dense_h_to_4h.bias.0.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:076a27c79e5ace2a3d47f9dd2e83e4ff6ea8872b3c2218f66c92b89b55f36560
+size 512
diff --git a/converter/testdata/1-gpu/model.layers.4.mlp.dense_h_to_4h.weight.0.bin b/converter/testdata/1-gpu/model.layers.4.mlp.dense_h_to_4h.weight.0.bin
new file mode 100644
index 0000000..975aa56
--- /dev/null
+++ b/converter/testdata/1-gpu/model.layers.4.mlp.dense_h_to_4h.weight.0.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cb7582613a3b40b73ac166af2e6b9773511cf6fba7bec12f340119f588c8ea48
+size 16384
diff --git a/converter/testdata/1-gpu/model.lm_head.bias.bin b/converter/testdata/1-gpu/model.lm_head.bias.bin
new file mode 100644
index 0000000..fb155d8
--- /dev/null
+++ b/converter/testdata/1-gpu/model.lm_head.bias.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:fc19b1997119425765295aeab72d76faa6927d4f83985d328c26f20468d6cc76
+size 4000
diff --git a/converter/testdata/1-gpu/model.lm_head.weight.bin b/converter/testdata/1-gpu/model.lm_head.weight.bin
new file mode 100644
index 0000000..530ff0d
--- /dev/null
+++ b/converter/testdata/1-gpu/model.lm_head.weight.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:884fae8e52776e900d3800048825503048c95ab2850c38c1a595c6da962d3286
+size 128000
diff --git a/converter/testdata/1-gpu/model.wte.bin b/converter/testdata/1-gpu/model.wte.bin
new file mode 100644
index 0000000..c815f00
--- /dev/null
+++ b/converter/testdata/1-gpu/model.wte.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d0d0fec061d1987d0f19acbd319c3471037691cebecd5aa2b00cedcdc2c6177c
+size 128000
diff --git a/poetry.lock b/poetry.lock
index 5a5384d..e7b41bd 100644
--- a/poetry.lock
+++ b/poetry.lock
@@ -264,6 +264,36 @@ files = [
     {file = "charset_normalizer-3.1.0-py3-none-any.whl", hash = "sha256:3d9098b479e78c85080c98e1e35ff40b4a31d8953102bb0fd7d1b6f8a2111a3d"},
 ]
 
+[[package]]
+name = "cmake"
+version = "3.26.0"
+description = "CMake is an open-source, cross-platform family of tools designed to build, test and package software"
+category = "main"
+optional = false
+python-versions = "*"
+files = [
+    {file = "cmake-3.26.0-py2.py3-none-macosx_10_10_universal2.macosx_10_10_x86_64.macosx_11_0_arm64.macosx_11_0_universal2.whl", hash = "sha256:4881727389325af84e39f1ec646b7249d8910b4ed637205bee6d589cb2b2ebd2"},
+    {file = "cmake-3.26.0-py2.py3-none-manylinux2010_i686.manylinux_2_12_i686.whl", hash = "sha256:babd1e38c85d38a4bf4164c3126ec8cf4cd8d374072e2a4a181e52e953007f8c"},
+    {file = "cmake-3.26.0-py2.py3-none-manylinux2010_x86_64.manylinux_2_12_x86_64.whl", hash = "sha256:1851be29d79bb39505954165e934d31994268d49f566ead6fff840a5092e444d"},
+    {file = "cmake-3.26.0-py2.py3-none-manylinux2014_aarch64.manylinux_2_17_aarch64.whl", hash = "sha256:483aaaeb9535deaa2657c928af5d9f0da9329f89bc249f494923495745a03677"},
+    {file = "cmake-3.26.0-py2.py3-none-manylinux2014_i686.manylinux_2_17_i686.whl", hash = "sha256:2f78c6194f224d462333e08d3acd571c553b58d04935971b87efbe76f241353c"},
+    {file = "cmake-3.26.0-py2.py3-none-manylinux2014_ppc64le.manylinux_2_17_ppc64le.whl", hash = "sha256:cf129c8b71f1344975f179f30287baa8804c4c61ff1b13003244b4157b676e13"},
+    {file = "cmake-3.26.0-py2.py3-none-manylinux2014_s390x.manylinux_2_17_s390x.whl", hash = "sha256:fabb82c69223eda27e673c5c6bb02985d60cf0baa631a2e4932eed87e8229928"},
+    {file = "cmake-3.26.0-py2.py3-none-manylinux2014_x86_64.manylinux_2_17_x86_64.whl", hash = "sha256:502cbed2335557920b88687c6f3ff4ce433bd416204c928ad489e399e76149f5"},
+    {file = "cmake-3.26.0-py2.py3-none-musllinux_1_1_aarch64.whl", hash = "sha256:b81c7775b125786c1696232078e9ceb0c9c66d26fb0a2259f40e33983170f924"},
+    {file = "cmake-3.26.0-py2.py3-none-musllinux_1_1_i686.whl", hash = "sha256:f4cc1dde7613cc813d15fd840a33e18cd07a443aa67205d74b9b05f55f08a459"},
+    {file = "cmake-3.26.0-py2.py3-none-musllinux_1_1_ppc64le.whl", hash = "sha256:ac6ca9d9ff58900138bbbebc55857647fb99f1c40b84d8a232f23b0d27d7f48a"},
+    {file = "cmake-3.26.0-py2.py3-none-musllinux_1_1_s390x.whl", hash = "sha256:85e0bad5aeb3a82919ed7d78b76a0462eafe2f918076a1823a09c6f37910f3e0"},
+    {file = "cmake-3.26.0-py2.py3-none-musllinux_1_1_x86_64.whl", hash = "sha256:5523b9701be367572155e77294bf8aa3ac9aa0d73c50dcd6c57903d12bcb308e"},
+    {file = "cmake-3.26.0-py2.py3-none-win32.whl", hash = "sha256:96f0e887260255eeb83bcf3465d51bc6c94078251c9312fa142dce6d3e80acac"},
+    {file = "cmake-3.26.0-py2.py3-none-win_amd64.whl", hash = "sha256:a0719a6f79cdc4d7b16caf757b8ae13eae1c6ce5a08d594cc09774afe129515d"},
+    {file = "cmake-3.26.0-py2.py3-none-win_arm64.whl", hash = "sha256:11159c9b64c6473d84361ab44ef2c85e1bd2db7a2b1b798ce8bf5988f32adf43"},
+    {file = "cmake-3.26.0.tar.gz", hash = "sha256:c18185c9cc147d0fa1e9228962aa37901b37866bd5d617e9efa23dfe706f7321"},
+]
+
+[package.extras]
+test = ["codecov (>=2.0.5)", "coverage (>=4.2)", "flake8 (>=3.0.4)", "path.py (>=11.5.0)", "pytest (>=3.0.3)", "pytest-cov (>=2.4.0)", "pytest-runner (>=2.9)", "pytest-virtualenv (>=1.7.0)", "scikit-build (>=0.10.0)", "setuptools (>=28.0.0)", "virtualenv (>=15.0.3)", "wheel"]
+
 [[package]]
 name = "colorama"
 version = "0.4.6"
@@ -543,6 +573,113 @@ files = [
     {file = "idna-3.4.tar.gz", hash = "sha256:814f528e8dead7d329833b91c5faa87d60bf71824cd12a7530b5526063d02cb4"},
 ]
 
+[[package]]
+name = "jinja2"
+version = "3.1.2"
+description = "A very fast and expressive template engine."
+category = "main"
+optional = false
+python-versions = ">=3.7"
+files = [
+    {file = "Jinja2-3.1.2-py3-none-any.whl", hash = "sha256:6088930bfe239f0e6710546ab9c19c9ef35e29792895fed6e6e31a023a182a61"},
+    {file = "Jinja2-3.1.2.tar.gz", hash = "sha256:31351a702a408a9e7595a8fc6150fc3f43bb6bf7e319770cbc0db9df9437e852"},
+]
+
+[package.dependencies]
+MarkupSafe = ">=2.0"
+
+[package.extras]
+i18n = ["Babel (>=2.7)"]
+
+[[package]]
+name = "lit"
+version = "15.0.7"
+description = "A Software Testing Tool"
+category = "main"
+optional = false
+python-versions = "*"
+files = [
+    {file = "lit-15.0.7.tar.gz", hash = "sha256:ed08ac55afe714a193653df293ae8a6ee6c45d6fb11eeca72ce347d99b88ecc8"},
+]
+
+[[package]]
+name = "markupsafe"
+version = "2.1.2"
+description = "Safely add untrusted strings to HTML/XML markup."
+category = "main"
+optional = false
+python-versions = ">=3.7"
+files = [
+    {file = "MarkupSafe-2.1.2-cp310-cp310-macosx_10_9_universal2.whl", hash = "sha256:665a36ae6f8f20a4676b53224e33d456a6f5a72657d9c83c2aa00765072f31f7"},
+    {file = "MarkupSafe-2.1.2-cp310-cp310-macosx_10_9_x86_64.whl", hash = "sha256:340bea174e9761308703ae988e982005aedf427de816d1afe98147668cc03036"},
+    {file = "MarkupSafe-2.1.2-cp310-cp310-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:22152d00bf4a9c7c83960521fc558f55a1adbc0631fbb00a9471e097b19d72e1"},
+    {file = "MarkupSafe-2.1.2-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:28057e985dace2f478e042eaa15606c7efccb700797660629da387eb289b9323"},
+    {file = "MarkupSafe-2.1.2-cp310-cp310-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:ca244fa73f50a800cf8c3ebf7fd93149ec37f5cb9596aa8873ae2c1d23498601"},
+    {file = "MarkupSafe-2.1.2-cp310-cp310-musllinux_1_1_aarch64.whl", hash = "sha256:d9d971ec1e79906046aa3ca266de79eac42f1dbf3612a05dc9368125952bd1a1"},
+    {file = "MarkupSafe-2.1.2-cp310-cp310-musllinux_1_1_i686.whl", hash = "sha256:7e007132af78ea9df29495dbf7b5824cb71648d7133cf7848a2a5dd00d36f9ff"},
+    {file = "MarkupSafe-2.1.2-cp310-cp310-musllinux_1_1_x86_64.whl", hash = "sha256:7313ce6a199651c4ed9d7e4cfb4aa56fe923b1adf9af3b420ee14e6d9a73df65"},
+    {file = "MarkupSafe-2.1.2-cp310-cp310-win32.whl", hash = "sha256:c4a549890a45f57f1ebf99c067a4ad0cb423a05544accaf2b065246827ed9603"},
+    {file = "MarkupSafe-2.1.2-cp310-cp310-win_amd64.whl", hash = "sha256:835fb5e38fd89328e9c81067fd642b3593c33e1e17e2fdbf77f5676abb14a156"},
+    {file = "MarkupSafe-2.1.2-cp311-cp311-macosx_10_9_universal2.whl", hash = "sha256:2ec4f2d48ae59bbb9d1f9d7efb9236ab81429a764dedca114f5fdabbc3788013"},
+    {file = "MarkupSafe-2.1.2-cp311-cp311-macosx_10_9_x86_64.whl", hash = "sha256:608e7073dfa9e38a85d38474c082d4281f4ce276ac0010224eaba11e929dd53a"},
+    {file = "MarkupSafe-2.1.2-cp311-cp311-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:65608c35bfb8a76763f37036547f7adfd09270fbdbf96608be2bead319728fcd"},
+    {file = "MarkupSafe-2.1.2-cp311-cp311-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:f2bfb563d0211ce16b63c7cb9395d2c682a23187f54c3d79bfec33e6705473c6"},
+    {file = "MarkupSafe-2.1.2-cp311-cp311-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:da25303d91526aac3672ee6d49a2f3db2d9502a4a60b55519feb1a4c7714e07d"},
+    {file = "MarkupSafe-2.1.2-cp311-cp311-musllinux_1_1_aarch64.whl", hash = "sha256:9cad97ab29dfc3f0249b483412c85c8ef4766d96cdf9dcf5a1e3caa3f3661cf1"},
+    {file = "MarkupSafe-2.1.2-cp311-cp311-musllinux_1_1_i686.whl", hash = "sha256:085fd3201e7b12809f9e6e9bc1e5c96a368c8523fad5afb02afe3c051ae4afcc"},
+    {file = "MarkupSafe-2.1.2-cp311-cp311-musllinux_1_1_x86_64.whl", hash = "sha256:1bea30e9bf331f3fef67e0a3877b2288593c98a21ccb2cf29b74c581a4eb3af0"},
+    {file = "MarkupSafe-2.1.2-cp311-cp311-win32.whl", hash = "sha256:7df70907e00c970c60b9ef2938d894a9381f38e6b9db73c5be35e59d92e06625"},
+    {file = "MarkupSafe-2.1.2-cp311-cp311-win_amd64.whl", hash = "sha256:e55e40ff0cc8cc5c07996915ad367fa47da6b3fc091fdadca7f5403239c5fec3"},
+    {file = "MarkupSafe-2.1.2-cp37-cp37m-macosx_10_9_x86_64.whl", hash = "sha256:a6e40afa7f45939ca356f348c8e23048e02cb109ced1eb8420961b2f40fb373a"},
+    {file = "MarkupSafe-2.1.2-cp37-cp37m-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:cf877ab4ed6e302ec1d04952ca358b381a882fbd9d1b07cccbfd61783561f98a"},
+    {file = "MarkupSafe-2.1.2-cp37-cp37m-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:63ba06c9941e46fa389d389644e2d8225e0e3e5ebcc4ff1ea8506dce646f8c8a"},
+    {file = "MarkupSafe-2.1.2-cp37-cp37m-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:f1cd098434e83e656abf198f103a8207a8187c0fc110306691a2e94a78d0abb2"},
+    {file = "MarkupSafe-2.1.2-cp37-cp37m-musllinux_1_1_aarch64.whl", hash = "sha256:55f44b440d491028addb3b88f72207d71eeebfb7b5dbf0643f7c023ae1fba619"},
+    {file = "MarkupSafe-2.1.2-cp37-cp37m-musllinux_1_1_i686.whl", hash = "sha256:a6f2fcca746e8d5910e18782f976489939d54a91f9411c32051b4aab2bd7c513"},
+    {file = "MarkupSafe-2.1.2-cp37-cp37m-musllinux_1_1_x86_64.whl", hash = "sha256:0b462104ba25f1ac006fdab8b6a01ebbfbce9ed37fd37fd4acd70c67c973e460"},
+    {file = "MarkupSafe-2.1.2-cp37-cp37m-win32.whl", hash = "sha256:7668b52e102d0ed87cb082380a7e2e1e78737ddecdde129acadb0eccc5423859"},
+    {file = "MarkupSafe-2.1.2-cp37-cp37m-win_amd64.whl", hash = "sha256:6d6607f98fcf17e534162f0709aaad3ab7a96032723d8ac8750ffe17ae5a0666"},
+    {file = "MarkupSafe-2.1.2-cp38-cp38-macosx_10_9_universal2.whl", hash = "sha256:a806db027852538d2ad7555b203300173dd1b77ba116de92da9afbc3a3be3eed"},
+    {file = "MarkupSafe-2.1.2-cp38-cp38-macosx_10_9_x86_64.whl", hash = "sha256:a4abaec6ca3ad8660690236d11bfe28dfd707778e2442b45addd2f086d6ef094"},
+    {file = "MarkupSafe-2.1.2-cp38-cp38-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:f03a532d7dee1bed20bc4884194a16160a2de9ffc6354b3878ec9682bb623c54"},
+    {file = "MarkupSafe-2.1.2-cp38-cp38-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:4cf06cdc1dda95223e9d2d3c58d3b178aa5dacb35ee7e3bbac10e4e1faacb419"},
+    {file = "MarkupSafe-2.1.2-cp38-cp38-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:22731d79ed2eb25059ae3df1dfc9cb1546691cc41f4e3130fe6bfbc3ecbbecfa"},
+    {file = "MarkupSafe-2.1.2-cp38-cp38-musllinux_1_1_aarch64.whl", hash = "sha256:f8ffb705ffcf5ddd0e80b65ddf7bed7ee4f5a441ea7d3419e861a12eaf41af58"},
+    {file = "MarkupSafe-2.1.2-cp38-cp38-musllinux_1_1_i686.whl", hash = "sha256:8db032bf0ce9022a8e41a22598eefc802314e81b879ae093f36ce9ddf39ab1ba"},
+    {file = "MarkupSafe-2.1.2-cp38-cp38-musllinux_1_1_x86_64.whl", hash = "sha256:2298c859cfc5463f1b64bd55cb3e602528db6fa0f3cfd568d3605c50678f8f03"},
+    {file = "MarkupSafe-2.1.2-cp38-cp38-win32.whl", hash = "sha256:50c42830a633fa0cf9e7d27664637532791bfc31c731a87b202d2d8ac40c3ea2"},
+    {file = "MarkupSafe-2.1.2-cp38-cp38-win_amd64.whl", hash = "sha256:bb06feb762bade6bf3c8b844462274db0c76acc95c52abe8dbed28ae3d44a147"},
+    {file = "MarkupSafe-2.1.2-cp39-cp39-macosx_10_9_universal2.whl", hash = "sha256:99625a92da8229df6d44335e6fcc558a5037dd0a760e11d84be2260e6f37002f"},
+    {file = "MarkupSafe-2.1.2-cp39-cp39-macosx_10_9_x86_64.whl", hash = "sha256:8bca7e26c1dd751236cfb0c6c72d4ad61d986e9a41bbf76cb445f69488b2a2bd"},
+    {file = "MarkupSafe-2.1.2-cp39-cp39-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:40627dcf047dadb22cd25ea7ecfe9cbf3bbbad0482ee5920b582f3809c97654f"},
+    {file = "MarkupSafe-2.1.2-cp39-cp39-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:40dfd3fefbef579ee058f139733ac336312663c6706d1163b82b3003fb1925c4"},
+    {file = "MarkupSafe-2.1.2-cp39-cp39-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:090376d812fb6ac5f171e5938e82e7f2d7adc2b629101cec0db8b267815c85e2"},
+    {file = "MarkupSafe-2.1.2-cp39-cp39-musllinux_1_1_aarch64.whl", hash = "sha256:2e7821bffe00aa6bd07a23913b7f4e01328c3d5cc0b40b36c0bd81d362faeb65"},
+    {file = "MarkupSafe-2.1.2-cp39-cp39-musllinux_1_1_i686.whl", hash = "sha256:c0a33bc9f02c2b17c3ea382f91b4db0e6cde90b63b296422a939886a7a80de1c"},
+    {file = "MarkupSafe-2.1.2-cp39-cp39-musllinux_1_1_x86_64.whl", hash = "sha256:b8526c6d437855442cdd3d87eede9c425c4445ea011ca38d937db299382e6fa3"},
+    {file = "MarkupSafe-2.1.2-cp39-cp39-win32.whl", hash = "sha256:137678c63c977754abe9086a3ec011e8fd985ab90631145dfb9294ad09c102a7"},
+    {file = "MarkupSafe-2.1.2-cp39-cp39-win_amd64.whl", hash = "sha256:0576fe974b40a400449768941d5d0858cc624e3249dfd1e0c33674e5c7ca7aed"},
+    {file = "MarkupSafe-2.1.2.tar.gz", hash = "sha256:abcabc8c2b26036d62d4c746381a6f7cf60aafcc653198ad678306986b09450d"},
+]
+
+[[package]]
+name = "mpmath"
+version = "1.3.0"
+description = "Python library for arbitrary-precision floating-point arithmetic"
+category = "main"
+optional = false
+python-versions = "*"
+files = [
+    {file = "mpmath-1.3.0-py3-none-any.whl", hash = "sha256:a0b2b9fe80bbcd81a6647ff13108738cfb482d481d826cc0e02f5b35e5c88d2c"},
+    {file = "mpmath-1.3.0.tar.gz", hash = "sha256:7a28eb2a9774d00c7bc92411c19a89209d5da7c4c9a9e227be8330a23a25b91f"},
+]
+
+[package.extras]
+develop = ["codecov", "pycodestyle", "pytest (>=4.6)", "pytest-cov", "wheel"]
+docs = ["sphinx"]
+gmpy = ["gmpy2 (>=2.1.0a4)"]
+tests = ["pytest (>=4.6)"]
+
 [[package]]
 name = "multidict"
 version = "6.0.4"
@@ -654,6 +791,25 @@ files = [
 [package.dependencies]
 dill = ">=0.3.6"
 
+[[package]]
+name = "networkx"
+version = "3.0"
+description = "Python package for creating and manipulating graphs and networks"
+category = "main"
+optional = false
+python-versions = ">=3.8"
+files = [
+    {file = "networkx-3.0-py3-none-any.whl", hash = "sha256:58058d66b1818043527244fab9d41a51fcd7dcc271748015f3c181b8a90c8e2e"},
+    {file = "networkx-3.0.tar.gz", hash = "sha256:9a9992345353618ae98339c2b63d8201c381c2944f38a2ab49cb45a4c667e412"},
+]
+
+[package.extras]
+default = ["matplotlib (>=3.4)", "numpy (>=1.20)", "pandas (>=1.3)", "scipy (>=1.8)"]
+developer = ["mypy (>=0.991)", "pre-commit (>=2.20)"]
+doc = ["nb2plots (>=0.6)", "numpydoc (>=1.5)", "pillow (>=9.2)", "pydata-sphinx-theme (>=0.11)", "sphinx (==5.2.3)", "sphinx-gallery (>=0.11)", "texext (>=0.6.7)"]
+extra = ["lxml (>=4.6)", "pydot (>=1.4.2)", "pygraphviz (>=1.10)", "sympy (>=1.10)"]
+test = ["codecov (>=2.1)", "pytest (>=7.2)", "pytest-cov (>=4.0)"]
+
 [[package]]
 name = "nodeenv"
 version = "1.7.0"
@@ -707,6 +863,175 @@ files = [
     {file = "numpy-1.24.2.tar.gz", hash = "sha256:003a9f530e880cb2cd177cba1af7220b9aa42def9c4afc2a2fc3ee6be7eb2b22"},
 ]
 
+[[package]]
+name = "nvidia-cublas-cu11"
+version = "11.10.3.66"
+description = "CUBLAS native runtime libraries"
+category = "main"
+optional = false
+python-versions = ">=3"
+files = [
+    {file = "nvidia_cublas_cu11-11.10.3.66-py3-none-manylinux1_x86_64.whl", hash = "sha256:d32e4d75f94ddfb93ea0a5dda08389bcc65d8916a25cb9f37ac89edaeed3bded"},
+    {file = "nvidia_cublas_cu11-11.10.3.66-py3-none-win_amd64.whl", hash = "sha256:8ac17ba6ade3ed56ab898a036f9ae0756f1e81052a317bf98f8c6d18dc3ae49e"},
+]
+
+[package.dependencies]
+setuptools = "*"
+wheel = "*"
+
+[[package]]
+name = "nvidia-cuda-cupti-cu11"
+version = "11.7.101"
+description = "CUDA profiling tools runtime libs."
+category = "main"
+optional = false
+python-versions = ">=3"
+files = [
+    {file = "nvidia_cuda_cupti_cu11-11.7.101-py3-none-manylinux1_x86_64.whl", hash = "sha256:e0cfd9854e1f2edaa36ca20d21cd0bdd5dcfca4e3b9e130a082e05b33b6c5895"},
+    {file = "nvidia_cuda_cupti_cu11-11.7.101-py3-none-win_amd64.whl", hash = "sha256:7cc5b8f91ae5e1389c3c0ad8866b3b016a175e827ea8f162a672990a402ab2b0"},
+]
+
+[package.dependencies]
+setuptools = "*"
+wheel = "*"
+
+[[package]]
+name = "nvidia-cuda-nvrtc-cu11"
+version = "11.7.99"
+description = "NVRTC native runtime libraries"
+category = "main"
+optional = false
+python-versions = ">=3"
+files = [
+    {file = "nvidia_cuda_nvrtc_cu11-11.7.99-2-py3-none-manylinux1_x86_64.whl", hash = "sha256:9f1562822ea264b7e34ed5930567e89242d266448e936b85bc97a3370feabb03"},
+    {file = "nvidia_cuda_nvrtc_cu11-11.7.99-py3-none-manylinux1_x86_64.whl", hash = "sha256:f7d9610d9b7c331fa0da2d1b2858a4a8315e6d49765091d28711c8946e7425e7"},
+    {file = "nvidia_cuda_nvrtc_cu11-11.7.99-py3-none-win_amd64.whl", hash = "sha256:f2effeb1309bdd1b3854fc9b17eaf997808f8b25968ce0c7070945c4265d64a3"},
+]
+
+[package.dependencies]
+setuptools = "*"
+wheel = "*"
+
+[[package]]
+name = "nvidia-cuda-runtime-cu11"
+version = "11.7.99"
+description = "CUDA Runtime native Libraries"
+category = "main"
+optional = false
+python-versions = ">=3"
+files = [
+    {file = "nvidia_cuda_runtime_cu11-11.7.99-py3-none-manylinux1_x86_64.whl", hash = "sha256:cc768314ae58d2641f07eac350f40f99dcb35719c4faff4bc458a7cd2b119e31"},
+    {file = "nvidia_cuda_runtime_cu11-11.7.99-py3-none-win_amd64.whl", hash = "sha256:bc77fa59a7679310df9d5c70ab13c4e34c64ae2124dd1efd7e5474b71be125c7"},
+]
+
+[package.dependencies]
+setuptools = "*"
+wheel = "*"
+
+[[package]]
+name = "nvidia-cudnn-cu11"
+version = "8.5.0.96"
+description = "cuDNN runtime libraries"
+category = "main"
+optional = false
+python-versions = ">=3"
+files = [
+    {file = "nvidia_cudnn_cu11-8.5.0.96-2-py3-none-manylinux1_x86_64.whl", hash = "sha256:402f40adfc6f418f9dae9ab402e773cfed9beae52333f6d86ae3107a1b9527e7"},
+    {file = "nvidia_cudnn_cu11-8.5.0.96-py3-none-manylinux1_x86_64.whl", hash = "sha256:71f8111eb830879ff2836db3cccf03bbd735df9b0d17cd93761732ac50a8a108"},
+]
+
+[package.dependencies]
+setuptools = "*"
+wheel = "*"
+
+[[package]]
+name = "nvidia-cufft-cu11"
+version = "10.9.0.58"
+description = "CUFFT native runtime libraries"
+category = "main"
+optional = false
+python-versions = ">=3"
+files = [
+    {file = "nvidia_cufft_cu11-10.9.0.58-py3-none-manylinux1_x86_64.whl", hash = "sha256:222f9da70c80384632fd6035e4c3f16762d64ea7a843829cb278f98b3cb7dd81"},
+    {file = "nvidia_cufft_cu11-10.9.0.58-py3-none-win_amd64.whl", hash = "sha256:c4d316f17c745ec9c728e30409612eaf77a8404c3733cdf6c9c1569634d1ca03"},
+]
+
+[[package]]
+name = "nvidia-curand-cu11"
+version = "10.2.10.91"
+description = "CURAND native runtime libraries"
+category = "main"
+optional = false
+python-versions = ">=3"
+files = [
+    {file = "nvidia_curand_cu11-10.2.10.91-py3-none-manylinux1_x86_64.whl", hash = "sha256:eecb269c970fa599a2660c9232fa46aaccbf90d9170b96c462e13bcb4d129e2c"},
+    {file = "nvidia_curand_cu11-10.2.10.91-py3-none-win_amd64.whl", hash = "sha256:f742052af0e1e75523bde18895a9ed016ecf1e5aa0ecddfcc3658fd11a1ff417"},
+]
+
+[package.dependencies]
+setuptools = "*"
+wheel = "*"
+
+[[package]]
+name = "nvidia-cusolver-cu11"
+version = "11.4.0.1"
+description = "CUDA solver native runtime libraries"
+category = "main"
+optional = false
+python-versions = ">=3"
+files = [
+    {file = "nvidia_cusolver_cu11-11.4.0.1-2-py3-none-manylinux1_x86_64.whl", hash = "sha256:72fa7261d755ed55c0074960df5904b65e2326f7adce364cbe4945063c1be412"},
+    {file = "nvidia_cusolver_cu11-11.4.0.1-py3-none-manylinux1_x86_64.whl", hash = "sha256:700b781bfefd57d161443aff9ace1878584b93e0b2cfef3d6e9296d96febbf99"},
+    {file = "nvidia_cusolver_cu11-11.4.0.1-py3-none-win_amd64.whl", hash = "sha256:00f70b256add65f8c1eb3b6a65308795a93e7740f6df9e273eccbba770d370c4"},
+]
+
+[package.dependencies]
+setuptools = "*"
+wheel = "*"
+
+[[package]]
+name = "nvidia-cusparse-cu11"
+version = "11.7.4.91"
+description = "CUSPARSE native runtime libraries"
+category = "main"
+optional = false
+python-versions = ">=3"
+files = [
+    {file = "nvidia_cusparse_cu11-11.7.4.91-py3-none-manylinux1_x86_64.whl", hash = "sha256:a3389de714db63321aa11fbec3919271f415ef19fda58aed7f2ede488c32733d"},
+    {file = "nvidia_cusparse_cu11-11.7.4.91-py3-none-win_amd64.whl", hash = "sha256:304a01599534f5186a8ed1c3756879282c72c118bc77dd890dc1ff868cad25b9"},
+]
+
+[package.dependencies]
+setuptools = "*"
+wheel = "*"
+
+[[package]]
+name = "nvidia-nccl-cu11"
+version = "2.14.3"
+description = "NVIDIA Collective Communication Library (NCCL) Runtime"
+category = "main"
+optional = false
+python-versions = ">=3"
+files = [
+    {file = "nvidia_nccl_cu11-2.14.3-py3-none-manylinux1_x86_64.whl", hash = "sha256:5e5534257d1284b8e825bc3a182c6f06acd6eb405e9f89d49340e98cd8f136eb"},
+]
+
+[[package]]
+name = "nvidia-nvtx-cu11"
+version = "11.7.91"
+description = "NVIDIA Tools Extension"
+category = "main"
+optional = false
+python-versions = ">=3"
+files = [
+    {file = "nvidia_nvtx_cu11-11.7.91-py3-none-manylinux1_x86_64.whl", hash = "sha256:b22c64eee426a62fc00952b507d6d29cf62b4c9df7a480fcc417e540e05fd5ac"},
+    {file = "nvidia_nvtx_cu11-11.7.91-py3-none-win_amd64.whl", hash = "sha256:dfd7fcb2a91742513027d63a26b757f38dd8b07fecac282c4d132a9d373ff064"},
+]
+
+[package.dependencies]
+setuptools = "*"
+wheel = "*"
+
 [[package]]
 name = "packaging"
 version = "23.0"
@@ -1060,7 +1385,7 @@ tests = ["coverage (>=6.0.0)", "flake8", "mypy", "pytest (>=4.6)", "pytest-cov",
 name = "setuptools"
 version = "67.6.0"
 description = "Easily download, build, install, upgrade, and uninstall Python packages"
-category = "dev"
+category = "main"
 optional = false
 python-versions = ">=3.7"
 files = [
@@ -1085,6 +1410,21 @@ files = [
     {file = "six-1.16.0.tar.gz", hash = "sha256:1e61c37477a1626458e36f7b1d82aa5c9b094fa4802892072e49de9c60c4c926"},
 ]
 
+[[package]]
+name = "sympy"
+version = "1.11.1"
+description = "Computer algebra system (CAS) in Python"
+category = "main"
+optional = false
+python-versions = ">=3.8"
+files = [
+    {file = "sympy-1.11.1-py3-none-any.whl", hash = "sha256:938f984ee2b1e8eae8a07b884c8b7a1146010040fccddc6539c54f401c8f6fcf"},
+    {file = "sympy-1.11.1.tar.gz", hash = "sha256:e32380dce63cb7c0108ed525570092fd45168bdae2faa17e528221ef72e88658"},
+]
+
+[package.dependencies]
+mpmath = ">=0.19"
+
 [[package]]
 name = "tokenizers"
 version = "0.13.2"
@@ -1140,6 +1480,58 @@ dev = ["black (==22.3)", "datasets", "numpy", "pytest", "requests"]
 docs = ["setuptools-rust", "sphinx", "sphinx-rtd-theme"]
 testing = ["black (==22.3)", "datasets", "numpy", "pytest", "requests"]
 
+[[package]]
+name = "torch"
+version = "2.0.0"
+description = "Tensors and Dynamic neural networks in Python with strong GPU acceleration"
+category = "main"
+optional = false
+python-versions = ">=3.8.0"
+files = [
+    {file = "torch-2.0.0-cp310-cp310-manylinux1_x86_64.whl", hash = "sha256:7a9319a67294ef02459a19738bbfa8727bb5307b822dadd708bc2ccf6c901aca"},
+    {file = "torch-2.0.0-cp310-cp310-manylinux2014_aarch64.whl", hash = "sha256:9f01fe1f6263f31bd04e1757946fd63ad531ae37f28bb2dbf66f5c826ee089f4"},
+    {file = "torch-2.0.0-cp310-cp310-win_amd64.whl", hash = "sha256:527f4ae68df7b8301ee6b1158ca56350282ea633686537b30dbb5d7b4a52622a"},
+    {file = "torch-2.0.0-cp310-none-macosx_10_9_x86_64.whl", hash = "sha256:ce9b5a49bd513dff7950a5a07d6e26594dd51989cee05ba388b03e8e366fd5d5"},
+    {file = "torch-2.0.0-cp310-none-macosx_11_0_arm64.whl", hash = "sha256:53e1c33c6896583cdb9a583693e22e99266444c4a43392dddc562640d39e542b"},
+    {file = "torch-2.0.0-cp311-cp311-manylinux1_x86_64.whl", hash = "sha256:09651bff72e439d004c991f15add0c397c66f98ab36fe60d5514b44e4da722e8"},
+    {file = "torch-2.0.0-cp311-cp311-manylinux2014_aarch64.whl", hash = "sha256:d439aec349c98f12819e8564b8c54008e4613dd4428582af0e6e14c24ca85870"},
+    {file = "torch-2.0.0-cp311-cp311-win_amd64.whl", hash = "sha256:2802f84f021907deee7e9470ed10c0e78af7457ac9a08a6cd7d55adef835fede"},
+    {file = "torch-2.0.0-cp311-none-macosx_10_9_x86_64.whl", hash = "sha256:01858620f25f25e7a9ec4b547ff38e5e27c92d38ec4ccba9cfbfb31d7071ed9c"},
+    {file = "torch-2.0.0-cp311-none-macosx_11_0_arm64.whl", hash = "sha256:9a2e53b5783ef5896a6af338b36d782f28e83c8ddfc2ac44b67b066d9d76f498"},
+    {file = "torch-2.0.0-cp38-cp38-manylinux1_x86_64.whl", hash = "sha256:ec5fff2447663e369682838ff0f82187b4d846057ef4d119a8dea7772a0b17dd"},
+    {file = "torch-2.0.0-cp38-cp38-manylinux2014_aarch64.whl", hash = "sha256:11b0384fe3c18c01b8fc5992e70fc519cde65e44c51cc87be1838c1803daf42f"},
+    {file = "torch-2.0.0-cp38-cp38-win_amd64.whl", hash = "sha256:e54846aa63855298cfb1195487f032e413e7ac9cbfa978fda32354cc39551475"},
+    {file = "torch-2.0.0-cp38-none-macosx_10_9_x86_64.whl", hash = "sha256:cc788cbbbbc6eb4c90e52c550efd067586c2693092cf367c135b34893a64ae78"},
+    {file = "torch-2.0.0-cp38-none-macosx_11_0_arm64.whl", hash = "sha256:d292640f0fd72b7a31b2a6e3b635eb5065fcbedd4478f9cad1a1e7a9ec861d35"},
+    {file = "torch-2.0.0-cp39-cp39-manylinux1_x86_64.whl", hash = "sha256:6befaad784004b7af357e3d87fa0863c1f642866291f12a4c2af2de435e8ac5c"},
+    {file = "torch-2.0.0-cp39-cp39-manylinux2014_aarch64.whl", hash = "sha256:a83b26bd6ae36fbf5fee3d56973d9816e2002e8a3b7d9205531167c28aaa38a7"},
+    {file = "torch-2.0.0-cp39-cp39-win_amd64.whl", hash = "sha256:c7e67195e1c3e33da53954b026e89a8e1ff3bc1aeb9eb32b677172d4a9b5dcbf"},
+    {file = "torch-2.0.0-cp39-none-macosx_10_9_x86_64.whl", hash = "sha256:6e0b97beb037a165669c312591f242382e9109a240e20054d5a5782d9236cad0"},
+    {file = "torch-2.0.0-cp39-none-macosx_11_0_arm64.whl", hash = "sha256:297a4919aff1c0f98a58ebe969200f71350a1d4d4f986dbfd60c02ffce780e99"},
+]
+
+[package.dependencies]
+filelock = "*"
+jinja2 = "*"
+networkx = "*"
+nvidia-cublas-cu11 = {version = "11.10.3.66", markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""}
+nvidia-cuda-cupti-cu11 = {version = "11.7.101", markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""}
+nvidia-cuda-nvrtc-cu11 = {version = "11.7.99", markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""}
+nvidia-cuda-runtime-cu11 = {version = "11.7.99", markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""}
+nvidia-cudnn-cu11 = {version = "8.5.0.96", markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""}
+nvidia-cufft-cu11 = {version = "10.9.0.58", markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""}
+nvidia-curand-cu11 = {version = "10.2.10.91", markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""}
+nvidia-cusolver-cu11 = {version = "11.4.0.1", markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""}
+nvidia-cusparse-cu11 = {version = "11.7.4.91", markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""}
+nvidia-nccl-cu11 = {version = "2.14.3", markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""}
+nvidia-nvtx-cu11 = {version = "11.7.91", markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""}
+sympy = "*"
+triton = {version = "2.0.0", markers = "platform_system == \"Linux\" and platform_machine == \"x86_64\""}
+typing-extensions = "*"
+
+[package.extras]
+opt-einsum = ["opt-einsum (>=3.3)"]
+
 [[package]]
 name = "tqdm"
 version = "4.65.0"
@@ -1229,6 +1621,35 @@ torchhub = ["filelock", "huggingface-hub (>=0.11.0,<1.0)", "importlib-metadata",
 video = ["av (==9.2.0)", "decord (==0.6.0)"]
 vision = ["Pillow"]
 
+[[package]]
+name = "triton"
+version = "2.0.0"
+description = "A language and compiler for custom Deep Learning operations"
+category = "main"
+optional = false
+python-versions = "*"
+files = [
+    {file = "triton-2.0.0-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:8f05a7e64e4ca0565535e3d5d3405d7e49f9d308505bb7773d21fb26a4c008c2"},
+    {file = "triton-2.0.0-cp311-cp311-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:bb4b99ca3c6844066e516658541d876c28a5f6e3a852286bbc97ad57134827fd"},
+    {file = "triton-2.0.0-cp36-cp36m-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:47b4d70dc92fb40af553b4460492c31dc7d3a114a979ffb7a5cdedb7eb546c08"},
+    {file = "triton-2.0.0-cp37-cp37m-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:fedce6a381901b1547e0e7e1f2546e4f65dca6d91e2d8a7305a2d1f5551895be"},
+    {file = "triton-2.0.0-cp38-cp38-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:75834f27926eab6c7f00ce73aaf1ab5bfb9bec6eb57ab7c0bfc0a23fac803b4c"},
+    {file = "triton-2.0.0-cp39-cp39-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:0117722f8c2b579cd429e0bee80f7731ae05f63fe8e9414acd9a679885fcbf42"},
+    {file = "triton-2.0.0-pp37-pypy37_pp73-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:bcd9be5d0c2e45d2b7e6ddc6da20112b6862d69741576f9c3dbaf941d745ecae"},
+    {file = "triton-2.0.0-pp38-pypy38_pp73-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:42a0d2c3fc2eab4ba71384f2e785fbfd47aa41ae05fa58bf12cb31dcbd0aeceb"},
+    {file = "triton-2.0.0-pp39-pypy39_pp73-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:52c47b72c72693198163ece9d90a721299e4fb3b8e24fd13141e384ad952724f"},
+]
+
+[package.dependencies]
+cmake = "*"
+filelock = "*"
+lit = "*"
+torch = "*"
+
+[package.extras]
+tests = ["autopep8", "flake8", "isort", "numpy", "pytest", "scipy (>=1.7.1)"]
+tutorials = ["matplotlib", "pandas", "tabulate"]
+
 [[package]]
 name = "typing-extensions"
 version = "4.5.0"
@@ -1279,6 +1700,21 @@ platformdirs = ">=2.4,<4"
 docs = ["furo (>=2022.12.7)", "proselint (>=0.13)", "sphinx (>=6.1.3)", "sphinx-argparse (>=0.4)", "sphinxcontrib-towncrier (>=0.2.1a0)", "towncrier (>=22.12)"]
 test = ["covdefaults (>=2.2.2)", "coverage (>=7.1)", "coverage-enable-subprocess (>=1)", "flaky (>=3.7)", "packaging (>=23)", "pytest (>=7.2.1)", "pytest-env (>=0.8.1)", "pytest-freezegun (>=0.4.2)", "pytest-mock (>=3.10)", "pytest-randomly (>=3.12)", "pytest-timeout (>=2.1)"]
 
+[[package]]
+name = "wheel"
+version = "0.40.0"
+description = "A built-package format for Python"
+category = "main"
+optional = false
+python-versions = ">=3.7"
+files = [
+    {file = "wheel-0.40.0-py3-none-any.whl", hash = "sha256:d236b20e7cb522daf2390fa84c55eea81c5c30190f90f29ae2ca1ad8355bf247"},
+    {file = "wheel-0.40.0.tar.gz", hash = "sha256:cd1196f3faee2b31968d626e1731c94f99cbdb67cf5a46e4f5656cbee7738873"},
+]
+
+[package.extras]
+test = ["pytest (>=6.0.0)"]
+
 [[package]]
 name = "xxhash"
 version = "3.2.0"
@@ -1478,4 +1914,4 @@ multidict = ">=4.0"
 [metadata]
 lock-version = "2.0"
 python-versions = "^3.10"
-content-hash = "26132a5fe81992d452faef8d696a8ceeb39e4c9584fb5b3e4d92800abe12d76f"
+content-hash = "3b1bc0ebb3617354aa8c19bb84aeb08e74a5976bfdcd6ddb110d23c3e892cf7d"
diff --git a/pyproject.toml b/pyproject.toml
index b6a6aea..609c406 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -10,6 +10,7 @@ readme = "README.md"
 python = "^3.10"
 datasets = "^2.10.1"
 transformers = "^4.27.1"
+torch = "^2.0.0"
 
 
 [tool.poetry.group.dev.dependencies]