diff --git a/src/llamacpp_utils.py b/src/llamacpp_utils.py
deleted file mode 100644
index 2026a9dd..00000000
--- a/src/llamacpp_utils.py
+++ /dev/null
@@ -1,31 +0,0 @@
-from llama_cpp import Llama
-
-
-def tokenize(llama, prompt):
-    return llama.tokenize(bytes(prompt, "utf-8"))
-
-def count_tokens(llama,prompt):
-    return len(tokenize(llama,prompt)) + 5
-
-def clip_history(llama, prompt, history, n_ctx, max_tokens):
-    prompt_len = count_tokens(llama, prompt)
-    history_len = sum([count_tokens(llama, x["content"]) for x in history])
-    input_len = prompt_len + history_len
-    print(input_len)
-    while input_len >= n_ctx-max_tokens:
-        print("Clipping")
-        history.pop(1)
-        history_len = sum([count_tokens(llama, x["content"]) for x in history])
-        input_len = history_len + prompt_len
-        print(input_len)
-    return history
-
-def chunk_tokens(llm, prompt, chunk_size):
-    tokens = tokenize(llm, prompt)
-    num_tokens = count_tokens(llm, prompt)
-    chunks = []
-    for i in range((num_tokens//chunk_size)+1):
-        chunk = str(llm.detokenize(tokens[:chunk_size]),"utf-8")
-        chunks.append(chunk)
-        tokens = tokens[chunk_size:]
-    return chunks