-
Notifications
You must be signed in to change notification settings - Fork 4.1k
/
tests.py
32 lines (23 loc) · 902 Bytes
/
tests.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
# Copyright (c) Sebastian Raschka under Apache License 2.0 (see LICENSE.txt).
# Source for "Build a Large Language Model From Scratch"
# - https://www.manning.com/books/build-a-large-language-model-from-scratch
# Code: https://github.com/rasbt/LLMs-from-scratch
# File for internal use (unit tests)
from pathlib import Path
import os
import subprocess
def test_pretraining():
sequence = "a b c d"
repetitions = 1000
content = sequence * repetitions
folder_path = Path("gutenberg") / "data"
file_name = "repeated_sequence.txt"
os.makedirs(folder_path, exist_ok=True)
with open(folder_path/file_name, "w") as file:
file.write(content)
result = subprocess.run(
["python", "pretraining_simple.py", "--debug", "true"],
capture_output=True, text=True
)
print(result.stdout)
assert "Maximum GPU memory allocated" in result.stdout