From 0fe5014b1ff4562fe2da062b536d481da336010f Mon Sep 17 00:00:00 2001
From: Kirill <iam@python273.pw>
Date: Sat, 18 Mar 2023 23:49:21 +0300
Subject: [PATCH] Use pathlib (#711)

* Use pathlib in llama

* Use pathlib in stablediffusion
---
 examples/llama.py            | 23 ++++++++++-------------
 examples/stable_diffusion.py |  6 +++---
 2 files changed, 13 insertions(+), 16 deletions(-)

diff --git a/examples/llama.py b/examples/llama.py
index 52a8a49bc8..e55a7e5ae6 100755
--- a/examples/llama.py
+++ b/examples/llama.py
@@ -3,7 +3,7 @@
 #import typeguard.importhook
 #typeguard.importhook.install_import_hook('tinygrad')
 
-import os
+from pathlib import Path
 import sys, argparse, math, platform
 import numpy as np
 from tqdm import tqdm
@@ -165,18 +165,19 @@ class Transformer:
 
 # **** files and arguments ****
 
-TOKENIZER_FILENAME = os.path.join(os.path.dirname(os.path.abspath(__file__)), "../weights/LLaMA/tokenizer.model")
+WEIGHTS_DIR = Path(__file__).parent.parent / "weights/LLaMA/"
+TOKENIZER_FILENAME = WEIGHTS_DIR / "tokenizer.model"
 VOCAB_SIZE = 32000
 
 args_small = {"dim": 512, "multiple_of": 256, "n_heads": 8, "n_layers": 8, "norm_eps": 1e-05, "vocab_size": VOCAB_SIZE}
 
 args_7B = {"dim": 4096, "multiple_of": 256, "n_heads": 32, "n_layers": 32, "norm_eps": 1e-06, "vocab_size": VOCAB_SIZE}
-WEIGHTS_FILENAME = os.path.join(os.path.dirname(os.path.abspath(__file__)), "../weights/LLaMA/7B/consolidated.00.pth")
+WEIGHTS_7B_FILENAME = WEIGHTS_DIR / "7B/consolidated.00.pth"
 
 # TODO: make this model work
 args_13B = {"dim": 5120, "multiple_of": 256, "n_heads": 40, "n_layers": 40, "norm_eps": 1e-06, "vocab_size": VOCAB_SIZE}
-WEIGHTS0_FILENAME = os.path.join(os.path.dirname(os.path.abspath(__file__)), "../weights/LLaMA/13B/consolidated.00.pth")
-WEIGHTS1_FILENAME = os.path.join(os.path.dirname(os.path.abspath(__file__)), "../weights/LLaMA/13B/consolidated.01.pth")
+WEIGHTS_13B_0_FILENAME = WEIGHTS_DIR / "13B/consolidated.00.pth"
+WEIGHTS_13B_1_FILENAME = WEIGHTS_DIR / "13B/consolidated.01.pth"
 
 # **** helper functions ****
 
@@ -199,10 +200,9 @@ def sample(logits, temperature):
 
 if __name__ == "__main__":
   Tensor.no_grad = True
-
   print(f"using {Device.DEFAULT} backend")
   from sentencepiece import SentencePieceProcessor
-  sp_model = SentencePieceProcessor(model_file=TOKENIZER_FILENAME)
+  sp_model = SentencePieceProcessor(model_file=str(TOKENIZER_FILENAME))
   assert sp_model.vocab_size() == VOCAB_SIZE
 
   parser = argparse.ArgumentParser(description='Run LLaMA 7B in tinygrad', formatter_class=argparse.ArgumentDefaultsHelpFormatter)
@@ -225,8 +225,8 @@ if __name__ == "__main__":
   if args.large:
     model = Transformer(**args_13B)
     with Timing("loaded weights in ", lambda et_ns: f", {GlobalCounters.mem_used/1e9:.2f} GB loaded at {GlobalCounters.mem_used/et_ns:.2f} GB/s"):
-      weights0 = fake_torch_load_zipped(open(WEIGHTS0_FILENAME, "rb"), load_weights=getenv("WEIGHTS", 1))
-      weights1 = fake_torch_load_zipped(open(WEIGHTS1_FILENAME, "rb"), load_weights=getenv("WEIGHTS", 1))
+      weights0 = fake_torch_load_zipped(open(WEIGHTS_13B_0_FILENAME, "rb"), load_weights=getenv("WEIGHTS", 1))
+      weights1 = fake_torch_load_zipped(open(WEIGHTS_13B_1_FILENAME, "rb"), load_weights=getenv("WEIGHTS", 1))
     # eww, this makes a copy
     print("concatenating weights")
     from tqdm import tqdm
@@ -259,10 +259,7 @@ if __name__ == "__main__":
   else:
     model = Transformer(**args_7B)
     with Timing("loaded weights in ", lambda et_ns: f", {GlobalCounters.mem_used/1e9:.2f} GB loaded at {GlobalCounters.mem_used/et_ns:.2f} GB/s"):
-      weights = fake_torch_load_zipped(open(WEIGHTS_FILENAME, "rb"), load_weights=getenv("WEIGHTS", 1))
-
-    #from tinygrad.nn.optim import get_state_dict
-    #state_dict = get_state_dict(model)
+      weights = fake_torch_load_zipped(open(WEIGHTS_7B_FILENAME, "rb"), load_weights=getenv("WEIGHTS", 1))
 
     # assign weights (should be free)
     for k,v in weights.items():
diff --git a/examples/stable_diffusion.py b/examples/stable_diffusion.py
index 82d8faca59..d7fed82a33 100644
--- a/examples/stable_diffusion.py
+++ b/examples/stable_diffusion.py
@@ -1,7 +1,7 @@
 # https://arxiv.org/pdf/2112.10752.pdf
 # https://github.com/ekagra-ranjan/huggingface-blog/blob/main/stable_diffusion.md
 
-import os
+from pathlib import Path
 import gzip
 import argparse
 import math
@@ -466,7 +466,7 @@ class CLIPTextTransformer:
 # Clip tokenizer, taken from https://github.com/openai/CLIP/blob/main/clip/simple_tokenizer.py (MIT license)
 @lru_cache()
 def default_bpe():
-  return os.path.join(os.path.dirname(os.path.abspath(__file__)), "../weights/bpe_simple_vocab_16e6.txt.gz")
+  return Path(__file__).parent.parent / "weights/bpe_simple_vocab_16e6.txt.gz"
 
 def get_pairs(word):
   """Return set of symbol pairs in a word.
@@ -600,7 +600,7 @@ class StableDiffusion:
 # this is sd-v1-4.ckpt
 #FILENAME = "/Users/kafka/fun/mps/stable-diffusion/models/ldm/stable-diffusion-v1/model.ckpt"
 #FILENAME = "/home/kafka/model.ckpt"
-FILENAME = os.path.join(os.path.dirname(os.path.abspath(__file__)), "../weights/sd-v1-4.ckpt")
+FILENAME = Path(__file__).parent.parent / "weights/sd-v1-4.ckpt"
 
 if __name__ == "__main__":
   parser = argparse.ArgumentParser(description='Run Stable Diffusion', formatter_class=argparse.ArgumentDefaultsHelpFormatter)