adding tools to be able to profile model fwds to see what to turn into kernels

(cherry picked from commit 6db5b126b6)
2026-04-21 13:37:39 +00:00 · 2024-02-12 22:31:05 +00:00 · 2024-02-12 22:31:05 +00:00 · 12898b5bef
commit 12898b5bef
parent 3ab282fd40
1 changed files with 27 additions and 0 deletions
--- a/tests/profiles/profile_phi2.py
+++ b/tests/profiles/profile_phi2.py
@ -0,0 +1,27 @@
+import torch
+from transformers import AutoModelForCausalLM, AutoTokenizer
+
+from unsloth.kernels.utils import profile_generate_method
+
+torch.set_default_device("cuda")
+
+model = AutoModelForCausalLM.from_pretrained("microsoft/phi-2", torch_dtype="auto", trust_remote_code=True)
+tokenizer = AutoTokenizer.from_pretrained("microsoft/phi-2", trust_remote_code=True)
+
+inputs = tokenizer('''def print_prime(n):
+   """
+   Print all primes between 1 and n
+   """''', return_tensors="pt", return_attention_mask=False)
+
+
+generate_args = {
+    **inputs,  # Assuming model_inputs is a dictionary with appropriate keys
+    "max_new_tokens": 100,
+    "do_sample": True
+}
+
+# Ensure your model and tokenizer are properly loaded and set up as before.
+
+# Now, call the profile_generate_method function
+prof = profile_generate_method(model, generate_args)
+