ibm-granite
/

granitelib-core-r1.0

@@ -27,7 +27,8 @@ from transformers import AutoTokenizer, AutoModelForCausalLM
 from peft import PeftModel
 BASE_NAME = "ibm-granite/granite-4.0-micro"
-LORA_NAME = "path/to/uncertainty/lora/adapter"
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 # Load model
@@ -35,7 +36,8 @@ tokenizer = AutoTokenizer.from_pretrained(BASE_NAME, padding_side="left", trust_
 model_base = AutoModelForCausalLM.from_pretrained(BASE_NAME, device_map="auto", torch_dtype=torch.bfloat16)
 model_uq = PeftModel.from_pretrained(
     AutoModelForCausalLM.from_pretrained(BASE_NAME, device_map="auto", torch_dtype=torch.bfloat16),
-    LORA_NAME,
 )
 question = "What is IBM Research?"

 from peft import PeftModel
 BASE_NAME = "ibm-granite/granite-4.0-micro"
+LORA_REPO = "ibm-granite/granitelib-core-r1.0"
+LORA_SUBFOLDER = "uncertainty/granite-4.0-micro/lora"
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 # Load model
 model_base = AutoModelForCausalLM.from_pretrained(BASE_NAME, device_map="auto", torch_dtype=torch.bfloat16)
 model_uq = PeftModel.from_pretrained(
     AutoModelForCausalLM.from_pretrained(BASE_NAME, device_map="auto", torch_dtype=torch.bfloat16),
+    LORA_REPO,
+    subfolder=LORA_SUBFOLDER,
 )
 question = "What is IBM Research?"