from transformers import AutoTokenizer, AutoModelForCausalLM import torch def load_model(): model_name = "bigcode/starcoder" tokenizer = AutoTokenizer.from_pretrained(model_name) model = AutoModelForCausalLM.from_pretrained(model_name, trust_remote_code=True) model.eval() device = "cuda" if torch.cuda.is_available() else "cpu" model.to(device) return tokenizer, model, device def generate_explanation(prompt, tokenizer, model, device): inputs = tokenizer(prompt, return_tensors="pt").to(device) output = model.generate(**inputs, max_new_tokens=512, temperature=0.7) return tokenizer.decode(output[0], skip_special_tokens=True)