Fixed the comments

cehongwang · cehongwang · commit 92f62f8a58ce · 2025-10-07T21:01:57.000Z
diff --git a/tools/llm/run_llm.py b/tools/llm/run_llm.py
@@ -71,7 +71,7 @@ def get_model(args):
     else:
         model = model.to(torch.float32)
 
-    return model.cuda()
+    return model
 
 
 def compile_torchtrt(model, input_ids, args):