Fixed the comments

cehongwang · cehongwang · commit 049b810f3260 · 2025-10-08T23:11:50.000Z
diff --git a/tools/llm/run_llm.py b/tools/llm/run_llm.py
@@ -68,7 +68,7 @@ def get_model(args):
     else:
         model = model.to(torch.float32)
 
-    return model.cuda()
+    return model
 
 
 def compile_torchtrt(model, input_ids, args):