Imran1
/

Qwen2.5-72B-Instruct-FP8

Model card Files Files and versions

Update inference.py

#6

by FINGU-AI - opened Oct 9, 2024

base: refs/heads/main

←

from: refs/pr/6

Discussion Files changed

Files changed (1) hide show

inference.py +11 -1

inference.py CHANGED Viewed

@@ -1,9 +1,19 @@
 import os
 import json
 import torch
 from vllm import LLM, SamplingParams
 from vllm.utils import random_uuid
-from typing import List, Dict
 # Function to format chat messages using Qwen's chat template
 def format_chat(messages: List[Dict[str, str]]) -> str:

 import os
 import json
+import subprocess
+import sys
 import torch
+from typing import List, Dict
+# Ensure vllm is installed
+try:
+    import vllm
+except ImportError:
+    subprocess.check_call([sys.executable, "-m", "pip", "install", "vllm"])
+# Import the necessary modules after installation
 from vllm import LLM, SamplingParams
 from vllm.utils import random_uuid
 # Function to format chat messages using Qwen's chat template
 def format_chat(messages: List[Dict[str, str]]) -> str: