Offline Inference Classification

Offline Inference Classification#

Source: examples/offline_inference_classification.py.

 1from vllm import LLM
 2
 3# Sample prompts.
 4prompts = [
 5    "Hello, my name is",
 6    "The president of the United States is",
 7    "The capital of France is",
 8    "The future of AI is",
 9]
10
11# Create an LLM.
12# You should pass task="classify" for classification models
13model = LLM(
14    model="jason9693/Qwen2.5-1.5B-apeach",
15    task="classify",
16    enforce_eager=True,
17)
18
19# Generate logits. The output is a list of ClassificationRequestOutputs.
20outputs = model.classify(prompts)
21
22# Print the outputs.
23for prompt, output in zip(prompts, outputs):
24    probs = output.outputs.probs
25    probs_trimmed = ((str(probs[:16])[:-1] +
26                      ", ...]") if len(probs) > 16 else probs)
27    print(f"Prompt: {prompt!r} | "
28          f"Class Probabilities: {probs_trimmed} (size={len(probs)})")