[Bugfix] Set enable_prefix_caching=True in prefix caching example (#3703)

This commit is contained in:
Woosuk Kwon
2024-03-28 16:26:30 -07:00
committed by GitHub
parent cb40b3ab6b
commit c0935c96d3

View File

@ -22,7 +22,7 @@ prompts = [
sampling_params = SamplingParams(temperature=0.0) sampling_params = SamplingParams(temperature=0.0)
# Create an LLM. # Create an LLM.
llm = LLM(model="facebook/opt-125m") llm = LLM(model="facebook/opt-125m", enable_prefix_caching=True)
generating_prompts = [prefix + prompt for prompt in prompts] generating_prompts = [prefix + prompt for prompt in prompts]