From cfe1baaa24e6154b9c8162f6bbce71da91c02079 Mon Sep 17 00:00:00 2001 From: Michael Goin Date: Fri, 12 Apr 2024 12:18:57 -0600 Subject: [PATCH] Update README.md --- src/deepsparse/transformers/README.md | 9 ++++++--- 1 file changed, 6 insertions(+), 3 deletions(-) diff --git a/src/deepsparse/transformers/README.md b/src/deepsparse/transformers/README.md index f1e38aee85..9630086df9 100644 --- a/src/deepsparse/transformers/README.md +++ b/src/deepsparse/transformers/README.md @@ -151,9 +151,12 @@ https://sparsezoo.neuralmagic.com/?useCase=text_generation) ```python from deepsparse import Pipeline -opt_pipeline = Pipeline.create(task="opt", model_path="zoo:opt-1.3b-opt_pretrain-quantW8A8") +llama_pipeline = Pipeline.create( + task="text-generation", + model_path="zoo:llama2-7b-ultrachat200k_llama2_pretrain-pruned50_quantized" +) -inference = opt_pipeline("Who is the president of the United States?") +inference = llama_pipeline("Who is the president of the United States?") >> 'The president of the United States is the head of the executive branch of government...' ``` @@ -163,7 +166,7 @@ Spinning up: ```bash deepsparse.server \ --task text-generation \ - --model_path zoo:opt-1.3b-opt_pretrain-pruned50_quantW8A8 + --model_path zoo:llama2-7b-ultrachat200k_llama2_pretrain-pruned50_quantized ``` Making a request: