Intel
/

DeepSeek-R1-0528-Qwen3-8B-int4-AutoRound

4-bit precision

Model card Files Files and versions

wenhuach commited on Jul 25

Commit

7dc248b

·

verified ·

1 Parent(s): 1b14e5b

Update README.md

Files changed (1) hide show

README.md +2 -2

README.md CHANGED Viewed

@@ -21,7 +21,7 @@ Please follow the license of the original model.
 ~~~python
 from transformers import AutoModelForCausalLM, AutoTokenizer
-quantized_model_dir = "Intel/DeepSeek-R1-0528-Qwen3-8B-int4-AutoRound-gptq-inc"
 model = AutoModelForCausalLM.from_pretrained(
     quantized_model_dir,
@@ -211,7 +211,7 @@ prompts = [
     "Hello, my name is",
 ]
 sampling_params = SamplingParams(temperature=0.8, top_p=0.95)  ##change this to match official usage
-model_name = "Intel/DeepSeek-R1-0528-Qwen3-8B-int4-AutoRound-gptq-inc"
 llm = LLM(model=model_name, tensor_parallel_size=1)
 outputs = llm.generate(prompts, sampling_params)

 ~~~python
 from transformers import AutoModelForCausalLM, AutoTokenizer
+quantized_model_dir = "Intel/DeepSeek-R1-0528-Qwen3-8B-int4-AutoRound"
 model = AutoModelForCausalLM.from_pretrained(
     quantized_model_dir,
     "Hello, my name is",
 ]
 sampling_params = SamplingParams(temperature=0.8, top_p=0.95)  ##change this to match official usage
+model_name = "Intel/DeepSeek-R1-0528-Qwen3-8B-int4-AutoRound"
 llm = LLM(model=model_name, tensor_parallel_size=1)
 outputs = llm.generate(prompts, sampling_params)