[Convert] Fix DeepSeek-R1 convert issue. (#145)

Duyi-Wang · web-flow · commit bc14a70c5ab3 · 2025-06-05T09:46:49.000+08:00
diff --git a/README.md b/README.md
@@ -171,7 +171,7 @@ xFasterTransformer supports a different model format from Huggingface, but it's
 1. Download the huggingface format model firstly.
 2. After that, convert the model into xFasterTransformer format by using model convert module in xfastertransformer. If output directory is not provided, converted model will be placed into `${HF_DATASET_DIR}-xft`.
     ```
-    python -c 'import xfastertransformer as xft; xft.LlamaConvert().convert("${HF_DATASET_DIR}","${OUTPUT_DIR}")'
+    python -c "import xfastertransformer as xft; xft.DeepSeekR1Convert().convert('${HF_DATASET_DIR}', '${OUTPUT_DIR}')"
     ```
     ***PS: Due to the potential compatibility issues between the model file and the `transformers` version, please select the appropriate `transformers` version.***
     
diff --git a/README_CN.md b/README_CN.md
@@ -172,7 +172,7 @@ xFasterTransformer &#25903;&#25345;&#30340;&#27169;&#22411;&#26684;&#24335;&#19982; Huggingface &#26377;&#25152;&#19981;&#21516;&#65292;&#20294;&#19982; Fa
 1. &#39318;&#20808;&#19979;&#36733; huggingface &#26684;&#24335;&#30340;&#27169;&#22411;&#12290;
 2. &#28982;&#21518;&#65292;&#20351;&#29992; xfastertransformer &#20013;&#30340;&#27169;&#22411;&#36716;&#25442;&#27169;&#22359;&#23558;&#27169;&#22411;&#36716;&#25442;&#20026; xFasterTransformer &#26684;&#24335;&#12290;&#22914;&#26524;&#27809;&#26377;&#25552;&#20379;&#36755;&#20986;&#30446;&#24405;&#65292;&#36716;&#25442;&#21518;&#30340;&#27169;&#22411;&#23558;&#34987;&#40664;&#35748;&#25918;&#32622;&#21040; `${HF_DATASET_DIR}-xft`.
     ```
-    python -c 'import xfastertransformer as xft; xft.LlamaConvert().convert("${HF_DATASET_DIR}","${OUTPUT_DIR}")'
+    python -c "import xfastertransformer as xft; xft.DeepSeekR1Convert().convert('${HF_DATASET_DIR}', '${OUTPUT_DIR}')"
     ```
     ***PS: &#30001;&#20110;&#27169;&#22411;&#25991;&#20214;&#21644; `transformers` &#29256;&#26412;&#20043;&#38388;&#21487;&#33021;&#23384;&#22312;&#20860;&#23481;&#24615;&#38382;&#39064;&#65292;&#35831;&#36873;&#25321;&#30456;&#24212;&#30340; `transformers` &#29256;&#26412;&#12290;***
     
diff --git a/src/xfastertransformer/tools/convert.py b/src/xfastertransformer/tools/convert.py
@@ -102,6 +102,7 @@ def map_np_dtype_to_torch(dtype: np.dtype):
         np.float32: [torch.float32, torch.float32],
         np.float16: [torch.float16, torch.float16],
         np.uint16: [torch.bfloat16, torch.uint16],
+        np.uint8: [torch.float8_e4m3fn, torch.uint8],
     }
     if dtype in MAPPING:
         return MAPPING[dtype]

-Original file line number
+Diff line change
 . 首先下载 huggingface 格式的模型。
 . 然后，使用 xfastertransformer 中的模型转换模块将模型转换为 xFasterTransformer 格式。如果没有提供输出目录，转换后的模型将被默认放置到 `${HF_DATASET_DIR}-xft`.
     ```
 -    python -c 'import xfastertransformer as xft; xft.LlamaConvert().convert("${HF_DATASET_DIR}","${OUTPUT_DIR}")'
 +    python -c "import xfastertransformer as xft; xft.DeepSeekR1Convert().convert('${HF_DATASET_DIR}', '${OUTPUT_DIR}')"
     ```
     ***PS: 由于模型文件和 `transformers` 版本之间可能存在兼容性问题，请选择相应的 `transformers` 版本。***
Original file line number	Diff line number	Diff line change
`@@ -102,6 +102,7 @@ def map_np_dtype_to_torch(dtype: np.dtype):`
`102`	`102`	`np.float32: [torch.float32, torch.float32],`
`103`	`103`	`np.float16: [torch.float16, torch.float16],`
`104`	`104`	`np.uint16: [torch.bfloat16, torch.uint16],`
	`105`	`+ np.uint8: [torch.float8_e4m3fn, torch.uint8],`
`105`	`106`	`}`
`106`	`107`	`if dtype in MAPPING:`
`107`	`108`	`return MAPPING[dtype]`