{"id":68776,"date":"2026-01-30T18:09:13","date_gmt":"2026-01-30T10:09:13","guid":{"rendered":"https:\/\/www.wsisp.com\/helps\/68776.html"},"modified":"2026-01-30T18:09:13","modified_gmt":"2026-01-30T10:09:13","slug":"%e3%80%90%e4%bf%a1%e5%88%9b%e3%80%91%e5%8d%8e%e4%b8%ba%e6%98%87%e8%85%be%e5%a4%a7%e6%a8%a1%e5%9e%8b%e9%83%a8%e7%bd%b2","status":"publish","type":"post","link":"https:\/\/www.wsisp.com\/helps\/68776.html","title":{"rendered":"\u3010\u4fe1\u521b\u3011\u534e\u4e3a\u6607\u817e\u5927\u6a21\u578b\u90e8\u7f72"},"content":{"rendered":"<p><img decoding=\"async\" src=\"https:\/\/www.wsisp.com\/helps\/wp-content\/uploads\/2026\/01\/20260130100912-697c83481549d.png\" alt=\"\u5728\u8fd9\u91cc\u63d2\u5165\u56fe\u7247\u63cf\u8ff0\" \/><\/p>\n<h3>\u4e00\u3001\u7cfb\u7edf\u4e0e\u786c\u4ef6\u73af\u5883\u8bf4\u660e<\/h3>\n<table>\n<tr>\u6a21\u5757\u8bf4\u660e<\/tr>\n<tbody>\n<tr>\n<td>CPU<\/td>\n<td>\u9cb2\u9e4f 920 \/ 930 \u7cfb\u5217&#xff08;ARM64\u67b6\u6784&#xff09;<\/td>\n<\/tr>\n<tr>\n<td>GPU\/NPU<\/td>\n<td>\u534e\u4e3a\u6607\u817e 910B2 \u00d7 2&#xff08;\u652f\u6301BF16\u3001INT8\u91cf\u5316&#xff09;<\/td>\n<\/tr>\n<tr>\n<td>\u5185\u5b58<\/td>\n<td>\u2265 256GB<\/td>\n<\/tr>\n<tr>\n<td>\u5b58\u50a8<\/td>\n<td>\u2265 2TB SSD<\/td>\n<\/tr>\n<tr>\n<td>\u64cd\u4f5c\u7cfb\u7edf<\/td>\n<td>openEuler \/ \u9e92\u9e9f \/ \u7edf\u4fe1UOS&#xff08;\u56fd\u4ea7\u4fe1\u521bOS&#xff09;<\/td>\n<\/tr>\n<tr>\n<td>\u9a71\u52a8<\/td>\n<td>CANN \u2265 8.0&#xff1b;Ascend Toolkit \u2265 8.0<\/td>\n<\/tr>\n<tr>\n<td>\u6846\u67b6\u73af\u5883<\/td>\n<td>MindSpore \u2265 2.3&#xff1b;torch-npu \u2265 2.1&#xff08;\u517c\u5bb9PyTorch 2.1&#xff09;<\/td>\n<\/tr>\n<tr>\n<td>\u90e8\u7f72\u5de5\u5177<\/td>\n<td>XInference \u2265 0.12&#xff0c;Ascend ATC \u5de5\u5177<\/td>\n<\/tr>\n<\/tbody>\n<\/table>\n<h3>\u4e8c\u3001\u6a21\u578b\u6765\u6e90\u4e0e\u57fa\u672c\u7ed3\u6784<\/h3>\n<table>\n<tr>\u6a21\u578b\u540d\u79f0\u6765\u6e90\u53c2\u6570\u91cf\u6846\u67b6\u5f53\u524d\u683c\u5f0f\u91cf\u5316\u7c7b\u578b\u7528\u9014<\/tr>\n<tbody>\n<tr>\n<td>Qwen3-32B-Base<\/td>\n<td>\u4ece\u963f\u91cc\u5df4\u5df4\u5b98\u65b9 \/ Hugging Face \u4e0b\u8f7d<\/td>\n<td>32B<\/td>\n<td>PyTorch<\/td>\n<td>.bin \/ .safetensors<\/td>\n<td>FP16 \/ BF16<\/td>\n<td>\u539f\u59cb\u9884\u8bad\u7ec3\u6a21\u578b<\/td>\n<\/tr>\n<tr>\n<td>Qwen3-32B-Finetuned<\/td>\n<td>\u5728\u6607\u817e910B2\u4e0a\u8fdb\u884c\u5fae\u8c03&#xff08;\u4f7f\u7528MindSpore\u6846\u67b6&#xff09;<\/td>\n<td>32B<\/td>\n<td>MindSpore<\/td>\n<td>.ckpt<\/td>\n<td>INT8 \/ BF16<\/td>\n<td>\u884c\u4e1a\u5b9a\u5236\u5fae\u8c03\u6a21\u578b<\/td>\n<\/tr>\n<\/tbody>\n<\/table>\n<h3>\u4e09\u3001\u6a21\u578b\u683c\u5f0f\u8f6c\u6362\u6d41\u7a0b<\/h3>\n<p>\u6a21\u578b\u90e8\u7f72\u524d\u9700\u7edf\u4e00\u683c\u5f0f&#xff0c;\u6607\u817e\u5e73\u53f0\u63a8\u8350\u4f7f\u7528 MindIR \u6216 OM \u683c\u5f0f\u3002<\/p>\n<h4>1\ufe0f\u20e3 \u4ece PyTorch \u683c\u5f0f\u8f6c\u6362\u5230 MindIR \u683c\u5f0f<\/h4>\n<h5>\u65b9\u6cd5 1&#xff1a;\u901a\u8fc7 MindConverter<\/h5>\n<p>MindConverter \u662f\u6607\u817e\u5b98\u65b9\u63d0\u4f9b\u7684\u8de8\u6846\u67b6\u6a21\u578b\u8f6c\u6362\u5de5\u5177\u3002<\/p>\n<p>mindconverter &#8211;in_framework pytorch <span class=\"token punctuation\">\\\\<\/span><br \/>\n              &#8211;model_file \/models\/qwen32b\/pytorch_model.bin <span class=\"token punctuation\">\\\\<\/span><br \/>\n              &#8211;input_shape <span class=\"token string\">&#039;[1,1024]&#039;<\/span> <span class=\"token punctuation\">\\\\<\/span><br \/>\n              &#8211;output_file \/models\/qwen32b\/qwen32b.mindir<\/p>\n<h5>\u65b9\u6cd5 2&#xff1a;\u901a\u8fc7 ONNX \u4e2d\u8f6c<\/h5>\n<p>\u5982\u679cMindConverter\u8f6c\u6362\u5931\u8d25&#xff0c;\u53ef\u901a\u8fc7ONNX\u4f5c\u4e3a\u4e2d\u95f4\u5c42&#xff1a;<\/p>\n<p><span class=\"token comment\"># PyTorch -&gt; ONNX<\/span><br \/>\n<span class=\"token keyword\">import<\/span> torch<br \/>\ndummy_input <span class=\"token operator\">&#061;<\/span> torch<span class=\"token punctuation\">.<\/span>ones<span class=\"token punctuation\">(<\/span><span class=\"token number\">1<\/span><span class=\"token punctuation\">,<\/span> <span class=\"token number\">1024<\/span><span class=\"token punctuation\">,<\/span> dtype<span class=\"token operator\">&#061;<\/span>torch<span class=\"token punctuation\">.<\/span>int64<span class=\"token punctuation\">)<\/span><br \/>\ntorch<span class=\"token punctuation\">.<\/span>onnx<span class=\"token punctuation\">.<\/span>export<span class=\"token punctuation\">(<\/span>model<span class=\"token punctuation\">,<\/span> dummy_input<span class=\"token punctuation\">,<\/span> <span class=\"token string\">&#034;qwen32b.onnx&#034;<\/span><span class=\"token punctuation\">,<\/span> opset_version<span class=\"token operator\">&#061;<\/span><span class=\"token number\">17<\/span><span class=\"token punctuation\">)<\/span><\/p>\n<p><span class=\"token comment\"># ONNX -&gt; MindIR<\/span><br \/>\natc &#8211;model<span class=\"token operator\">&#061;<\/span>qwen32b.onnx <span class=\"token punctuation\">\\\\<\/span><br \/>\n    &#8211;framework<span class=\"token operator\">&#061;<\/span><span class=\"token number\">5<\/span> <span class=\"token punctuation\">\\\\<\/span><br \/>\n    &#8211;output<span class=\"token operator\">&#061;<\/span>qwen32b_mindir <span class=\"token punctuation\">\\\\<\/span><br \/>\n    &#8211;soc_version<span class=\"token operator\">&#061;<\/span>Ascend910B2<\/p>\n<h4>2\ufe0f\u20e3 MindIR \u2192 OM&#xff08;\u90e8\u7f72\u4f18\u5316\u683c\u5f0f&#xff09;<\/h4>\n<p>OM&#xff08;Offline Model&#xff09;\u662f\u6607\u817e\u82af\u7247\u7684\u79bb\u7ebf\u6267\u884c\u4f18\u5316\u683c\u5f0f&#xff0c;\u90e8\u7f72\u65f6\u52a0\u8f7d\u6027\u80fd\u66f4\u4f18\u3002<\/p>\n<p>atc &#8211;model<span class=\"token operator\">&#061;<\/span>qwen32b.mindir <span class=\"token punctuation\">\\\\<\/span><br \/>\n    &#8211;framework<span class=\"token operator\">&#061;<\/span><span class=\"token number\">1<\/span> <span class=\"token punctuation\">\\\\<\/span><br \/>\n    &#8211;output<span class=\"token operator\">&#061;<\/span>qwen32b_om <span class=\"token punctuation\">\\\\<\/span><br \/>\n    &#8211;input_format<span class=\"token operator\">&#061;<\/span>ND <span class=\"token punctuation\">\\\\<\/span><br \/>\n    &#8211;input_shape<span class=\"token operator\">&#061;<\/span><span class=\"token string\">&#034;input_ids:1,1024&#034;<\/span> <span class=\"token punctuation\">\\\\<\/span><br \/>\n    &#8211;soc_version<span class=\"token operator\">&#061;<\/span>Ascend910B2 <span class=\"token punctuation\">\\\\<\/span><br \/>\n    &#8211;precision_mode<span class=\"token operator\">&#061;<\/span>allow_mix_precision<\/p>\n<p>\u2699\ufe0f \u6ce8\u610f&#xff1a;<\/p>\n<ul>\n<li>soc_version \u5fc5\u987b\u4e0e\u6607\u817e\u82af\u7247\u578b\u53f7\u4e00\u81f4\u3002<\/li>\n<li>MindIR \u683c\u5f0f\u652f\u6301\u8bad\u7ec3\u548c\u90e8\u7f72&#xff1b;OM \u683c\u5f0f\u4ec5\u652f\u6301\u63a8\u7406\u3002<\/li>\n<\/ul>\n<h3>\u56db\u3001\u6a21\u578b\u90e8\u7f72\u65b9\u5f0f<\/h3>\n<p>\u6211\u4eec\u5e0c\u671b\u90e8\u7f72\u4e24\u4e2a\u6a21\u578b&#xff08;Base \u4e0e Finetuned&#xff09;&#xff0c;\u5e76\u53ef\u5728 XInference \u4e2d\u52a8\u6001\u5207\u6362\u3002<\/p>\n<h4>1\ufe0f\u20e3 \u73af\u5883\u76ee\u5f55\u7ed3\u6784<\/h4>\n<p>\/models\/<br \/>\n\u2502<br \/>\n\u251c\u2500\u2500 qwen32b_base\/<br \/>\n\u2502   \u251c\u2500\u2500 qwen32b_om.om<br \/>\n\u2502   \u2514\u2500\u2500 config.json<br \/>\n\u2502<br \/>\n\u2514\u2500\u2500 qwen32b_finetune\/<br \/>\n    \u251c\u2500\u2500 qwen32b_finetune_om.om<br \/>\n    \u2514\u2500\u2500 config.json<\/p>\n<h4>2\ufe0f\u20e3 \u542f\u52a8 XInference \u670d\u52a1<\/h4>\n<p><span class=\"token comment\"># \u542f\u52a8 Base \u6a21\u578b<\/span><br \/>\nxinf start &#8211;model Qwen3-32B-Base <span class=\"token punctuation\">\\\\<\/span><br \/>\n           &#8211;model-path \/models\/qwen32b_base <span class=\"token punctuation\">\\\\<\/span><br \/>\n           &#8211;device ascend <span class=\"token punctuation\">\\\\<\/span><br \/>\n           &#8211;precision bf16 <span class=\"token punctuation\">\\\\<\/span><br \/>\n           &#8211;port <span class=\"token number\">8081<\/span><\/p>\n<p><span class=\"token comment\"># \u542f\u52a8 Finetuned \u6a21\u578b<\/span><br \/>\nxinf start &#8211;model Qwen3-32B-Finetuned <span class=\"token punctuation\">\\\\<\/span><br \/>\n           &#8211;model-path \/models\/qwen32b_finetune <span class=\"token punctuation\">\\\\<\/span><br \/>\n           &#8211;device ascend <span class=\"token punctuation\">\\\\<\/span><br \/>\n           &#8211;precision int8 <span class=\"token punctuation\">\\\\<\/span><br \/>\n           &#8211;port <span class=\"token number\">8082<\/span><\/p>\n<p>\u2705 \u652f\u6301\u4f7f\u7528 Docker \u5bb9\u5668\u5316\u90e8\u7f72&#xff08;xinf ascend-runtime \u5b98\u65b9\u955c\u50cf&#xff09;<\/p>\n<h4>3\ufe0f\u20e3 \u6a21\u578b\u6ce8\u518c\u914d\u7f6e&#xff08;xinf.json&#xff09;<\/h4>\n<p><span class=\"token punctuation\">{<\/span><br \/>\n  <span class=\"token string-property property\">&#034;models&#034;<\/span><span class=\"token operator\">:<\/span> <span class=\"token punctuation\">[<\/span><br \/>\n    <span class=\"token punctuation\">{<\/span><br \/>\n      <span class=\"token string-property property\">&#034;name&#034;<\/span><span class=\"token operator\">:<\/span> <span class=\"token string\">&#034;Qwen3-32B-Base&#034;<\/span><span class=\"token punctuation\">,<\/span><br \/>\n      <span class=\"token string-property property\">&#034;path&#034;<\/span><span class=\"token operator\">:<\/span> <span class=\"token string\">&#034;\/models\/qwen32b_base\/qwen32b_om.om&#034;<\/span><span class=\"token punctuation\">,<\/span><br \/>\n      <span class=\"token string-property property\">&#034;device&#034;<\/span><span class=\"token operator\">:<\/span> <span class=\"token string\">&#034;ascend&#034;<\/span><span class=\"token punctuation\">,<\/span><br \/>\n      <span class=\"token string-property property\">&#034;port&#034;<\/span><span class=\"token operator\">:<\/span> <span class=\"token number\">8081<\/span><span class=\"token punctuation\">,<\/span><br \/>\n      <span class=\"token string-property property\">&#034;precision&#034;<\/span><span class=\"token operator\">:<\/span> <span class=\"token string\">&#034;bf16&#034;<\/span><br \/>\n    <span class=\"token punctuation\">}<\/span><span class=\"token punctuation\">,<\/span><br \/>\n    <span class=\"token punctuation\">{<\/span><br \/>\n      <span class=\"token string-property property\">&#034;name&#034;<\/span><span class=\"token operator\">:<\/span> <span class=\"token string\">&#034;Qwen3-32B-Finetuned&#034;<\/span><span class=\"token punctuation\">,<\/span><br \/>\n      <span class=\"token string-property property\">&#034;path&#034;<\/span><span class=\"token operator\">:<\/span> <span class=\"token string\">&#034;\/models\/qwen32b_finetune\/qwen32b_finetune_om.om&#034;<\/span><span class=\"token punctuation\">,<\/span><br \/>\n      <span class=\"token string-property property\">&#034;device&#034;<\/span><span class=\"token operator\">:<\/span> <span class=\"token string\">&#034;ascend&#034;<\/span><span class=\"token punctuation\">,<\/span><br \/>\n      <span class=\"token string-property property\">&#034;port&#034;<\/span><span class=\"token operator\">:<\/span> <span class=\"token number\">8082<\/span><span class=\"token punctuation\">,<\/span><br \/>\n      <span class=\"token string-property property\">&#034;precision&#034;<\/span><span class=\"token operator\">:<\/span> <span class=\"token string\">&#034;int8&#034;<\/span><br \/>\n    <span class=\"token punctuation\">}<\/span><br \/>\n  <span class=\"token punctuation\">]<\/span><br \/>\n<span class=\"token punctuation\">}<\/span><\/p>\n<h3>\u4e94\u3001XInference \u6a21\u578b\u5207\u6362\u4e0e\u8c03\u7528<\/h3>\n<h4>1\ufe0f\u20e3 \u6a21\u578b\u52a8\u6001\u5207\u6362&#xff08;REST API&#xff09;<\/h4>\n<p><span class=\"token function\">curl<\/span> -X POST http:\/\/localhost:8000\/api\/models\/select <span class=\"token punctuation\">\\\\<\/span><br \/>\n     -H <span class=\"token string\">&#034;Content-Type: application\/json&#034;<\/span> <span class=\"token punctuation\">\\\\<\/span><br \/>\n     -d <span class=\"token string\">&#039;{&#034;model_name&#034;: &#034;Qwen3-32B-Finetuned&#034;}&#039;<\/span><\/p>\n<p>\u5207\u6362\u56de\u539f\u59cb\u6a21\u578b&#xff1a;<\/p>\n<p><span class=\"token function\">curl<\/span> -X POST http:\/\/localhost:8000\/api\/models\/select <span class=\"token punctuation\">\\\\<\/span><br \/>\n     -d <span class=\"token string\">&#039;{&#034;model_name&#034;: &#034;Qwen3-32B-Base&#034;}&#039;<\/span><\/p>\n<h4>2\ufe0f\u20e3 \u63a8\u7406\u8c03\u7528\u793a\u4f8b&#xff08;Python&#xff09;<\/h4>\n<p><span class=\"token keyword\">import<\/span> requests<\/p>\n<p><span class=\"token keyword\">def<\/span> <span class=\"token function\">query_model<\/span><span class=\"token punctuation\">(<\/span>port<span class=\"token punctuation\">,<\/span> prompt<span class=\"token punctuation\">)<\/span><span class=\"token punctuation\">:<\/span><br \/>\n    url <span class=\"token operator\">&#061;<\/span> <span class=\"token string-interpolation\"><span class=\"token string\">f&#034;http:\/\/localhost:<\/span><span class=\"token interpolation\"><span class=\"token punctuation\">{<\/span>port<span class=\"token punctuation\">}<\/span><\/span><span class=\"token string\">\/v1\/completions&#034;<\/span><\/span><br \/>\n    payload <span class=\"token operator\">&#061;<\/span> <span class=\"token punctuation\">{<\/span><br \/>\n        <span class=\"token string\">&#034;prompt&#034;<\/span><span class=\"token punctuation\">:<\/span> prompt<span class=\"token punctuation\">,<\/span><br \/>\n        <span class=\"token string\">&#034;max_tokens&#034;<\/span><span class=\"token punctuation\">:<\/span> <span class=\"token number\">256<\/span><span class=\"token punctuation\">,<\/span><br \/>\n        <span class=\"token string\">&#034;temperature&#034;<\/span><span class=\"token punctuation\">:<\/span> <span class=\"token number\">0.8<\/span><br \/>\n    <span class=\"token punctuation\">}<\/span><br \/>\n    headers <span class=\"token operator\">&#061;<\/span> <span class=\"token punctuation\">{<\/span><span class=\"token string\">&#034;Content-Type&#034;<\/span><span class=\"token punctuation\">:<\/span> <span class=\"token string\">&#034;application\/json&#034;<\/span><span class=\"token punctuation\">}<\/span><br \/>\n    response <span class=\"token operator\">&#061;<\/span> requests<span class=\"token punctuation\">.<\/span>post<span class=\"token punctuation\">(<\/span>url<span class=\"token punctuation\">,<\/span> headers<span class=\"token operator\">&#061;<\/span>headers<span class=\"token punctuation\">,<\/span> json<span class=\"token operator\">&#061;<\/span>payload<span class=\"token punctuation\">)<\/span><br \/>\n    <span class=\"token keyword\">return<\/span> response<span class=\"token punctuation\">.<\/span>json<span class=\"token punctuation\">(<\/span><span class=\"token punctuation\">)<\/span><span class=\"token punctuation\">[<\/span><span class=\"token string\">&#034;choices&#034;<\/span><span class=\"token punctuation\">]<\/span><span class=\"token punctuation\">[<\/span><span class=\"token number\">0<\/span><span class=\"token punctuation\">]<\/span><span class=\"token punctuation\">[<\/span><span class=\"token string\">&#034;text&#034;<\/span><span class=\"token punctuation\">]<\/span><\/p>\n<p><span class=\"token keyword\">print<\/span><span class=\"token punctuation\">(<\/span><span class=\"token string\">&#034;Base\u6a21\u578b\u56de\u7b54&#xff1a;&#034;<\/span><span class=\"token punctuation\">)<\/span><br \/>\n<span class=\"token keyword\">print<\/span><span class=\"token punctuation\">(<\/span>query_model<span class=\"token punctuation\">(<\/span><span class=\"token number\">8081<\/span><span class=\"token punctuation\">,<\/span> <span class=\"token string\">&#034;\u4ecb\u7ecd\u4e00\u4e0b\u9cb2\u9e4f920\u7684CPU\u67b6\u6784\u4f18\u52bf&#034;<\/span><span class=\"token punctuation\">)<\/span><span class=\"token punctuation\">)<\/span><\/p>\n<p><span class=\"token keyword\">print<\/span><span class=\"token punctuation\">(<\/span><span class=\"token string\">&#034;\\\\nFinetuned\u6a21\u578b\u56de\u7b54&#xff1a;&#034;<\/span><span class=\"token punctuation\">)<\/span><br \/>\n<span class=\"token keyword\">print<\/span><span class=\"token punctuation\">(<\/span>query_model<span class=\"token punctuation\">(<\/span><span class=\"token number\">8082<\/span><span class=\"token punctuation\">,<\/span> <span class=\"token string\">&#034;\u89e3\u91ca\u4e00\u4e0b\u4fe1\u521b\u751f\u6001\u4e0bAI\u7b97\u6cd5\u7684\u4f18\u52bf&#034;<\/span><span class=\"token punctuation\">)<\/span><span class=\"token punctuation\">)<\/span><\/p>\n<h3>\u516d\u3001\u6a21\u578b\u63a8\u7406\u6027\u80fd\u4e0e\u4f18\u5316<\/h3>\n<table>\n<tr>\u4f18\u5316\u624b\u6bb5\u8bf4\u660e\u6548\u679c<\/tr>\n<tbody>\n<tr>\n<td>INT8\u91cf\u5316<\/td>\n<td>\u5fae\u8c03\u6a21\u578b\u5728\u5bfc\u51fa\u65f6\u4f7f\u7528\u91cf\u5316\u611f\u77e5\u8bad\u7ec3&#xff08;QAT&#xff09;<\/td>\n<td>\u663e\u5b58\u964d\u4f4e\u7ea6 50%&#xff0c;\u901f\u5ea6\u63d0\u5347\u7ea6 1.6\u00d7<\/td>\n<\/tr>\n<tr>\n<td>\u53cc\u5361\u5e76\u884c\u63a8\u7406<\/td>\n<td>\u4f7f\u7528\u4e24\u5f20910B2\u5361\u5206\u522b\u90e8\u7f72\u4e24\u4e2a\u6a21\u578b<\/td>\n<td>\u5b9e\u73b0\u6a21\u578b\u5e76\u884c\u8c03\u7528<\/td>\n<\/tr>\n<tr>\n<td>Pipeline\u5207\u5206<\/td>\n<td>\u6a21\u578b\u524d\u5411\u4f20\u64ad\u5206\u6bb5\u6267\u884c<\/td>\n<td>\u9002\u5408\u663e\u5b58\u4e0d\u8db3\u60c5\u51b5<\/td>\n<\/tr>\n<tr>\n<td>XInference\u5f02\u6b65\u961f\u5217<\/td>\n<td>\u652f\u6301\u591a\u8bf7\u6c42\u5e76\u53d1\u5206\u53d1<\/td>\n<td>\u63d0\u5347\u541e\u5410\u91cf 2~3\u500d<\/td>\n<\/tr>\n<\/tbody>\n<\/table>\n<h3>\u4e03\u3001\u5e38\u89c1\u95ee\u9898\u4e0e\u89e3\u51b3\u5efa\u8bae<\/h3>\n<table>\n<tr>\u95ee\u9898\u53ef\u80fd\u539f\u56e0\u89e3\u51b3\u65b9\u6848<\/tr>\n<tbody>\n<tr>\n<td>CANN\u4e0d\u652f\u6301\u8be5\u7b97\u5b50<\/td>\n<td>\u8f6c\u6362\u65f6ONNX\u7b97\u5b50\u4e0d\u517c\u5bb9<\/td>\n<td>\u5728atc\u547d\u4ee4\u4e2d\u52a0&#8211;customize_op \u6216\u4f7f\u7528MindSpore\u539f\u751f\u6a21\u578b<\/td>\n<\/tr>\n<tr>\n<td>\u5185\u5b58\u4e0d\u8db3<\/td>\n<td>\u6a21\u578b\u663e\u5b58\u5f00\u9500\u5927<\/td>\n<td>\u5f00\u542fINT8\u91cf\u5316\u6216\u5206\u5c42\u52a0\u8f7d<\/td>\n<\/tr>\n<tr>\n<td>XInference\u65e0\u6cd5\u52a0\u8f7d<\/td>\n<td>\u6a21\u578b\u8def\u5f84\u6216\u683c\u5f0f\u4e0d\u5339\u914d<\/td>\n<td>\u786e\u8ba4.om\u6587\u4ef6\u8def\u5f84\u4e0e\u914d\u7f6e\u6587\u4ef6\u4e00\u81f4<\/td>\n<\/tr>\n<tr>\n<td>\u8bf7\u6c42\u5ef6\u8fdf\u9ad8<\/td>\n<td>\u540c\u6b65\u963b\u585e<\/td>\n<td>\u4f7f\u7528\u5f02\u6b65\u8c03\u7528API\u6216\u591a\u8fdb\u7a0b\u90e8\u7f72<\/td>\n<\/tr>\n<\/tbody>\n<\/table>\n<h3>\u516b\u3001\u603b\u7ed3<\/h3>\n<table>\n<tr>\u9879\u76ee\u63a8\u8350\u65b9\u6848\u8bf4\u660e<\/tr>\n<tbody>\n<tr>\n<td>\u6a21\u578b\u8bad\u7ec3\u6846\u67b6<\/td>\n<td>MindSpore&#xff08;\u6607\u817e\u539f\u751f&#xff09;<\/td>\n<td>\u5fae\u8c03\u9636\u6bb5\u6548\u7387\u9ad8<\/td>\n<\/tr>\n<tr>\n<td>\u6a21\u578b\u90e8\u7f72\u683c\u5f0f<\/td>\n<td>MindIR \/ OM<\/td>\n<td>\u539f\u751f\u652f\u6301\u6607\u817e\u63a8\u7406<\/td>\n<\/tr>\n<tr>\n<td>\u591a\u6a21\u578b\u8c03\u7528<\/td>\n<td>XInference \u52a8\u6001\u6ce8\u518c\u5207\u6362<\/td>\n<td>\u5feb\u901f\u5728Base\u4e0eFinetune\u6a21\u578b\u95f4\u5207\u6362<\/td>\n<\/tr>\n<tr>\n<td>\u6027\u80fd\u4f18\u5316<\/td>\n<td>INT8\u91cf\u5316 &#043; \u53cc\u5361\u5e76\u53d1 &#043; \u5f02\u6b65\u63a8\u7406<\/td>\n<td>\u6ee1\u8db3\u4fe1\u521b\u786c\u4ef6\u7ea6\u675f<\/td>\n<\/tr>\n<tr>\n<td>\u517c\u5bb9\u6027<\/td>\n<td>\u652f\u6301PyTorch\u3001MindSpore\u3001ONNX\u7edf\u4e00\u90e8\u7f72<\/td>\n<td>\u9002\u914d\u7075\u6d3b<\/td>\n<\/tr>\n<\/tbody>\n<\/table>\n","protected":false},"excerpt":{"rendered":"<p>\u4e00\u3001\u7cfb\u7edf\u4e0e\u786c\u4ef6\u73af\u5883\u8bf4\u660e\u6a21\u5757\u8bf4\u660eCPU\u9cb2\u9e4f 920 \/ 930 \u7cfb\u5217&#xff08;ARM64\u67b6\u6784&#xff09;GPU\/NPU\u534e\u4e3a\u6607\u817e 910B2 \u00d7 2&#xff08;\u652f\u6301BF16\u3001INT8\u91cf\u5316&#xff09;\u5185\u5b58\u2265 256GB\u5b58\u50a8\u2265 2TB SSD\u64cd\u4f5c\u7cfb\u7edfopenEuler \/ \u9e92\u9e9f \/ \u7edf\u4fe1UOS&#xff08;\u56fd\u4ea7\u4fe1\u521bOS&#xff09;\u9a71\u52a8CANN \u2265 8.0&#xff1b;Ascend Toolkit \u2265 8.0\u6846\u67b6\u73af\u5883MindSpore \u2265 2.3&amp;#xff1b<\/p>\n","protected":false},"author":2,"featured_media":68775,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"footnotes":""},"categories":[1],"tags":[50,67,207,427],"topic":[],"class_list":["post-68776","post","type-post","status-publish","format-standard","has-post-thumbnail","hentry","category-server","tag-50","tag-67","tag-207","tag-427"],"yoast_head":"<!-- This site is optimized with the Yoast SEO plugin v20.3 - https:\/\/yoast.com\/wordpress\/plugins\/seo\/ -->\n<title>\u3010\u4fe1\u521b\u3011\u534e\u4e3a\u6607\u817e\u5927\u6a21\u578b\u90e8\u7f72 - \u7f51\u7855\u4e92\u8054\u5e2e\u52a9\u4e2d\u5fc3<\/title>\n<meta name=\"robots\" content=\"index, follow, max-snippet:-1, max-image-preview:large, max-video-preview:-1\" \/>\n<link rel=\"canonical\" href=\"https:\/\/www.wsisp.com\/helps\/68776.html\" \/>\n<meta property=\"og:locale\" content=\"zh_CN\" \/>\n<meta property=\"og:type\" content=\"article\" \/>\n<meta property=\"og:title\" content=\"\u3010\u4fe1\u521b\u3011\u534e\u4e3a\u6607\u817e\u5927\u6a21\u578b\u90e8\u7f72 - \u7f51\u7855\u4e92\u8054\u5e2e\u52a9\u4e2d\u5fc3\" \/>\n<meta property=\"og:description\" content=\"\u4e00\u3001\u7cfb\u7edf\u4e0e\u786c\u4ef6\u73af\u5883\u8bf4\u660e\u6a21\u5757\u8bf4\u660eCPU\u9cb2\u9e4f 920 \/ 930 \u7cfb\u5217&#xff08;ARM64\u67b6\u6784&#xff09;GPU\/NPU\u534e\u4e3a\u6607\u817e 910B2 \u00d7 2&#xff08;\u652f\u6301BF16\u3001INT8\u91cf\u5316&#xff09;\u5185\u5b58\u2265 256GB\u5b58\u50a8\u2265 2TB SSD\u64cd\u4f5c\u7cfb\u7edfopenEuler \/ \u9e92\u9e9f \/ \u7edf\u4fe1UOS&#xff08;\u56fd\u4ea7\u4fe1\u521bOS&#xff09;\u9a71\u52a8CANN \u2265 8.0&#xff1b;Ascend Toolkit \u2265 8.0\u6846\u67b6\u73af\u5883MindSpore \u2265 2.3&amp;#xff1b\" \/>\n<meta property=\"og:url\" content=\"https:\/\/www.wsisp.com\/helps\/68776.html\" \/>\n<meta property=\"og:site_name\" content=\"\u7f51\u7855\u4e92\u8054\u5e2e\u52a9\u4e2d\u5fc3\" \/>\n<meta property=\"article:published_time\" content=\"2026-01-30T10:09:13+00:00\" \/>\n<meta property=\"og:image\" content=\"https:\/\/www.wsisp.com\/helps\/wp-content\/uploads\/2026\/01\/20260130100912-697c83481549d.png\" \/>\n<meta name=\"author\" content=\"admin\" \/>\n<meta name=\"twitter:card\" content=\"summary_large_image\" \/>\n<meta name=\"twitter:label1\" content=\"\u4f5c\u8005\" \/>\n\t<meta name=\"twitter:data1\" content=\"admin\" \/>\n\t<meta name=\"twitter:label2\" content=\"\u9884\u8ba1\u9605\u8bfb\u65f6\u95f4\" \/>\n\t<meta name=\"twitter:data2\" content=\"2 \u5206\" \/>\n<script type=\"application\/ld+json\" class=\"yoast-schema-graph\">{\"@context\":\"https:\/\/schema.org\",\"@graph\":[{\"@type\":\"WebPage\",\"@id\":\"https:\/\/www.wsisp.com\/helps\/68776.html\",\"url\":\"https:\/\/www.wsisp.com\/helps\/68776.html\",\"name\":\"\u3010\u4fe1\u521b\u3011\u534e\u4e3a\u6607\u817e\u5927\u6a21\u578b\u90e8\u7f72 - \u7f51\u7855\u4e92\u8054\u5e2e\u52a9\u4e2d\u5fc3\",\"isPartOf\":{\"@id\":\"https:\/\/www.wsisp.com\/helps\/#website\"},\"datePublished\":\"2026-01-30T10:09:13+00:00\",\"dateModified\":\"2026-01-30T10:09:13+00:00\",\"author\":{\"@id\":\"https:\/\/www.wsisp.com\/helps\/#\/schema\/person\/358e386c577a3ab51c4493330a20ad41\"},\"breadcrumb\":{\"@id\":\"https:\/\/www.wsisp.com\/helps\/68776.html#breadcrumb\"},\"inLanguage\":\"zh-Hans\",\"potentialAction\":[{\"@type\":\"ReadAction\",\"target\":[\"https:\/\/www.wsisp.com\/helps\/68776.html\"]}]},{\"@type\":\"BreadcrumbList\",\"@id\":\"https:\/\/www.wsisp.com\/helps\/68776.html#breadcrumb\",\"itemListElement\":[{\"@type\":\"ListItem\",\"position\":1,\"name\":\"\u9996\u9875\",\"item\":\"https:\/\/www.wsisp.com\/helps\"},{\"@type\":\"ListItem\",\"position\":2,\"name\":\"\u3010\u4fe1\u521b\u3011\u534e\u4e3a\u6607\u817e\u5927\u6a21\u578b\u90e8\u7f72\"}]},{\"@type\":\"WebSite\",\"@id\":\"https:\/\/www.wsisp.com\/helps\/#website\",\"url\":\"https:\/\/www.wsisp.com\/helps\/\",\"name\":\"\u7f51\u7855\u4e92\u8054\u5e2e\u52a9\u4e2d\u5fc3\",\"description\":\"\u9999\u6e2f\u670d\u52a1\u5668_\u9999\u6e2f\u4e91\u670d\u52a1\u5668\u8d44\u8baf_\u670d\u52a1\u5668\u5e2e\u52a9\u6587\u6863_\u670d\u52a1\u5668\u6559\u7a0b\",\"potentialAction\":[{\"@type\":\"SearchAction\",\"target\":{\"@type\":\"EntryPoint\",\"urlTemplate\":\"https:\/\/www.wsisp.com\/helps\/?s={search_term_string}\"},\"query-input\":\"required name=search_term_string\"}],\"inLanguage\":\"zh-Hans\"},{\"@type\":\"Person\",\"@id\":\"https:\/\/www.wsisp.com\/helps\/#\/schema\/person\/358e386c577a3ab51c4493330a20ad41\",\"name\":\"admin\",\"image\":{\"@type\":\"ImageObject\",\"inLanguage\":\"zh-Hans\",\"@id\":\"https:\/\/www.wsisp.com\/helps\/#\/schema\/person\/image\/\",\"url\":\"https:\/\/gravatar.wp-china-yes.net\/avatar\/?s=96&d=mystery\",\"contentUrl\":\"https:\/\/gravatar.wp-china-yes.net\/avatar\/?s=96&d=mystery\",\"caption\":\"admin\"},\"sameAs\":[\"http:\/\/wp.wsisp.com\"],\"url\":\"https:\/\/www.wsisp.com\/helps\/author\/admin\"}]}<\/script>\n<!-- \/ Yoast SEO plugin. -->","yoast_head_json":{"title":"\u3010\u4fe1\u521b\u3011\u534e\u4e3a\u6607\u817e\u5927\u6a21\u578b\u90e8\u7f72 - \u7f51\u7855\u4e92\u8054\u5e2e\u52a9\u4e2d\u5fc3","robots":{"index":"index","follow":"follow","max-snippet":"max-snippet:-1","max-image-preview":"max-image-preview:large","max-video-preview":"max-video-preview:-1"},"canonical":"https:\/\/www.wsisp.com\/helps\/68776.html","og_locale":"zh_CN","og_type":"article","og_title":"\u3010\u4fe1\u521b\u3011\u534e\u4e3a\u6607\u817e\u5927\u6a21\u578b\u90e8\u7f72 - \u7f51\u7855\u4e92\u8054\u5e2e\u52a9\u4e2d\u5fc3","og_description":"\u4e00\u3001\u7cfb\u7edf\u4e0e\u786c\u4ef6\u73af\u5883\u8bf4\u660e\u6a21\u5757\u8bf4\u660eCPU\u9cb2\u9e4f 920 \/ 930 \u7cfb\u5217&#xff08;ARM64\u67b6\u6784&#xff09;GPU\/NPU\u534e\u4e3a\u6607\u817e 910B2 \u00d7 2&#xff08;\u652f\u6301BF16\u3001INT8\u91cf\u5316&#xff09;\u5185\u5b58\u2265 256GB\u5b58\u50a8\u2265 2TB SSD\u64cd\u4f5c\u7cfb\u7edfopenEuler \/ \u9e92\u9e9f \/ \u7edf\u4fe1UOS&#xff08;\u56fd\u4ea7\u4fe1\u521bOS&#xff09;\u9a71\u52a8CANN \u2265 8.0&#xff1b;Ascend Toolkit \u2265 8.0\u6846\u67b6\u73af\u5883MindSpore \u2265 2.3&amp;#xff1b","og_url":"https:\/\/www.wsisp.com\/helps\/68776.html","og_site_name":"\u7f51\u7855\u4e92\u8054\u5e2e\u52a9\u4e2d\u5fc3","article_published_time":"2026-01-30T10:09:13+00:00","og_image":[{"url":"https:\/\/www.wsisp.com\/helps\/wp-content\/uploads\/2026\/01\/20260130100912-697c83481549d.png"}],"author":"admin","twitter_card":"summary_large_image","twitter_misc":{"\u4f5c\u8005":"admin","\u9884\u8ba1\u9605\u8bfb\u65f6\u95f4":"2 \u5206"},"schema":{"@context":"https:\/\/schema.org","@graph":[{"@type":"WebPage","@id":"https:\/\/www.wsisp.com\/helps\/68776.html","url":"https:\/\/www.wsisp.com\/helps\/68776.html","name":"\u3010\u4fe1\u521b\u3011\u534e\u4e3a\u6607\u817e\u5927\u6a21\u578b\u90e8\u7f72 - \u7f51\u7855\u4e92\u8054\u5e2e\u52a9\u4e2d\u5fc3","isPartOf":{"@id":"https:\/\/www.wsisp.com\/helps\/#website"},"datePublished":"2026-01-30T10:09:13+00:00","dateModified":"2026-01-30T10:09:13+00:00","author":{"@id":"https:\/\/www.wsisp.com\/helps\/#\/schema\/person\/358e386c577a3ab51c4493330a20ad41"},"breadcrumb":{"@id":"https:\/\/www.wsisp.com\/helps\/68776.html#breadcrumb"},"inLanguage":"zh-Hans","potentialAction":[{"@type":"ReadAction","target":["https:\/\/www.wsisp.com\/helps\/68776.html"]}]},{"@type":"BreadcrumbList","@id":"https:\/\/www.wsisp.com\/helps\/68776.html#breadcrumb","itemListElement":[{"@type":"ListItem","position":1,"name":"\u9996\u9875","item":"https:\/\/www.wsisp.com\/helps"},{"@type":"ListItem","position":2,"name":"\u3010\u4fe1\u521b\u3011\u534e\u4e3a\u6607\u817e\u5927\u6a21\u578b\u90e8\u7f72"}]},{"@type":"WebSite","@id":"https:\/\/www.wsisp.com\/helps\/#website","url":"https:\/\/www.wsisp.com\/helps\/","name":"\u7f51\u7855\u4e92\u8054\u5e2e\u52a9\u4e2d\u5fc3","description":"\u9999\u6e2f\u670d\u52a1\u5668_\u9999\u6e2f\u4e91\u670d\u52a1\u5668\u8d44\u8baf_\u670d\u52a1\u5668\u5e2e\u52a9\u6587\u6863_\u670d\u52a1\u5668\u6559\u7a0b","potentialAction":[{"@type":"SearchAction","target":{"@type":"EntryPoint","urlTemplate":"https:\/\/www.wsisp.com\/helps\/?s={search_term_string}"},"query-input":"required name=search_term_string"}],"inLanguage":"zh-Hans"},{"@type":"Person","@id":"https:\/\/www.wsisp.com\/helps\/#\/schema\/person\/358e386c577a3ab51c4493330a20ad41","name":"admin","image":{"@type":"ImageObject","inLanguage":"zh-Hans","@id":"https:\/\/www.wsisp.com\/helps\/#\/schema\/person\/image\/","url":"https:\/\/gravatar.wp-china-yes.net\/avatar\/?s=96&d=mystery","contentUrl":"https:\/\/gravatar.wp-china-yes.net\/avatar\/?s=96&d=mystery","caption":"admin"},"sameAs":["http:\/\/wp.wsisp.com"],"url":"https:\/\/www.wsisp.com\/helps\/author\/admin"}]}},"_links":{"self":[{"href":"https:\/\/www.wsisp.com\/helps\/wp-json\/wp\/v2\/posts\/68776","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/www.wsisp.com\/helps\/wp-json\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/www.wsisp.com\/helps\/wp-json\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/www.wsisp.com\/helps\/wp-json\/wp\/v2\/users\/2"}],"replies":[{"embeddable":true,"href":"https:\/\/www.wsisp.com\/helps\/wp-json\/wp\/v2\/comments?post=68776"}],"version-history":[{"count":0,"href":"https:\/\/www.wsisp.com\/helps\/wp-json\/wp\/v2\/posts\/68776\/revisions"}],"wp:featuredmedia":[{"embeddable":true,"href":"https:\/\/www.wsisp.com\/helps\/wp-json\/wp\/v2\/media\/68775"}],"wp:attachment":[{"href":"https:\/\/www.wsisp.com\/helps\/wp-json\/wp\/v2\/media?parent=68776"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/www.wsisp.com\/helps\/wp-json\/wp\/v2\/categories?post=68776"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/www.wsisp.com\/helps\/wp-json\/wp\/v2\/tags?post=68776"},{"taxonomy":"topic","embeddable":true,"href":"https:\/\/www.wsisp.com\/helps\/wp-json\/wp\/v2\/topic?post=68776"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}