{"id":64644,"date":"2026-01-23T20:56:42","date_gmt":"2026-01-23T12:56:42","guid":{"rendered":"https:\/\/www.wsisp.com\/helps\/64644.html"},"modified":"2026-01-23T20:56:42","modified_gmt":"2026-01-23T12:56:42","slug":"pd%e5%88%86%e7%a6%bb%e9%83%a8%e7%bd%b2%ef%bc%9a%e5%9f%ba%e4%ba%8eatlas-800t-a3%e6%9c%8d%e5%8a%a1%e5%99%a8sglang-1p2d%e9%83%a8%e7%bd%b2qwen3-235b%e6%8c%87%e5%8d%97","status":"publish","type":"post","link":"https:\/\/www.wsisp.com\/helps\/64644.html","title":{"rendered":"PD\u5206\u79bb\u90e8\u7f72\uff1a\u57fa\u4e8eAtlas 800T A3\u670d\u52a1\u5668+SGLang 1P2D\u90e8\u7f72Qwen3-235B\u6307\u5357"},"content":{"rendered":"<p>\u4f5c\u8005&#xff1a;\u6607\u817e\u5b9e\u6218\u6d3e Sglang\u77e5\u8bc6\u5730\u56fe&#xff1a; https:\/\/blog.csdn.net\/weixin_41406651\/article\/details\/156754353?spm&#061;1001.2014.3001.5502<\/p>\n<h3>\u80cc\u666f\u6982\u8ff0<\/h3>\n<p>Qwen3-235B\u6a21\u578b\u7528Atlas 800I A3\u6216Atlas 800T A3\u5747\u53ef\u90e8\u7f72&#xff0c;\u672c\u6587\u6863\u4ee5Atlas 800T A3\u4e3a\u4f8b&#xff0c;\u8bb0\u5f55\u4e86\u4f7f\u7528SGLang\u6846\u67b6\u90e8\u7f72Qwen3-235B\u6a21\u578b\u76841P2D&#xff08;\u4e00\u4e2aPrefill\u8282\u70b9\u548c\u4e24\u4e2aDecode\u8282\u70b9&#xff09;\u914d\u7f6e\u65b9\u6848\u3002\u8be5\u914d\u7f6e\u9488\u5bf9\u5927\u89c4\u6a21\u8bed\u8a00\u6a21\u578b\u63a8\u7406\u573a\u666f\u8fdb\u884c\u4e86\u4f18\u5316&#xff0c;\u7279\u522b\u9002\u7528\u4e8e\u9700\u8981\u9ad8\u541e\u5410\u91cf\u7684\u751f\u4ea7\u73af\u5883\u3002<\/p>\n<h3>1. \u7248\u672c\u4e0e\u73af\u5883\u914d\u7f6e<\/h3>\n<ul>\n<li>\u673a\u5668\u578b\u53f7&#xff1a; Atlas 800T A3 <img decoding=\"async\" src=\"https:\/\/www.wsisp.com\/helps\/wp-content\/uploads\/2026\/01\/20260123125641-697370096aad5.png\" alt=\"\u5728\u8fd9\u91cc\u63d2\u5165\u56fe\u7247\u63cf\u8ff0\" \/>* Cann\u7248\u672c <img decoding=\"async\" src=\"https:\/\/www.wsisp.com\/helps\/wp-content\/uploads\/2026\/01\/20260123125641-6973700978d1e.png\" alt=\"\u5728\u8fd9\u91cc\u63d2\u5165\u56fe\u7247\u63cf\u8ff0\" \/> 8.2.RC1<\/li>\n<li>Sglang\u5206\u652f&#xff08;\u6b64\u5206\u652f\u6709\u522b\u4e8e\u4e3b\u5e72&#xff0c;\u662f\u5f00\u53d1\u4e2d\u7684\u5206\u652f\u6682\u672a\u5408\u5165 &amp; \u53ea\u6709\u5bf9qwen\u7cfb\u5217\u7684\u4f18\u5316&#xff09;<span class=\"token function\">git<\/span> clone https:\/\/github.com\/ping1jing2\/sglang.git<br \/>\n<span class=\"token builtin class-name\">cd<\/span> sglang<br \/>\n<span class=\"token function\">git<\/span> checkout -b main_qwen origin\/main_qwen\u200b\n <\/li>\n<li>Docker\u955c\u50cf\u7248\u672c&#xff1a;<span class=\"token comment\"># docker.io<\/span><br \/>\n <span class=\"token function\">docker<\/span> pull lmsysorg\/sglang:main-cann8.3.rc1-910b  <span class=\"token comment\"># a2<\/span><br \/>\n <span class=\"token function\">docker<\/span> pull lmsysorg\/sglang:main-cann8.3.rc1-a3  <span class=\"token comment\"># a3<\/span><br \/>\n <span class=\"token comment\"># \u56fd\u5185\u955c\u50cf\u7ad9<\/span><br \/>\n <span class=\"token function\">docker<\/span> pull swr.cn-southwest-2.myhuaweicloud.com\/base_image\/dockerhub\/lmsysorg\/sglang:main-cann8.3.rc1-910b  <span class=\"token comment\"># a2<\/span><br \/>\n <span class=\"token function\">docker<\/span> pull swr.cn-southwest-2.myhuaweicloud.com\/base_image\/dockerhub\/lmsysorg\/sglang:main-cann8.3.rc1-a3  <span class=\"token comment\"># a3<\/span><br \/>\n\u200b\n <\/li>\n<li>triton-ascend &amp; torch_npu\u66f4\u65b0&#xff1a;https:\/\/wiki.huawei.com\/domains\/119266\/wiki\/243400\/WIKI202511259151404?title&#061;_fde87425<\/li>\n<li>sgl-kernel-npu\u9700\u8981\u624b\u52a8\u7f16\u8bd1<span class=\"token function\">git<\/span> clone https:\/\/github.com\/sgl-project\/sgl-kernel-npu<br \/>\n<span class=\"token builtin class-name\">cd<\/span> sgl-kernel-npu<br \/>\n<span class=\"token function\">bash<\/span> build.sh<br \/>\npip <span class=\"token function\">install<\/span> output\/sgl_kernel_npu*.whl\u200b\n <\/li>\n<li>set_env.sh \u6ce8\u610f&#xff1a;\u542f\u52a8router\u65f6&#xff0c;\u64cd\u4f5c\u524d\u624b\u52a8 source source \/usr\/local\/Ascend\/ascend-toolkit\/set_env.sh<span class=\"token builtin class-name\">export<\/span> <span class=\"token assign-left variable\">LD_LIBRARY_PATH<\/span><span class=\"token operator\">&#061;<\/span>\/usr\/local\/Ascend\/driver\/lib64:\/usr\/local\/Ascend\/driver\/lib64\/common:\/usr\/local\/Ascend\/driver\/lib64\/driver:<span class=\"token variable\">$LD_LIBRARY_PATH<\/span><br \/>\n<span class=\"token builtin class-name\">export<\/span> <span class=\"token assign-left variable\">ASCEND_TOOLKIT_HOME<\/span><span class=\"token operator\">&#061;<\/span>\/usr\/local\/Ascend\/ascend-toolkit\/latest<br \/>\n<span class=\"token builtin class-name\">export<\/span> <span class=\"token assign-left variable\">LD_LIBRARY_PATH<\/span><span class=\"token operator\">&#061;<\/span><span class=\"token variable\">${ASCEND_TOOLKIT_HOME}<\/span>\/lib64:<span class=\"token variable\">${ASCEND_TOOLKIT_HOME}<\/span>\/lib64\/plugin\/opskernel:<span class=\"token variable\">${ASCEND_TOOLKIT_HOME}<\/span>\/lib64\/plugin\/nnengine:<span class=\"token variable\">${ASCEND_TOOLKIT_HOME}<\/span>\/opp\/built-in\/op_impl\/ai_core\/tbe\/op_tiling\/lib\/linux\/<span class=\"token variable\"><span class=\"token variable\">$(<\/span>arch<span class=\"token variable\">)<\/span><\/span><span class=\"token builtin class-name\">:<\/span><span class=\"token variable\">$LD_LIBRARY_PATH<\/span><br \/>\n<span class=\"token builtin class-name\">export<\/span> <span class=\"token assign-left variable\">LD_LIBRARY_PATH<\/span><span class=\"token operator\">&#061;<\/span><span class=\"token variable\">${ASCEND_TOOLKIT_HOME}<\/span>\/tools\/aml\/lib64:<span class=\"token variable\">${ASCEND_TOOLKIT_HOME}<\/span>\/tools\/aml\/lib64\/plugin:<span class=\"token variable\">$LD_LIBRARY_PATH<\/span><br \/>\n<span class=\"token builtin class-name\">export<\/span> <span class=\"token assign-left variable\">PYTHONPATH<\/span><span class=\"token operator\">&#061;<\/span><span class=\"token variable\">${ASCEND_TOOLKIT_HOME}<\/span>\/python\/site-packages:<span class=\"token variable\">${ASCEND_TOOLKIT_HOME}<\/span>\/opp\/built-in\/op_impl\/ai_core\/tbe:<span class=\"token variable\">$PYTHONPATH<\/span><br \/>\n<span class=\"token builtin class-name\">export<\/span> <span class=\"token assign-left variable\"><span class=\"token environment constant\">PATH<\/span><\/span><span class=\"token operator\">&#061;<\/span><span class=\"token variable\">${ASCEND_TOOLKIT_HOME}<\/span>\/bin:<span class=\"token variable\">${ASCEND_TOOLKIT_HOME}<\/span>\/compiler\/ccec_compiler\/bin:<span class=\"token variable\">${ASCEND_TOOLKIT_HOME}<\/span>\/tools\/ccec_compiler\/bin:<span class=\"token environment constant\">$PATH<\/span><br \/>\n<span class=\"token builtin class-name\">export<\/span> <span class=\"token assign-left variable\">ASCEND_AICPU_PATH<\/span><span class=\"token operator\">&#061;<\/span><span class=\"token variable\">${ASCEND_TOOLKIT_HOME}<\/span><br \/>\n<span class=\"token builtin class-name\">export<\/span> <span class=\"token assign-left variable\">ASCEND_OPP_PATH<\/span><span class=\"token operator\">&#061;<\/span><span class=\"token variable\">${ASCEND_TOOLKIT_HOME}<\/span>\/opp<br \/>\n<span class=\"token builtin class-name\">export<\/span> <span class=\"token assign-left variable\">TOOLCHAIN_HOME<\/span><span class=\"token operator\">&#061;<\/span><span class=\"token variable\">${ASCEND_TOOLKIT_HOME}<\/span>\/toolkit<br \/>\n<span class=\"token builtin class-name\">export<\/span> <span class=\"token assign-left variable\">ASCEND_HOME_PATH<\/span><span class=\"token operator\">&#061;<\/span><span class=\"token variable\">${ASCEND_TOOLKIT_HOME}<\/span>\u200b\n <\/li>\n<\/ul>\n<h3>2 \u670d\u52a1\u542f\u52a8\u811a\u672c<\/h3>\n<h4>\u670d\u52a1\u542f\u52a8\u914d\u7f6e<\/h4>\n<p>\u4ee5\u4e0b\u811a\u672c\u652f\u6301P\u8282\u70b9\u3001D\u8282\u70b9\u548csgl-router\u5171\u7528&#xff0c;\u53ea\u9700\u4fee\u6539P\u8282\u70b9\u3001D\u8282\u70b9\u76f8\u5173\u53c2\u6570\u5373\u53ef\u3002<\/p>\n<p><span class=\"token comment\"># 235b_run.sh<\/span><br \/>\n<span class=\"token comment\"># docker exec -it sglang_perf_b150 bash<\/span><br \/>\n<span class=\"token function\">pkill<\/span> -9 python <span class=\"token operator\">|<\/span> <span class=\"token function\">pkill<\/span> -9 sglang<br \/>\n<span class=\"token function\">pkill<\/span> -9 sglang<br \/>\n<span class=\"token builtin class-name\">echo<\/span> performance <span class=\"token operator\">|<\/span> <span class=\"token function\">tee<\/span> \/sys\/devices\/system\/cpu\/cpu*\/cpufreq\/scaling_governor<br \/>\nsysctl -w vm.swappiness<span class=\"token operator\">&#061;<\/span><span class=\"token number\">0<\/span><br \/>\nsysctl -w kernel.numa_balancing<span class=\"token operator\">&#061;<\/span><span class=\"token number\">0<\/span><br \/>\nsysctl -w kernel.sched_migration_cost_ns<span class=\"token operator\">&#061;<\/span><span class=\"token number\">50000<\/span><\/p>\n<p><span class=\"token builtin class-name\">export<\/span> <span class=\"token assign-left variable\">SGLANG_SET_CPU_AFFINITY<\/span><span class=\"token operator\">&#061;<\/span><span class=\"token number\">1<\/span><br \/>\n<span class=\"token comment\"># \u8bbe\u7f6ePYTHONPATH<\/span><\/p>\n<p><span class=\"token builtin class-name\">cd<\/span> \/home\/sglang_ascend<br \/>\n<span class=\"token builtin class-name\">export<\/span> <span class=\"token assign-left variable\">PYTHONPATH<\/span><span class=\"token operator\">&#061;<\/span><span class=\"token variable\">${<span class=\"token environment constant\">PWD<\/span>}<\/span>\/python:<span class=\"token variable\">$PYTHONPATH<\/span><br \/>\n<span class=\"token builtin class-name\">unset<\/span> https_proxy<br \/>\n<span class=\"token builtin class-name\">unset<\/span> http_proxy<br \/>\n<span class=\"token builtin class-name\">unset<\/span> HTTPS_PROXY<br \/>\n<span class=\"token builtin class-name\">unset<\/span> HTTP_PROXY<br \/>\n<span class=\"token builtin class-name\">unset<\/span> ASCEND_LAUNCH_BLOCKING<\/p>\n<p><span class=\"token builtin class-name\">source<\/span> \/usr\/local\/Ascend\/ascend-toolkit\/latest\/opp\/vendors\/customize\/bin\/set_env.bash<br \/>\n<span class=\"token comment\">#export SGLANG_EXPERT_DISTRIBUTION_RECORDER_DIR&#061;\/home\/\/\/sglang_ascend_1111\/sglang_ascend\/hot_map<\/span><br \/>\n<span class=\"token builtin class-name\">export<\/span> <span class=\"token assign-left variable\">PYTORCH_NPU_ALLOC_CONF<\/span><span class=\"token operator\">&#061;<\/span>expandable_segments:True<\/p>\n<p><span class=\"token builtin class-name\">export<\/span> <span class=\"token assign-left variable\">SGLANG_DEEPEP_NUM_MAX_DISPATCH_TOKENS_PER_RANK<\/span><span class=\"token operator\">&#061;<\/span><span class=\"token number\">16<\/span><\/p>\n<p><span class=\"token assign-left variable\">MODEL_PATH<\/span><span class=\"token operator\">&#061;<\/span>\/mnt\/share\/weights\/Qwen3-235B-A22B-W8A8<br \/>\n<span class=\"token comment\"># pd\u4f20\u8f93, IP\u8bbe\u7f6e\u4e3ap\u8282\u70b9\u9996\u8282\u70b9<\/span><br \/>\n<span class=\"token builtin class-name\">export<\/span> <span class=\"token assign-left variable\">ASCEND_MF_STORE_URL<\/span><span class=\"token operator\">&#061;<\/span><span class=\"token string\">&#034;tcp:\/\/x.x.x.x:24667&#034;<\/span><br \/>\n<span class=\"token comment\"># p\u8282\u70b9IP<\/span><br \/>\n<span class=\"token assign-left variable\">P_IP<\/span><span class=\"token operator\">&#061;<\/span><span class=\"token punctuation\">(<\/span><span class=\"token string\">&#039;x.x.x.x&#039;<\/span><span class=\"token punctuation\">)<\/span><br \/>\n<span class=\"token comment\"># D\u8282\u70b9IP<\/span><br \/>\n<span class=\"token comment\">#D_IP&#061;(&#039;x.x.x.x&#039;)<\/span><br \/>\n<span class=\"token assign-left variable\">D_IP<\/span><span class=\"token operator\">&#061;<\/span><span class=\"token punctuation\">(<\/span><span class=\"token string\">&#039;x.x.x.x&#039;<\/span> <span class=\"token string\">&#039;x.x.x.x&#039;<\/span><span class=\"token punctuation\">)<\/span><br \/>\n<span class=\"token comment\">#export SGLANG_ENABLE_TORCH_COMPILE&#061;1<\/span><br \/>\n<span class=\"token builtin class-name\">export<\/span> <span class=\"token assign-left variable\">SGLANG_DISAGGREGATION_BOOTSTRAP_TIMEOUT<\/span><span class=\"token operator\">&#061;<\/span><span class=\"token number\">600<\/span><\/p>\n<p><span class=\"token assign-left variable\">LOCAL_HOST1<\/span><span class=\"token operator\">&#061;<\/span><span class=\"token variable\"><span class=\"token variable\">&#096;<\/span><span class=\"token function\">hostname<\/span> -I<span class=\"token operator\">|<\/span><span class=\"token function\">awk<\/span> -F <span class=\"token string\">&#034; &#034;<\/span> <span class=\"token string\">&#039;{print$1}&#039;<\/span><span class=\"token variable\">&#096;<\/span><\/span><br \/>\n<span class=\"token assign-left variable\">LOCAL_HOST2<\/span><span class=\"token operator\">&#061;<\/span><span class=\"token variable\"><span class=\"token variable\">&#096;<\/span><span class=\"token function\">hostname<\/span> -I<span class=\"token operator\">|<\/span><span class=\"token function\">awk<\/span> -F <span class=\"token string\">&#034; &#034;<\/span> <span class=\"token string\">&#039;{print$2}&#039;<\/span><span class=\"token variable\">&#096;<\/span><\/span><\/p>\n<p><span class=\"token builtin class-name\">echo<\/span> <span class=\"token string\">&#034;<span class=\"token variable\">${LOCAL_HOST1}<\/span>&#034;<\/span><br \/>\n<span class=\"token builtin class-name\">echo<\/span> <span class=\"token string\">&#034;<span class=\"token variable\">${LOCAL_HOST2}<\/span>&#034;<\/span><\/p>\n<p><span class=\"token keyword\">for<\/span> <span class=\"token for-or-select variable\">i<\/span> <span class=\"token keyword\">in<\/span> <span class=\"token string\">&#034;<span class=\"token variable\">${<span class=\"token operator\">!<\/span>P_IP<span class=\"token punctuation\">[<\/span>&#064;<span class=\"token punctuation\">]<\/span>}<\/span>&#034;<\/span><span class=\"token punctuation\">;<\/span><br \/>\n<span class=\"token keyword\">do<\/span><br \/>\n    <span class=\"token keyword\">if<\/span> <span class=\"token punctuation\">[<\/span><span class=\"token punctuation\">[<\/span> <span class=\"token string\">&#034;<span class=\"token variable\">$LOCAL_HOST1<\/span>&#034;<\/span> <span class=\"token operator\">&#061;&#061;<\/span> <span class=\"token string\">&#034;<span class=\"token variable\">${P_IP<span class=\"token punctuation\">[<\/span>$i<span class=\"token punctuation\">]<\/span>}<\/span>&#034;<\/span> <span class=\"token operator\">||<\/span> <span class=\"token string\">&#034;<span class=\"token variable\">$LOCAL_HOST2<\/span>&#034;<\/span> <span class=\"token operator\">&#061;&#061;<\/span> <span class=\"token string\">&#034;<span class=\"token variable\">${P_IP<span class=\"token punctuation\">[<\/span>$i<span class=\"token punctuation\">]<\/span>}<\/span>&#034;<\/span> <span class=\"token punctuation\">]<\/span><span class=\"token punctuation\">]<\/span><span class=\"token punctuation\">;<\/span><br \/>\n    <span class=\"token keyword\">then<\/span><br \/>\n        <span class=\"token builtin class-name\">echo<\/span> <span class=\"token string\">&#034;<span class=\"token variable\">${P_IP<span class=\"token punctuation\">[<\/span>$i<span class=\"token punctuation\">]<\/span>}<\/span>&#034;<\/span><br \/>\n        <span class=\"token builtin class-name\">source<\/span> \/usr\/local\/Ascend\/ascend-toolkit\/set_env.sh<br \/>\n        <span class=\"token builtin class-name\">source<\/span> \/usr\/local\/Ascend\/nnal\/atb\/set_env.sh<br \/>\n        <span class=\"token builtin class-name\">export<\/span> <span class=\"token assign-left variable\">HCCL_BUFFSIZE<\/span><span class=\"token operator\">&#061;<\/span><span class=\"token number\">3000<\/span><br \/>\n        <span class=\"token builtin class-name\">export<\/span> <span class=\"token assign-left variable\">TASK_QUEUE_ENABLE<\/span><span class=\"token operator\">&#061;<\/span><span class=\"token number\">2<\/span><br \/>\n        <span class=\"token builtin class-name\">export<\/span> <span class=\"token assign-left variable\">HCCL_SOCKET_IFNAME<\/span><span class=\"token operator\">&#061;<\/span>lo<br \/>\n        <span class=\"token builtin class-name\">export<\/span> <span class=\"token assign-left variable\">GLOO_SOCKET_IFNAME<\/span><span class=\"token operator\">&#061;<\/span>lo<br \/>\n        <span class=\"token builtin class-name\">export<\/span> <span class=\"token assign-left variable\">STREAMS_PER_DEVICE<\/span><span class=\"token operator\">&#061;<\/span><span class=\"token number\">32<\/span><br \/>\n        <span class=\"token builtin class-name\">export<\/span> <span class=\"token assign-left variable\">ENABLE_ASCEND_MOE_NZ<\/span><span class=\"token operator\">&#061;<\/span><span class=\"token number\">1<\/span><br \/>\n        <span class=\"token builtin class-name\">export<\/span> <span class=\"token assign-left variable\">DEEP_NORMAL_MODE_USE_INT8_QUANT<\/span><span class=\"token operator\">&#061;<\/span><span class=\"token number\">1<\/span><br \/>\n<span class=\"token comment\">#        export ENABLE_PROFILING&#061;1<\/span><\/p>\n<p>        <span class=\"token comment\"># P\u8282\u70b9<\/span><br \/>\n        python -m sglang.launch_server &#8211;model-path <span class=\"token variable\">${MODEL_PATH}<\/span> &#8211;disaggregation-mode prefill <span class=\"token punctuation\">\\\\<\/span><br \/>\n        &#8211;host <span class=\"token variable\">${P_IP<span class=\"token punctuation\">[<\/span>$i<span class=\"token punctuation\">]<\/span>}<\/span> &#8211;port <span class=\"token number\">8000<\/span> &#8211;disaggregation-bootstrap-port <span class=\"token number\">8995<\/span> &#8211;trust-remote-code <span class=\"token punctuation\">\\\\<\/span><br \/>\n        &#8211;nnodes <span class=\"token number\">1<\/span> &#8211;node-rank <span class=\"token variable\">$i<\/span> &#8211;tp-size <span class=\"token number\">16<\/span> &#8211;dp-size <span class=\"token number\">8<\/span> &#8211;mem-fraction-static <span class=\"token number\">0.6<\/span> <span class=\"token punctuation\">\\\\<\/span><br \/>\n        &#8211;disable-radix-cache <span class=\"token punctuation\">\\\\<\/span><br \/>\n        &#8211;ep-dispatch-algorithm static &#8211;init-expert-location \/homesglang_ascend\/hot_map\/expert_distribution_recorder_1763480391.7582676.pt <span class=\"token punctuation\">\\\\<\/span><br \/>\n        &#8211;attention-backend ascend &#8211;device npu &#8211;quantization w8a8_int8 &#8211;disaggregation-transfer-backend ascend <span class=\"token punctuation\">\\\\<\/span><br \/>\n        &#8211;max-running-requests <span class=\"token number\">128<\/span> &#8211;chunked-prefill-size <span class=\"token number\">114688<\/span> &#8211;max-prefill-tokens <span class=\"token number\">458880<\/span> <span class=\"token punctuation\">\\\\<\/span><br \/>\n        &#8211;disable-overlap-schedule  &#8211;enable-dp-attention &#8211;tokenizer-worker-num <span class=\"token number\">4<\/span> <span class=\"token punctuation\">\\\\<\/span><br \/>\n        &#8211;moe-a2a-backend deepep &#8211;deepep-mode normal &#8211;dtype bfloat16<br \/>\n        <span class=\"token assign-left variable\">NODE_RANK<\/span><span class=\"token operator\">&#061;<\/span><span class=\"token variable\">$i<\/span><br \/>\n        <span class=\"token builtin class-name\">break<\/span><br \/>\n    <span class=\"token keyword\">fi<\/span><br \/>\n<span class=\"token keyword\">done<\/span><\/p>\n<p><span class=\"token keyword\">for<\/span> <span class=\"token for-or-select variable\">i<\/span> <span class=\"token keyword\">in<\/span> <span class=\"token string\">&#034;<span class=\"token variable\">${<span class=\"token operator\">!<\/span>D_IP<span class=\"token punctuation\">[<\/span>&#064;<span class=\"token punctuation\">]<\/span>}<\/span>&#034;<\/span><span class=\"token punctuation\">;<\/span><br \/>\n<span class=\"token keyword\">do<\/span><br \/>\n    <span class=\"token keyword\">if<\/span> <span class=\"token punctuation\">[<\/span><span class=\"token punctuation\">[<\/span> <span class=\"token string\">&#034;<span class=\"token variable\">$LOCAL_HOST1<\/span>&#034;<\/span> <span class=\"token operator\">&#061;&#061;<\/span> <span class=\"token string\">&#034;<span class=\"token variable\">${D_IP<span class=\"token punctuation\">[<\/span>$i<span class=\"token punctuation\">]<\/span>}<\/span>&#034;<\/span> <span class=\"token operator\">||<\/span> <span class=\"token string\">&#034;<span class=\"token variable\">$LOCAL_HOST2<\/span>&#034;<\/span> <span class=\"token operator\">&#061;&#061;<\/span> <span class=\"token string\">&#034;<span class=\"token variable\">${D_IP<span class=\"token punctuation\">[<\/span>$i<span class=\"token punctuation\">]<\/span>}<\/span>&#034;<\/span> <span class=\"token punctuation\">]<\/span><span class=\"token punctuation\">]<\/span><span class=\"token punctuation\">;<\/span><br \/>\n    <span class=\"token keyword\">then<\/span><br \/>\n        <span class=\"token builtin class-name\">echo<\/span> <span class=\"token string\">&#034;<span class=\"token variable\">${D_IP<span class=\"token punctuation\">[<\/span>$i<span class=\"token punctuation\">]<\/span>}<\/span>&#034;<\/span><br \/>\n        <span class=\"token builtin class-name\">source<\/span> \/usr\/local\/Ascend\/ascend-toolkit\/set_env.sh<br \/>\n        <span class=\"token builtin class-name\">source<\/span> \/usr\/local\/Ascend\/nnal\/atb\/set_env.sh<br \/>\n        <span class=\"token builtin class-name\">export<\/span> <span class=\"token assign-left variable\">DP_ROUND_ROBIN<\/span><span class=\"token operator\">&#061;<\/span><span class=\"token number\">1<\/span><br \/>\n        <span class=\"token builtin class-name\">export<\/span> <span class=\"token assign-left variable\">SGLANG_DEEPEP_NUM_MAX_DISPATCH_TOKENS_PER_RANK<\/span><span class=\"token operator\">&#061;<\/span><span class=\"token number\">60<\/span><br \/>\n        <span class=\"token builtin class-name\">export<\/span> <span class=\"token assign-left variable\">HCCL_BUFFSIZE<\/span><span class=\"token operator\">&#061;<\/span><span class=\"token number\">512<\/span><br \/>\n        <span class=\"token builtin class-name\">export<\/span> <span class=\"token assign-left variable\">HCCL_SOCKET_IFNAME<\/span><span class=\"token operator\">&#061;<\/span>data0.3001<br \/>\n        <span class=\"token builtin class-name\">export<\/span> <span class=\"token assign-left variable\">GLOO_SOCKET_IFNAME<\/span><span class=\"token operator\">&#061;<\/span>data0.3001<br \/>\n        <span class=\"token builtin class-name\">export<\/span> <span class=\"token assign-left variable\">STREAMS_PER_DEVICE<\/span><span class=\"token operator\">&#061;<\/span><span class=\"token number\">32<\/span><\/p>\n<p><span class=\"token comment\">#        export ENABLE_ASCEND_MOE_NZ&#061;1<\/span><br \/>\n<span class=\"token comment\">#        export ENABLE_PROFILING&#061;1<\/span><br \/>\n        <span class=\"token comment\"># D\u8282\u70b9<\/span><br \/>\n        python -m sglang.launch_server &#8211;model-path <span class=\"token variable\">${MODEL_PATH}<\/span> &#8211;disaggregation-mode decode <span class=\"token punctuation\">\\\\<\/span><br \/>\n        &#8211;host <span class=\"token variable\">${D_IP<span class=\"token punctuation\">[<\/span>$i<span class=\"token punctuation\">]<\/span>}<\/span> &#8211;port <span class=\"token number\">8001<\/span> &#8211;trust-remote-code <span class=\"token punctuation\">\\\\<\/span><br \/>\n        &#8211;nnodes <span class=\"token number\">2<\/span> &#8211;node-rank <span class=\"token variable\">$i<\/span> &#8211;tp-size <span class=\"token number\">32<\/span> &#8211;dp-size <span class=\"token number\">16<\/span> &#8211;mem-fraction-static <span class=\"token number\">0.83<\/span> &#8211;max-running-requests <span class=\"token number\">960<\/span> <span class=\"token punctuation\">\\\\<\/span><br \/>\n        &#8211;attention-backend ascend &#8211;device npu &#8211;quantization w8a8_int8 &#8211;enable-dp-attention <span class=\"token punctuation\">\\\\<\/span><br \/>\n        &#8211;moe-a2a-backend ascend_fuseep &#8211;cuda-graph-bs <span class=\"token number\">6<\/span> <span class=\"token number\">8<\/span> <span class=\"token number\">12<\/span> <span class=\"token number\">15<\/span> <span class=\"token number\">18<\/span> <span class=\"token number\">20<\/span> <span class=\"token number\">22<\/span> <span class=\"token number\">24<\/span> <span class=\"token number\">30<\/span> <span class=\"token number\">36<\/span> <span class=\"token number\">42<\/span> <span class=\"token number\">48<\/span> <span class=\"token number\">54<\/span> <span class=\"token number\">56<\/span> <span class=\"token number\">58<\/span> <span class=\"token number\">60<\/span> <span class=\"token punctuation\">\\\\<\/span><br \/>\n        &#8211;dist-init-addr <span class=\"token number\">172.27<\/span>.1.143:5000 <span class=\"token punctuation\">\\\\<\/span><br \/>\n        &#8211;disaggregation-transfer-backend ascend &#8211;watchdog-timeout <span class=\"token number\">9000<\/span> &#8211;context-length <span class=\"token number\">8192<\/span> <span class=\"token punctuation\">\\\\<\/span><br \/>\n        &#8211;prefill-round-robin-balance &#8211;enable-dp-lm-head &#8211;tokenizer-worker-num <span class=\"token number\">4<\/span> &#8211;dtype bfloat16<br \/>\n        <span class=\"token assign-left variable\">NODE_RANK<\/span><span class=\"token operator\">&#061;<\/span><span class=\"token variable\">$i<\/span><br \/>\n        <span class=\"token builtin class-name\">break<\/span><br \/>\n    <span class=\"token keyword\">fi<\/span><br \/>\n<span class=\"token keyword\">done<\/span><\/p>\n<p><span class=\"token builtin class-name\">exit<\/span> <span class=\"token number\">1<\/span><br \/>\npython -m sglang_router.launch_router <span class=\"token punctuation\">\\\\<\/span><br \/>\n    &#8211;pd-disaggregation <span class=\"token punctuation\">\\\\<\/span><br \/>\n    &#8211;policy cache_aware <span class=\"token punctuation\">\\\\<\/span><br \/>\n    &#8211;prefill http:\/\/x.x.x.x:8000 <span class=\"token number\">8995<\/span> <span class=\"token punctuation\">\\\\<\/span><br \/>\n    &#8211;decode http:\/\/x.x.x.x:8001 <span class=\"token punctuation\">\\\\<\/span><br \/>\n    &#8211;host <span class=\"token number\">127.0<\/span>.0.1 <span class=\"token punctuation\">\\\\<\/span><br \/>\n    &#8211;port <span class=\"token number\">6688<\/span> <span class=\"token punctuation\">\\\\<\/span><br \/>\n    &#8211;mini-lb<br \/>\n\u200b<\/p>\n<h3>3 ais_bench \u914d\u7f6e<\/h3>\n<h4>3.1 \u4fee\u6539\u6d4b\u8bd5\u53c2\u6570<\/h4>\n<p>\u8c03\u6574Python\u6d4b\u8bd5\u4ee3\u7801\u914d\u7f6e&#xff1a;<\/p>\n<p><span class=\"token function\">vim<\/span> ais_bench\/benchmark\/configs\/models\/vllm_api\/vllm_api_stream_chat.py<\/p>\n<p><span class=\"token comment\"># vllm_api_stream_chat.py<\/span><br \/>\n<span class=\"token keyword\">from<\/span> ais_bench<span class=\"token punctuation\">.<\/span>benchmark<span class=\"token punctuation\">.<\/span>models <span class=\"token keyword\">import<\/span> VLLMCustomAPIChatStream<br \/>\n<span class=\"token keyword\">from<\/span> ais_bench<span class=\"token punctuation\">.<\/span>benchmark<span class=\"token punctuation\">.<\/span>utils<span class=\"token punctuation\">.<\/span>model_postprocessors <span class=\"token keyword\">import<\/span> extract_non_reasoning_content<\/p>\n<p>models <span class=\"token operator\">&#061;<\/span> <span class=\"token punctuation\">[<\/span><br \/>\n    <span class=\"token builtin\">dict<\/span><span class=\"token punctuation\">(<\/span><br \/>\n        attr<span class=\"token operator\">&#061;<\/span><span class=\"token string\">&#034;service&#034;<\/span><span class=\"token punctuation\">,<\/span><br \/>\n        <span class=\"token builtin\">type<\/span><span class=\"token operator\">&#061;<\/span>VLLMCustomAPIChatStream<span class=\"token punctuation\">,<\/span><br \/>\n        abbr<span class=\"token operator\">&#061;<\/span><span class=\"token string\">&#039;vllm-api-stream-chat&#039;<\/span><span class=\"token punctuation\">,<\/span><br \/>\n        path<span class=\"token operator\">&#061;<\/span><span class=\"token string\">&#034;\/mnt\/share\/weights\/Qwen3-235B-A22B-W8A8&#034;<\/span><span class=\"token punctuation\">,<\/span><br \/>\n        model<span class=\"token operator\">&#061;<\/span><span class=\"token string\">&#034;Qwen3&#034;<\/span><span class=\"token punctuation\">,<\/span><br \/>\n        request_rate <span class=\"token operator\">&#061;<\/span> <span class=\"token number\">10.5<\/span><span class=\"token punctuation\">,<\/span><br \/>\n        retry <span class=\"token operator\">&#061;<\/span> <span class=\"token number\">2<\/span><span class=\"token punctuation\">,<\/span><br \/>\n        host_ip <span class=\"token operator\">&#061;<\/span> <span class=\"token string\">&#034;127.0.0.1&#034;<\/span><span class=\"token punctuation\">,<\/span><br \/>\n        host_port <span class=\"token operator\">&#061;<\/span> <span class=\"token number\">6688<\/span><span class=\"token punctuation\">,<\/span><br \/>\n        max_out_len <span class=\"token operator\">&#061;<\/span> <span class=\"token number\">1500<\/span><span class=\"token punctuation\">,<\/span><br \/>\n        batch_size <span class=\"token operator\">&#061;<\/span> <span class=\"token number\">960<\/span><span class=\"token punctuation\">,<\/span> <span class=\"token comment\">#880<\/span><br \/>\n        trust_remote_code<span class=\"token operator\">&#061;<\/span><span class=\"token boolean\">False<\/span><span class=\"token punctuation\">,<\/span><br \/>\n        generation_kwargs <span class=\"token operator\">&#061;<\/span> <span class=\"token builtin\">dict<\/span><span class=\"token punctuation\">(<\/span><br \/>\n            temperature <span class=\"token operator\">&#061;<\/span> <span class=\"token number\">0<\/span><span class=\"token punctuation\">,<\/span><br \/>\n            ignore_eos <span class=\"token operator\">&#061;<\/span> <span class=\"token boolean\">True<\/span><span class=\"token punctuation\">,<\/span><br \/>\n        <span class=\"token punctuation\">)<\/span><span class=\"token punctuation\">,<\/span><br \/>\n        pred_postprocessor<span class=\"token operator\">&#061;<\/span><span class=\"token builtin\">dict<\/span><span class=\"token punctuation\">(<\/span><span class=\"token builtin\">type<\/span><span class=\"token operator\">&#061;<\/span>extract_non_reasoning_content<span class=\"token punctuation\">)<\/span><br \/>\n    <span class=\"token punctuation\">)<\/span><br \/>\n<span class=\"token punctuation\">]<\/span><\/p>\n<h4>3.2 \u6267\u884c\u6d4b\u8bd5\u547d\u4ee4<\/h4>\n<p>ais_bench &#8211;models vllm_api_stream_chat &#8211;datasets gsm8k_gen_0_shot_cot_str_perf  &#8211;debug &#8211;summarizer default_perf &#8211;mode perf &#8211;num-prompts <span class=\"token number\">4240<\/span><\/p>\n","protected":false},"excerpt":{"rendered":"<p>\u4f5c\u8005&#xff1a;\u6607\u817e\u5b9e\u6218\u6d3e Sglang\u77e5\u8bc6\u5730\u56fe&#xff1a; https:\/\/blog.csdn.net\/weixin_41406651\/article\/details\/156754353?spm1001.2014.3001.5502<br \/>\n\u80cc\u666f\u6982\u8ff0<br \/>\nQwen3-235B\u6a21\u578b\u7528Atlas 800I A3\u6216Atlas 800T A3\u5747\u53ef\u90e8\u7f72&#xff0c;\u672c\u6587\u6863\u4ee5Atlas 800T A3\u4e3a\u4f8b&#xff0c;\u8bb0\u5f55\u4e86\u4f7f\u7528SGLang\u6846\u67b6\u90e8\u7f72Qwen3-235B\u6a21\u578b\u76841P2D<\/p>\n","protected":false},"author":2,"featured_media":64642,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"footnotes":""},"categories":[1],"tags":[66],"topic":[],"class_list":["post-64644","post","type-post","status-publish","format-standard","has-post-thumbnail","hentry","category-server","tag-ai"],"yoast_head":"<!-- This site is optimized with the Yoast SEO plugin v20.3 - https:\/\/yoast.com\/wordpress\/plugins\/seo\/ -->\n<title>PD\u5206\u79bb\u90e8\u7f72\uff1a\u57fa\u4e8eAtlas 800T A3\u670d\u52a1\u5668+SGLang 1P2D\u90e8\u7f72Qwen3-235B\u6307\u5357 - \u7f51\u7855\u4e92\u8054\u5e2e\u52a9\u4e2d\u5fc3<\/title>\n<meta name=\"robots\" content=\"index, follow, max-snippet:-1, max-image-preview:large, max-video-preview:-1\" \/>\n<link rel=\"canonical\" href=\"https:\/\/www.wsisp.com\/helps\/64644.html\" \/>\n<meta property=\"og:locale\" content=\"zh_CN\" \/>\n<meta property=\"og:type\" content=\"article\" \/>\n<meta property=\"og:title\" content=\"PD\u5206\u79bb\u90e8\u7f72\uff1a\u57fa\u4e8eAtlas 800T A3\u670d\u52a1\u5668+SGLang 1P2D\u90e8\u7f72Qwen3-235B\u6307\u5357 - \u7f51\u7855\u4e92\u8054\u5e2e\u52a9\u4e2d\u5fc3\" \/>\n<meta property=\"og:description\" content=\"\u4f5c\u8005&#xff1a;\u6607\u817e\u5b9e\u6218\u6d3e Sglang\u77e5\u8bc6\u5730\u56fe&#xff1a; https:\/\/blog.csdn.net\/weixin_41406651\/article\/details\/156754353?spm1001.2014.3001.5502 \u80cc\u666f\u6982\u8ff0 Qwen3-235B\u6a21\u578b\u7528Atlas 800I A3\u6216Atlas 800T A3\u5747\u53ef\u90e8\u7f72&#xff0c;\u672c\u6587\u6863\u4ee5Atlas 800T A3\u4e3a\u4f8b&#xff0c;\u8bb0\u5f55\u4e86\u4f7f\u7528SGLang\u6846\u67b6\u90e8\u7f72Qwen3-235B\u6a21\u578b\u76841P2D\" \/>\n<meta property=\"og:url\" content=\"https:\/\/www.wsisp.com\/helps\/64644.html\" \/>\n<meta property=\"og:site_name\" content=\"\u7f51\u7855\u4e92\u8054\u5e2e\u52a9\u4e2d\u5fc3\" \/>\n<meta property=\"article:published_time\" content=\"2026-01-23T12:56:42+00:00\" \/>\n<meta property=\"og:image\" content=\"https:\/\/www.wsisp.com\/helps\/wp-content\/uploads\/2026\/01\/20260123125641-697370096aad5.png\" \/>\n<meta name=\"author\" content=\"admin\" \/>\n<meta name=\"twitter:card\" content=\"summary_large_image\" \/>\n<meta name=\"twitter:label1\" content=\"\u4f5c\u8005\" \/>\n\t<meta name=\"twitter:data1\" content=\"admin\" \/>\n\t<meta name=\"twitter:label2\" content=\"\u9884\u8ba1\u9605\u8bfb\u65f6\u95f4\" \/>\n\t<meta name=\"twitter:data2\" content=\"5 \u5206\" \/>\n<script type=\"application\/ld+json\" class=\"yoast-schema-graph\">{\"@context\":\"https:\/\/schema.org\",\"@graph\":[{\"@type\":\"WebPage\",\"@id\":\"https:\/\/www.wsisp.com\/helps\/64644.html\",\"url\":\"https:\/\/www.wsisp.com\/helps\/64644.html\",\"name\":\"PD\u5206\u79bb\u90e8\u7f72\uff1a\u57fa\u4e8eAtlas 800T A3\u670d\u52a1\u5668+SGLang 1P2D\u90e8\u7f72Qwen3-235B\u6307\u5357 - \u7f51\u7855\u4e92\u8054\u5e2e\u52a9\u4e2d\u5fc3\",\"isPartOf\":{\"@id\":\"https:\/\/www.wsisp.com\/helps\/#website\"},\"datePublished\":\"2026-01-23T12:56:42+00:00\",\"dateModified\":\"2026-01-23T12:56:42+00:00\",\"author\":{\"@id\":\"https:\/\/www.wsisp.com\/helps\/#\/schema\/person\/358e386c577a3ab51c4493330a20ad41\"},\"breadcrumb\":{\"@id\":\"https:\/\/www.wsisp.com\/helps\/64644.html#breadcrumb\"},\"inLanguage\":\"zh-Hans\",\"potentialAction\":[{\"@type\":\"ReadAction\",\"target\":[\"https:\/\/www.wsisp.com\/helps\/64644.html\"]}]},{\"@type\":\"BreadcrumbList\",\"@id\":\"https:\/\/www.wsisp.com\/helps\/64644.html#breadcrumb\",\"itemListElement\":[{\"@type\":\"ListItem\",\"position\":1,\"name\":\"\u9996\u9875\",\"item\":\"https:\/\/www.wsisp.com\/helps\"},{\"@type\":\"ListItem\",\"position\":2,\"name\":\"PD\u5206\u79bb\u90e8\u7f72\uff1a\u57fa\u4e8eAtlas 800T A3\u670d\u52a1\u5668+SGLang 1P2D\u90e8\u7f72Qwen3-235B\u6307\u5357\"}]},{\"@type\":\"WebSite\",\"@id\":\"https:\/\/www.wsisp.com\/helps\/#website\",\"url\":\"https:\/\/www.wsisp.com\/helps\/\",\"name\":\"\u7f51\u7855\u4e92\u8054\u5e2e\u52a9\u4e2d\u5fc3\",\"description\":\"\u9999\u6e2f\u670d\u52a1\u5668_\u9999\u6e2f\u4e91\u670d\u52a1\u5668\u8d44\u8baf_\u670d\u52a1\u5668\u5e2e\u52a9\u6587\u6863_\u670d\u52a1\u5668\u6559\u7a0b\",\"potentialAction\":[{\"@type\":\"SearchAction\",\"target\":{\"@type\":\"EntryPoint\",\"urlTemplate\":\"https:\/\/www.wsisp.com\/helps\/?s={search_term_string}\"},\"query-input\":\"required name=search_term_string\"}],\"inLanguage\":\"zh-Hans\"},{\"@type\":\"Person\",\"@id\":\"https:\/\/www.wsisp.com\/helps\/#\/schema\/person\/358e386c577a3ab51c4493330a20ad41\",\"name\":\"admin\",\"image\":{\"@type\":\"ImageObject\",\"inLanguage\":\"zh-Hans\",\"@id\":\"https:\/\/www.wsisp.com\/helps\/#\/schema\/person\/image\/\",\"url\":\"https:\/\/gravatar.wp-china-yes.net\/avatar\/?s=96&d=mystery\",\"contentUrl\":\"https:\/\/gravatar.wp-china-yes.net\/avatar\/?s=96&d=mystery\",\"caption\":\"admin\"},\"sameAs\":[\"http:\/\/wp.wsisp.com\"],\"url\":\"https:\/\/www.wsisp.com\/helps\/author\/admin\"}]}<\/script>\n<!-- \/ Yoast SEO plugin. -->","yoast_head_json":{"title":"PD\u5206\u79bb\u90e8\u7f72\uff1a\u57fa\u4e8eAtlas 800T A3\u670d\u52a1\u5668+SGLang 1P2D\u90e8\u7f72Qwen3-235B\u6307\u5357 - \u7f51\u7855\u4e92\u8054\u5e2e\u52a9\u4e2d\u5fc3","robots":{"index":"index","follow":"follow","max-snippet":"max-snippet:-1","max-image-preview":"max-image-preview:large","max-video-preview":"max-video-preview:-1"},"canonical":"https:\/\/www.wsisp.com\/helps\/64644.html","og_locale":"zh_CN","og_type":"article","og_title":"PD\u5206\u79bb\u90e8\u7f72\uff1a\u57fa\u4e8eAtlas 800T A3\u670d\u52a1\u5668+SGLang 1P2D\u90e8\u7f72Qwen3-235B\u6307\u5357 - \u7f51\u7855\u4e92\u8054\u5e2e\u52a9\u4e2d\u5fc3","og_description":"\u4f5c\u8005&#xff1a;\u6607\u817e\u5b9e\u6218\u6d3e Sglang\u77e5\u8bc6\u5730\u56fe&#xff1a; https:\/\/blog.csdn.net\/weixin_41406651\/article\/details\/156754353?spm1001.2014.3001.5502 \u80cc\u666f\u6982\u8ff0 Qwen3-235B\u6a21\u578b\u7528Atlas 800I A3\u6216Atlas 800T A3\u5747\u53ef\u90e8\u7f72&#xff0c;\u672c\u6587\u6863\u4ee5Atlas 800T A3\u4e3a\u4f8b&#xff0c;\u8bb0\u5f55\u4e86\u4f7f\u7528SGLang\u6846\u67b6\u90e8\u7f72Qwen3-235B\u6a21\u578b\u76841P2D","og_url":"https:\/\/www.wsisp.com\/helps\/64644.html","og_site_name":"\u7f51\u7855\u4e92\u8054\u5e2e\u52a9\u4e2d\u5fc3","article_published_time":"2026-01-23T12:56:42+00:00","og_image":[{"url":"https:\/\/www.wsisp.com\/helps\/wp-content\/uploads\/2026\/01\/20260123125641-697370096aad5.png"}],"author":"admin","twitter_card":"summary_large_image","twitter_misc":{"\u4f5c\u8005":"admin","\u9884\u8ba1\u9605\u8bfb\u65f6\u95f4":"5 \u5206"},"schema":{"@context":"https:\/\/schema.org","@graph":[{"@type":"WebPage","@id":"https:\/\/www.wsisp.com\/helps\/64644.html","url":"https:\/\/www.wsisp.com\/helps\/64644.html","name":"PD\u5206\u79bb\u90e8\u7f72\uff1a\u57fa\u4e8eAtlas 800T A3\u670d\u52a1\u5668+SGLang 1P2D\u90e8\u7f72Qwen3-235B\u6307\u5357 - \u7f51\u7855\u4e92\u8054\u5e2e\u52a9\u4e2d\u5fc3","isPartOf":{"@id":"https:\/\/www.wsisp.com\/helps\/#website"},"datePublished":"2026-01-23T12:56:42+00:00","dateModified":"2026-01-23T12:56:42+00:00","author":{"@id":"https:\/\/www.wsisp.com\/helps\/#\/schema\/person\/358e386c577a3ab51c4493330a20ad41"},"breadcrumb":{"@id":"https:\/\/www.wsisp.com\/helps\/64644.html#breadcrumb"},"inLanguage":"zh-Hans","potentialAction":[{"@type":"ReadAction","target":["https:\/\/www.wsisp.com\/helps\/64644.html"]}]},{"@type":"BreadcrumbList","@id":"https:\/\/www.wsisp.com\/helps\/64644.html#breadcrumb","itemListElement":[{"@type":"ListItem","position":1,"name":"\u9996\u9875","item":"https:\/\/www.wsisp.com\/helps"},{"@type":"ListItem","position":2,"name":"PD\u5206\u79bb\u90e8\u7f72\uff1a\u57fa\u4e8eAtlas 800T A3\u670d\u52a1\u5668+SGLang 1P2D\u90e8\u7f72Qwen3-235B\u6307\u5357"}]},{"@type":"WebSite","@id":"https:\/\/www.wsisp.com\/helps\/#website","url":"https:\/\/www.wsisp.com\/helps\/","name":"\u7f51\u7855\u4e92\u8054\u5e2e\u52a9\u4e2d\u5fc3","description":"\u9999\u6e2f\u670d\u52a1\u5668_\u9999\u6e2f\u4e91\u670d\u52a1\u5668\u8d44\u8baf_\u670d\u52a1\u5668\u5e2e\u52a9\u6587\u6863_\u670d\u52a1\u5668\u6559\u7a0b","potentialAction":[{"@type":"SearchAction","target":{"@type":"EntryPoint","urlTemplate":"https:\/\/www.wsisp.com\/helps\/?s={search_term_string}"},"query-input":"required name=search_term_string"}],"inLanguage":"zh-Hans"},{"@type":"Person","@id":"https:\/\/www.wsisp.com\/helps\/#\/schema\/person\/358e386c577a3ab51c4493330a20ad41","name":"admin","image":{"@type":"ImageObject","inLanguage":"zh-Hans","@id":"https:\/\/www.wsisp.com\/helps\/#\/schema\/person\/image\/","url":"https:\/\/gravatar.wp-china-yes.net\/avatar\/?s=96&d=mystery","contentUrl":"https:\/\/gravatar.wp-china-yes.net\/avatar\/?s=96&d=mystery","caption":"admin"},"sameAs":["http:\/\/wp.wsisp.com"],"url":"https:\/\/www.wsisp.com\/helps\/author\/admin"}]}},"_links":{"self":[{"href":"https:\/\/www.wsisp.com\/helps\/wp-json\/wp\/v2\/posts\/64644","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/www.wsisp.com\/helps\/wp-json\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/www.wsisp.com\/helps\/wp-json\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/www.wsisp.com\/helps\/wp-json\/wp\/v2\/users\/2"}],"replies":[{"embeddable":true,"href":"https:\/\/www.wsisp.com\/helps\/wp-json\/wp\/v2\/comments?post=64644"}],"version-history":[{"count":0,"href":"https:\/\/www.wsisp.com\/helps\/wp-json\/wp\/v2\/posts\/64644\/revisions"}],"wp:featuredmedia":[{"embeddable":true,"href":"https:\/\/www.wsisp.com\/helps\/wp-json\/wp\/v2\/media\/64642"}],"wp:attachment":[{"href":"https:\/\/www.wsisp.com\/helps\/wp-json\/wp\/v2\/media?parent=64644"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/www.wsisp.com\/helps\/wp-json\/wp\/v2\/categories?post=64644"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/www.wsisp.com\/helps\/wp-json\/wp\/v2\/tags?post=64644"},{"taxonomy":"topic","embeddable":true,"href":"https:\/\/www.wsisp.com\/helps\/wp-json\/wp\/v2\/topic?post=64644"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}