{"id":74,"date":"2025-07-04T17:55:09","date_gmt":"2025-07-04T09:55:09","guid":{"rendered":"http:\/\/blog.thirdbody.cn\/?p=74"},"modified":"2025-07-22T17:38:37","modified_gmt":"2025-07-22T09:38:37","slug":"%e4%bd%bf%e7%94%a8xorbits-inference%e9%83%a8%e7%bd%b2%e6%a8%a1%e5%9e%8b","status":"publish","type":"post","link":"http:\/\/blog.thirdbody.cn\/index.php\/2025\/07\/04\/%e4%bd%bf%e7%94%a8xorbits-inference%e9%83%a8%e7%bd%b2%e6%a8%a1%e5%9e%8b\/","title":{"rendered":"\u4f7f\u7528Xorbits Inference\u90e8\u7f72\u6a21\u578b"},"content":{"rendered":"<h3>1. \u542f\u52a8xinference\u670d\u52a1<\/h3>\n<pre><code>xinference-local --host 0.0.0.0 --port 9997<\/code><\/pre>\n<h3>2. \u6d4f\u89c8\u5668\u8bbf\u95ee<\/h3>\n<p>\u6d4f\u89c8\u5668\u8bbf\u95ee\u4e0a\u8ff0\u670d\u52a1\u5730\u5740(\u5982\uff1a<a href=\"http:\/\/10.0.14.55:9997)\uff0c\u5373\u53ef\u4f7f\u7528\u9875\u9762\">http:\/\/10.0.14.55:9997)\uff0c\u5373\u53ef\u4f7f\u7528\u9875\u9762<\/a>:<\/p>\n<p><img decoding=\"async\" src=\"http:\/\/cdn.thirdbody.cn\/blog\/xinference-1.png\" alt=\"\" \/><\/p>\n<h3>3. \u542f\u52a8\u6a21\u578b<\/h3>\n<h4>3.1 \u542f\u52a8\u5d4c\u5165\u6a21\u578b<\/h4>\n<pre><code># --endpoint\u6362\u4e3a\u5b9e\u9645\u7684xinferrence\u670d\u52a1\u5730\u5740(\u7b2c\u4e00\u6b65\u7684\u670d\u52a1\u5730\u5740)\nxinference launch --model_path \/home\/module\/xinference\/models\/bge-m3 --endpoint http:\/\/10.0.14.55:9997 --model-name bge-m3 --model-type embedding --device cpu<\/code><\/pre>\n<h4>3.2 \u542f\u52a8\u91cd\u6392\u5e8f\u6a21\u578b<\/h4>\n<pre><code># --endpoint\u6362\u4e3a\u5b9e\u9645\u7684xinferrence\u670d\u52a1\u5730\u5740(\u7b2c\u4e00\u6b65\u7684\u670d\u52a1\u5730\u5740)\nxinference launch --model_path \/home\/qll\/models\/bge-reranker-v2-m3 --endpoint http:\/\/10.0.14.55:9997 --model-name bge-reranker-v2-m3 --model-type rerank<\/code><\/pre>\n<h4>3.3 \u76f8\u5173\u53c2\u6570\u542b\u4e49\u5982\u4e0b\uff1a<\/h4>\n<ul>\n<li>model_path: \u6a21\u578b\u6743\u91cd\u8def\u5f84<\/li>\n<li>endpoint: xinferrence\u670d\u52a1\u5730\u5740<\/li>\n<li>model-name: \u542f\u52a8\u7684\u6a21\u578b\u7684\u540d\u79f0<\/li>\n<li>model-type: \u6a21\u578b\u7c7b\u578b\uff0c\u652f\u6301<code>LLM<\/code>\u3001<code>embedding<\/code>\u3001<code>rerank<\/code>\u3001<code>image<\/code><\/li>\n<li>device: cpu\u3001cuda\u7b49<\/li>\n<\/ul>\n<h3>4. \u4f7f\u7528\u65b9\u5f0f<\/h3>\n<ul>\n<li>\n<p>\u53ef\u4ee5\u4f7f\u7528openai API\u8c03\u7528\uff0c\u53ea\u9700\u5982\u4e0b\u8bbe\u7f6e\u5373\u53ef\uff1a<\/p>\n<pre><code>openai.api_base = \"http:\/\/10.0.14.55:9997\/v1\"\nopenai.api_key = \"\"<\/code><\/pre>\n<\/li>\n<li>\n<p>\u4f7f\u7528\u9875\u9762\u8fdb\u884c\u6d4b\u8bd5:<\/p>\n<p><img decoding=\"async\" src=\"http:\/\/cdn.thirdbody.cn\/blog\/xinference-2.png\" alt=\"\" \/><\/p>\n<\/li>\n<\/ul>\n","protected":false},"excerpt":{"rendered":"<p>1. \u542f\u52a8xinference\u670d\u52a1 xinference-local &#8211;host 0.0.0.0 &#8211;por [&hellip;]<\/p>\n","protected":false},"author":1,"featured_media":75,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"footnotes":""},"categories":[25],"tags":[40,28],"class_list":["post-74","post","type-post","status-publish","format-standard","has-post-thumbnail","hentry","category-model_deployment","tag-xinference","tag-28"],"_links":{"self":[{"href":"http:\/\/blog.thirdbody.cn\/index.php\/wp-json\/wp\/v2\/posts\/74","targetHints":{"allow":["GET"]}}],"collection":[{"href":"http:\/\/blog.thirdbody.cn\/index.php\/wp-json\/wp\/v2\/posts"}],"about":[{"href":"http:\/\/blog.thirdbody.cn\/index.php\/wp-json\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"http:\/\/blog.thirdbody.cn\/index.php\/wp-json\/wp\/v2\/users\/1"}],"replies":[{"embeddable":true,"href":"http:\/\/blog.thirdbody.cn\/index.php\/wp-json\/wp\/v2\/comments?post=74"}],"version-history":[{"count":3,"href":"http:\/\/blog.thirdbody.cn\/index.php\/wp-json\/wp\/v2\/posts\/74\/revisions"}],"predecessor-version":[{"id":91,"href":"http:\/\/blog.thirdbody.cn\/index.php\/wp-json\/wp\/v2\/posts\/74\/revisions\/91"}],"wp:featuredmedia":[{"embeddable":true,"href":"http:\/\/blog.thirdbody.cn\/index.php\/wp-json\/wp\/v2\/media\/75"}],"wp:attachment":[{"href":"http:\/\/blog.thirdbody.cn\/index.php\/wp-json\/wp\/v2\/media?parent=74"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"http:\/\/blog.thirdbody.cn\/index.php\/wp-json\/wp\/v2\/categories?post=74"},{"taxonomy":"post_tag","embeddable":true,"href":"http:\/\/blog.thirdbody.cn\/index.php\/wp-json\/wp\/v2\/tags?post=74"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}