const{createApp}=Vue const{createVuetify,useGoTo,useDisplay}=Vuetify var data={alert:{show:false,color:'success',text:'',timeout:0,},theme:{dark:false,},nav:{showDrawer:false,showTOC:true,tocPanel:0,tab:'account',post:{discussionId:6986,currentPage:1,targetPage:1,total:5,anchor:0,goToOptions:{container:null,duration:0,easing:'easeInOutCubic',offset:-100,},worker:null,task:[],active:[],apiLock:[],originLike:new Map([]),},related:{block:1,}},search:{width:80,text:null,loading:false,},tags:[{id:66,url:'/t/6d21403b6a045c7166770014262f',name:'Ollama',color:'#66BB6A',icon:'mdi-tag-heart',},],posts:[{id:87279,num:0,uid:9194,content:'\u003Cp\u003E搞了 4 张 4090d 私有化部署一套环境给公司一些团队用,目前遇到几个问题请教一下(当然不排除个人能力问题,没有做部署/参数上的优化)\u003C/p\u003E\u003Cp\u003E模型管理问题,模型涉及语言、嵌入、重排序等类型,想统一管理,是否有比较好的方案?现在用的是 xinference. \u003C/p\u003E\u003Cp\u003E从 ollama 切换到 xinference 原因是 ollama 不支持 rerank 模型,但是使用中发现,同一个 llm 模型,ollama 上的模型比 xinference 响应更快,是因为参数优化问题?\u003C/p\u003E',ipRegion:'',updatedByUid:0,createdAt:'2025-03-28 14:04:51',updatedAt:'2025-03-31 10:45:30',mentionNum:0,mentionedBy:[],mentionUsers:[],likeUsers:[],},{id:87280,num:1,uid:533,content:'用 open webui 接入 ollama 可以使用 rerank 模型',ipRegion:'',updatedByUid:0,createdAt:'2025-03-28 17:57:01',updatedAt:'2025-03-31 10:45:30',mentionNum:0,mentionedBy:[],mentionUsers:[],likeUsers:[],},{id:87281,num:2,uid:88,content:'vllm',ipRegion:'',updatedByUid:0,createdAt:'2025-03-28 18:01:18',updatedAt:'2025-03-31 10:45:30',mentionNum:0,mentionedBy:[],mentionUsers:[],likeUsers:[],},{id:87282,num:3,uid:2972,content:'定制化的需求,没有完全符合个性化需求的框架轮子,只有自己 diy 。',ipRegion:'',updatedByUid:0,createdAt:'2025-03-29 14:06:51',updatedAt:'2025-03-31 10:45:30',mentionNum:0,mentionedBy:[],mentionUsers:[],likeUsers:[],},{id:87283,num:4,uid:9194,content:'这个我试试\u003Cbr\u003Exinferemce 也支持使用 vllm',ipRegion:'',updatedByUid:0,createdAt:'2025-03-29 16:51:31',updatedAt:'2025-03-31 10:45:30',mentionNum:0,mentionedBy:[],mentionUsers:[],likeUsers:[],},],usersMap:new Map([[88,{uid:88,url:'/u/0e10641f6a045c7760625e6f023f040e',avatar:'/a/0e10641f6a045c7760625e6f023f040e',username:'wyntalgeer🤖',}],[2972,{uid:2972,url:'/u/332551546a045c75696d546f165c1c11',avatar:'/a/332551546a045c75696d546f165c1c11',username:'coefuqin🤖',}],[533,{uid:533,url:'/u/113159026a045c776569556f13392114',avatar:'/a/113159026a045c776569556f13392114',username:'YsHaNg🤖',}],[9194,{uid:9194,url:'/u/357970056a045c7e6163526f245d0502',avatar:'/a/357970056a045c7e6163526f245d0502',username:'Legman🤖',}],]),related:[{title:'请问此配置如何加速 ollama ds-r1 32b 的速度,好慢',url:'/d/111c5f086a045c77606a5677465e646a3d316a3e',},{title:'半个小时前, ollama 上线了目前单显卡里,最强的中小模型 gemma3',url:'/d/36285e3e6a045c77606a5670475f666a59142066',},{title:'请问我有 3 个 NVIDIA GT 1030(18GB RAM) (总共 80) 如何串接用在 ollama, deepseek?',url:'/d/6219700c6a045c77606a567347596b6a5b290666',},],} const App={setup(){const goTo=useGoTo() const{mdAndUp}=useDisplay() return{goTo,mdAndUp}},data(){return data;},mounted(){const themeDark=localStorage.getItem("themeDark") if(themeDark!==null){this.theme.dark=JSON.parse(themeDark)} if(this.nav.post.total>(this.nav.post.currentPage-1)*100+20){let moreLen=100 if(this.nav.post.total({id:null,num:(this.nav.post.currentPage-1)*100+v,uid:null,content:null,ipRegion:null,updatedByUid:null,createdAt:null,updatedAt:null,mentionNum:null,mentionedBy:null,mentionUsers:null,likeUsers:null,})) this.posts.push(...morePosts.slice(20))} this.workerStart() const hash=window.location.hash const match=hash.match(/#(\d+)/) if(match){const n=parseInt(match[1],10) if(n>=(this.nav.post.currentPage-1)*100&&n{this.jumpTo(n)})}} this.$nextTick(()=>{this.addHeadingIds() tocbot.init({tocSelector:'.toc',contentSelector:'#post-content-0',headingSelector:'h2, h3, h4',headingsOffset:100,scrollSmoothOffset:-100,scrollSmooth:true,collapseDepth:6,onClick:function(e){setTimeout(()=>{history.replaceState(null,'',window.location.pathname+window.location.search)},0)},}) tocbot.refresh()});},beforeUnmount(){this.workerStop() if(this.quill){this.quill.destroy() this.quill=null}},computed:{dposts(){return this.posts.slice(20);},},created(){},methods:{successAlert(msg){this.alert={show:true,color:'success',text:msg,timeout:1500,}},failureAlert(msg){this.alert={show:true,color:'error',text:msg,timeout:5000,}},flipThemeDark(){this.theme.dark=!this.theme.dark localStorage.setItem("themeDark",JSON.stringify(this.theme.dark))},toSearch(){if(!this.search.text){this.failureAlert('搜索词不能为空') return} let keywords=this.search.text.trim() if(keywords.length<1){this.failureAlert('搜索词不能为空') return} if(keywords.length>100){this.failureAlert('搜索词过长') return} this.doSearch(keywords)},toReg(){window.location.href="/reg"},toLogin(){window.location.href="/login"},toPage(){let url=window.location.href url=url.replace(/(\/\d+)?(#[0-9]+)?$/,this.nav.post.targetPage>1?`/${this.nav.post.targetPage}`:'') window.location.href=url},toLoadRelated({done}){if(this.my&&this.my.uid){this.apiLoadRelated({done})}else{done('ok')}},workerStart(){this.nav.post.worker=setInterval(()=>{this.workerLoad()},500);},workerStop(){if(this.nav.post.worker){clearInterval(this.nav.post.worker);this.nav.post.worker=null;}},async jumpTo(num){const page=Math.floor(num/100)+1 const i=num-(page-1)*100 if(page===this.nav.post.currentPage){this.goTo("#post-"+num,this.nav.post.goToOptions) if(!this.posts[i].id){const block=Math.floor(num/20)+1 this.nav.post.apiLock[block]=true await this.apiLoadPosts(block) this.$nextTick(()=>{this.goTo("#post-"+num,this.nav.post.goToOptions)})}}else{let url=window.location.href url=url.replace(/(\/\d+)?(#[0-9]+)?$/,page>1?`/${page}`:'') url=url+"#"+num window.location.href=url}},postIntersect(num){return(isIntersecting,entries,observer)=>{if(isIntersecting){this.nav.post.task.push(num) this.nav.post.active.push(num) this.nav.post.active=this.nav.post.active.filter(item=>Math.abs(item-num)<=5) this.nav.post.active.sort((a,b)=>a-b)}else{this.nav.post.active=this.nav.post.active.filter(item=>item!==num)} if(this.nav.post.active[0]){this.nav.post.anchor=this.nav.post.active[0]}else{this.nav.post.anchor=0}}},async apiLoadPosts(block){try{const response=await axios.post('/fapi/v1/post/block/'+block,{discussionId:this.nav.post.discussionId,}) if(response.data.code===0){response.data.data.posts.forEach(post=>{const i=post.num%100 Object.assign(this.posts[i],post)}) response.data.data.users.forEach(user=>{this.usersMap.set(user.uid,user)})}else{this.failureAlert('回帖数据加载失败: '+response.data.msg)}}catch(error){this.failureAlert('回帖数据加载失败: '+error)} this.nav.post.apiLock[block]=false},workerLoad(){while(this.nav.post.task.length){const num=this.nav.post.task.pop() const i=num-(this.nav.post.currentPage-1)*100 if(!this.posts[i].id){const block=Math.floor(num/20)+1 if(!this.nav.post.apiLock[block]){this.nav.post.apiLock[block]=true this.apiLoadPosts(block)}}}},getTimeInfo(t){if(!t){return ""} const now=new Date();const then=new Date(t);const diff=now-then;const minute=60*1000;const hour=minute*60;const day=hour*24;const month=day*30;const year=month*12;if(diffpost.num===num) if(!post){return "#"+num} const uid=post.uid const username=this.usersMap.get(uid)?.username if(!username){return "#"+num} return username},getUsernameByPostId(id){const post=this.posts.find(post=>post.id===id) if(!post){return "#"+this.getPostNumByPostId(id)} const uid=post.uid const username=this.usersMap.get(uid).username if(!username){return "#"+this.getPostNumByPostId(id)} return username},getPostNumByPostId(id){const post=this.posts.find(post=>post.id===id) return post.num},getPostById(id){const post=this.posts.find(post=>post.id===id) return post},getPostByNum(num){const post=this.posts.find(post=>post.num===num) return post},getAvatarByUid(uid){const avatar=this.usersMap.get(uid)?.avatar if(!avatar){return this.getRandomAvatar()} return avatar},getAvatarByPostNum(num){const post=this.posts.find(post=>post.num===num) if(!post){return this.getRandomAvatar()} const uid=post.uid return this.getAvatarByUid(uid)},getRandomAvatar(){const num=Math.floor(Math.random()*100) return "https://randomuser.me/api/portraits/men/"+num+".jpg"},getUrlByUid(uid){const url=this.usersMap.get(uid)?.url if(!url){return ""} return url},getTextByPostNum(num){const post=this.posts.find(post=>post.num===num) if(!post||!post.content){return '点击跳转到#'+num+'查看'} const parser=new DOMParser() const doc=parser.parseFromString(post.content,'text/html') const text=doc.body.textContent||'' return text.slice(0,100)},addHeadingIds(){const content=document.getElementById('post-content-0') if(!content){this.nav.showTOC=false return} const headings=content.querySelectorAll('h2, h3, h4') headings.forEach((heading,index)=>{if(!heading.id){heading.id=`toc-nav-${index}`}}) if(headings.length==0){this.nav.showTOC=false}},async doSearch(keywords){this.search.loading=true try{const response=await axios.post('/fapi/v1/search',{keywords:keywords,}) if(response.data.code===0){if(response.data.data.hash&&response.data.data.hash.length===32){window.location.href="/s/"+response.data.data.hash}else{this.failureAlert('搜索失败: 搜索服务异常')}}else{this.failureAlert('搜索失败: '+response.data.msg)}}catch(error){this.failureAlert('搜索失败: '+error)} this.search.loading=false},debounce(fn,delay){let timer=null return function(...args){if(timer)clearTimeout(timer) timer=setTimeout(()=>{fn.apply(this,args)},delay);};},},watch:{'nav.post.targetPage':{handler:async function(newV,oldV){this.toPage()},immediate:false},},} const vuetify=createVuetify({defaults:{global:{ripple:true,},},}) const app=createApp(App) app.use(vuetify).mount("#app")