From e9146919285afa562e8d1163f6fbfa715987f192 Mon Sep 17 00:00:00 2001 From: Sanket Sudake Date: Thu, 18 Jul 2024 14:42:54 +0530 Subject: [PATCH] Update ai-stack chart to use pvc and secret (#13) * Update ai-stack chart to use pvc and secret Signed-off-by: Sanket Sudake * add reranker support in ai-stack Signed-off-by: Sanket Sudake --------- Signed-off-by: Sanket Sudake --- charts/ai-stack/Chart.lock | 11 +- charts/ai-stack/Chart.yaml | 22 +++- charts/ai-stack/README.md | 6 + charts/ai-stack/charts/chromadb-0.1.19.tgz | Bin 0 -> 6031 bytes .../text-embeddings-inference-0.1.1.tgz | Bin 4302 -> 0 bytes .../text-embeddings-inference-0.1.3.tgz | Bin 0 -> 4742 bytes .../text-generation-inference-0.1.1.tgz | Bin 4285 -> 0 bytes .../text-generation-inference-0.1.3.tgz | Bin 0 -> 4762 bytes charts/ai-stack/templates/_helpers.tpl | 62 ++++++++++ charts/ai-stack/templates/pvc.yaml | 24 ++++ charts/ai-stack/values.yaml | 115 +++++++++++++++++- 11 files changed, 228 insertions(+), 12 deletions(-) create mode 100644 charts/ai-stack/charts/chromadb-0.1.19.tgz delete mode 100644 charts/ai-stack/charts/text-embeddings-inference-0.1.1.tgz create mode 100644 charts/ai-stack/charts/text-embeddings-inference-0.1.3.tgz delete mode 100644 charts/ai-stack/charts/text-generation-inference-0.1.1.tgz create mode 100644 charts/ai-stack/charts/text-generation-inference-0.1.3.tgz create mode 100644 charts/ai-stack/templates/_helpers.tpl create mode 100644 charts/ai-stack/templates/pvc.yaml diff --git a/charts/ai-stack/Chart.lock b/charts/ai-stack/Chart.lock index 99bdddb..e1921d6 100644 --- a/charts/ai-stack/Chart.lock +++ b/charts/ai-stack/Chart.lock @@ -1,9 +1,12 @@ dependencies: - name: text-generation-inference repository: https://infracloudio.github.io/charts - version: 0.1.1 + version: 0.1.3 - name: text-embeddings-inference repository: https://infracloudio.github.io/charts - version: 0.1.1 -digest: sha256:03b9860baccbba01ab701b07ab16fd12c6558b3a1920f806b623bef2cc5d03bd -generated: "2024-07-16T15:49:37.371821+05:30" + version: 0.1.3 +- name: chromadb + repository: https://amikos-tech.github.io/chromadb-chart/ + version: 0.1.19 +digest: sha256:05ba005e3d493eccad2f831ffa151ee9de81b24597c4f347741d8cb1624feec8 +generated: "2024-07-17T13:32:27.60585+05:30" diff --git a/charts/ai-stack/Chart.yaml b/charts/ai-stack/Chart.yaml index a86d670..acff08c 100644 --- a/charts/ai-stack/Chart.yaml +++ b/charts/ai-stack/Chart.yaml @@ -15,7 +15,7 @@ type: application # This is the chart version. This version number should be incremented each time you make changes # to the chart and its templates, including the app version. # Versions are expected to follow Semantic Versioning (https://semver.org/) -version: 0.1.0 +version: 0.2.0 # This is the version number of the application being deployed. This version number should be # incremented each time you make changes to the application. Versions are not expected to @@ -25,13 +25,25 @@ appVersion: "" dependencies: - name: text-generation-inference - version: 0.1.1 + version: 0.1.3 repository: "https://infracloudio.github.io/charts" alias: tgi condition: tgi.enabled - + - name: text-embeddings-inference - version: 0.1.1 + version: 0.1.3 repository: "https://infracloudio.github.io/charts" alias: tei - condition: tei.enabled \ No newline at end of file + condition: tei.enabled + + - name: text-embeddings-inference + version: 0.1.3 + repository: "https://infracloudio.github.io/charts" + alias: reranker + condition: reranker.enabled + + - name: chromadb + version: 0.1.19 + repository: https://amikos-tech.github.io/chromadb-chart/ + alias: vectordb + condition: vectordb.enabled \ No newline at end of file diff --git a/charts/ai-stack/README.md b/charts/ai-stack/README.md index fd6aca2..4223dc3 100644 --- a/charts/ai-stack/README.md +++ b/charts/ai-stack/README.md @@ -20,6 +20,12 @@ See [helm repo](https://helm.sh/docs/helm/helm_repo/) for command documentation. ## Installing the Chart +Create a secret with HuggingFace token: + +```bash +kubectl create secret generic hf-api-token --from-literal HF_API_TOKEN= +``` + To install the chart with the release name `ai-stack`: ```bash diff --git a/charts/ai-stack/charts/chromadb-0.1.19.tgz b/charts/ai-stack/charts/chromadb-0.1.19.tgz new file mode 100644 index 0000000000000000000000000000000000000000..4ffb30af2ce8d2966c28c74f2a3cd001537feab5 GIT binary patch literal 6031 zcmV;A7jWnwiwG0|00000|0w_~VMtOiV@ORlOnEsqVl!4SWK%V1T2nbTPgYhoO;>Dc zVQyr3R8em|NM&qo0PH>ebKAC({h5Eo9^*{xzKD`PVyB$xo2S}NqNzVLmXf}_wxfZ_ zm4uokSOB!GI=;XC1^`Ks6!qc6b#iw`W*iv;7Q2hx#R9v4y$NR_@rTXB3E|S2k}&x0 zp-ZdPYVGgs>Hk};R`vhZ!Tzi7w)b9bZ@=0(*gH7*uC={$aPaCoXgxS4H6;;}@b6k* zJXV#s|0RXQ^aFB1S>(dijz!`)|Fz}pIoo@dkHX_Lmb$JD?=T3#Q^Eox#^F%Q4;=jj zSLjK`K}g2Yny?UEm`E85x7i$1IZ1|&$HFEF=_L~liQc4{$zDT)v#6&=sOe+cH9W?# z=`&9>hXETlTfI3N;*V_6)v zXdbd8k}hmp77fW5UF#VD$CwE!8K1f^o_O4$tfcToKqiNux)FU1i@UTC6HfH58IxniLwBmK`%y+ zjwlMao}io{2Lfq3Af_RR2}=TBam?dLB>EPlpIneUK@F%KMNDc<*6by|ul|!0tb(%u z$gHgkw{WKc^e3oI5wKBRHw7&b=;*ec5kyRaKnW!BQ)HA3D0E%|F@UImF-FK0%8&>e zjWytmIr((wHc&AsJF;ZvD$1dX%o+Sd|Fi3<%-sx%~q>)4(kpNf}Of@bijQBs1 zfJ7d0-2`t;6U(B}n4=I1GDb=eeHTU~5DEb=AVQpFSk$se5q_Brkw>URl(J?D(9xY; zh{iO!vF4k}Ks1P_K`Z_!@DnDaMg*Xte{qdIHSmUnaez+1JQC>d0b(L2X=BqtRk+a1 zYfO{A=2k~_4>2;xr{d))W(KLWDg>bcLQC*jx}FrqZpc8GMg=^dWnrUJBDgiu z^b0~F5)uSc;OMb1#K_k&BN+&d)D-;GsN}u%1WE=0k}CwM>=0A zi8oQhpVEk``E-=jPgw#!gKH9%C@FMHB15e-vd)5lUDIf+p$9ZlO^E+TBJ}s68X!Us zg&=(TQq#{dWSV*eFX6!yhMZ{Lj3jb+F=O=$Cj}bP*&KOs;=*>T6{f$37;5vkz4Q8% z8sqtAf_hT*l+N1gU(3xcl1L^z63}Q|t2H5wE{vTP%0>f(5-TWX+R~# zd=h-l;_Pz++9xNeY!UxF3Z@r~$u~4WF%=TSf(hqI)D~wfQVpur?*($rQNyi~c*|K5 zyRc(wYRr}5fTAIFL^Wp=3Q7h=m$RWZu_Ho*gkyigQA}9iD~O6uG(?ujoH5&~GOjW! zpjWs8+TQxml#eBocnPqS{JEZnSW1E;49K)NjFm0%3Se;?W1EeOHuXwHFHoSI2{sj7 z)lx`|W>XQHsw2v^_)T4C(#Xe~fls7z8v-^yWYLI@)$E=y<5#=NdX4C~8L;udeANE4 zo-`IsL;4r`eN;AEDvW|eTE`>p;l}RQ}64V@k<(w9cv*lfn#OJoSyk#!PEM|uaLjfYnI(|^uI#A zl(AZ@mA2~1QoQ-Vf+WNq{Yx!@+i$5|u9u9HF&?IiXcB1NBywU%&W%nw3z=JBOLmEo zqA+Gc&|!e7ck05B2PgYL!ohtARQMWH7c zG)vR2D2q9}qCRrrypx(fUkP+i&u=@ClS7U^MoQn5=If^RdI;SE3C&*TC-qZ}X-2>2 za7FsxbWVpq zYI5eYk87{5jn9%KKXpa0|=^yb-l|G4MK8~IRUtT_MK z+nGE6-P=3Ze>(qpjI!;(TQnP*!igcgzc_*6RQab-y0;eyYWG8w`(@qUHk5gCKA1zp zY_puM=WutYTW}JM5jNCD6Wkx?TI&s{Y6~!H?dTn`shvm}-`=W$HmZGPpxTJrTTq+N zyF0hpyuCF;X}EBAcYAAq%|pc=z74z&O~JC(3=l+%L?N4X~k9^S-^OE^0} zIv#Y-FZw@jY^t54Cj%IxghoS|2N4qwK_PO1f!eq_XL;@29W)sHAy}l4{L#L3)Q;0p zP{psU-<>E$;?B;FYlMPCBQHpNREC6b>0}2kHaKv1w^c!`)2*PTfQrvTj!FzQUP2O? z2#5H-nh4Z&=`VM-M!=geJ#}ugxsjsbZsd$w!1LnS&N99OfU-|6bR>ji3X)u^#c+hz zYR8($^aNAMbLqIK(@lM2az$vM#MCL;=Z`D_k3?`yq&G2VWSUN3qoN+Xxc3~3D-Rmi zD`)P-Z06Kb(mAY|JPm4{F;@)+jYeke!M?qf*ycP;@Bx4?5U1F&NFhx z#Fz7ZXe6X!){oV(6pt1vREUzO9g~KgGSZNCcz)Jzcg~J4>MTsm{PpPD$T(DMZ@l~% zLE(~HpS;?bpnP`i4^&W@P4f26f!-u;yRTcXTj?>fIqxqlCdzHfFkcH}g+*h;_%-2v z0ev-wyHRFJ(U|Wz&}W)A%C`b<=D;cab**gGQjT#ZR%LfATfa8(&jl^C_@&!Zr3lu& z2-8}uedDtGTb&s#4tkI~8$PKmF7EF^qv4~+e5@{D4?>dOll=`O!6*3RPiSy>v1!Q4 zw&?H){$&XBx8NUOyEgm-(l*)7yV&MMf$XpCH2ohcHU9r#fe|L9p zr{e#=+TGuI^8X*B+}<|7w~lXO9iFL#3DYp}_s!JM_&B0bWhrdTzS998$K(;|RWGwQ z#c(Nn0?CuegZ*9ok%qlwG@>_PH|&aYZfV>OO#qVQBPd^H3V$Xfpd*UDT4^-aj`a%~ z*t)$`BPdJ-4ACQMVG=Av_&Hy)4Xq=JfiHk?G~pIZgR4})=5VU{aCFvFZIuJ4*32!( z>WqLJYiNMvu8T>GF(Fc!AIfCMJwzj)V!ME?GgqxKv+o%vtHI}tV++4uhug~iN3$cC^SR-6r@v-kd(M~o@1uIn|Gu0Y$fG%%ysz$e7Q&tLxRyz3)o|D6 zcPu8Sn7eYe$o7<*IcZ`@#r$tB-gs^;f)o|0E9iR$(@sCkZ3b%r%<1&kUSYrOQse&> zBAE{}#tQ#$XK!b_>i=!;Kb`+RN-5?4Zd;c$@?9{okW&&{+2MqnCvvSiTxtYt+%O`P z_R)LAd4ra1A*~F4C5rCCr-nYF(~g7As&L+-1iL=yu9n7#Mrz9sdkSo$(I{?@HwA`Q z$PZZ7CTwTw2YhBaKSM#t9SqlulL$K=lhbEcXAClrq0 z>LO4k&iH9&#&vYD9mErImV~go16%M3hWmRMdBqjjOb#8vVm@g2v&iaPVAY)T>+dz1 zb~}+1#?u@jdv4h3Y5wP+P!87C;PCH;$!l-)O(Mc7Bnltb6T5@IRqP6fIbTWaW{DUJ zCC_956pn*xSUgMHSOKPRVzfYpxAzywaAoekwn2X6QnUVNF}4SD09M6+Td(HNf1d9D zJWeT?t3}b=Y%j2(7W%XFfMAIakhd3Co=)yA#C~(#EvJ+f_Z!8t>{1rC9(prkvc{-x zJKL`tEwz^}R9u`x~xgJva=;4LYXBKUcNTF^X*d5u5P%!2OVyRk`%_QcEKBok@_gg zZ4Fb*de<>*toLSTVy&5Lw*GGJc~%5H$j>z@?xtz2lg^jTyKY%b>CFd{>>~+-MSxR! zM4Ifpp00eEnwY^;u!plt6osXDe$0jLS$zgadU+vdLYf4!sBLzoqHtxR(5sM8k|k*= zT+0sYtXGcVEM;v*;OzIT%^XqrFFXlwB@HFyvWp>VB%Q7@hoX+K=IBo zk(5(l%Dpq`$*z|yk(P~nh|8?Z?yY2K^ov;>izdR9A@MFT@~g>%t8Cm_m{!LEDBMdb zmqkXRTw=!Md|!Yl35V&9B3}#Vx))EqYOy+71BbM!$Z`B?nH+kkh zTKC@lV$LMv&1HA{bT>rQC zcV1QVzxQ{Z^1mOa6!o9PvD!psMj#b~UhPTY8it^7cxW#=J+vRdV3hnMdlh1~x$t?a z!^0s)GJ6fc?h;Od00SG+hYtiwNux1@NFo7pLQI}~fiXJifwLe$p5Mb82F$zE`Hxf8 z*_$XgT|g2^8tDFbLxqOhWj;^=7su_RkB)iMpm5)|Y)nETy~#;|Q}?zn`{{No)$`?j#uv)-{!z77*v|p54GZIb72k3z%K1krlEXfQF#Po)^zT9jL&CP&A7$8-?L_= z8{uC%-Zv7ENx50R!Cg49Fy=M8#@EQMD;9QZ=Cu^Jr z3l8?Rehd{@pe=;#SV%A|lgQ zFILdj?sf*9)9%TAW+Df?mYglZZ}!l}dhCC9-n);0mcTy*qH{+fOOfsOyXJD%y)mAR zb04g~h4ii}S`~M{E+Z-3+hBB6@M5=j)?>1MX+Wnh4f+@Dv!3Gj;N5Y%`tCr^_7xdm zh4iTPA~fHeOT8xVO}@~YysxFbaQZl#qtb=R`yDH0rF4{7VKd`7y!@3gCwuR!<}34Z zSZRpa>tf3^zXo~*(fpOMB9S%SK4tSzVDR4kgliF9)#m9tY4r%DT|OV3+RC~u{_4Gb zioy~c?&*imzdSWBQKf|3ViC#EKwAdo%Urwy%J%K;O8>2D_cIdGSGd-dn{Ul1J;)Yn z3E}f^zs-vD;vVxZaV|oA|G0@M^KZA6)UJq$Q*B#?Ree2fF{Eg49@_d@-;y-U zAzA<6Vv*CLP(KTltq;gvHjTBOUF;Sp5$Djo%NK0^zfx7{x8+E>7Po0 zBJ?C>(U)Wbtjhm+Rek?$r?u01ivK@Ksm=fCGQTF|zuM+jWadkP`!#`NJG+`bVeHa& zL5-Ft0aW7&+0t@7MwwcmG=eZp#B|7R@;HPE?ZB@uRMQuku_b)0jPZ+AG%tDFO2gu) zSN|-CaE4dNza=}C>%XJ8OUDu8_|Rjl)c@UT{?G3A)BT^vDbJuwq(pB1w1k;|xSn7H z!-NJtjm8iY?~;sB{|lgPK8L4;%T z!sKSmaYS#>H;DlMl|6mSBHdG=q?~j8u)bqCN4-H$|0SMhkUnYg;jjlj<-&5tR5tZb zgTCbq|Kd&kGpm@4o9ajQtGJ4qGeAS)T_&;qlP1FY-VxWa^}RDBm)7@=4Ap1G>Dc=I zzpZERfpE$a0iB~`VL35pf1oEVhx$mGra5PSSk9I3n2*hGNzWIRT>tBDRX@lWEA(Hf z{#^cVtM#P+k5Tf+R<fQ`rc?+d)q57%dZ{l_e^={_o5nm4y>7m_RL zF&;UpAC1ON`j>^?Wc_qg1I2|G&o=|S!oZk;Edjqi-z375G{i0OJ3QYEQ3x`|Eny;o ziNJx!0>)<#$?KQqaTIE3e&c!Ac>WQdzjL3Ty3c#6m)Te?L$R$}d?tooKrxa7;`@9{ zKm+XOo9V7+psd!Gu;KZpc}sJk3_?cAQmiK=@`E}a=j?a0dR?9VftrkmnF+t9*eIW@_=h9%K1atty?<*#CLyKoI%jXrzqX=2m8bGlp2`E4{|Nv9|Nkfm JC*uHi008Wi>XiTh literal 0 HcmV?d00001 diff --git a/charts/ai-stack/charts/text-embeddings-inference-0.1.1.tgz b/charts/ai-stack/charts/text-embeddings-inference-0.1.1.tgz deleted file mode 100644 index 9ff92adae50bb193def28d1a4f2d188ca3009f3f..0000000000000000000000000000000000000000 GIT binary patch literal 0 HcmV?d00001 literal 4302 zcmV;<5Har`iwG0|00000|0w_~VMtOiV@ORlOnEsqVl!4SWK%V1T2nbTPgYhoO;>Dc zVQyr3R8em|NM&qo0PH+zbK|y>`OII@%kir@Hlhw6Gs~*kEkBQ6;)=(kvOV)Qn@YJL zvLzt~0R{kND~|WKZvo&f$&&4flYM1;uqCk3-Dsc>G@8g*@(O$p@9FvS`aO-WgdgZ1F zyccjjr3$D50zdA5JnoEzOo-MP!k#^$cS(61!Ut<#66D(Rl$J!}WFErJtq1S|q+pEl$>%gC8bjL! zkdW)MOis`sDSJM1G9#23Zi;?qV@~TRJdY-1Vlhcfg`!%>c?gqfBm*kCQ)j})B*N}$ z+Xawjj12{&(L98s@rlqwiOS5tko`16DQRqkGDWcTK$8hvO@%^;^R=Mvv9q(4O%6OT zz#;g)=S3n(h>_7xew!OcG9FD)`agRf@|hD&2b|gc_~XUl$(M^S`=_~l?81kT%sa?u zof(lG+hd=eVm_}Brdp>e?AFB)M4}suNUat}H)8aH$Vq0FP=N;(8=pQL9$y@N@StMh z@B8~l-O&U)jK~RgkauSNV7ESK|GzH|j*kvc&M*GHe}3@&#o5vS9M&=T{oY{5uZ=kU zd}d$|emFnfKWKuEGsgUU&4(FdXBbJ;DukbYwjQcjDl2XSywK?>lrtLPeiYe#YejaJ zVnoLj6ORKWx}8l{dQQzkkvhzm)V=D~w}Esexe5%0IS zOGSK4M#$VZ^Ysj)Oj12R5Zvs{at>qlofKIb!l2jdnblhk7Lk;UD5IL9D$GhOMOu9B z!2a>Evp`7VPn^w9h0y8Q)hYf*XK#_h*GNgnrJ7m8PNK4ATM2lty_p zGzLXT9m2bw=TSb9s4P>+jWvry7!#%p)`$_MP6|OSTSP`fXpAlu-5g(F$A-Ws zlwU6e)J%0qWO18G82nSAwB^JI#C!>zz3SjKNm7OZ6A@wdIY3JEGzWGAOh*Xavd4j( z+qoZ^;l^NC?sI*LjA)qCPP+^pP*!2xlpCZwnyGxPDmGsfq?d8&NmL?}5mp=ip9q=C ztnNuP#uj;Ox3w0aEKl>&UYDcoe%AsRk{NRCq}+@Xa$W1_^=xz?C#VmGpFeBL=x!N5+=63t9i{P=9G#9l4d!dH3Yg`Qcfhuk{0ItU3Q}?`-#4=fAga2iwo*zo%&Z z0KP+K>1+8G_s=m_{l32vBt@81N*6$b{Z`l1{38G z%VLCuGhcN^F9K*E0=T_>-D37=*kaWXQV(L7YD_GzN)w%_fW)y`9JGD;ms{U55KV<$ z&am6v%Gn6FO5v?ohhstFzY}IcAbHnX0Dv)3AslH)$Q(4eL?AH6E8{aWU1T+;2z8Wj zG|V#-WpW^>#iQ_}$RHvdu85ANK(zul&$?o~y!WE3Sp=P{2QB5xYAMeSPrn=;ELly9 zeiJ?(!T@wSg;xOo=ElFd$+h+sd*ZxvEoYP|A=Kxug?O{+?u z{uipKE*8E&cpLPBUeFKU_1^XJe1c09);yCrc@~^+#IfO`GZylS$hgM7p%HF1g;Mtn zf3{zKs*=L2qv`c#i*`qTSqd-*|`Dsm)uoQhYY+ z5O{C8xxKX~sSPYzr-HZHk-%LgTjN!j<$5j^em5s79>LzW{YaCuY&@pd;CK91z~)(g z4_rc#loX7cn!~RdVRTF}HU`7aB=G);4!4EZhJu-uf)Pf<*cT-dgda-F>*hbE$YKRV zqRUNSo-3saUXA8fHXlyT46KO(jOlwFct>N9&HysY*<+pG-qML8HieONWfn)q*L_id~GW6 zl2)((B5A6+vwmKBQ9FE_4zmS|(`8s*$vz~D;6ZNZ+@*+B+4VSBY1n@UPI-)6!;Zmb z!mlvT@KJa1T<~4HQK{!9ZFxt2ZBm_d24$$VQk#7VjjI_g( z5FJgAYZBO428&LvqPyov6|<#Cx4s|%n;`CT=vF>BLU zW15dz>>8Qn6LC^$L*32r0?Wm2T1uo{DpKKDC?a``&=#HBri!-AEe3VO&4P!eOjZJI zl~F9`zRLO3ulGyqP!CXRQon41uFFm@d~VQP5xEs6}Rg(w^iJ?e^olQYyAqUe%Jpn zYJYa3!Dg$2={||bD-NpO==l4IJq_qyrD$JZ^nJF zp@{c$2$X;A6NBaP+?GO};@II{b{;bQ3+3q6v^{1{BrbPXK^98!KTp0Lwyg%XB zP;OnASt`^I$F_R@YYH0a7?z3VKQT)uNxW&K70)-rNCUzOYl zHL1~T55a4V+Nw&#+Jow~qk0Bxf#zaXe1+-JMGjZjS0JwrUIkmcgVZ{U=c8(s#;$cNuk}0K`lwbi zwt73k4642_4J#X8WX5pq92(3OZ&DdbwvKs$MO!UbvfFyEYE>n5HE;I{O0zb)Il9ea_UTV42$*_7aGdJZ+?zkEk zY0W$SuW+Hi^CY(Q9{QhGYu(=rtkwVBeoOxc{kPBg|0ii170k7dTWv#;gFo0_+)=jh z2cN`R^Zkkkvhp`Lnld^Um&liyp^}AS+|xu^o9MqrrQP37Bsj;&zD&Kj8Ca|Tdu{#S z-r0Vx|9g_QRIP_1UZTtXL!5u7wQc;buG0%D>K7&FQz0(>5DW)p)X*+hD#~H5CaCMR zTp^4yH6MxVvdpRYwWXH^^ySY*#etkC)AMv8q^dSg9#HOSJX=Ri|A+ zHV47&NW&7ODD5xK1YYpr?BYxdiQWsyUrYINa0W4z$_pk`ckN%tz88#slU@6_=$KBr z=1=ie&3Ly$G$PSumfD}MQ{J0EU8UZeU_>sxH-S#fXCdjtd-K2E3;04L6`6vg4~NPN wQYn7HNP7W|k#rrn6u)@EOhqEb?sI13xjnb%_E&EI7XSeN|9oN`5&&8N0C)jzEC2ui diff --git a/charts/ai-stack/charts/text-embeddings-inference-0.1.3.tgz b/charts/ai-stack/charts/text-embeddings-inference-0.1.3.tgz new file mode 100644 index 0000000000000000000000000000000000000000..7f440ad8e5840469c1793da8f335f3bebabd2feb GIT binary patch literal 4742 zcmV;15_#<(iwG0|00000|0w_~VMtOiV@ORlOnEsqVl!4SWK%V1T2nbTPgYhoO;>Dc zVQyr3R8em|NM&qo0PH;dQyaOG`}6!2eTG;0xOi;ymE6?jUGadoOKn0ZAbGc!N)dUc zZEMj;vy#T(Wx2ooO459Lj16Sj-7EA1cxGDNt(N*jQcD`IbQj|xMiJ#>)unud5_yQd zy$O-ppOKh-_rTKc_xn3rTlRmy-*5i!Z}(q+H`v*m(UN^dCxi zm69q=JB&Mt+FRN!?%Bej1Q3`4IA?cXa9w#vdw;)g=l_6SM6Ri^!^m=2eC+W}+Mck|4>n+BiX9)&Cl7!Ka7*TlB zTuOa^;BR_=bT{6+EY|-iVJWI_VE~rs|Mu&hK~w*?UT;0=|6`Oj*vAn`nFiP2R;w2d z3g26Uvk6r|6%hDo_x-!>NXVFIjS-9}vjF=TG9nSCL{c(js6Y!CA|ym9jDT`2U?x&S zCQca9sC>_pXmx8(q+ACu@VpDkqX71;eTk84&r@0wjpJDW*Eb%(8c4wy<>QY@L^KBW z6+ld`PE$EXgQR%#k&`K*%y5&xcPf2SMd5igCS!|9Vj>jPLe2shPeSQav7)H}NK(d* z1*73CfWy&|(8m&$X@Md8VTw}H$OvVEVCjJ-W4N3Mg%D+ZLEUF(XG@#xdtiVA=yW_U z6md+9j6Qdo+%S^zaDuY)#ene<9XsiqO%RN^1TnJsV-X=Uy^|{RVUKXrO$6S5*gtr8 zez*@r0i(+Ft>EyVx%Hfk{8034UG;Zh^aA0lo*-ul%HCLGcSsa|^)1E2k?CqM9Y_T) zFuwxiQz`{FABuqjmm*~mXmWv&NDMKuV-7rUoF486@Q>Zy!`^U=T}I>>yU4rKfxqo} z$fp5({$h!qVAdHyVeu<{XPA#fs22BOFJ$zb$Z=}8Q($p+!TFi@yZ?Q@_wMlE=4&p|fOtOfYRK$HPCxMo}KLOHGxMdW1Vc|9jA<)Vkl87+Za4SYL6vwnqWvr6ct=fP)|?-fea3a0|Yg(@*X0D5{bshgX~uT zTBc|b?WS79MAMKkHiOt!Byd_I`Aos?@u8_3nT{q*{g($oOiicHB{t55wjR`41rkN( zpBak{=1lz(wov)z2yQkh8_W6F<3fW%4TMKo%dBe26kh>xh^T@wax|tTf>fCp#URcl zT^K13vfeZjPeioa;4Tr-J2FJ(p3LJZhN+}_wkNn5YDF7H>U$~DB!G>6zi)c49V{dX z8B#_yHNlG;G?5fZ{<{mi@7_5(h$Q;J+3Z9J{ZGnJ&6LKtB6XSaU3Db50cgJds89wl z$XKz`G!&e9++(TIC=ZW~SrbwR@TTv1l#eAU%M@~>xKRKj!j!=pGNRN`E~vInG?XvW zAxe(M^i$Ex@cFiG0DMgORV$!os!KwP+cd)9p9rNbCq^LVA#hf+i&rF082U_vgxT)^ z3DJ`b*i|qu0_YWQ9LSk%`=P0BEP&-c)2GmghN;5TKo^u%Sl8ql>8@rf>#LH@wVZSt zm!8BtTFpnnzYtQDTHTXqOg{3+4r?tyS)OKv*C=Y+@va3hBvS-!95yiyI}}`nRHTlr za3YNAScg9`WKjCfyA!4aP;N9vp)#!U(EXQMnPFr6LB)bAxTJaljB3rYp_Q}p3RD_S z4EgtzQ`4P(?i3;cmxR|^QmK}5*IMn=Q7|ShDIZ(xjB*1)qMuV`zsH6E#}Jhwa`wu$ zUt%n5>k-0KvKb5|v9cLyl<=$+^)o+18q>0m!X&j?5$8b!#x@ujY`l3-vv+(-BTDQv zVr;>)rvH+ndMGB3(J69N>R5`Q)kx#YzDMnbZ#HlzNSL0uHjkZ0@xy=Ps|SZx&& z6BV^8cue_;i`A5CaZIi%FZz8OqsTGpz2lD`HD&Zyt3bynL!(S4GJDf^A(#bwZ{@KV z(p!VwD5B;IVK5aejZv8aXnIzpI!SdUOf5fN2ct+?>aRbk(WL1sh znS07UiNq1lh0w;)d*goY#FneEfH&(mk8MYFdZ@$RNQjR8k{kQXj(c20c!~@|Eu?cj zS}^0zoXP$C#q-F>(sqG!BmQ3;1QpSF@94wX!KtsW^gZVoOXh!@TbupH{O|Sar}dx5 zDFYwAM`vRz%Ny|Vr8M2>efOjUad6nX!PI8w()`A0w4J<$j?OPx1-Wr2+eQgM>H|uI*S>LrzQL+K_rLf&W8$Wh2f4~% zqC8}2gfKVfE9dBW=-L4vZf;&Qm_0mhuxbdYdofHk#+Fy5iB6SIqR4a(+IQK*O~*12 zPK52wpx0Z^*a+4O;VtNgcY;L!Aj||G^0vMJ0Ar#8IMfi6nVUco7~!SyR;kWcH6{pE zlyG>QtxOb)1AZkEgr7tTA>nXIbT|R36}Wa*730~RJ6%mf=w9BdE1#8Jd3td2>2R;5 zH!b>A__z-P(Cy}40Xo;$o$KpNYoAjd;T7ZqfmNiOt1R?iSf%u>W;*@r+_VgjvT1=~ zzR~Np^$Rt(n6Ip$y2l^(&yRNBA2bA*h-g)9V9+5+;@9UWrsCVxgj)*s)jS@`l{Nx= z+oW&gwonse)FdLBSlpR#U32$79G&eR9vz&tnX5!ZtF?JOms+dw$~pq2<)tuX#cOBJ ziXQKLqKfLg;|CkB{l4G#2f>^En|?NvcMF9T&t&F&Ip-^JY`Ex-guEm&s<3Zp1nYI7 zR6WBV?Ux^`tP=m7Pmm=jm9LX~Z3Qfg|8}-F>ha%3e`jOoDgJwma(&%<=^b1pcEzBv zxMt`3zW1`1*;_k@S;3-pOL)63;k&J5YrJx^TwTS4-^^Twhp@A0f719g9gXM}bh@2J zz~)(g_uNt*DJU2>HG^ML!sv)%WDJIFiSPXj9c~M+4F%IG1w#ypu`f!*2tO8<*R_8{ zkwprKM7Jt{*(xPf@O(J4ve`d6HLxZIFsAQ??;VanIs@d86kf@#;=9F04VRQL6LX}> z@Tp9kk}{TYdk0aMo;eqHB_MCE6X#M~_43*yj{JEOCAfkI3!Kq=J>3= zyd!goq+E}n^EcJ~o9Z-hIijl%xb~m5VOZ&3qea=yu<2Xd$Ju~!P>c+b-Kn2#y|R;= zjjPJt{m%A^;5U$%FyjR~|K5SldFSqGCgNCd$FsT%&#s1JdV(zW)ud`FahYIti+wcnZ9d{Ew)9ObF<0d`_$3t@8-kk05))3w7%+I!f z8t&=&-R40r7GdXADOBuHPN$Ron46olBABx|zmNZ4CH{+wWz73!gDlJc7z`TuUmJtX zt*7|!QA#!cizJEaO$S-(MP>4BUYH@6&n|;vGxR>I2p(j1&TU6nm0ga56^8vc;FL$m zHEbDdCj1Jr6+Y^=d~?1ldl}WWNt@o0ZCF%VSxrH4U`57B!KfBLk(iYVoB=d>s;xHy zbzh|uPp+p3Dz<`(@b;(Dq< zE0d)_8wm{U+?Q)U)s6MSI#dJHiqvo6Ws#~aWM;5Y$Lx~0pi@z8`^qnqy5Qy}nER~B z7=CNcXlg-Yr%C0wlIk^wugn9h^H(HpRcd7K>VU|n^J1w)H^`^;3ax@OP>Y4tGW=R; zxim6A%fo5{7uiu+epl^dk?T}zZw*}~xL(SdT~-WQ$=e<5I_cWlV~vI8igLYPB83*A zU;&)%9ap~1ZOh*(`x^8uy)eIHe=FKL_^o)0?B}H@^W2fe*yikEZR@)RTHE4YNP7vb zTGuZiUZI=s_CLh*&QYmuua{u8P4{m~FW;-LxZ-^G{+rUNBngyI)y#qWQTwCA*{5>H zvda8#l8^@-16VTu+vsm>&*gt?4xZ+Jk5L+Ke!+~XHcKo)dee<;viO6L^jG6**|CUr zGYFJ_?ir)y@ysTno#4pfZkrFA_jAV)tQ&Ypi)x8xDGZnU`B?H;f&a%`YJ4hx!m^70&y()%8v`uy|67Cp=G^}O=Ejr%e~hvu zlQZ8_SvT(MDBJYCqqi$?sA*_s;niHw+9bTPfkSvS$5U~%1fFxD;km+iigHiH36Th$ zzrP*$gE!rN2mHOt(HZ~8bcp%+x$mjYe!h57uG40##?L22{fM(Ux|Ow1=-hI0rBgw< zer{T+P~RWh;`T2|Xr&`)6U~3DDw=E$v5bQ_>PsOnjAOZYUX z&}>%0D~;UzRCQP<6c@W4Ix)6~q~-Yj=Fw)`I&#Zcu#j`h?h7X0^P3EfU63XE^DxzM z#51&e<$uK=H3GE zG#;XK^>e2(8|@(3Or<>#p3r8a!q-+%$S~L3;(amD)E0Fr2S6ue}8AQng7w> z+3Y{X|Bq2>_y6RnA6c&2pL_LA7cOMsNsr1_VK+PEx^x53Eu9>fCt@>G-m)K9+jOkw zczlC|j;%+rt#{D>EL-pHW?-rQZ#VA$+1S|VKdt{iN?9pkvN_#q8j1}3-uB{_w3Xj^ zCe~>0H=K|ax1ZEybS5s4x0#`Wg}mP5L|Loozec6q-)<;4$Iu>QU)>BW)&J)GUmKfS zTbob%{}`oJt&c_2qRXB8IR9>A*mSAThYJ!Zxn2DiFYNmYr3M4Y3=@jicPvt$~k+%jM$L@xS=ZVA-y~4;jkF0l(pQ&>_tGDd3-6_`WAj@`I`&@vueS!Dh@>J_aJYY7iT)2ZH=6fvdxY!r!ux)opB)^&`11U|ckRBIzc1MLytOqrMV%(@ z{^64%k=ygWe*HQmYGThB+G{)QrGk`?Bng>Fqi%LK9z0D0}XqfqcKYrM8`GYw(fNMSP{a%9*7O<ViW-MfoU5aXiip*B1NXGvw*xaY`RG!LH U`7@ON3jhHB|DN}MhX7e!8<^TWy literal 0 HcmV?d00001 diff --git a/charts/ai-stack/charts/text-generation-inference-0.1.1.tgz b/charts/ai-stack/charts/text-generation-inference-0.1.1.tgz deleted file mode 100644 index ed6b639e447dfd961d2f821245a845238eeea08b..0000000000000000000000000000000000000000 GIT binary patch literal 0 HcmV?d00001 literal 4285 zcmV;u5JK-CiwG0|00000|0w_~VMtOiV@ORlOnEsqVl!4SWK%V1T2nbTPgYhoO;>Dc zVQyr3R8em|NM&qo0PH;dQyaOG`FZ||z6r1Laq-wDK=P(4cf|oOOKk!!AbGd7wMEG@ zZCi^*nw2yLFX8_7D@pTh8ym>7`(B|Rz}B?7TP^j6T0Pcyr8{HfD2b+mcPJmBL>^&x zZ$hLFW+Y+H9@u)lUT%l_~6dhP$c&7GZR{jHs??al4}+wHAqz5dST_Pb}$dnn;` zTBbCS&w3B0)t=nHNFyozic(R*Lzr%QBu&e&n?XP5doij=(p1~7UHAc60+HDoFcK1C zOqrNbK87>A((tj|NN`weBp6ANzz^AYY{33OBJ?;(FodOB&(pIMLm+9&Xk?#x(}Jm< zW$MqC+P_a*uK!cQGF0Eg0Ibme?d^H}-`?DQ(*MV3&tV@&Bx4%fdRwhtx+wzhIh;+X z0;+((PrIK#bw)xaL~D#;M41KH$A}S$FeQ?bAwvaPzz`uNN?{C?YXLKn88S)Ah(;B7 zoX1J5_%v}nHd~d25lqo&NcD9e($J&kv6VU(U|Yj(_x-OpAnQ8WF~3kl29)P8%d&DA*kwnz1o*ZG`;a z9sn^Tol;fUI2YP3lvPa<$L62ea4qJ{_zJevyR!*ese%|S8fB1W3Ihv!I07y-DAYiB zoX^beZ<*m6APx~#knbLhAyXz$Fo+9DmzKhVd^wH8QxWgBxJyO+i42jsZ|3VMMwz5~ zwkNpRq~#n&>Z24{8p39;*E6fP7%UBUXWhIr6*B|Oh#C3_DG4HxbjKDvpZaeZs)u6o7@Z7;0fg?E?`n_#tFHqb@X~R zP>^HPdxI}uG-dR6t3U&kkx?cS9=-3mILLy1w(?jG={<+tIHu+aVK5aeOHi2&XjWEa zI?Z$~Rx`>#xrGkA9N21W6@`q1@Ql!%;)b46$+{XRGxsfjBvMDb5W*skJ{$LQC$`*( zCA?X`Ij{@mcTq>(kr2LpQW*Q(j(c3hc!~@oEu?cjTChAAa@ajGvb0_F`e#S|Ra+jp zmC!6AWj@%kVrH zQwaHqLxtY;bqDAOg0C(|P{a39bp{3j8Ax<3LF5 zmn`QoSzrP(hYzoey@sRX{e$zt@yXeTjhDu+Mw-DGHFP@0l&F+M2!@dpWX6pLM`iEL z4Ri$jssuMoe(R4;tivZk;{PGc z#69x1wEzHPqCz;-kdPT@a)Cf#gqOxqX1d5~Oc3fQ;c$>=Cd%YMPzyrgCy_x!I9w7P zO@L|zZk~0;cyZ@NSJMbOm-kxA7u8ap9-MqV+*`1k7X3PW+=l_^bPBHk{`IwgeVuFV zOUh%sf?^}Env@Hbh2ATxl!4Vur+@y zCBRg~>uLi7pQLHfJRX^WAJ!9YCD=Ffcqmue2=GIjzLDEfO-xXem}p{g=fZW<-8()y z+dVuwI9X(_QW38==Z!*Y3yoL45GXA#r70`Bojog8-2X}y)y2a1H{S)lpcnMR_r3SM zJc-~Eg*DG)j++JNYjJG2=!}HCBr>kCZ)k)YO`+61!=LS!AFHhs|D8{er6^UP(|cV7 ztcw43wl|yc-)3)Td+RCwdyIB{-F@vHT%|Ty(aP)DR72ps?&kK^9-r2*Xq^h)rbGgF zm28byVV3I&RQP6&Q9Od3xAr4VPP5U7UV-27TLGJA`Q39_L{d^PZfXX1O zJCnfsCpz2~UK5Q#1!fq8VKZto!K$}<<@t_9@n6m=oR zrO(${0po4+&l`3&;fM8?xZ<&ti$l`(ZH~`I=N*|#CFObq{@+yRZ_01sazxkPaEm`S zwqb33jTYrs)n;w&8s{6vK`}B!cBgf=nnsn_v!ZpLreA0nqYn>4)&%S)hNe8tZmkVaMyhk(7<|D4M z#=yi9b3?wtZ<)~864X4Fgm5y(xHFuEji4mItXU}NB6V~RQMc#aS;&;jYuz;}U4W>F zO2fH;>oyH(JC?;4Mt7Tb{p#yznH_9`1^Mk$%RRlk+d1gfGVHuAg_=Do==k}ExwFYa z1amg$kMaNO#D8&_LA_r!$cp%HYx~{XR{YoB>h+)EzsG3x`Y)2EsyprHr5Clsx9Koj zusB_Y#=DH+w`Cz7yAfpdU1PmO#dKw+dEo`mRV@~I|)wPi5xv3@JsCity*i&})$D2o!0<=EzIN8^UN0ou5UUP^lft%d~RF@KF*=4(W^ZpQ37CQy;0$KfZcZ<>~UQ;mZk8KjLhTZY>uE{w*&}_%)Op=Vq1)_5HCepZ|)2MmmB; zqWSx}qRH=&syK+Fz7+DpIF^g|?y9WcD8O1oZtJ^}8=@vPn(ZNYrIDMDstN0a;$pW$ zC&tAgX|=zyiWIe3H491z({*4^tgSJV(1%y=zp@fX&gI&x$WG zJ-W!@>iP=g)xpbPix-btXYqVgtw>z3WJafj_vwd(Dzf{n9! zDetm{aBWDU3*>RwNC%NPt@N*5e|7TrD_34>xzx#^dKoh}Qx4pQfY~c?+iM8hY9S>yX4{tPObS5s4 zFET?V3&ps{iL%zwe~n7Jznw^Mj*)$XdVMpnQvY|_`u}$8-BbPFqqK!;JrMB%UH0$e z{5!2}<9~OZo>Ni3C^?@9ap8wxI4GlrcDYhf4s$t1U9aT|VVJ4eP+XN|PQ|Y+y)d9J zekm#rV_S^RT|IXIV z+b8{hjP@J`L~E4pr=Z+&!{r1y3^U4N%EyqB=z@$h9yW*+Mk&TykP(I z{8S5x-gC%bOZmEY3Ne++3&vD;?O(^f7Yu)wUHiA_n2fvTPw`bvdAC9|B+*5d+Mlme z-s?bJrrzsdNG`nBflkb4A?etA{eRwb_(~)dnS#Up1LXy&6u)Amy@19@x(-~5U%gSl|Q09pV5Qdx6P diff --git a/charts/ai-stack/charts/text-generation-inference-0.1.3.tgz b/charts/ai-stack/charts/text-generation-inference-0.1.3.tgz new file mode 100644 index 0000000000000000000000000000000000000000..91b386c78eec7d76c3b2a17b6c3dd81dc3666270 GIT binary patch literal 4762 zcmV;L5@qcliwG0|00000|0w_~VMtOiV@ORlOnEsqVl!4SWK%V1T2nbTPgYhoO;>Dc zVQyr3R8em|NM&qo0PH;dQzN&M`FZ||KEtd1xb@iPYxhmvzAFxR8!Eft0(Re}QYnyU z+O~p5nn)Uh!*YN7m8AK$jSXx_@(TR`o|#s6tEFzWS}ke3*6k5;ltfd(+msJcA`h{% zHzrd1Qxdc99$C8GZg*#E%l_|nyUqXI?QZwG-qz06_SSZ9bL;JQ-QLc|_QrS6eJtTs zN~$!G-*q2NtJ%1}NFfRRf>Kez1DI@hBuR?L4Zr92ya-h&X`=0`UHBeZ451ksFccCZ zOqiHbK7up6*6^ViNN|`BBp6B&!}sZEWWfGOLi8?idL?9}0K<82f zJYB!%Z+d@p|2?)W*8d4%DXMQ_0G8Ew15FZLX^S?DAxj}A~j^< zgb|I(_dJPK#r8zXbpSojyQDk{VBgx87`gU5r6tigng(!l>jA8R6pT?m`kX{WV_;ta z#N_%kl_NAriZ`D*nGnhhH~D*~*(X&Lo=0OcvX~?$LQyT`G=R}Kls*+JS`2_BWvnk4 z4W|Jd4v&QHOH`%>hV1bKrKFJ&${4}Y15HM7H5LjX%KC!3&(6-4Hre;U00+=&d0r^u zm>3!T)M|3WNXo-8%GS>Yj1TF^N#|^gV5}yHp~WAI2$|`fRG|-hgqv<6@acH};N$t> zJ`e?rD$}=u!++&QbUgG!(Xn;aKY-Cogo{z4H!eU(xHwLb?K46U|V0;dUvbVyOb)fn{{ zB@oEqfH*)U7L7 z!qk6z0L0XE`d?z>TxirjQ$5 zjsh4GrVQ4Q5v7iDLCxz#L-{ftpyX(#3Mx7oKHt_2fR8A@o(rg%YLn37HjOa&$3kh# zi4ll-2%ME|<28vBhCUM^VfH&fLi9KTb`{Kv06N7R2XbcHerT#2lV!Qj^eHr=VX81b z&<14{)-}0Cx~-YY`l@7eEhjyXOHX3%H1& z{82IL3a+Rg1EX5AY-r`IyaAPlV?+KE<L?f!SCo$| zc1F1YA<-|XvfpDvfMbYC5jlNh+b=N|w)F^MD%lhUl33XcHA;9p%Eo^^)a&GS<`<_Q9Txu$LIt(D%F=_U^UWAZXZy);hPQI zF%qW7?u}JX1LPTdKp$AwGge!L#CTD26+EW=#QAp0wKyi%l^5Nv^=ae?^kIWoVSicyjN$&SkS;pR7C^WN2wSNBfUnpgfn~wJdgXi`7}@==kj5 z)YsSgfi#w^|2MZboAJN5Z+Cjn>;I=HJs&=xn=>m>F8F-%5e8E;b@R-_RS4ONQw845 zO&jPC{4Xv>lsjaZ@rT=63n2*~A*>r;27>o9(ALK>umB~rZ+$NJ)=V%rH-^x9v#w?a zM%~#*wmk;r90C#vv;yI8d+olPNSbLcukmTtVwdMA#Qnw+fasN7pxA zuEU4dW)g&>42w`T;U&d(irAP~WxV?SVVD_-zVAT*( z4`P^Vj4iK96P+rbM3LznwC}Qq+m>Y@91Gi>L8r5xu@S5n!duV}9|ej2hcM$z%Degk z0E~$W;7~(MrY=T6V2D@7`$%;j)fyvIQNm$Ai%b>4A;03;!;d0`kZ`ynIvfMl3S2v@ zit*y!ovtP!w67l2l`qP!JUux1a=16AH!b>A_;?5d&~E3m0<>;!S~oYD*1n`X!fVI} z0;@h_QK&yRLL9W(@(h-g)9 zV9+8-;@8)lrsDh6gj)*s%`6_ul{Nx=-=uHkwonse)FdLBSlpR#U32%2kIr@vj}A`e znX5!ZtF?JOm)cz8m30J4%S&O(ir3Db6+PbiLKW3{$M-hg`dz>4_kwrbcik*9;{wH% znaQl-bIw=d*l^Jv3VB6jRAJxH2-fRDsm=_4^t}93WflMLe2gqXseGM0Xe(%$|F^Tf zQTP8gx;s1FXaDah%FRvZwRdox*a%P~SZd=pzW2J5*;~6NUBRNYOL!Y+@?9!{HD0+{ zu12Ndt67`!5Oy~0Pa2=5!y&zfR=d@3*gVVco(s*Af`XZ*rtoV@7#&iKjKQ!i@x6bc z!)@WUp$Ww)`_;R+_LrM|AZ8H~(jC7*_h% zXi=6RVEWefaW-Ha6e9y<_v&X`uk7Sz`hf;lQz94+kmRH zvYLYAz>18cf>AAgBrz)$I0I<%REswPwQcw!CRPX=;;AG9i}ZD09iQXkyj1~Z>E8Nt`)il*i?wwhG>l~lhOd}SVBoxdV+uTmp> zR|iBsnH5XLyFoswSC}g}1GQLKbB5nsS}u*y&r7_~pzoqaC%EUT>l#tC`UF_0zezm4w3_H6#g=JWdRDN19S zU$A1TtrAO+&SWE7EPgK}{mo3ZtS_S73`O%roWAN&(Mmcdf>4ZsI zym17o{(wVOp;!4vCMd}WD<2m&c{R=(v*J=o+>vSeKw-FC-lvks3j9B1sPVb{3Ck+; zf1Y&rP#<8){J+)fZqDxiZ#~cdPf?a+a^`y~>t^~o$~JxPIolOD)Fd>k@MEJ-n(|U1^!;;D3t$0I>7w=+BnTZx52>yDF1tqRKZbJI$N`r+6Xw|_}OD;>f-(foZ?(PVpwr60sm zUkQ0>CYH;0ZmYCcOTe2)ZtI(p8=xi?n$0SBt&y9bst)Uf;(WJ5C&u|MX*s^Xxwknl zjyz{9Sjd^M`+~*y>?T8F7i5Y4JWh2S@eJ)=d4R7P0iB^ayDPH5^yoZ>ud6+fWrr_< z%}?_+;ucx0N~XChZOiMtu;ZLye0k2tR4Sk6x|OvDnKE43h8lDEnM6a$=CRMPXtN~? zb{i)Y7iH3y?RJN`>bddt+WF|oPd45$TGsC|T*^`&natTZtEO@<>Ihc`B)mi(1&wg+ zGP}1Dr?XMu$^qAUS!6is#h#O!c?-bPc!1K?&nLy1>eV!Yxm+Esz(WRF1izP%Ys!1h zis^Z^@NZRC@&9ut?RWD3yE~iB{EzO=&h!0GPf}|4Kjo<(S+3fjJ9?*!DP-YEkIGhI zJ3F+zbOX?ZPWt5u=ggGP*$=F3I@WVMzCl9A)|1%Qd+2|bt#^MjuvGuI8}~nLY;0^k z$N!(Ctdua>Ty8ZDMF#$0dvQnF%I~}qYqa+pF35`8Z0a&P6PL*6nW2J(yx!AzS*z&3 zMy1`~b|^T<&|XWhx*1ri|2s|n-`sk;{jC2_QRb?3Uqo|sx%H6Azug!%t#7W=Gb-B3 zj~tAJxNHSrI4Hb^X1ZFQI&?KcUCreSV34ZmKwKATZuxC%FAV65pY!YtIa223Lu7Nu z`BsZxq8XbyPcS>e3CeG62NvtUZ^TGPTu6K*jb-}3z1iIV-`U!E`>g*@QP!YOv_|Rf zS99GBS7YQbNGXdbA3;LGOEN-LT>hxi#Cq1C#>g0qm>9UEX39rzKq4cWPSD1AD(?x8 zyfxrBayLx8Oe7BJHAZei{*PBa9CJ1W!EH^$5+o??-A%sd@1LHZY9Y~EgX~z+m%USn zs8pUmqPk=MI`%z(@SE(|zxj*tsAK-*k7~j@C87ZdFVnjf1*MWVdt+98Ck6VCkMOx zpAP&udNhqC`rq5!Xx{(2z0-ZZ|Mf}A+8q}td%G|$uY1-ayY1N?;reOeea|n?J{-RK z`Q<~eTz)lsU$pOeYin?dI!)aD(B;`X%LMGCvo!vs0 z^HYAI!q1qa!W~ak6)dT{687Ta!t+iM;iuwL*|yx#uos4!2m9yT0Cis3J4f=o?ns1b zaW|lA&mmWu*xP5VKyA9Y=bZ_l?nC9&sI`#hv39`tLXYT0(2zh;c|>Q0aL2W^ww-Hh z@R`#^e5Jg~nWYZp(Xb{X73dLl=+DN*9YWb{dkS)Nl_S`ph!er>HGxDa5mI~AW+8*@ oQd}ccWVS*@GX7t|=02C_@?4(FpP~GJ00030{~+GWbO2-k06nv9ApigX literal 0 HcmV?d00001 diff --git a/charts/ai-stack/templates/_helpers.tpl b/charts/ai-stack/templates/_helpers.tpl new file mode 100644 index 0000000..7fcc456 --- /dev/null +++ b/charts/ai-stack/templates/_helpers.tpl @@ -0,0 +1,62 @@ +{{/* +Expand the name of the chart. +*/}} +{{- define "ai-stack.name" -}} +{{- default .Chart.Name .Values.nameOverride | trunc 63 | trimSuffix "-" }} +{{- end }} + +{{/* +Create a default fully qualified app name. +We truncate at 63 chars because some Kubernetes name fields are limited to this (by the DNS naming spec). +If release name contains chart name it will be used as a full name. +*/}} +{{- define "ai-stack.fullname" -}} +{{- if .Values.fullnameOverride }} +{{- .Values.fullnameOverride | trunc 63 | trimSuffix "-" }} +{{- else }} +{{- $name := default .Chart.Name .Values.nameOverride }} +{{- if contains $name .Release.Name }} +{{- .Release.Name | trunc 63 | trimSuffix "-" }} +{{- else }} +{{- printf "%s-%s" .Release.Name $name | trunc 63 | trimSuffix "-" }} +{{- end }} +{{- end }} +{{- end }} + +{{/* +Create chart name and version as used by the chart label. +*/}} +{{- define "ai-stack.chart" -}} +{{- printf "%s-%s" .Chart.Name .Chart.Version | replace "+" "_" | trunc 63 | trimSuffix "-" }} +{{- end }} + +{{/* +Common labels +*/}} +{{- define "ai-stack.labels" -}} +helm.sh/chart: {{ include "ai-stack.chart" . }} +{{ include "ai-stack.selectorLabels" . }} +{{- if .Chart.AppVersion }} +app.kubernetes.io/version: {{ .Chart.AppVersion | quote }} +{{- end }} +app.kubernetes.io/managed-by: {{ .Release.Service }} +{{- end }} + +{{/* +Selector labels +*/}} +{{- define "ai-stack.selectorLabels" -}} +app.kubernetes.io/name: {{ include "ai-stack.name" . }} +app.kubernetes.io/instance: {{ .Release.Name }} +{{- end }} + +{{/* +Create the name of the service account to use +*/}} +{{- define "ai-stack.serviceAccountName" -}} +{{- if .Values.serviceAccount.create }} +{{- default (include "ai-stack.fullname" .) .Values.serviceAccount.name }} +{{- else }} +{{- default "default" .Values.serviceAccount.name }} +{{- end }} +{{- end }} diff --git a/charts/ai-stack/templates/pvc.yaml b/charts/ai-stack/templates/pvc.yaml new file mode 100644 index 0000000..4e87283 --- /dev/null +++ b/charts/ai-stack/templates/pvc.yaml @@ -0,0 +1,24 @@ +{{- if .Values.huggingface.cache.enabled }} +{{- if not .Values.huggingface.cache.existingClaim}} +apiVersion: v1 +kind: PersistentVolumeClaim +metadata: + name: {{ .Values.huggingface.cache.persistentVolumeClaim.name }} + labels: + {{- include "ai-stack.labels" . | nindent 4 }} + {{- with .Values.huggingface.cache.persistentVolumeClaim.labels }} + {{- toYaml . | nindent 4 }} + {{- end }} + annotations: + {{- with .Values.huggingface.cache.persistentVolumeClaim.annotations }} + {{- toYaml . | nindent 4 }} + {{- end }} +spec: + storageClassName: {{ .Values.huggingface.cache.persistentVolumeClaim.storageClassName }} + accessModes: + {{- toYaml .Values.huggingface.cache.persistentVolumeClaim.accessModes | nindent 4 }} + resources: + requests: + storage: {{ .Values.huggingface.cache.persistentVolumeClaim.size }} +{{- end }} +{{- end }} \ No newline at end of file diff --git a/charts/ai-stack/values.yaml b/charts/ai-stack/values.yaml index d55049f..ef14643 100644 --- a/charts/ai-stack/values.yaml +++ b/charts/ai-stack/values.yaml @@ -2,7 +2,8 @@ # This is a YAML-formatted file. # Declare variables to be passed into your templates. -# Values for the text-generation-inference chart +# Values for tgi: the text-generation-inference chart +# Reference: https://artifacthub.io/packages/helm/infracloud-charts/text-generation-inference?modal=values tei: enabled: true @@ -14,6 +15,11 @@ tei: value: "1024" - name: RUST_BACKTRACE value: "full" + - name: HF_API_TOKEN + valueFrom: + secretKeyRef: + name: hf-api-token + key: HF_API_TOKEN resources: limits: @@ -28,7 +34,18 @@ tei: type: LoadBalancer port: 80 -# Values for the text-embeddings-inference chart + volumeMounts: + - name: hf-cache + mountPath: /data + + volumes: + - name: hf-cache + persistentVolumeClaim: + claimName: hf-cache + + +# Values for tei: the text-embeddings-inference chart +# Reference: https://artifacthub.io/packages/helm/infracloud-charts/text-embeddings-inference?modal=values tgi: enabled: true @@ -40,6 +57,11 @@ tgi: value: "6144" - name: MAX_TOTAL_TOKENS value: "8192" + - name: HF_API_TOKEN + valueFrom: + secretKeyRef: + name: hf-api-token + key: HF_API_TOKEN resources: limits: @@ -52,4 +74,91 @@ tgi: service: type: LoadBalancer - port: 80 \ No newline at end of file + port: 80 + + volumeMounts: + - name: hf-cache + mountPath: /data + + volumes: + - name: hf-cache + persistentVolumeClaim: + claimName: hf-cache + - name: shm + emptyDir: + medium: Memory + sizeLimit: "1Gi" + + +# Values for vector: the chromadb chart +# Reference: https://artifacthub.io/packages/helm/chromadb-helm/chromadb?modal=values +vectordb: + enabled: true + + service: + type: LoadBalancer + +huggingface: + + cache: + enabled: true + + existingClaim: "" + + persistentVolumeClaim: + ## Ref: http://kubernetes.io/docs/user-guide/persistent-volum + accessModes: + - ReadWriteMany + + name: "hf-cache" + + labels: {} + + annotations: + nfs.io/storage-path: "hf/hub" + + storageClassName: "controller-nfs" + + size: "50Gi" + + +# Values for reranker: the text-generation-inference chart +# Reference: https://artifacthub.io/packages/helm/infracloud-charts/text-generation-inference?modal=values +reranker: + enabled: true + + config: + modelID: "BAAI/bge-reranker-large" + + env: + - name: MAX_CLIENT_BATCH_SIZE + value: "1024" + - name: RUST_BACKTRACE + value: "full" + - name: HF_API_TOKEN + valueFrom: + secretKeyRef: + name: hf-api-token + key: HF_API_TOKEN + + resources: + limits: + nvidia.com/gpu: 1 + requests: + nvidia.com/gpu: 1 + + strategy: + type: Recreate + + service: + type: LoadBalancer + port: 80 + + volumeMounts: + - name: hf-cache + mountPath: /data + + volumes: + - name: hf-cache + persistentVolumeClaim: + claimName: hf-cache \ No newline at end of file