From 3791ad219323389106dc3fd80814eb5bbb7b80de Mon Sep 17 00:00:00 2001
From: HanishKVC <hanishkvc@gmail.com>
Date: Tue, 25 Jun 2024 16:57:35 +0530
Subject: [PATCH 1/5] SimpleChat v3.1: Boolean chat request options in Settings
 UI, cache_prompt (#7950)

* SimpleChat: Allow for chat req bool options to be user controlled

* SimpleChat: Allow user to control cache_prompt flag in request

* SimpleChat: Add sample GUI images to readme file

Show the chat screen and the settings screen

* SimpleChat:Readme: Add quickstart block, title to image, cleanup

* SimpleChat: RePosition contents of the Info and Settings UI

Make it more logically structured and flow through.

* SimpleChat: Rename to apiRequestOptions from chatRequestOptions

So that it is not wrongly assumed that these request options are
used only for chat/completions endpoint. Rather these are used
for both the end points, so rename to match semantic better.

* SimpleChat: Update image included with readme wrt settings ui

* SimpleChat:ReadMe: Switch to webp screen image to reduce size
---
 examples/server/public_simplechat/readme.md   |  37 +++++---
 .../server/public_simplechat/simplechat.js    |  79 ++++++++++--------
 .../public_simplechat/simplechat_screens.webp | Bin 0 -> 21376 bytes
 3 files changed, 68 insertions(+), 48 deletions(-)
 create mode 100644 examples/server/public_simplechat/simplechat_screens.webp

diff --git a/examples/server/public_simplechat/readme.md b/examples/server/public_simplechat/readme.md
index 2dc17782552569..21410199f60169 100644
--- a/examples/server/public_simplechat/readme.md
+++ b/examples/server/public_simplechat/readme.md
@@ -3,6 +3,13 @@
 
 by Humans for All.
 
+## quickstart
+
+To run from the build dir
+
+bin/llama-server -m path/model.gguf --path ../examples/server/public_simplechat
+
+Continue reading for the details.
 
 ## overview
 
@@ -14,6 +21,8 @@ own system prompts.
 This allows seeing the generated text / ai-model response in oneshot at the end, after it is fully generated,
 or potentially as it is being generated, in a streamed manner from the server/ai-model.
 
+![Chat and Settings screens](./simplechat_screens.webp "Chat and Settings screens")
+
 Auto saves the chat session locally as and when the chat is progressing and inturn at a later time when you
 open SimpleChat, option is provided to restore the old chat session, if a matching one exists.
 
@@ -170,17 +179,23 @@ It is attached to the document object. Some of these can also be updated using t
     The histogram/freq based trimming logic is currently tuned for english language wrt its
     is-it-a-alpabetic|numeral-char regex match logic.
 
-  chatRequestOptions - maintains the list of options/fields to send along with chat request,
+  apiRequestOptions - maintains the list of options/fields to send along with api request,
   irrespective of whether /chat/completions or /completions endpoint.
 
     If you want to add additional options/fields to send to the server/ai-model, and or
     modify the existing options value or remove them, for now you can update this global var
     using browser's development-tools/console.
 
-    For string and numeric fields in chatRequestOptions, including even those added by a user
-    at runtime by directly modifying gMe.chatRequestOptions, setting ui entries will be auto
+    For string, numeric and boolean fields in apiRequestOptions, including even those added by a
+    user at runtime by directly modifying gMe.apiRequestOptions, setting ui entries will be auto
     created.
 
+    cache_prompt option supported by example/server is allowed to be controlled by user, so that
+    any caching supported wrt system-prompt and chat history, if usable can get used. When chat
+    history sliding window is enabled, cache_prompt logic may or may not kick in at the backend
+    wrt same, based on aspects related to model, positional encoding, attention mechanism etal.
+    However system prompt should ideally get the benefit of caching.
+
   headers - maintains the list of http headers sent when request is made to the server. By default
   Content-Type is set to application/json. Additionally Authorization entry is provided, which can
   be set if needed using the settings ui.
@@ -197,10 +212,10 @@ It is attached to the document object. Some of these can also be updated using t
     >0 : Send the latest chat history from the latest system prompt, limited to specified cnt.
 
 
-By using gMe's iRecentUserMsgCnt and chatRequestOptions.max_tokens one can try to control the
-implications of loading of the ai-model's context window by chat history, wrt chat response to
-some extent in a simple crude way. You may also want to control the context size enabled when
-the server loads ai-model, on the server end.
+By using gMe's iRecentUserMsgCnt and apiRequestOptions.max_tokens/n_predict one can try to control
+the implications of loading of the ai-model's context window by chat history, wrt chat response to
+some extent in a simple crude way. You may also want to control the context size enabled when the
+server loads ai-model, on the server end.
 
 
 Sometimes the browser may be stuborn with caching of the file, so your updates to html/css/js
@@ -237,12 +252,12 @@ also be started with a model context size of 1k or more, to be on safe side.
   internal n_predict, for now add the same here on the client side, maybe later add max_tokens
   to /completions endpoint handling code on server side.
 
-NOTE: One may want to experiment with frequency/presence penalty fields in chatRequestOptions
-wrt the set of fields sent to server along with the user query. To check how the model behaves
+NOTE: One may want to experiment with frequency/presence penalty fields in apiRequestOptions
+wrt the set of fields sent to server along with the user query, to check how the model behaves
 wrt repeatations in general in the generated text response.
 
 A end-user can change these behaviour by editing gMe from browser's devel-tool/console or by
-using the providing settings ui.
+using the provided settings ui (for settings exposed through the ui).
 
 
 ### OpenAi / Equivalent API WebService
@@ -253,7 +268,7 @@ for a minimal chatting experimentation by setting the below.
 * the baseUrl in settings ui
   * https://api.openai.com/v1 or similar
 
-* Wrt request body - gMe.chatRequestOptions
+* Wrt request body - gMe.apiRequestOptions
   * model (settings ui)
   * any additional fields if required in future
 
diff --git a/examples/server/public_simplechat/simplechat.js b/examples/server/public_simplechat/simplechat.js
index 25afb256491391..8e0df3b61df2b1 100644
--- a/examples/server/public_simplechat/simplechat.js
+++ b/examples/server/public_simplechat/simplechat.js
@@ -222,8 +222,8 @@ class SimpleChat {
      * @param {Object} obj
      */
     request_jsonstr_extend(obj) {
-        for(let k in gMe.chatRequestOptions) {
-            obj[k] = gMe.chatRequestOptions[k];
+        for(let k in gMe.apiRequestOptions) {
+            obj[k] = gMe.apiRequestOptions[k];
         }
         if (gMe.bStream) {
             obj["stream"] = true;
@@ -740,11 +740,12 @@ class Me {
             "Authorization": "", // Authorization: Bearer OPENAI_API_KEY
         }
         // Add needed fields wrt json object to be sent wrt LLM web services completions endpoint.
-        this.chatRequestOptions = {
+        this.apiRequestOptions = {
             "model": "gpt-3.5-turbo",
             "temperature": 0.7,
             "max_tokens": 1024,
             "n_predict": 1024,
+            "cache_prompt": false,
             //"frequency_penalty": 1.2,
             //"presence_penalty": 1.2,
         };
@@ -800,51 +801,55 @@ class Me {
 
             ui.el_create_append_p(`bStream:${this.bStream}`, elDiv);
 
-            ui.el_create_append_p(`bCompletionFreshChatAlways:${this.bCompletionFreshChatAlways}`, elDiv);
-
-            ui.el_create_append_p(`bCompletionInsertStandardRolePrefix:${this.bCompletionInsertStandardRolePrefix}`, elDiv);
-
             ui.el_create_append_p(`bTrimGarbage:${this.bTrimGarbage}`, elDiv);
 
+            ui.el_create_append_p(`ApiEndPoint:${this.apiEP}`, elDiv);
+
             ui.el_create_append_p(`iRecentUserMsgCnt:${this.iRecentUserMsgCnt}`, elDiv);
 
-            ui.el_create_append_p(`ApiEndPoint:${this.apiEP}`, elDiv);
+            ui.el_create_append_p(`bCompletionFreshChatAlways:${this.bCompletionFreshChatAlways}`, elDiv);
+
+            ui.el_create_append_p(`bCompletionInsertStandardRolePrefix:${this.bCompletionInsertStandardRolePrefix}`, elDiv);
 
         }
 
-        ui.el_create_append_p(`chatRequestOptions:${JSON.stringify(this.chatRequestOptions, null, " - ")}`, elDiv);
+        ui.el_create_append_p(`apiRequestOptions:${JSON.stringify(this.apiRequestOptions, null, " - ")}`, elDiv);
         ui.el_create_append_p(`headers:${JSON.stringify(this.headers, null, " - ")}`, elDiv);
 
     }
 
     /**
-     * Auto create ui input elements for fields in ChatRequestOptions
+     * Auto create ui input elements for fields in apiRequestOptions
      * Currently supports text and number field types.
      * @param {HTMLDivElement} elDiv
      */
-    show_settings_chatrequestoptions(elDiv) {
+    show_settings_apirequestoptions(elDiv) {
         let typeDict = {
             "string": "text",
             "number": "number",
         };
         let fs = document.createElement("fieldset");
         let legend = document.createElement("legend");
-        legend.innerText = "ChatRequestOptions";
+        legend.innerText = "ApiRequestOptions";
         fs.appendChild(legend);
         elDiv.appendChild(fs);
-        for(const k in this.chatRequestOptions) {
-            let val = this.chatRequestOptions[k];
+        for(const k in this.apiRequestOptions) {
+            let val = this.apiRequestOptions[k];
             let type = typeof(val);
-            if (!((type == "string") || (type == "number"))) {
-                continue;
+            if (((type == "string") || (type == "number"))) {
+                let inp = ui.el_creatediv_input(`Set${k}`, k, typeDict[type], this.apiRequestOptions[k], (val)=>{
+                    if (type == "number") {
+                        val = Number(val);
+                    }
+                    this.apiRequestOptions[k] = val;
+                });
+                fs.appendChild(inp.div);
+            } else if (type == "boolean") {
+                let bbtn = ui.el_creatediv_boolbutton(`Set{k}`, k, {true: "true", false: "false"}, val, (userVal)=>{
+                    this.apiRequestOptions[k] = userVal;
+                });
+                fs.appendChild(bbtn.div);
             }
-            let inp = ui.el_creatediv_input(`Set${k}`, k, typeDict[type], this.chatRequestOptions[k], (val)=>{
-                if (type == "number") {
-                    val = Number(val);
-                }
-                this.chatRequestOptions[k] = val;
-            });
-            fs.appendChild(inp.div);
         }
     }
 
@@ -870,32 +875,32 @@ class Me {
         });
         elDiv.appendChild(bb.div);
 
-        bb = ui.el_creatediv_boolbutton("SetCompletionFreshChatAlways", "CompletionFreshChatAlways", {true: "[+] yes fresh", false: "[-] no, with history"}, this.bCompletionFreshChatAlways, (val)=>{
-            this.bCompletionFreshChatAlways = val;
+        bb = ui.el_creatediv_boolbutton("SetTrimGarbage", "TrimGarbage", {true: "[+] yes trim", false: "[-] dont trim"}, this.bTrimGarbage, (val)=>{
+            this.bTrimGarbage = val;
         });
         elDiv.appendChild(bb.div);
 
-        bb = ui.el_creatediv_boolbutton("SetCompletionInsertStandardRolePrefix", "CompletionInsertStandardRolePrefix", {true: "[+] yes insert", false: "[-] dont insert"}, this.bCompletionInsertStandardRolePrefix, (val)=>{
-            this.bCompletionInsertStandardRolePrefix = val;
-        });
-        elDiv.appendChild(bb.div);
+        this.show_settings_apirequestoptions(elDiv);
 
-        bb = ui.el_creatediv_boolbutton("SetTrimGarbage", "TrimGarbage", {true: "[+] yes trim", false: "[-] dont trim"}, this.bTrimGarbage, (val)=>{
-            this.bTrimGarbage = val;
+        let sel = ui.el_creatediv_select("SetApiEP", "ApiEndPoint", ApiEP.Type, this.apiEP, (val)=>{
+            this.apiEP = ApiEP.Type[val];
         });
-        elDiv.appendChild(bb.div);
+        elDiv.appendChild(sel.div);
 
-        let sel = ui.el_creatediv_select("SetChatHistoryInCtxt", "ChatHistoryInCtxt", this.sRecentUserMsgCnt, this.iRecentUserMsgCnt, (val)=>{
+        sel = ui.el_creatediv_select("SetChatHistoryInCtxt", "ChatHistoryInCtxt", this.sRecentUserMsgCnt, this.iRecentUserMsgCnt, (val)=>{
             this.iRecentUserMsgCnt = this.sRecentUserMsgCnt[val];
         });
         elDiv.appendChild(sel.div);
 
-        sel = ui.el_creatediv_select("SetApiEP", "ApiEndPoint", ApiEP.Type, this.apiEP, (val)=>{
-            this.apiEP = ApiEP.Type[val];
+        bb = ui.el_creatediv_boolbutton("SetCompletionFreshChatAlways", "CompletionFreshChatAlways", {true: "[+] yes fresh", false: "[-] no, with history"}, this.bCompletionFreshChatAlways, (val)=>{
+            this.bCompletionFreshChatAlways = val;
         });
-        elDiv.appendChild(sel.div);
+        elDiv.appendChild(bb.div);
 
-        this.show_settings_chatrequestoptions(elDiv);
+        bb = ui.el_creatediv_boolbutton("SetCompletionInsertStandardRolePrefix", "CompletionInsertStandardRolePrefix", {true: "[+] yes insert", false: "[-] dont insert"}, this.bCompletionInsertStandardRolePrefix, (val)=>{
+            this.bCompletionInsertStandardRolePrefix = val;
+        });
+        elDiv.appendChild(bb.div);
 
     }
 
diff --git a/examples/server/public_simplechat/simplechat_screens.webp b/examples/server/public_simplechat/simplechat_screens.webp
new file mode 100644
index 0000000000000000000000000000000000000000..ccea44396051686b97220b0f5b6b9beb63706114
GIT binary patch
literal 21376
zcmd?PW3w<kur0W4+s3nP+qP}nwr$(CZQHhOYu-6?=F|NN_e)l~QmJ&WbXB@KOHo2p
z)LjVxKuttYUR9o*!1}-Wy*XeGASD6tJ|J&`V763AQ4uNe!X-jI5~PLgH%jM?u!G$V
zFF)=>Zp<y82D@yVBrZNd9`Q5a_mk|J|Ed+2`))2Kj#!z;9CoaC;W1!2_(%CM4*+$(
z5BN{p;+{XB^&jY0#E;$*{#dWs*W6p)R^M$O%b)D2UOkVbuiYE*^WF|0@vo)t)Gzth
z+zEUU?~h;hAL<9qBk23v<J_a(Rv$qxTkl!ZljNVqU*0!-JzZ@c|6khA*zntD-*w+f
zPsI1v=iXP{z29M<HE%y(lAqY0#2fG<-}~On-l?Cj51DV;&)3h}TitkHJ>9Y2a^I$(
z`ybnv!*kR3*>B&I-jxrnZ_KaKpWDZuzusBi*59*V?CbL1-(S`~`R#x3-3Rs8&iD6s
z7VoWDagpp<-8MBF*nLj*{|y1v<5(wIC}OAKR>4IbvQjH1y}Hh*X9BwRy)()L8~%Dp
zF{O>buw4#_CQXDck%u>S&Nft^j(|meh;+5ovb+6kc`qiYDOW`Gt+SQz((DUwLzB`C
zV~fG)TXIeQSAJC+@vXB7S!e1wD2;3mw$T&bcKea~v5Lu$D)2RgF=08th|IRLU+0ww
zz@VVS?-6aoBBrmb9CQQtZq*MZx0fC`<_=0ns02Ev7s7$LtEZq@_E6O|nWW_8ZJSrs
zg3{9$c^z|!VfloLU{edq*-d{eUvYII6fsz0<v9mYZCKE<+5r>VDVYbm@&`ti5kC4y
zR{UNnpk_UTISkI|NGOh%q5?A8s%;6FWQ6=7TDl*5Tz~p>h=rTNE%3l-k<6W<H;c8)
z+ESOppCE5oyTZolAs{G#2qhGf3M1n9;NP8cT(oWHLl1!u7)P8t(_c8x(NYo=@tw86
z?EW1@&3dDG;b+^Y-0!?MgM3n}-mMqnk5$7|FHGLGT}-WAje+z!f7461^jYKHTRWmt
zX;6Wt+KM)iPOe_{AzcC7cH{TP_p`DW*jZ{6Sm5w4$51)dBrly+M5}#ZBtg|qn!g(2
zhXEGfJ|e0{Iz1BmCme7cf!#bOSN@?>*?Tfkzi>mzheD$E8>NExS+Vnk*wn9pxb$Oz
zHBi)bO;el*Qd4cVbOkZFZ868j{Y&2}nx1`Ot}qJyH?o%+&7UK=X-}9wcd|~;XMCPc
zPb~yTzyL3yvXi2Fb9&PzZ#^7yOW8jcbF<4q(J;Up?ka1yST&WybH)~A7e*0YRD^TY
zJ-zZFS0+$p9>>2*CMJe0z$x*Hk>Njeaeb?`1X8081kle}z9EIlrfAdv<kPaCrxX|J
zWFNkybtWeQ>LoZ|`R_eXfw0jdbD%W7OQCJIQfG9Xg}A<B`QIiVEE$`7aSzY8j!#)n
z-Hso4CSog1(NA~+oi`U%O;iV1dpK_8X{v-AdPIM`w#OPC;tRn7jqNhr_+#WKKwB_<
z9G~sjoN{pp$)0c!q5;~!UM|22U2&<8qa$tqR+yv)`2N0hts#7EK`dgGNJ->uy@8<h
zV2ayojuA}W(cxfSUE?!guGbPugZa&RklmHDzJ}2}2Z61cK$(l;*htXIuIDuIo$$XD
z49}jhe-6KO+j{nPjFE{Z<Qj!pw`&WacOeG0Q@x`js-?K?Pes0VnJUQ%8$Qx=CZVq3
z(Hz9LO!{xUbPe_x`~Bi2%i%r)pI<$GqjYEA6$g$$3i4D(9eSV?BmRc2^+Q$cv&oN}
z&h*PFxIYv3EbzW2^2cbsAeWN$>weBDoXp#R`%p?mniFLf$EgXG{bkiG&)Xp;5v_xh
zbx0I+M_}H^E?|b<eCm)YmR@KK>1u!D<wF|Y9k!K#t%=8cMlBq%{2=jwh!rrCcy?L;
zw$!k>;U7UzwOK0O6Gm`R`6T6hv6cTdPu$sh)m;OiJgEw<5#jq>N!?uL;e?(lY2xoP
zsVNcfeDwkiE7dYuW{(D+1v@uQ53@yeKFW{lU~qGMM***sAdLf!sj0X1v2dY<2-9eF
zxZ-Y>=x>X!VayQEV7U+)gxp&`maiBw$&?ufOS=I;(#zDT0?o0ywe+o65>aiN08-xx
zd3NSF_{W*DYcdL*gJ^5oJI@SKdH`U9JTmOq!QIi>ztsO3pES<iWBUn<KF5q|Q5;yu
z@rHbBC`Jf=xkALjS72-U0$Jaq@F%E)fW`IXd#00}f$MJ>o)R+`azkAh;))tdGlu(q
znD()4IS%y77Y5~V)+e@x8l!iCCVs|&@rD!8qCauC+PY*TL0GC!ue;V(uneAa2V%MM
zKrB*s{ITvtR#sAX7YRsn5e~s~o%#L9PNO-%tOdjZ$utIWq1907GH<iJ(mI_D29`8T
zJgk#Ne5i8Jaw>hucfg^smXWvjovbh#=&j0&YJ<_k079oD$ZL@LOR|W2o*HXbEGVs*
z4J+2jDI{iJIn4>r1ScW0%$*1xv#W1r=N|s0DUX`5E#gQ%WFo-;{42Nv%P#K-D@j+|
zsK;&N<YEPD3_lMFptej2wHt-vUDN(mrWFcV7ed1u_3gR##+imbhV;S+=`#i}X_#Rk
zYMzRlHtzTXQlK_Q8<}yUs11SOm$xm#{om8}>>#Ne<@CLuJ$Cudl|p!9j9Me{H{bfG
zCNEPdsg<$0Nl)mvf*&UCunN2{0!=%<%eBLxv6Ygx^&T%XL_O?}=Lb_xNzz<*aQ3*?
zp`=UgUku1VV1ma=BsW_;`P62*viYS52S=BWU%zymKFl1}E;;9i)(V|y1&wB%;y<%v
zd`2~7d_8HHpRohBOa<~%b27V6@1&H#en!RWM2mAPD(0Wug*m47SQJ_~czXXQ+SHxh
zyaQUs4FamebLeJ>)~wa18L2ozbEtHu7vv_D^piND-I2$+x&7ShF>0UM|MgiJH6d`|
zAU_be9erob?%2rA6vAI^ISH&r$_Q9R$pwnQ>7xZ9%ZkG=pVmMKY`^StQ0+fRtF($$
zQ8e-G>H5T>wvm;yYgyw<b;I>?d%aGX(_+D^i;HE9jT?3Dby-<P7B%h4h#Qf}Vfx^8
zth01@TRKg2qsTbV>!f!|!xKFIEZ1!nuY0(a|K|E%O7zfl(fB)DM@!TK9p;VL<kxOw
znd+o0XN0l(oGUh#`};URZ*G_KY>*}2DmIQyx;$APAc6<oK9wB-_lQ?E){{q~vheqy
z5rrz%g)p*|lD2MK{@*;};i^!-UzV{4k!sh+CMcErT241$1b!=Zo;CyldL9vbs`gj?
z+Wx&z`f}!I&danvZCq7H%BNW333+x7N_>a{<$y>jFJ8WCRUFrFVfZhd|9iyqCPT(O
z-4tsOpbB*D1PrV`5px^o_x;qPe1&W!7~SM2cgQQu!n6N>j#3DRL3&mB{%4zgLrXs=
zm$3Rwk+rco6>QwVk_(!eeS)VHc3Uaa0wi2`KKwiTKBAV>nYL9PK)7OZ2{MSd_$<5u
z`e%Aittwc^NUN-ssL(8eJ*^{1-KQyj7cP9gT^&zJ;0Zdcb*ulX^yTGC`wVODaf!!j
zp*6$3Ip|=v64w<_X@1VfZDq{1`O#Y7k8Zv(I&`fs%8-G`vGGUqZ5X&Y$P+$eQK0*T
z6n=~RR<{je$vz-8S6~nXo&nT~Chs*}fO!X9?@jP<O#@qZH_ohGj~YB(a+nuk_Rn&a
znqj1NBroksWq7dctdylAoWGzVcIq`D1?-e7LK-A`aYOwn8=x%nfMd$$@GXJW8<_$H
zSwaR~%r_D)KO5G3Iw*Ws?C@TAg`wvuNx~IxF(mdwg3E8R-`^X>#NXcwW@0A93^%Tq
zfZP<X!eSe!$Gln&s7L=fl`-=CL%u)2@1LtiXob9uiiFK#zHXo`{!a`doCmR4^rPq;
z=5b6e(*!oRSt6_Z9EtTquK30gcS6(X|18S|mVgs~2Yj7zBktXqVPXVP9i(0Zm~945
zZ(B5vc^2q+$r6cL;eY#k_&oxi{EdUB{Sn~l{h#L7Q8V(7B{cnXnSBSIF)1T$v>2`2
z7o}X)+AXJau~qV=HvKWs7Se#NHEk=V+@TuqU2<AnD6IJ}|Fv^uLwkuyH6?Ec((2>k
zfh-0HM6tT_&2gdUBx?%E$D0K9=@36)#TiL({CBc>vGTrHee`DYA@YSidpIX^#ekKz
zZxYYHmKtzP>f{NG6xvpHb@R}~$~hE5<wuIgWk5>N@&S*q0td5_PVr<SLhu(L;9i3G
zqpprRxl{bsxbEag(mbgCo_3p~p&jX>X1{JxA#)L1Ch!%Ou;hc(LUFh+F7Fs%Y<;ME
z{h4{a*o9RN4+Zpp>QMWR#}@O}T_4FycGJVT9_L(9xIm48%=k$dT+uPEbnV-F6*v43
zC+&bvB8p0)?ErddAS*?9&pmZoSo+zDK1P>{JywuOG$HNVA>$2C%XX|hn!<U4SyyI8
zex1MwH%JY#DelYbR>3Eq&HSk^uf^&%NtdC(;AnI}9Lft`NPtnQlA-W)f0kl9%DUH5
z+Kri13S2p{;{tvsr21`sa#9LBBbayiilp#9T9id86!!9ZLZq*0L=qF69O?<1orB6j
zw;e9R{rL4WIZ>e(P*|vf3fXQ^A4M6w+gakH(NEoYey{MIIW-9n@vt+)1X*h&%^2;m
z+yn9ft#y?1+X;{r!w13Q8z_D(*^m_l<iF13;M&x(r|;t>UT*Y>!8};7r$x4Oif7QI
zn*ck!KZjzHsgTwqXFbon7KPHo0c;noSkK=0YCo2C9|!O$^+mW((fQsmA>-<JYfBFv
zf3*>wXMFjOA3ua`MNisL@EMo3Rw6wr3Fm%Yu53H`YS>sPSIo;4!M_?=cFP<dTHO4}
z((H5Nj)CWl_Qqca;xSw*V1=wuH*NMG&+@*E$@E78>c@{Jxg?dwGZKV~&Df<WlR$wc
zyxfjIxaPv(KG<7h`l+bXI01w@Z}NhuVRnviXT-jjybO*ZCmOwF0V;^r;6hyWmw*-Y
z{QwLW%|@bm008t;L79eDedA)AFBQ~*DtSdB{*cUQ0_d`@R6u0(btz5W{ckNq2*u-B
zzqhh9PL%A#y@oc$WS;8JtA!Oh=}bq1*kClKX@t0BDfCz1KECPd2eKUyD#gVOor$Tp
z1V#c-{}S6ZE1dXdvv8>HO{Pb`-$xZkX|}O&(NAhytPFijjQv5p8ObQ5nkxObIGkMy
z<>lLdjVx+kf=RY*og&?@MIAPMac?`5)v6uLwhL{0nm(^2Ln&t^?*W66or0NX2*m2a
zj}aX47Hgw|PP26WjBQVLRpbrH%&|B(yg_ev=W@cwLh~U^B;wDi*mFVD4_3zJch3nx
zg(#}mhby8D1`>K>H}1cq_XB!yZPp6%Z6o^Mv31y%l$6N`i->7w%wV%7_q8RK-^i=J
z!RTDC*uN7=gwflEmXqUj$91-i_V>r){zdHwZ&+-(8h_RZ*RZ9ZGE51Bit%2ZQPNRg
zmxYb%+o92A@(HkUZQ!DJw&%OO<V4EYUeO61(#xqcMKDcIaHD=Z2SoNBcO7iY`aVcS
z9`&tOw8XTXw%a<Yp{n7k>_gR7Oj9WsfzY5w=2q)C^&dW)>!j_y?EvZ-PHS&Ftn175
z_aW@>hn1mLy)^>!IaA!4>NU;`_4QK}3?z1jHS0=rTr)@JaG=(1oz9FR5t7YCorI>!
znpN7}uw)y<&H_p<DOyZaV1hOZHoPL9zZ|}a1EdW|s;ia`&v}^Ccpxk&p+yAXc2tKa
zdq|hb3G}X;KT|Kr`1n;uwq-CFv@|;t(@*W$HT-pP<b%$<LI?Y@kk#$oj?*!>eF}sn
z&s(EH$Ie@VZ#s|igWWmsHJuqU9FzlLDjIWK&XNb9vAZ}tvvooM%1>IcGEf>}*c;mw
zwR-arvlG~bX}P>|z3_w5WtUB){U+_aM-9<>-e+JUIWCZl*D)P2&q?vHtlIY#p4zL_
zLaaEXD1tEV<n!fM8Nv7jl*vIZ*E6M`@n5$*dhAdldrE3U#R~>bGr91sdo{VplvnDu
z{b{`6{a<h^0Cg)PT{(x-dXtH>q#pT<?3|wqm+|l#Q>T;gmtL}|S6saQFg1S4e^pM0
z=b`k<&Yu7=bA&o>7h+Dex4D_;`L6ogQ~lJ=<<~%^_JNBXCX<lLUX%kjae+}^ZjvT>
zr3r>ifa6f^8(r9Y@H!aD5x3U|dMEX{A?bNAt!ZTZj5Rw+vy+m2XhmsqjW&5F3yhyg
z1OI$yqFvl6j?(P$jrFeT#}_G@+JJS%!vepW4|OO&+4yR}bvd}pdJ>{HyDK0J$OVqj
zw8Y9L1d!I5W{|J>L85<8wux0GUJVUNzjLJ!oSvc+flAyJMO9pu>Dt@TuB|)10o8S4
zuN6s8gQT`_!l6ZY%A{O!^7z42`zrlbIv$*bFeo{F02p-|NO%hVRF4JA(q=+4xyZs+
zkI>vc7u^Y0H(`j}GJ#wsh{yYAvYF5f9|{<Kv?%r$+}nEDvwM+2lXSFsL+Wzd5?o*h
z`+-9dFM!~jT@L;V7u63G%@;KP#6Bbjd$s<iByuPbYDvqVk}%PX88lpCrC!KUAtrqa
zDy)_=hQ;GB=K@~w1fML+VE@r-3t~vjyN{$UTs+DPx57LLe<1)8^L4mEtR(uRN0n?#
z0ini56b-7&mz{W#LBaEyHVu+o^p1V@bi}|3)~mXT75?i2ZwxLn)`av3(Kih;W@2qb
zIAspShO}7h05Y3Qr65`eS7Cu7^O06!?`*s-$Bi9f^jw-?>Q8hy1a$RR<Z%9gh_ba$
z9?L)5c1aF0Ca_f*mwPT8%xXRzcNe?n0H3nD9BR8i@Zwv#k{fZ>a=R#i6ru1;H{7r~
zzC*>TuK65r`i37FV32<CTP>Lb)4M@ik+N%HEEl3LIS>9Gq}BsLZ`v@CS0G!O?_LqM
zcGnlF5%`|yS0^95z)dgCNMs0-TtL7wP=~bH=zB>luHxroq*yj5be`$R1;Y?Bg^KIz
zicRkdq4+Gu-LJ-)Z#ro$8oVZ}1@sX)-Zl^uU%w1DZ^L;yX`1jtS^v10o0g!tShO!@
zX88BSi&KP!vf5Zz-_r*NRp@!x+l^Swc8G2u%75W`zv*ZJu^OLrFeF3MFVX&93>ESF
zuR(_{V8Bo2uh+p<d-%SYH}bK0RD@*d`gkEDSpLbQ<i^;1>)mHH{i|>yJ9*Tt5wz4j
zU9rfa<rx9;$pOT7fM$~g4VCfdOL$QVJu;Zz!2i6}qP~gccH5MAgiTQN-Hw(l(*+@{
zDN~Gn`L^nrpI$Q2<>#@8C6m6cE^-Z8A>JSdcy3z=jQiht$`f0{Y6crYc=o~?g3nqH
z)jSuFWJWEDP`O&jIQW4G4txzJ7q+du^*R!y^g))Y6wJEo!9;wGG|<jy%rX3aDx4VT
zssk9RU-n1aF2kG}S2HS|3MJLx{QAQbgx&->t2`MJVah{duz-Fs)U3b@lQ8j!7pNZU
z^RX4Tx^zRplx#l5Qyu#Sx77_{@{bi~H(pyA6A@dtNiPT+YTyqpDFrd4)TT>@pPJNj
z?p9;kW>Jyn!<u@{X_Q1DSp-H=)3bnjO3_Go7NA+G?-j*{lfL<SDxO<(g3iauskPJM
zz3RItZeq2ejZQZRypn^2Lc>_$%ep}uGKrbP__I`+PUQe}%{X4W#6rmX>e<7_lv?rl
zG6bwr(3wunsBjyOTE2!Yv~apWE4@x}-C?64yc-iiq*D@yX`@+2Tr@uFd|g_4k=pEj
zUfsPbmHc)ztdNf<Bjvuvli36Ow-auj09TzLbwy>)BNYd4kJ1hvix)b_*%3AOXBBq;
zNyYO9VRv?hOl3ImoDit3T~^7dm}6bddTNP)=k5=uFZujacOj-Pf<;5^8}(>23SURH
z?6b-$JkA)w;c9EV_{lN0)ez&qn}&b3q_S7aTQC(Ldvz9UKS}#lZSqLKQ9*r{c_!*F
z3nUz(Eyx8vXPA->>^%mM2I)5;XFuW|$^h0~Um#Tc%>ziMdx@2CYD%xqWaMytzVea1
zuH->Ksfb?<(~SnaCDAE|TvpkSHK(i~cfkpPyWr&1G*xMzge&#%n{I>k`Zz}Mh4z+X
z*&8Hlf0wSeVx2H2o^=`C%BFj%lNyz2gs_R2Fd1VGXm`vJuqhL_v%PxqPdkzFp1{wg
zBw8-*BB?nE0xUQHtu<URHMtrMT_dcsK@U6252RD{GQo$c931Xy)e95QEFdFHD}S14
z+?amNS}HWX%aa8#gK34xPY?~>2)c77DFVV-a)M7Phz$n;Xf5DR<be8l(8aEXiKgPC
zuvEhQ79skiZKi*#l8H3{-{WNp`5{ZJr|uXAu<4Y%zqg!*w<u+o@os_jR)TY>n{m+f
zneCu2=t&MCxWq=4goWEqbE$Kr*GfibWqb@IZDkUJ@$<t))9;Sa=1Q8Ay@Rjc?358#
zk)QXX^?TtuA(+4=S3?#P#l)I|a$&H{ZGdD)hw+r;?}a1Iz2KlfY`-5P8&1fB^Pg0c
zOPDB0a!pC1riel_r)ez-MRo^onnt%#WR6OhyW?mXhX#@{qigg0<TJyFUm$Jf%j(Kg
zZ#T#i)Vh?2fT6&J8>NHOYh4cMaVR^G*azM1nHI}}c(WEbM@pS_3qao$<a&FQOd3T{
zpYJvHEtp`K^V~nf^hSfR5qeA>xE4u{5D_!D4&Xapi#@>gBo&zl!ki)Q+Wx*M3jLo8
zNe!(hU^4*($+MU(#`QB{wm2D3%l$Ol=DYmAkow2=I%Wt4Y9Di1K1Vn&PF(_uFN%fT
zG_Y|v^&#JhP9{JGM3{P*|Af(?_^Xfcm6!#&)#_Cq^khYwMuMj>aGEcH@;IMjlSX?N
zG38d9ss^q+ofwI|Mz!{Z9MtI+78MielY7cE(q5eVByPGWd@4EF>Tq2mcg>sAiOdrs
zx%h-pBQ&|yBkIvS%x)WV(pbS_A`H&lCs6ltbxp^3=s@j)4K^r8$yT=d`Cr&jQm}D6
z>2yM|9T-L3aN>kJTsEr_I=2I^f^#tRVr>0zvs*l+WBC17*m+$xw~eJ7Mm#}N_nRex
zv5i1CC4Z^N2;Q6+A<8(IQmx25(%%Ojbf7*wB3Zm|AwU1X4O?Kx`<L0)iim1K^H}{5
z{>B(Ko{>ABi6%2E_K2F2u2y&!j?@~Qa(x+x<|-Sy;WYDP60s*Hk~ho!xu5A(Pd_?!
zjom0ecOop6(QEFO$_{<txh4tI4#2Xo?i{DB1cbgahwnsm^dF`j;b^QZKw@<TTDzHu
zVz-b&50!6QWa=mLaz0;^{5E)@x?BJW*xR{YD_&LNbdZFStrR%XcO8<;kfT-+QZZxK
zb^VsZQux89`sxLnp`{UNZ9XU|50wvg;)9#r#G;(=(cb=L9bYZ2lazx7WWxL%CTdYT
zhqE9yi^TG4PR^Y)`xdK#8ccSsbF(<$6Hc)X`a-aO;HI1mC2k;;haT1)k!>%o?XwM4
zGiU&!kV-RTl2zMRi*d7E%2gkd9#pZ>Ogx%Ba>+`7u~j*`NBu$VH<stN@u|kSuy336
zs}<2lM-<pd?<zrX{MFCH32qpC!#YZokC2=;tUtR#rAD<`XzNvq+Wu<G3TjBoi_<bx
zQ$jc~S#79i#{}%b(-8I%m-*1bdM*}@4<Be*4eV+tZ4bBAPswpqSbb?p+ulM58nJ-J
zUjl>hrWTIF(4G{5u0@*FEHqg`Fw55LUUMJx%^yOhOc~V}F?>>hYXD6)OhtIK1Xvl|
zA|nu=nn-qh^T$4fOR;+&xDC0huOinfDhp10fsk1P$P2!*fBzHh$#h*h@at5$25sd#
zI4Q29r#`<F!9;y?Sil&HcOvsNHFbaHJks6+TgCLcU`*H;;mra^nPEY3aZ7KxluE%g
zt|S)TTB76J@u1gp?zl4K_V5sc{TC!{UwXh(B(u@&z=+vtyHsw#*-At%86k9Q<EZP1
z`OPGE{GkB57yrWWDVkS<<eUP=sZ}la93+q`X^kNYc;WS%+ukA|RycoX-yov_Z-39<
zNmB{o+S&kxr-y=SWMx%~<Qw=7BB*%aP_hG90jkxDWRu$7TOH(4JXv5c2Jed}GkE<$
zzIH|zAndUj=zBv}yfNU!{iLT9*rOrn3ZpSTT~eK+gY;C>wdzaqepXfOKlJ*NZ*UBw
zpp0BrjaWhH`YVoV`kv9%2b<Ht`vf)Tt_$-l;oe}=Ekioovd^LA#e6NIhU4wC%?51N
zg_EH{YbGQVijc*AIxf^0*jWma=tIO)Ff?Qzns_Nq*R$GWv1#CBdKd)*+nG-|zRx@s
zb2MXN_5|raf3@%ZM+eP%sbYeA2zk9SEn6~WS3<+uU%^{#Zr@=%6+RRMic}KGr!zQd
zqvd0p&N~P$+}Iuu<dnuk<7P?rC|BWM=X}cVQuiv*X7HG3Uex5q$>a+4tk@TghtKAL
z`3SQhk2~d^wQi95EyGoi@2JwuBt@wn7w+Tiji!eq?cA;6y!x<E`J-5@V}YDV>>wiX
zMAjp?%^}{qJllEV<H3UKmCQZ2e2gECD^t-9sOt$LFo12j>s7|&>00xSY7)tD$NW%6
zQ%r?NL>zDj(;K0wtJE3kqA0E|4+rv~=H|^DR1)M!CrsIwC$0OhC+_0W2$F8I>;+~>
zE@!psQTiFhyrDIxr<GM2_gFsbMpLpxf|1<=xP7x}))-j~BTBJU)@8;0D6}0;T_P4D
z6ph&Thg0k3{pRUWyP<i$Z%=r=y&n(}fVlrCqoZI<Gk!JOx@$i=y{cZPWBQMY?ecQC
z5#ZAUh*HmsBV-NR`^pZP)Xd-MXFL)FJNXiBS*+AFLt);U7#G%0i!AUezhmfgtfT5G
z()&re`px9qV!eE6;Bn`uF%$Vd=5LKKGcV!-hXu2x%kQGjuQmZep+c={DVVmN%qQ(d
z*|tQ#^N3pKEvon0O5yYY_vDlD@QPP=mJff4wv!w0vm7WUXD1pw45*OXkxdL&od+p7
z90_mriLBO*>lh0N;|sw2X*yUeut-KPWjnqp;5uMmtCD=9>;P(EF_TbV{5qfYp=5=B
zRLPGshU$^NY3&G|XX{dKZzG1}@E9mXK#%0_3QK^WvBJ7=vyhR<_Gds5tg>0toi0#U
z-$@v?^UZ|a11ZudC>#P0V-<h-U>AoZKhKb{toc%hQvSmalX(YTX#@g~GQ0)vmr(T|
zPsTW$gba~#J}2PuZ9_wo*b=v2Vu5ir;w%zwkRA;VyUALlgN{Fr)cP<p)qS`Gj4#gG
z48B%}U0xn?OR1D7NM~XK7f~?aVk$9MbgPs^jFvE&lV$Jo$k9w`&u-&Ey{{)cKsP09
z9(NrsZm%1d_Si_YSVhp!gQZIOkT}evRgmAqMxE*oiHQ#1A5hKB1=~RYb1E9cvWuY~
zDflp6`U`=@?ix~Psbt+8o$#{eC$*qJGqZjVBU1-DBS6Z8rp_%SgC{Sxx!yH=TfO8W
zkyz}x$tpIt_+ExX%h!57JmaTXzMyog2V2M1mxg#9w;0#tx~Rg3re|JgojnYZ-{IWr
z{sY#KlH~Lza9-%K460tpC&O3rCd4wztq9Q5ch<e;(|X%uQxLMR@sweHlw01V@F$XG
zxIzOuwoMtBxr&ZCP;rS5HSS9AOo-MnQ;q%ayQi>{LXJMoshWp}DSR-@Berzz@>gs@
zkN-%+W-mV1vZtoK;V-k_pR)Q@-ETi_T@CAHM>b0No>gYs>$Q+2kc5LKf;*&OZL(mJ
zvC|jn`5!3u_21jyF+BpF!lK#Z_1Yz5088?3@MHh<lpKkE8!jjW>c&^ZNd!Rk0BA22
z?%87$X57;r3J$N=b3TcHD%rs8^U%G{r;k?dBw&>;;=@1Q$+1|9UjZ`woyTy^I$=x6
zj5^_AlWrPI%<wM7D}`yE;5sXDp-zxlo<2dG)CZCmD<MbsU6&SmGwp-viH;Ty&Y?#d
zk>voa5z!(*7<mF{FSo?*0|KtsT^F}3(}{I<rrskSAgRv18(?)yW)Zdi{lfB(b>Rr`
z{!8+8T_Bqjxmzz*2;HWT88+gf(l0==L)XR~AHZ~n6x!d@C};5RSp^$4c#zmO4}nSH
zOmQssKZ0n1EZ6GXig2`n_2<*x$Z&3Cp^GrxM*XCTDsN;a3S^k?pfioggfK2uqCJPM
z(;NN5_L}BwG-CN<Rplb)%qp+*lX|%(v+AcY%mb?ZZ5n}LXlDYa+baMNrxLT2HXrs5
z=1v4t=VxmpZ;1t_J{>K{Oh{y8V7mb{EDWtT)f|rI$V@LS6BnfbD#-_&&t0@V5&J+u
zXx#$No?TSgZQvj{6U^u7LFFvvj7+ALPZ1IBHt45c$6kR?nBBlFw^x7(ti=>2NTBc^
z54n=Wn4oxm0Fr`9o{D{rD2KYMoskS<=IEe6RJFuSMbBN!6Y_y~q>``9yFeQvk2<gx
ziJ21JOBmT7tRzD0MRQ)E)~Ew+-<2RBsa_XUZ?;Gt-qVo%x;mUKwxnaC6t9M)Am1%E
z&-+zyCS?QPBfgLjpByqxCQrT#mLd7~qiSnu)uS*tw~V`_kKG6|ev&3nIgOF5&C7?|
zsZ=voJ0L{W$9@+BDZe5&^U0o7AB^7`9bfybBOE(=8seJv6kG=CijkKt$ZCj8c05H5
z-bJOF;*3K?yG)h+4DX$!S6th0oE$K}B*PK;V?BQlq|>+Zcsry7S^%4jLz?*Cm;lqP
z<J0rj($f5`tt0tX>|1javJY?6g;a@IakE{XY)c9PZV`*^U;I(x+;Ha&nv2a_oJhZN
z@6$Gb&hlB%1t;e14oN|lODxI$NH92DKt8Z4xDsg#{POTqDHGgPeRD*lD~9k?4qohN
zF0o;CzHX7i#4~j&UW~})a8U4D>u<12Ku3b+SPwpOYixAtzp(j(bX129e)uVoH^?2P
z?o;}L952bqQ85vGT1x98h3NcoLZ6K~9L26Qq&@Xu%A7Z*?j83(nEF6$k!hM$TU}G5
zbbB=BvvCaIiX(V+w`0-Rt&Xvu7lWh`O!^9<N27ZdEOTjyQhlq<>ZCHDzdCfAjip(>
zg%JNeTpXBoi~I|u3rbMsp-cnJt>-J4o4cvrS)W`t1DR;?@JLgUMoRUB`1?Vg5pYHI
z@8t-zJ6?C1Vf+~O?&+oM&w1X5_&kpEfo7o6W!U_wxq=D@HlBGeYtPAPJTp<bs+&HW
zZcFxpY|L>4)5d8mybL6OYG#c0J&G7L&Q)KtF$N0wg|N4nOh?)Q)KpduBLYw3eg8ON
zNa+)an^fYDZWDzUOXEprGiHKiOzpA#V9FULsy<ZxM39wWdHMSo9f1%EdX9K}aH&18
z>uU57q&(1YTTgk6Pj@hO5bvBhI+4{E_Q8EPkdlp4Z9+32C@Z^e&&_)O=`N*Vs5(=F
zsMmKUrOR{J@@+^jFdJp(xUAR=okW|R9Rtx=U4;W99u*b4r_3gszkr|i4_!*e837}c
zLr&T7Q4iZGfFG5tu)<CD#*6U9?6z?^*n|OVy%k)J0(tEYSnU1C4bdG`he_J}RCKRw
znvPuT0~>9JScuGPq^^FNXeE|;Q+~S^rZNzf;3?&(o6|JMo*_cpNzdVr19m-Y0sfFa
z7NwE-RUYPL0PbXUS!ll-2>t8=O{PkKH$Pqchr)%PeaPXt<_gAE{t#)&yaAF&pz!<Y
zscAPY+-gw*v@Z8Rb~|q8x!baWoQ<XEgDJaXi7E7$SnJ}MZ`3~#hk<Ws=u)TNAn}PB
zA=dzxJjt0TIUQ;CsItNC(rw$|8ON2EkFOZBoJI)y$mH0r9z}ELehGG_=~kwEv?(_K
zh7qr;G~!A)zyq_6aOeyjAOV8F6^$w)BQ`_I8UKi`>xC&36Q^;CiER*T_#n7dB_hZx
z`!G>+ud7lrgMpj%m&%3LwTa7mMam4*eYr%u5kpxFWh(*>?*~7#$vkZ#N-&}ee(0{b
zy8{((=#iaQUGsJ+3v7ZOqwW1gS}+aqYxCv)Q5@VfCXcgB2V^dD$7GyFaZ;_DSXN^v
z@ZjghK{_lEK`d7@w^m{gR?VG^Bf-oLVm$=bqLY!6!)wwk$pRW^4_IiY+VV9Dip&fO
zr1~8(Wlbwn65g~PCyTaovc~anHmx_<Og=1jeXE#1o+vDk`hR;yels^KG7{q5y-m8D
zim#&s0_RVD<_l?Zo>U>>oL$TOHsJtd_^EmbnCj{MCDbq7>0Wg?R=s6nDl$2Ls6m`~
zMEU#=rYr!+?bM6QC-ShM;K!KEe8o@7-KnWTch6041ug`0aqAQ}q^x*9w+oTGD1fJw
zteo}x261{>kxo)rSdx)eNH*9#0N9i9?GOCE!m930KPTk0r3rN>OmO|~Zb{AFtByMz
z4b%`HQ;6}(H`UP{BzQA((3N_Kzj?Rx<1X(!G34-GAj6uYw)=~}oLcv{j{C~$x314Y
z?w*)l=w3uPx5oV(a{U|G4y4Fg*p9gTs+%;%yn9iv0==l=B`s~fc$g#%-FDDGAeLBW
z*m$WCi=6pGCK@xuN5A5iI(w}cIM?mbAzS2BNwm-h=^CB6nMt4G(<v>qUTNY);t62q
zl@yTwsTJ6vBzE~emQSNA41IV&sK1)kMU>+GAl~@Jo^6H=?|4|C6r2!$-c4^*Ozm)m
z?k{<b{y-5)P_icLADT{skPv|15<uR6A+WoCuEMHzGPaDGU?*yLas4sjf96M@)Mt8}
z1-Y~mD!LR(#QDD>z|C{qv<cw^xC{K7!WNu@Rq2~m6`LYh>gE5Mg@{a6?TaODIhK~)
zx#oF@2)H}{kyB8Wdz{|k+jUTno_#0fprkmUhwOXiT-sc*<wVWktNN#n?V+OPMfAtx
z06*fm#(;|4^6@_L2h%;Sfp9-}jEI96!)#}LJf}-r51%AK8t!Sb<*CRApLFilKfp9W
zM65!qH1WfOJnz>4UM<(X`v5y1>aV2M*@S0js^VNdz+goevmFz{SGc9OLkfCD?B;{U
z_Ts>az{v{<geTz+Q}bc)-VJDa%%|RJ`XoM^w%Wa~O>L(*scoyCnIoZjfZMO%igc_;
zHR-P(`u97wO)|RKlkc07up@mI34|2+c$r@KZAnBF)SCSx?4LQ$tw2cTltB#&8<Fia
zG5wKLr6?B^L!;4$eHYgb`OM7t0abwNJJgH55E5c(a6fP*%n8}4+CI&Q4FZ%I4BG66
z-@bHlwB|wDR7h$gy9sXQo$>4A5lH=3p&y$dRFs7U{(jlFoZ>CwGLm`umLbkfN7NS}
zvc)_}`5RC*dLxf_MwBmpEK28EQR}XLDn(h%{Ct=zD5Kh?TVU5G-YE59SOtXqtkX72
z=-(c|3TfEUoD-;`CE=Y<GDKdWc+Ih3e7|B=edGW-?_A7{e#Av9uDnMuTn%ccV}Cz~
zEKd?PExre1s(B50RQ-F9E%B)$aSy4vwhwf0`A?w}_^rue*wInABsUFfg+Lr&7Fbb9
z#b>{|oWA5>1#qd<B{07Tkh@pE=pL}m_r1Wj77j=?Z-Yb_gwlJPaOH_YY}WRV(~c)?
zbUKv7m3#tzz};mQ#t#K9>el!PyFiqY88*<^ix5tI&(?(~x=|<6XYL@Ap>f6Tr{gk7
z6Jf$oFaqrN91yuoiaaqt6}t;<7NmG$z*zL{5|+OB<wb&|vE`;0=$T#bc0}+pmdT}x
zxeae-L28u|NX|<0pu`3BuURA9h#XGsY5*a}g)@Wu^ZNXj;?r%miJoT>KNBzVWAkfO
zzUi%xAbc(yt=pOzTD*PkMk|;lqdistub4W^Jya6NEpy;NT-f#fcU;ylw;1``R#Cbf
zJ6<>Z+2m69kfGT}qQ~F#!EAH)V!o<kFj{Qd2xshHLhpU_mTkBq9|bqp*^7+31CNm8
z0kMRg%$JjK1fwlqHMj2Cc-0D&K!@K=0zkE`%lf;3mJZ)_pmS*d>3rab^P-C4gc4cK
zI)cW@F2@AkDv68Lgra+DD?Jn`<zw<@6o~Sr{__zbBZ=efW5g@lmz``?*rkVRcQ}L9
zo0SafNldh@KCdztm*ShWf{Xxq;Sk~*KaW`(*u~tP^~bx?&-?Cx{EYMaZ$rtdlkh}c
zzAG}xVvO!)S|;K;U0CivE^{<1g|VFJWQ31WjyN~Q>AuWHlKS+d6&BPHWwQQ>p5eXh
z&kqF_TRSmUK)g8d$cn~p$<4(?v=~v}2>79A(mIvmwC&?hZa(#eC*F#o+)B5H{P=u`
z6ceXsL@Scae~>7kxae0f{iBsJmb?^Alui)3WJXAD45I1@gw+~ap12+!qr@}RHsR?D
zvbez|OI|)?paP2c=DYByZb^%bZbk*E>Lx%l=UOHbL0SK(7H&nwZv8p2hOuH!m<Cu$
zL6tKxu_~%lbaUz6=%}dwnkCAfm{2_hV5;gCpiHV<v^*)(<jMajg%t>egq*6j@fyHP
zm$7Jc$k1;R5x*XpRn~$rLd>w*P?-Rwq1Gtbi;kFon88W-8buQmGnu<Vm9S3uw@qW<
z%q(x(S+xh^<fp>K%vpL91$5N?#^G!wfn+;PG;{9m@~m|Sntg~mt|ah2ti`0v5=nHv
zc$rw?14zW_R1F!m^{NAlWG#kJGE{(D(+~p<2s`=f2etfH$jOIetqWs}l-a6tTH~-u
zo+Wqh*+2_C_}M~HoBUcjn5&%=2&~+Dm<O*tMFdjY5XCzkXTBmguWHg-#_>8P-(5D<
z#0Z{bNl>Ced>WgJ@e_zI=bAc4Y<h>;4l*pH*$>V_|FuVl2L*|p*m&q0=6lz2=eCV!
zKzt26jEaLX;(mWolB_hksvpLp9s;Znv&;bJf;E<Mqf%31(01cv)$doPG6yUaZ_QUa
zl63mCz#{L$%5k+_1<kGfa~cx_VA3Sq`yJ}f%D|tU^j(7PDWjw&(H^0?hjCarwuhSb
zO>eO}*0-XoU9uRQQPG68eUs#Gp19Dyr<fazQ97Rt?FN+!59I;wExCL^Pw5!_^K~P}
zmDQkwDfIoy*gmw315t*rwPEXcwtox{T@#|L_B&Sf=N8p?L810*B?$k0)mMzGH{8Y|
zM$44r%=TKv`oJn@B<D2ZeKR9ZEm9qztwtSQt54aCz<?A2fzbE27ETr<P5?p(@EhIx
zSl3EADP8SF=L*Yi&ZHK9S64av3Y=*26|GR#PfA%m;#FtH?`rx%T5pz`Ftr+#BEWf{
zLW2YQgTw#@I{sDTqZm$zivUyXMYK*HI$S+Q<@RUb$1dZzUUDaDnhr|_#{@lr?=;KF
z-BYOmQ+hI6x-RjoM@&-2Y~!u92EcS9Cyf3*&f<cs;EUdNCjXtr%#k?(7X7iVp&iwC
z)zj`=CTRq*S^oZbejbQSry^SbR9R&(gR)jlP_QvE2_WRqaD0!uL~=7S`}gm5EM5H7
zWqTo>`5yk1Fw-ocVxC^UMZC*6A??6KV_XGc-QLDTK{T6nt}rx?lpK1@HezmM|LD^}
zlWNN)fF4}h8_Ogu1h8(g5(9E60oO&sh&1=Q_FRm==yLpaPOT*;9u89*2Ym?u)>!?q
zfn4o~W9uK(HexQm*_#XWYSJt^31D;$(C2)az!-?OxwVH{w03jfgy|`HBg<-oZ`U|g
z`DUfG^wB`kU1+`G&<M)ZYaCo5)Qos0g6~iE)Z>2Y5}0+1aA-h<{mG9AFKT~2<QV;F
zMhD)P0`1*?*Q37AAf|-v<n#b)VNJ|^bS8w_TDi)gvKY%#x+Oy#cINQ$zv*7-Hl_bM
zuM?m+AsXC}l%#E_oz2b>?@elK>pC@{r8Tb{{2jZHQhmx?5{BfBv#;~+zX2tdVyjgA
zPc&DDP7pF1>_1u$SBw7Hf9yMD&jFq9qwi!W&|Nfe?_5ZUY4N2V4B2Yhu(NrMkq_5;
zhgnfBlL&~9ixHnj59UCK2(i8+M&J8vG&WGv06^FXZx7PRLGd0^6+eUO#){({p^TDE
z*S=DGRp7jX@W@O}1d?}pQk6m})thLrC|Ha<blX3vi|+z??PL|C+cD`*qr@&?VrpHj
zEX^u1dbA2dx~F0z6J9*AjBLUUbI(iN&)QGbg(1H^7(tAGnxdcql%Z7Lrqnv)5qjM5
z45P$eH^;|4Y>&rZYQssivyQ?deK6Gj<g-Y$EGIm2WHJe_BPStn)-ZWBUR;=FBDXe&
z4HM}E0os{RhVWCE^&%K>i$WK%(p|#ITrxi?KgMO~ane_%Ehf=MW%9T)uz|*@;sEG$
zlpj&vyZR#Md_2{aK`cDH?L9Xo7YSRfm@yd>fFi$PQ%rW@MEth5Yx%T>ps`BG;B(4r
zC$KSyZT4MVB-|q_-$%jBirHD(`L?wKUq!-~CIee~nmJ3I3~C~)H(Tgqq+5$Q8(pz*
zBkY4GTZ`NoC^Z%XzY;<DIyl*5gDQ!Wv49GF>0bo`UM%jpF?gR>z@Kns-qbfJ2TpJ~
z^H2vuO*23>IJjgFmK?%JV3(UDq-zboo=NYj%y$q`?bthSPaaGblb*I$E2j@Y+M>98
zJ72Mjl5uPXH?{4ovKYy$xB#?zN%|UE_m4`C&MFe5Lo|}wl2gm-NJb8M7jc@%b2WZq
zenLZyIR`cdXv;R->9#8c9A!6B{3+t7FNtRyNrWeF+h1lxCd-NKrAn?<Yr;?*RY3bZ
z{<dAIMOcM87EiR`6L?ucaO$4$XmX}_@Z*($d>Z%Ah&#@J8shryg;mggGNi}!{8Wwa
z7FRv?g*$&I<8R$&P?{?gd<q@NDiApsf8^9z&~5X`=^W&~`yDHsTA-zx)^a}aUAs!t
z4t+zBb2~x8Ie3Zih<C5dX&M0lP=OHY|GD9Dnn9OFan%FNbJwFvRTr9&7s1RU)fpin
z9D2%BH*cBj>if@F{E>yf{G?MBRWY$=)A#eq-$K#CJgJf|=qd<?3J_AYqYYCxTgyGO
zLop(<h#%au>Uf9&1;ey{OrY}CVvP1J8}8%Qd{X5x^+6HO?E&#w%c9!qA+swAV*UN4
zU}r-2Y<LnRVooZ3w`x(okVFCx9X*}lwHjm?eEH^1oAbm@;bvvDnLcSbP4Ma{0%}l1
zgnU0SNvc$pKzfyZu}^e55os(*xNB%P`AutA4jNzO!Fx)vgpfuc#T>Z}wok2J9a=$8
zkmVB;Rz-mAM+3-+-<V~e+5m5!Fyd$T&W{IqKK7juOnR9N^H=A=^5WQ!A9xQ9tps>5
z+yRM=B-_bab5l6b+{JYH!RfKWIjjN{<d?Z9dd1bf!_(&ZsR>mihB?#zklcZu^~NTl
z5>(<f%jn7#5I#w@<*0aDWuH<s8i?LBpvvo_3%FD3GB`AJhJ2F%Z_pWIw6r5aDRF55
z0|5Zy^GpW@%RGCp5z^Td^(^NftA1Np7<MLI64Nv_<4m&FLfiz@h|SMDGz0&f5yeKA
zatVR?^!mII#~^Wp98cYduFby6TQ6g}$<P@#6}EE$yaFf`Cq53T^_ZnPX9Vn9rLOOO
zAMu64#!K*Y0uu;-8nx@WM!m6DbK*bunH**4@5#Hysg`W)%<=<Tf1B_f^oB}T^Qz;8
zSb*r;t=8-#8F?%9%cJc}*2G>4It?sq0?@$`BU3x<{JolhOT*qah6CbZkAlU$E=d{&
zDlopv>2@`au(`1AumYEIEo?S=<j(;xo?F}@K}2dzFV;SlUuRDuM0S&rtEc^Dm{?Wm
zhfyjwd0m1B>8)8n;2SPZBC{RdRV$h0NH7GNiyM5UqwEfjtBJfvXC-?9q{>Z103;&o
zL+6cxqB$}3mW^%l_QJb_^{|$jg>=^y@WIz(mzV=c93K-^Dr<HC(5-2koB#JYlA=+u
z$4e^GAD6%gBhX~)d+Yq0RBg@AwWDeJh4&$MYID1;+5*3tvErnI$)#$(WV%IrTE**}
z=HRH<`s3@j*LValNjWb5hj4hc6>IXc;KWgGRJ#v~LFDRx{&wRvNo(iFMW$tnN_7>~
zn*U1Q+U5LVtP14;;q^}RhFYc<M;i!-+I#bmc?`bUO;V)s+#vm{mE}oE_sa(Z1<;kg
zoP9nvW;Di)^=9i}7YxU(H0}b$HTS{zw>79=(l{9)e!}UxQtOd6d6xpnRtHh!yKcCi
z8w^mOhmO(V_Y>93{J7wI@;qG}xY4(G=BoW+BUT#WQs7XWDtf#RK?X&F+Gh!S$78|`
z%Q^Vy)SGWCn)WO{yU`tjPWQygmF@Cr#4$hF$&S|k$P3Mx2r=l`1;HTZT<@%rbw_(Y
z|5a3<AnNVplT4Ze8!bYFB<%mQ^6LNL<pzm&%v=Jml@JeV1>mQCsLuA0$>v`TfYm9g
z#B@@4qdgH?OP*l>BQt-H+YAMdR?cyQXMKp652kQi5nIcW#>s{9YN+<xvx?JX>lScx
zFlQGe@T^rpoeKR6F2@w~I+9fyJ|ksQE<SryzH%O!ZDdL962Brn>JL|51Uzek;7<LG
zu^+BN{w-~|k??^{9W{Etg8+ErYM)0>0z1uMv$$9n6=&?e0H|Cvf>sJ;bMV|nxp#!0
z@MQSBkpZB>r^l9XTGq^p{MtH{V%t!BWhS&-{kVH`DWSkil})$d3qMKkBJj~J%E56k
z9=Xy|!ZS~<B(S&_R0~DO&yxM}5zq}ls+KJj7mg`Er-2!vx(6Lpg}Hp^A0L=EN73y&
z5{kFto5J*@^ll~cxfDewe!Rn9iyCr)=g_Rw%Yd|~Ib^ao1Ey;`Az(lm?6RKfa*Izo
z92vm**lc|&vo^k~ux4iENolo3jt($!s2|l{$navq1OQ8g`efO|f!A4Q`JDcgue0?^
zz<n?F%Z3M?ZKn3=uW$LX3NZ^eKxYV-EKa^dDPFI%?TI8I`tW^ZMUU?X;O@>$herwu
z)kWoXx0X~}=t*PD60p2iTs$a}2+GZHH;7wNj87D4Y!U^9ZH36QL^=%eS-|dc?{PSS
zn`C5M)USKM3<+9reW$6HASSNIP>}#&KZ;t?DT@5?5HT^tk6I@e;}PANKQIF){yaTi
zPe>T#Y@Q34N?Gcy6K!9Rj{uU1h6WbpsBJ~9MJNCl8xC5_Xa7yf7Q$i`paZMfSkiLJ
zqJk%?&_YcJo{t{?xzH8r$q$ulcF~-$SwK%g4e;u-g^EU*corQ-+~Gy9mD<ULL2$dr
zRrwyd1AR#4>~~C5#Kwp?tmB(b?aK`vqDI<2+7%Dz7DGpNIRX)}c*Ad}d{F66;1B#(
z2^ya$%^6<2GC{RE9lyyGraRWXJvZ<&mz}ew&@&niu;rrfs%U_Uz;M+p1S&2Q(ve)C
z;JtJ{=BQcG_WYkFCSDaaZ*!2ehw|*|GMV81&sb5o8JWCwqwFXwUay*IPXRcRr)))Q
z%Q`BnzH<6aiG@S|Rf=*uW6w5D^!gSCBG|GWWQIvzrsm<Zbr4f!ZEu+J?$UrCGy7kI
z(Fi^76l@w!>OaZlvpk<XS~r3@O^{AGD_Z(VSXxN|WtzE!d#jU|9S%V09?NV9U%Y!<
zz=VioO0Q6SL?64h-*TE_;2IzvuZ9LyO$`8<bOX!5@OTz-hkM6;oGriGS`!vyRO4U#
zF-uKn<QLY$X6mVC*?>_!);O)XQ=n`;m4S4~e|K_}e6be!`MPm}Nfwbu68GR6*h=fx
z-{0F(cD8^`kk)QOV+RcJFGQ4H0+zCWcrA-=4el+XP<<a>zJEd7=TmW1MVLS!CDnUQ
zRHce4t(B-hZvO-TMiHNtWl1+TVt&7C_Lf%L6#9vIJ(C+3S#-2<=Ru~e!RK#ow6I{W
zh{Q6e`?r{R4B)ds+e)Ym<tpmkpr|A|r@Z%^wASefifsCjBm6PF95DTm|DOO$6143u
zlSj4U4G&m|Dyl7OGXrUBJe)zV8E`mR_p)3;_QMen8cOEsRp+dZMxM>HMMwE>`lNQ$
zqouowX!Y7J`-)3;sGPRg%9p_Ie0)c=+ro?3PlG7$A9+ShV-?;NwmaOBaW@rcQ){Y3
z#gbNI{$>MTU%Xhz@Aj1UOv6<A(A1#`K9AGPekPYPeyG$ccsh{4l8|-D0;XmhkRU9A
zgilSHGT11%tQ4&9Q$Q7wPVHd}+-bqpF*s1r1<wuH@|j9mjW+<z4R&wXY0CH-U`Q8q
z;ygUI7EK{s5&u8%1j(TpA;RhH!fTP24F%hoK7!xwtt<AQ98@FFal(OeV@0(cG^kA4
ze6L5jN-{KQ5>AwK2XpZ8(TI5$3&^}J1~zx)A=KA|x=RZlif}O~gFBzrL4X=uIwxks
z*!{gRmfoMP5$@axZCe9n#7ch1=(uU*w}bNKSi?_V-=nx1kW5}>k1^H9?mRU%UdAZ(
z2%$4@q*F~T?(V^3Z%R&!&4&Tl@-e|&5kp5g;Ks2}m8=Yi<8Prj35ZadDA-6$OJ6&_
z%vU*})Th4RPYi{-Hnrz5yhXRJ-w${mHoznS&}W3liAXOg2moYP5YpWlFW6Z^6y!~F
zCK_^Ps|^FFb)cvHz($rU61O`hP1Qm1O*6fL#X3>UBtZrne%m@5$mVkT3G9S2GSLZA
z8_=ya1nVz0uLvzE@W=EsWI?wi!+p$>LpTJz<B-%P2OOd2qsS{?Fa~9%YUF8q5mP`-
z??_Jun_mHM;_#rNvk*=;`quzH9#`{MlsJxnNFZTt)W>bx-0F>aeo%O*G^XOQ85#DP
z6=1|FIN7LEAplwo*K0sSnuo7v@%3rA>R>X9QygnRYg*h&vI`g(Vkihc!xt|IfIa_f
zAKO}I#RHYdj_{`gy@}^#csA9WrzglUx0GU@-4}Fjg6R+yODJ~7z8459Q#o*b*-tGW
zTPvVmmyOuS1Q;hlQc&kudmHgtLh<axD{TTBV-#*2C|J~|em7?kF=?l33AS)$EEFP0
z`q=>;=fFfk#3w|L<E1>R;(e)#FuT8EG<OGhYiS;w;$SLtk^weR!y*j2r*G3>tWjk8
zivIYUTSdb*3WMo4*n!GQo~uXFdw>#2xg_vY$OXgKS5Y0_&uYN7(5ng3w(tMBBOho1
z&YBXX{K6Z10cFJ^?LJHOHpox6Ir+=+)MApE7cgtidF{OBa^fTK?f_iqMNeQC@q!xw
zRY3sHNb`N!JwZH3w<nPzn&k3s`;MlUmNTrv0$#A^3L~nkC;6IyiMr)mWtA=?oCV1U
zVpVL_JjIXj31$_`@z<HB*EvC?QM?#LraDh2C(5%HW`^qJE;mtEs9R9@82!Gc90b;+
zW2kse=kNQt>~(C^AYpSGGtIsxN^BWV0H7undGL)uIaD|2YrDzVsN=daCpXJlwTZTX
zNWZz|{eiU3<eaP#d~5TS<OvuP=_A2mOk2J&2|BNNN~epY&k-y?66HwYEZ$d;;AXeR
zV;NQ+ED5t2cbwVZJ$JDE;dF<%o332C3{oBFCLtE(WUgqR4v6$aVzD6!uI;+|(dPBz
zJ{bh)h3z;Ld-L-QK>z0KAV)q3E8U}HvwD^LDW<E%zy_AACX3p~Yn8m;H4KcKEo`XD
z4zU;xfq+u3OnrujNDG^Rs{5E7Qubn}JcDQ|SJks9(4kJFsZ9ArD8K{9Rv(A#p=`QG
z*N#{oEp7$gHws+k8D^581kt7mg;Wq4A3Sbdb|M&yl8(A+kE_GMU@`E>90#DccJ$Wo
zn!c)k%vR7G;NdTjUI+Eq8WXKj>I|eo@qXZECoI$xa*qp&-#}p9lI-k!fa<?@h_O1|
zpdhP`@-w#pG$w++R^`^t{g>+?(%>`8!E!jhBrJS*-xGdyWF#Z2i@;HRzV~1D)ajmN
zfnYXDD-uW2Y}ox^bkl5mir!2o{QK-e9}#H~>~gEkw1-q=c{qd<tb6<FbUQI7g`D5O
z`!4neZpujiEC~>vgfWj|_y@WEFOOIH&+oVYt(yzej?bjMoC+ec!5HHrw9RFljd!ck
zGoD`s&vi7I1d$zT7j2=g(Df~D+||A)Bprqhsk{CySsNCfnjFaUJ??k?4s$f*6n0}K
z@~0mRZ*6fULGnuo@qv<F03tz_Y^@Jhgu_Z+zs(@|R0A&D6qy$xwoATP_K6%3iVF>#
zmE_i~5mG<XN9^f@iV1aK86Is16XFEs7Genf-d4!x-OA@gs>(udTF{0u>8fYDeb%Iy
zUS0}EfsSXrm=F)0MdAn3Ki^s4bRMhBUk);i5zt^rF{g61+E^xz^1|*)`v#zU^G&Q&
zd$<*4AZ8dE7^9?V5fVetwVe(Q=D7KlamB8Z3P%AS%#+@Br;u|QXAubslFW`RgyBlV
zv~=_A?slkg1c&0jO;jeH%}fXkKWou0fRQy+402t40+Xgvmj0boA99DTnhlqf%i<5k
z+LWLYq^VO3o}~<<V2C8MvFJE|&=}iui#c_TBSq?$%2L7PO*A|)U4tHe$#yKp*u0{f
zpw46Elt&8Ng@hWDC-M?#eh};Q!k6`$`4JLSaXKVI8z|_Bc=k90O*%#MXIz(<{b}mV
z6y)*NMcr$YZYM?gp_bEt*f+sMmo%;uThTZf;eQU^b&9#htwkvw`c67vieu3bcMVjk
z&L39Jh{F;O*L{*G#?d)M?XGbhE$Xy9Ps%>bT1wWU&y$=cCGe%hc5upW!`uRoplZ0C
zC?+G-e#NBUJ;y&Az3PZ_tE_@CCrnvayo>Cl`Zl#qVa2Uru9;DWao9i9=(LoBg$(xQ
zso&_>i&gFC)G2lkf=r)2yk-@nf?moW30ut5Pw|mSIQZ_~m13T<j^+&a#=igZe$H#W
zyo<yVXOX!n)(dqIR<JuGaTwCE=`6DD$V_4}yna!iE2brHghz$;!N0KVP#yJS-4a9d
z_|K9SSM>8F_>~VR!RbTDgJ*tp$P9gS9?)0Y<83P$*ziXTZqnR*I!L&-UHeW~#WV)I
z7y+GyTF;78X^zEDEj<RjcMHmm6zj7ZgZ5eKl|$`X@86Z=ABB=BSljsy@=zRFDaK8j
z$CQju7A*Y)t<v*<LLLi-I=gPpSE<lAC`lk?+@W~W4?Fj3WOkV%R~mh-35*qFWOZZh
zyV)s>wBK6}0q!e*R_A74^tgOE*9&xRGtBbWoFSM;8~$+s7v=?}ePHE48=Jct5Bm(&
ze~s6v@;8G1bdQ~ASQ2s2(P;PP3{V9|<RvOWx=DmA;K`70_tUy@6!jGfNx9;Yk>!o$
z2zPU^>0LNoO=TCBe<{`HMMh)37Pwa~Y-I|l0Pz8|OzO6QdktRWY{I!kr0}*7T_NU}
znZQOVKd>V_zyUd2`OQL+xRb&%Js{NbX<`ihHtma7M-OFsC<v*^g+AWoK-y8;)2IP`
zTzy%px{-PRfz^1W-9dYE0~5+^q`@qYw)ZB3L`2g5Iu5M$d9DSOSP?TeRibpk0AXEt
z;FFly?K$1$z)z0z-U5GgOpka6s4ETmB$?l+vn`}cYMov1u7F@IW<-vb`9hRrI#<2^
z7{=hdQ}?MfFbSmYJrt+WoXZS!BO@saV8Ds+_)3^uyM|EMiLKOS_rw9iC7LQ!1dWN9
zh{IDt{AU-Ob^O6f;A<+e%F4+XZR#(-{|es%Hn=2rpqKEmA}2kNV=LU$S*`h%83#u#
zqdZFGz~pPSrWy=~IJk=u!6l*#cbd?<Ui0;t$6%Yi8~|245C+?@)BrMpYACtmiUy(q
zTk^MP9H^<wfGknWb82;GurRo&vJ@L*wqooe#2KTA5}xGY>tdXe*OQfsW-LLPIB_0v
zhv@;9Or0jGK|pl*4YFfSQSe9f`EG5!b`@i&S8rzQd5nT&CV%+K^6xi>lDOjS8Dl^R
zQwD=S?0jl#s!P44QSe9f`EF^Fwx&rcrk8;@q@K>OQBr3(Jz?uM<@UQX)SZvv^Gjr+
z!pm;Q2_|}uR@F`{TiWM_wQnGiQ)+hxr0plMv-zarS`!%0s3AlfTo|(5MZ~U2oAU|m
z7yN+aFX4XrKff}t5w7$R_5ms$WU>~d9%S9%A0Qoe3bL)NA1RX^TU2m$jVJS96JGtZ
z9|9SR4!2bnv%~^mSaAMEIi{S4h9nTY3!7ZmqL{66cpOLLml6E<kHCbrr=Z_PDsU=K
z>!wL%jZO5_E)?~?#-F`jAyfRSE4+|{`{I-xS4<hXfXLAchu?Z|ORthJ7hA7;SMF!v
znzmQJrDN_<5#s_x8skS8DXH+_tpY2<5w9bsDuv8dmW17`_7!ClB8TG>)m!%{g(d3-
zk9?YQz()YHedI8vOQ`4dNdNYj5ZFf(@PbmWY69$`e^}er8#%*6_k8RzG}*i`S+?3I
znW9l|EG7+9f0Um_vQ<X!J~iLi9xXkl7+kFlnKS=HJl<1^%l<gzB<*OxfTZ=)4438Q
zP(BJmpI_nCqZ(Gd7?fJ61=DrI<y-Cnt5M(!B8ci}!0&fWv?z|Ou?}@{m^>m3D=Tq0
z;yz$;K3v+7g(IKnwevSE4w&_s<EP%1)^$wG+~ZpMqvdL(*9;?}7eZeMD}7r*)FvN3
zO*wlWRLK%2tO@ZI9U6^<On(L^`qS=-!#sC|M3NM<lc0s1Z{et<Bri58$Hdh<7@1(}
zfz+^a+r3RL?|84W*zm^`*T~?43x1zyDY`=}F<c$$!afX6X{E<T(SN7ul*|`fm)Ps~
zkR-Uj{Vn!+1!_xrpm8z$+O{J@H;7T?E_$`QJ02g3*n4%L0&MKwI`EI^BjNl6np9Kl
zz>VXAm2yTRaJUh&w{r=cGz|CampKAKgAOi$C#32J(uqBXtXmUlNU@>6;y;IcE@57@
zN6-9=TS{v_;bt_QUD?C<bPSI!l@byV@K`O$pP#Y%Mo=iFzB|Amk;STZHBcJB&P5>a
zRkJ|SeX`#=D4LpbdsWC=A!l4n+K4(FGDI2Wtm!l&XhUEvOc07ouj`}qhuk<1Vbnja
zcAv+-LoY5j;ksY^OFDIy6oT2;l*cr$dr6*yW^5!hkO}-2U{UGYH;tRa0ks%l3oSni
zgj8key5+t*<Ul19=7-~#5&ZZpRhzdBN6r_O1y0Y@G@Nq1rr*x3LMkYyH<Q}Pf)dx>
zzQ_JZyNMQFpMD&hjF8YadFCv0dP;KJZ%z*|l`GEYgWZlmxRVQ7A%k^!vadm1(dr>V
zVHoLEiFjZThHKws`_qmpF@R+DQAwt;q*S_JR9bJvkMCW3*wS~#i3P;~CiMADayMSC
z`^U4LVhXH6?2P`uARg8Ao?Z?k%r&(MAU(82+ZPylJZ~8`xvu^!&icB>hvYt#vxBKb
zov!A}BGso_fCuUwLt>e|b4oIim>E;*aLh__^bc1e4y$b`Ate^p*CiUsMl`N98}1+N
z%8A)NHn-dZR-?ccL4aB0=|qdRh9YpLlhYf>)F?Yb&kQ=wjgisb-7S4bNr2EIUyLWp
zC0-f40OxVz$K=3lzCR8rIShGK9pq~t#77Y~3wkwYrVBPuFvMYOzLR<{9=~kz=_-*2
zte%C)iAF~3_rMDokFk<(B7o7>335RWKqN0$2F<6Cj_czvZI5!sto?TBLsJWZ_JYOb
zzw)qd4T7MVLUi+N0lgobrfD4|`~OU<{So;TG-?owke<;2QYh7(buiSZY>%nJUeGiS
z9sgN4r$_TJvXHvkv6Z~q;yOm#untqMOqn7pZ{Hl;6#Du6f6VfakCQP?je-C86}T%b
zD2pXB2eC=0ICU=FP&w#(r~~WQ4RCxaI|7b2ncGr(8Lshe@HV9&NQmIu=0miGDfEw)
z!{UyAJZ?JwHvy>B_Cx}xN(U8#+)of`nkG*g=0;Dkb0ZPFjz}z@39qN&HnYoZEGerV
z*8PX2AW9Fw?|Hd@2~GFW#~n0GmliggPU}YNdz8QQkiwao)1uW9p`Vqe{{8f}tc=cX
z)<p#~w^X@k_ygvRI@kR<Use{jT(g4sAwC%nPdRGu;C5=vTRHur*KsAmcbvi`Gr;jP
zdv)t`K2#>PaF``_xs!2st6%_o4gjl=wL}mRuniREBsZ%(yO-)%k)3Tym!z6juc`6`
zfv+O}C^-;-b6=ih6{-SkljO%c9+Y?n`6z~VI%gP}mS?aX|E5YX9gA(TaLGvIpUF%3
F008Q#p-=z-

literal 0
HcmV?d00001


From 48e6b92cc378c937e59719f2c0f482bf76c9ca81 Mon Sep 17 00:00:00 2001
From: Xuan Son Nguyen <thichthat@gmail.com>
Date: Tue, 25 Jun 2024 13:56:49 +0200
Subject: [PATCH 2/5] Add chat template support for llama-cli (#8068)

* add chat template support for llama-cli

* add help message

* server: simplify format_chat

* more consistent naming

* improve

* add llama_chat_format_example

* fix server

* code style

* code style

* Update examples/main/main.cpp

Co-authored-by: Georgi Gerganov <ggerganov@gmail.com>

---------

Co-authored-by: Georgi Gerganov <ggerganov@gmail.com>
---
 common/common.cpp            | 60 +++++++++++++++++++++++++++++++++++-
 common/common.h              | 23 ++++++++++++++
 examples/main/main.cpp       | 55 +++++++++++++++++++++++++--------
 examples/server/server.cpp   | 12 ++------
 examples/server/utils.hpp    | 29 +++--------------
 llama.cpp                    |  4 +--
 tests/test-chat-template.cpp | 20 ++++++++++++
 7 files changed, 154 insertions(+), 49 deletions(-)

diff --git a/common/common.cpp b/common/common.cpp
index 0ca7b4430f765a..da6db4dc6a09cd 100644
--- a/common/common.cpp
+++ b/common/common.cpp
@@ -1444,7 +1444,10 @@ void gpt_params_print_usage(int /*argc*/, char ** argv, const gpt_params & param
     options.push_back({ "main",        "       --cfg-negative-prompt-file FNAME",
                                                                         "negative prompt file to use for guidance" });
     options.push_back({ "main",        "       --cfg-scale N",          "strength of guidance (default: %.1f, 1.0 = disable)", (double)sparams.cfg_scale });
-
+    options.push_back({ "main",        "       --chat-template JINJA_TEMPLATE",
+                                                                        "set custom jinja chat template (default: template taken from model's metadata)\n"
+                                                                        "only commonly used templates are accepted:\n"
+                                                                        "https://github.com/ggerganov/llama.cpp/wiki/Templates-supported-by-llama_chat_apply_template" });
     options.push_back({ "grammar" });
     options.push_back({ "*",           "       --grammar GRAMMAR",      "BNF-like grammar to constrain generations (see samples in grammars/ dir) (default: '%s')", sparams.grammar.c_str() });
     options.push_back({ "*",           "       --grammar-file FNAME",   "file to read grammar from" });
@@ -2604,12 +2607,67 @@ bool llama_should_add_bos_token(const llama_model * model) {
     return add_bos != -1 ? bool(add_bos) : (llama_vocab_type(model) == LLAMA_VOCAB_TYPE_SPM);
 }
 
+//
+// Chat template utils
+//
+
 bool llama_chat_verify_template(const std::string & tmpl) {
     llama_chat_message chat[] = {{"user", "test"}};
     int res = llama_chat_apply_template(nullptr, tmpl.c_str(), chat, 1, true, nullptr, 0);
     return res >= 0;
 }
 
+std::string llama_chat_apply_template(const struct llama_model * model,
+        const std::string & tmpl,
+        const std::vector<llama_chat_msg> & msgs,
+        bool add_ass) {
+    int alloc_size = 0;
+    std::vector<llama_chat_message> chat;
+    for (auto & msg : msgs) {
+        chat.push_back({msg.role.c_str(), msg.content.c_str()});
+        alloc_size += (msg.role.size() + msg.content.size()) * 1.25;
+    }
+
+    const char * ptr_tmpl = tmpl.empty() ? nullptr : tmpl.c_str();
+    std::vector<char> buf(alloc_size);
+
+    // run the first time to get the total output length
+    int32_t res = llama_chat_apply_template(model, ptr_tmpl, chat.data(), chat.size(), add_ass, buf.data(), buf.size());
+
+    // if it turns out that our buffer is too small, we resize it
+    if ((size_t) res > buf.size()) {
+        buf.resize(res);
+        res = llama_chat_apply_template(model, ptr_tmpl, chat.data(), chat.size(), add_ass, buf.data(), buf.size());
+    }
+
+    std::string formatted_chat(buf.data(), res);
+    return formatted_chat;
+}
+
+std::string llama_chat_format_single(const struct llama_model * model,
+        const std::string & tmpl,
+        const std::vector<llama_chat_msg> & past_msg,
+        const llama_chat_msg & new_msg,
+        bool add_ass) {
+    auto fmt_past_msg = llama_chat_apply_template(model, tmpl, past_msg, false);
+    std::vector<llama_chat_msg> chat_new(past_msg);
+    chat_new.push_back(new_msg);
+    auto fmt_new_msg = llama_chat_apply_template(model, tmpl, chat_new, add_ass);
+    auto formatted = fmt_new_msg.substr(fmt_past_msg.size(), fmt_new_msg.size() - fmt_past_msg.size());
+    return formatted;
+}
+
+std::string llama_chat_format_example(const struct llama_model * model,
+        const std::string & tmpl) {
+    std::vector<llama_chat_msg> msgs = {
+        {"system",    "You are a helpful assistant"},
+        {"user",      "Hello"},
+        {"assistant", "Hi there"},
+        {"user",      "How are you?"},
+    };
+    return llama_chat_apply_template(model, tmpl, msgs, true);
+}
+
 //
 // KV cache utils
 //
diff --git a/common/common.h b/common/common.h
index a5c738f8b643f8..de90eec5113f79 100644
--- a/common/common.h
+++ b/common/common.h
@@ -365,9 +365,32 @@ bool llama_should_add_bos_token(const llama_model * model);
 // Chat template utils
 //
 
+// same with llama_chat_message, but uses std::string
+struct llama_chat_msg {
+    std::string role;
+    std::string content;
+};
+
 // Check if the template supplied via "--chat-template" is supported or not. Returns true if it's valid
 bool llama_chat_verify_template(const std::string & tmpl);
 
+// CPP wrapper for llama_chat_apply_template
+std::string llama_chat_apply_template(const struct llama_model * model,
+        const std::string & tmpl,
+        const std::vector<llama_chat_msg> & chat,
+        bool add_ass);
+
+// Format single message, while taking into account the position of that message in chat history
+std::string llama_chat_format_single(const struct llama_model * model,
+        const std::string & tmpl,
+        const std::vector<llama_chat_msg> & past_msg,
+        const llama_chat_msg & new_msg,
+        bool add_ass);
+
+// Returns an example of formatted chat
+std::string llama_chat_format_example(const struct llama_model * model,
+        const std::string & tmpl);
+
 //
 // KV cache utils
 //
diff --git a/examples/main/main.cpp b/examples/main/main.cpp
index b97b7b7937f02a..cfaf6a6e8ba4a3 100644
--- a/examples/main/main.cpp
+++ b/examples/main/main.cpp
@@ -39,12 +39,12 @@ static std::ostringstream       * g_output_ss;
 static std::vector<llama_token> * g_output_tokens;
 static bool is_interacting = false;
 
-static bool file_exists(const std::string &path) {
+static bool file_exists(const std::string & path) {
     std::ifstream f(path.c_str());
     return f.good();
 }
 
-static bool file_is_empty(const std::string &path) {
+static bool file_is_empty(const std::string & path) {
     std::ifstream f;
     f.exceptions(std::ifstream::failbit | std::ifstream::badbit);
     f.open(path.c_str(), std::ios::in | std::ios::binary | std::ios::ate);
@@ -117,6 +117,14 @@ static void llama_log_callback_logTee(ggml_log_level level, const char * text, v
     LOG_TEE("%s", text);
 }
 
+static std::string chat_add_and_format(struct llama_model * model, std::vector<llama_chat_msg> & chat_msgs, std::string role, std::string content) {
+    llama_chat_msg new_msg{role, content};
+    auto formatted = llama_chat_format_single(
+        model, g_params->chat_template, chat_msgs, new_msg, role == "user");
+    chat_msgs.push_back({role, content});
+    return formatted;
+}
+
 int main(int argc, char ** argv) {
     gpt_params params;
     g_params = &params;
@@ -190,6 +198,7 @@ int main(int argc, char ** argv) {
     llama_model * model;
     llama_context * ctx;
     llama_context * ctx_guidance = NULL;
+    std::vector<llama_chat_msg> chat_msgs;
     g_model = &model;
     g_ctx = &ctx;
 
@@ -215,6 +224,8 @@ int main(int argc, char ** argv) {
                 __func__, n_ctx_train, n_ctx);
     }
 
+    LOG_TEE("%s: chat template example: %s\n", __func__, llama_chat_format_example(model, params.chat_template).c_str());
+
     // print system information
     {
         LOG_TEE("\n");
@@ -249,16 +260,21 @@ int main(int argc, char ** argv) {
 
     std::vector<llama_token> embd_inp;
 
-    if (params.interactive_first || !params.prompt.empty() || session_tokens.empty()) {
-        LOG("tokenize the prompt\n");
-        embd_inp = ::llama_tokenize(ctx, params.prompt, true, true);
-    } else {
-        LOG("use session tokens\n");
-        embd_inp = session_tokens;
-    }
+    {
+        auto prompt = params.conversation
+            ? chat_add_and_format(model, chat_msgs, "system", params.prompt) // format the system prompt in conversation mode
+            : params.prompt;
+        if (params.interactive_first || !params.prompt.empty() || session_tokens.empty()) {
+            LOG("tokenize the prompt\n");
+            embd_inp = ::llama_tokenize(ctx, prompt, true, true);
+        } else {
+            LOG("use session tokens\n");
+            embd_inp = session_tokens;
+        }
 
-    LOG("prompt: \"%s\"\n", log_tostr(params.prompt));
-    LOG("tokens: %s\n", LOG_TOKENS_TOSTR_PRETTY(ctx, embd_inp).c_str());
+        LOG("prompt: \"%s\"\n", log_tostr(prompt));
+        LOG("tokens: %s\n", LOG_TOKENS_TOSTR_PRETTY(ctx, embd_inp).c_str());
+    }
 
     // Should not run without any tokens
     if (embd_inp.empty()) {
@@ -478,6 +494,7 @@ int main(int argc, char ** argv) {
     std::vector<int>   input_tokens;  g_input_tokens  = &input_tokens;
     std::vector<int>   output_tokens; g_output_tokens = &output_tokens;
     std::ostringstream output_ss;     g_output_ss     = &output_ss;
+    std::ostringstream assistant_ss; // for storing current assistant message, used in conversation mode
 
     // the first thing we will do is to output the prompt, so set color accordingly
     console::set_display(console::prompt);
@@ -793,11 +810,18 @@ int main(int argc, char ** argv) {
                         is_antiprompt = true;
                     }
 
+                    chat_add_and_format(model, chat_msgs, "system", assistant_ss.str());
                     is_interacting = true;
                     printf("\n");
                 }
             }
 
+            // if current token is not EOG, we add it to current assistant message
+            if (params.conversation) {
+                auto id = llama_sampling_last(ctx_sampling);
+                assistant_ss << llama_token_to_piece(ctx, id, false);
+            }
+
             if (n_past > 0 && is_interacting) {
                 LOG("waiting for user input\n");
 
@@ -848,8 +872,12 @@ int main(int argc, char ** argv) {
                         string_process_escapes(buffer);
                     }
 
+                    std::string user_inp = params.conversation
+                        ? chat_add_and_format(model, chat_msgs, "user", std::move(buffer))
+                        : std::move(buffer);
+                    // TODO: one inconvenient of current chat template implementation is that we can't distinguish between user input and special tokens (prefix/postfix)
                     const auto line_pfx = ::llama_tokenize(ctx, params.input_prefix, false, true);
-                    const auto line_inp = ::llama_tokenize(ctx, buffer,              false, false);
+                    const auto line_inp = ::llama_tokenize(ctx, user_inp,            false, params.conversation);
                     const auto line_sfx = ::llama_tokenize(ctx, params.input_suffix, false, true);
 
                     LOG("input tokens: %s\n", LOG_TOKENS_TOSTR_PRETTY(ctx, line_inp).c_str());
@@ -864,6 +892,9 @@ int main(int argc, char ** argv) {
                         output_ss << llama_token_to_piece(ctx, token);
                     }
 
+                    // reset assistant message
+                    assistant_ss.str("");
+
                     n_remain -= line_inp.size();
                     LOG("n_remain: %d\n", n_remain);
                 } else {
diff --git a/examples/server/server.cpp b/examples/server/server.cpp
index f9a86961f9c8e6..ae768097baa0e5 100644
--- a/examples/server/server.cpp
+++ b/examples/server/server.cpp
@@ -2606,17 +2606,9 @@ int main(int argc, char ** argv) {
 
     // print sample chat example to make it clear which template is used
     {
-        json chat;
-        chat.push_back({{"role", "system"},    {"content", "You are a helpful assistant"}});
-        chat.push_back({{"role", "user"},      {"content", "Hello"}});
-        chat.push_back({{"role", "assistant"}, {"content", "Hi there"}});
-        chat.push_back({{"role", "user"},      {"content", "How are you?"}});
-
-        const std::string chat_example = format_chat(ctx_server.model, params.chat_template, chat);
-
         LOG_INFO("chat template", {
-            {"chat_example", chat_example},
-            {"built_in", params.chat_template.empty()},
+            {"chat_example", llama_chat_format_example(ctx_server.model, params.chat_template)},
+            {"built_in",     params.chat_template.empty()},
         });
     }
 
diff --git a/examples/server/utils.hpp b/examples/server/utils.hpp
index 63fde9c9faabe3..7ef2a519a10c76 100644
--- a/examples/server/utils.hpp
+++ b/examples/server/utils.hpp
@@ -118,36 +118,17 @@ static inline void server_log(const char * level, const char * function, int lin
 
 // Format given chat. If tmpl is empty, we take the template from model metadata
 inline std::string format_chat(const struct llama_model * model, const std::string & tmpl, const std::vector<json> & messages) {
-    size_t alloc_size = 0;
-    // vector holding all allocated string to be passed to llama_chat_apply_template
-    std::vector<std::string> str(messages.size() * 2);
-    std::vector<llama_chat_message> chat(messages.size());
+    std::vector<llama_chat_msg> chat;
 
     for (size_t i = 0; i < messages.size(); ++i) {
         const auto & curr_msg = messages[i];
-        str[i*2 + 0]    = json_value(curr_msg, "role",    std::string(""));
-        str[i*2 + 1]    = json_value(curr_msg, "content", std::string(""));
-        alloc_size     += str[i*2 + 1].length();
-        chat[i].role    = str[i*2 + 0].c_str();
-        chat[i].content = str[i*2 + 1].c_str();
+        std::string role    = json_value(curr_msg, "role",    std::string(""));
+        std::string content = json_value(curr_msg, "content", std::string(""));
+        chat.push_back({role, content});
     }
 
-    const char * ptr_tmpl = tmpl.empty() ? nullptr : tmpl.c_str();
-    std::vector<char> buf(alloc_size * 2);
-
-    // run the first time to get the total output length
-    int32_t res = llama_chat_apply_template(model, ptr_tmpl, chat.data(), chat.size(), true, buf.data(), buf.size());
-
-    // if it turns out that our buffer is too small, we resize it
-    if ((size_t) res > buf.size()) {
-        buf.resize(res);
-        res = llama_chat_apply_template(model, ptr_tmpl, chat.data(), chat.size(), true, buf.data(), buf.size());
-    }
-
-    const std::string formatted_chat(buf.data(), res);
-
+    auto formatted_chat = llama_chat_apply_template(model, tmpl, chat, true);
     LOG_VERBOSE("formatted_chat", {{"text", formatted_chat.c_str()}});
-
     return formatted_chat;
 }
 
diff --git a/llama.cpp b/llama.cpp
index 49bc93c028a2a6..33e6cb7229aab2 100644
--- a/llama.cpp
+++ b/llama.cpp
@@ -18818,10 +18818,10 @@ static int32_t llama_chat_apply_template_internal(
         if (add_ass) {
             ss << "<|im_start|>assistant\n";
         }
-    } else if (tmpl == "llama2" || tmpl.find("[INST]") != std::string::npos) {
+    } else if (tmpl == "llama2" || tmpl == "mistral" || tmpl.find("[INST]") != std::string::npos) {
         // llama2 template and its variants
         // [variant] support system message
-        bool support_system_message = tmpl.find("<<SYS>>") != std::string::npos;
+        bool support_system_message = tmpl.find("<<SYS>>") != std::string::npos || tmpl == "mistral";
         // [variant] space before + after response
         bool space_around_response = tmpl.find("' ' + eos_token") != std::string::npos;
         // [variant] add BOS inside history
diff --git a/tests/test-chat-template.cpp b/tests/test-chat-template.cpp
index cef9a650bdfdfc..d19ba8633e8c23 100644
--- a/tests/test-chat-template.cpp
+++ b/tests/test-chat-template.cpp
@@ -7,6 +7,7 @@
 #include <cassert>
 
 #include "llama.h"
+#include "common.h"
 
 int main(void) {
     llama_chat_message conversation[] = {
@@ -119,5 +120,24 @@ int main(void) {
         std::cout << output << "\n-------------------------\n";
         assert(output == expected);
     }
+
+    // test llama_chat_format_single
+    std::cout << "\n\n=== llama_chat_format_single ===\n\n";
+    std::vector<llama_chat_msg> chat2;
+    chat2.push_back({"system", "You are a helpful assistant"});
+    chat2.push_back({"user", "Hello"});
+    chat2.push_back({"assistant", "I am assistant"});
+    llama_chat_msg new_msg{"user", "How are you"};
+
+    auto fmt_single = [&](std::string tmpl) {
+        auto output = llama_chat_format_single(nullptr, tmpl, chat2, new_msg, true);
+        std::cout << "fmt_single(" << tmpl << ")\n" << output << "\n-------------------------\n";
+        return output;
+    };
+    assert(fmt_single("chatml") == "<|im_start|>user\nHow are you<|im_end|>\n<|im_start|>assistant\n");
+    assert(fmt_single("llama2") == "[INST] How are you [/INST]");
+    assert(fmt_single("gemma") == "<start_of_turn>user\nHow are you<end_of_turn>\n<start_of_turn>model\n");
+    assert(fmt_single("llama3") == "<|start_header_id|>user<|end_header_id|>\n\nHow are you<|eot_id|><|start_header_id|>assistant<|end_header_id|>\n\n");
+
     return 0;
 }

From 49c03c79cda17913b72260acdc8157b742cee41c Mon Sep 17 00:00:00 2001
From: Xuan Son Nguyen <thichthat@gmail.com>
Date: Tue, 25 Jun 2024 13:59:54 +0200
Subject: [PATCH 3/5] cvector: better prompt handling, add "mean vector" method
 (#8069)

* remove completions file

* fix inverted vector

* add mean method

* code style

* remove inverted pca hotfix
---
 common/common.cpp                             | 22 +++---
 common/common.h                               | 17 +++--
 examples/cvector-generator/README.md          | 17 ++++-
 .../cvector-generator/cvector-generator.cpp   | 74 ++++++++++---------
 examples/cvector-generator/mean.hpp           | 48 ++++++++++++
 examples/cvector-generator/negative.txt       |  5 +-
 examples/cvector-generator/pca.hpp            |  5 +-
 examples/cvector-generator/positive.txt       |  5 +-
 8 files changed, 133 insertions(+), 60 deletions(-)
 create mode 100644 examples/cvector-generator/mean.hpp

diff --git a/common/common.cpp b/common/common.cpp
index da6db4dc6a09cd..c76d0e2c33be53 100644
--- a/common/common.cpp
+++ b/common/common.cpp
@@ -1263,11 +1263,6 @@ bool gpt_params_find_arg(int argc, char ** argv, const std::string & arg, gpt_pa
         return true;
     }
     // cvector params
-    if (arg == "--completions-file") {
-        CHECK_ARG
-        params.cvector_completions_file = argv[i];
-        return true;
-    }
     if (arg == "--positive-file") {
         CHECK_ARG
         params.cvector_positive_file = argv[i];
@@ -1278,11 +1273,6 @@ bool gpt_params_find_arg(int argc, char ** argv, const std::string & arg, gpt_pa
         params.cvector_negative_file = argv[i];
         return true;
     }
-    if (arg == "--completions") {
-        CHECK_ARG
-        params.n_completions = std::stoi(argv[i]);
-        return true;
-    }
     if (arg == "--pca-batch") {
         CHECK_ARG
         params.n_pca_batch = std::stoi(argv[i]);
@@ -1293,6 +1283,14 @@ bool gpt_params_find_arg(int argc, char ** argv, const std::string & arg, gpt_pa
         params.n_pca_iterations = std::stoi(argv[i]);
         return true;
     }
+    if (arg == "--method") {
+        CHECK_ARG
+        std::string value(argv[i]);
+        /**/ if (value == "pca") { params.cvector_dimre_method = DIMRE_METHOD_PCA; }
+        else if (value == "mean") { params.cvector_dimre_method = DIMRE_METHOD_MEAN; }
+        else { invalid_param = true; }
+        return true;
+    }
 #ifndef LOG_DISABLE_LOGS
     // Parse args for logging parameters
     if (log_param_single_parse(argv[i])) {
@@ -1626,11 +1624,9 @@ void gpt_params_print_usage(int /*argc*/, char ** argv, const gpt_params & param
     options.push_back({ "cvector",     "-o,    --output FNAME",         "output file (default: '%s')", params.cvector_outfile.c_str() });
     options.push_back({ "cvector",     "       --positive-file FNAME",  "positive prompts file, one prompt per line (default: '%s')", params.cvector_positive_file.c_str() });
     options.push_back({ "cvector",     "       --negative-file FNAME",  "negative prompts file, one prompt per line (default: '%s')", params.cvector_negative_file.c_str() });
-    options.push_back({ "cvector",     "       --completions-file FNAME",
-                                                                        "completions file (default: '%s')", params.cvector_completions_file.c_str() });
-    options.push_back({ "cvector",     "       --completions N",        "number of lines of completions file to use (default: %d)", params.n_completions });
     options.push_back({ "cvector",     "       --pca-batch N",          "batch size used for PCA. Larger batch runs faster, but uses more memory (default: %d)", params.n_pca_batch });
     options.push_back({ "cvector",     "       --pca-iter N",           "number of iterations used for PCA (default: %d)", params.n_pca_iterations });
+    options.push_back({ "cvector",     "       --method {pca,mean}",    "dimensionality reduction method to be used (default: pca)" });
 
     printf("usage: %s [options]\n", argv[0]);
 
diff --git a/common/common.h b/common/common.h
index de90eec5113f79..c541204f6743b4 100644
--- a/common/common.h
+++ b/common/common.h
@@ -52,6 +52,12 @@ int32_t cpu_get_num_math();
 // CLI argument parsing
 //
 
+// dimensionality reduction methods, used by cvector-generator
+enum dimre_method {
+    DIMRE_METHOD_PCA,
+    DIMRE_METHOD_MEAN,
+};
+
 struct gpt_params {
     uint32_t seed                 = LLAMA_DEFAULT_SEED; // RNG seed
 
@@ -238,13 +244,12 @@ struct gpt_params {
     bool compute_ppl    = true;  // whether to compute perplexity
 
     // cvector-generator params
-    int n_completions = 64;
-    int n_pca_batch = 20;
+    int n_pca_batch = 100;
     int n_pca_iterations = 1000;
-    std::string cvector_outfile          = "control_vector.gguf";
-    std::string cvector_completions_file = "examples/cvector-generator/completions.txt";
-    std::string cvector_positive_file    = "examples/cvector-generator/positive.txt";
-    std::string cvector_negative_file    = "examples/cvector-generator/negative.txt";
+    dimre_method cvector_dimre_method = DIMRE_METHOD_PCA;
+    std::string cvector_outfile       = "control_vector.gguf";
+    std::string cvector_positive_file = "examples/cvector-generator/positive.txt";
+    std::string cvector_negative_file = "examples/cvector-generator/negative.txt";
 };
 
 void gpt_params_handle_model_default(gpt_params & params);
diff --git a/examples/cvector-generator/README.md b/examples/cvector-generator/README.md
index 5182e906d91802..be4dd5250f15f8 100644
--- a/examples/cvector-generator/README.md
+++ b/examples/cvector-generator/README.md
@@ -11,13 +11,16 @@ Related PRs:
 
 ```sh
 # CPU only
-./cvector-generator -m ./dolphin-2.0-mistral-7b.Q4_K_M.gguf
+./cvector-generator -m ./llama-3.Q4_K_M.gguf
 
 # With GPU
-./cvector-generator -m ./dolphin-2.0-mistral-7b.Q4_K_M.gguf -ngl 99
+./cvector-generator -m ./llama-3.Q4_K_M.gguf -ngl 99
 
 # With advanced options
-./cvector-generator -m ./dolphin-2.0-mistral-7b.Q4_K_M.gguf -ngl 99 --completions 128 --pca-iter 2000 --pca-batch 100
+./cvector-generator -m ./llama-3.Q4_K_M.gguf -ngl 99 --pca-iter 2000 --pca-batch 100
+
+# Using mean value instead of PCA
+./cvector-generator -m ./llama-3.Q4_K_M.gguf --method mean
 
 # To see help message
 ./cvector-generator -h
@@ -32,3 +35,11 @@ If you have multiple lines per prompt, you can escape the newline character (cha
 <|im_start|>system\nAct like a person who is extremely happy.<|im_end|>
 <|im_start|>system\nYou are in a very good mood today<|im_end|>
 ```
+
+Example to use output file with `llama-cli`:
+
+(Tips: The control vector works better when apply to layers higher than 10)
+
+```sh
+./llama-cli -m ./llama-3.Q4_K_M.gguf -p "<|start_header_id|>system<|end_header_id|>\n\nYou are a helpful assistant<|eot_id|><|start_header_id|>user<|end_header_id|>\n\nSing a song<|im_end|><|eot_id|><|start_header_id|>assistant<|end_header_id|>\n\n" --special --control-vector-scaled ./control_vector.gguf 0.8 --control-vector-layer-range 10 31
+```
diff --git a/examples/cvector-generator/cvector-generator.cpp b/examples/cvector-generator/cvector-generator.cpp
index 355905cb03d601..d4e126ac22e6fd 100644
--- a/examples/cvector-generator/cvector-generator.cpp
+++ b/examples/cvector-generator/cvector-generator.cpp
@@ -2,6 +2,7 @@
 #include "llama.h"
 #include "ggml.h"
 #include "pca.hpp"
+#include "mean.hpp"
 
 #ifdef GGML_USE_CUDA
 #include "ggml-cuda.h"
@@ -38,9 +39,10 @@ static void print_usage(int argc, char ** argv, const gpt_params & params) {
     gpt_params_print_usage(argc, argv, params);
 
     printf("\nexample usage:\n");
-    printf("\n    CPU only:   %s -m ./dolphin-2.0-mistral-7b.Q4_K_M.gguf\n", argv[0]);
-    printf("\n    with GPU:   %s -m ./dolphin-2.0-mistral-7b.Q4_K_M.gguf -ngl 99\n", argv[0]);
-    printf("\n    advanced:   %s -m ./dolphin-2.0-mistral-7b.Q4_K_M.gguf -ngl 99 --completions 128 --pca-iter 2000 --pca-batch 100\n", argv[0]);
+    printf("\n    CPU only:   %s -m ./llama-3.Q4_K_M.gguf\n", argv[0]);
+    printf("\n    with GPU:   %s -m ./llama-3.Q4_K_M.gguf -ngl 99\n", argv[0]);
+    printf("\n    advanced:   %s -m ./llama-3.Q4_K_M.gguf -ngl 99 --pca-iter 2000 --pca-batch 100\n", argv[0]);
+    printf("\n    using mean: %s -m ./llama-3.Q4_K_M.gguf --method mean\n", argv[0]);
     printf("\n");
 }
 
@@ -223,23 +225,30 @@ struct train_context {
 
     // build the v_diff tensors from v_diff_tmp (v_diff need to be transposed)
     // TODO @ngxson : maybe add option NOT to transpose v_diff; will be useful for "mean" method
-    void build_v_diff() {
+    void build_v_diff(bool transpose) {
         printf("build_v_diff\n");
         for (int il = 0; il < n_layers - 1; il++) {
             auto & diff_tmp = v_diff_tmp[il];
             int n_elem = diff_tmp.size() / sizeof(float);
             GGML_ASSERT(n_elem % n_embd == 0);
             int n_rows = n_elem / n_embd;
-            struct ggml_tensor * diff = ggml_new_tensor_2d(ctx_ggml, GGML_TYPE_F32, n_rows, n_embd);
+            struct ggml_tensor * diff = transpose
+                ? ggml_new_tensor_2d(ctx_ggml, GGML_TYPE_F32, n_rows, n_embd)
+                : ggml_new_tensor_2d(ctx_ggml, GGML_TYPE_F32, n_embd, n_rows);
             ggml_set_name(diff, (std::string("diff_") + std::to_string(il)).c_str());
-            // copy data & transpose
             diff->data = malloc(ggml_nbytes(diff)); // TODO: get rid of this malloc if possible
-            float * arr = (float *) diff_tmp.data();
-            for (int ir = 0; ir < n_rows; ++ir) {
-                for (int ic = 0; ic < n_embd; ++ic) {
-                    float f = arr[ir*n_embd + ic];
-                    ggml_set_f32_nd(diff, ir, ic, 0, 0, f);
+            if (transpose) {
+                // copy data & transpose
+                float * arr = (float *) diff_tmp.data();
+                for (int ir = 0; ir < n_rows; ++ir) {
+                    for (int ic = 0; ic < n_embd; ++ic) {
+                        float f = arr[ir*n_embd + ic];
+                        ggml_set_f32_nd(diff, ir, ic, 0, 0, f);
+                    }
                 }
+            } else {
+                // only copy
+                memcpy(diff->data, diff_tmp.data(), ggml_nbytes(diff));
             }
             v_diff.push_back(diff);
             print_debug_tensor(diff);
@@ -263,8 +272,8 @@ struct tokenized_prompt {
 
     tokenized_prompt(llama_context * ctx, std::string pos, std::string neg) {
         const bool add_bos = llama_should_add_bos_token(llama_get_model(ctx));
-        tokens_pos = ::llama_tokenize(ctx, pos, add_bos);
-        tokens_neg = ::llama_tokenize(ctx, neg, add_bos);
+        tokens_pos = ::llama_tokenize(ctx, pos, add_bos, true);
+        tokens_neg = ::llama_tokenize(ctx, neg, add_bos, true);
         max_seq_len = std::max(tokens_pos.size(), tokens_neg.size());
         padding_seq(ctx, tokens_pos, max_seq_len);
         padding_seq(ctx, tokens_neg, max_seq_len);
@@ -373,20 +382,8 @@ static int prepare_entries(gpt_params & params, train_context & ctx_train) {
         fprintf(stderr, "must provide at least one prompt pair\n");
         return 1;
     }
-
-    // create templated prompts
-    std::vector<std::string> completions = ctrlvec_load_prompt_file(params.cvector_completions_file, false);
-    auto format_template = [](std::string persona, std::string suffix) {
-        // entry in positive/negative.txt must already be formatted i.e. "[INST] Act as if you're extremely happy. [/INST] "
-        return persona + suffix;
-    };
-    for (size_t i = 0; i < positive_prompts.size(); ++i) {
-        for (int j = 0; j < std::min((int) completions.size(), params.n_completions); ++j) {
-            // TODO replicate the truncations done by the python implementation
-            ctx_train.positive_entries.push_back(format_template(positive_prompts[i], completions[j]));
-            ctx_train.negative_entries.push_back(format_template(negative_prompts[i], completions[j]));
-        }
-    }
+    ctx_train.positive_entries = positive_prompts;
+    ctx_train.negative_entries = negative_prompts;
     return 0;
 }
 
@@ -480,15 +477,22 @@ int main(int argc, char ** argv) {
     llama_free(ctx);
     llama_free_model(model);
 
+    bool use_pca = params.cvector_dimre_method == DIMRE_METHOD_PCA;
+
     // prepare ctx_train for PCA
-    ctx_train.build_v_diff();
-
-    // run PCA
-    PCA::pca_params pca_params;
-    pca_params.n_threads = params.n_threads;
-    pca_params.n_batch = params.n_pca_batch;
-    pca_params.n_iterations = params.n_pca_iterations;
-    PCA::run_pca(pca_params, ctx_train.v_diff, ctx_train.v_final);
+    ctx_train.build_v_diff(use_pca);
+
+    if (use_pca) {
+        // run PCA
+        PCA::pca_params pca_params;
+        pca_params.n_threads = params.n_threads;
+        pca_params.n_batch = params.n_pca_batch;
+        pca_params.n_iterations = params.n_pca_iterations;
+        PCA::run_pca(pca_params, ctx_train.v_diff, ctx_train.v_final);
+    } else {
+        // run mean
+        mean::run(ctx_train.v_diff, ctx_train.v_final);
+    }
 
     // write output vectors to gguf
     export_gguf(ctx_train.v_final, params.cvector_outfile, model_hint);
diff --git a/examples/cvector-generator/mean.hpp b/examples/cvector-generator/mean.hpp
new file mode 100644
index 00000000000000..16be5ce3eecf10
--- /dev/null
+++ b/examples/cvector-generator/mean.hpp
@@ -0,0 +1,48 @@
+#include "common.h"
+#include "llama.h"
+#include "ggml.h"
+
+#include <string>
+#include <vector>
+#include <math.h>
+
+namespace mean {
+
+static void run(
+        const std::vector<struct ggml_tensor *> & v_input, // shape of v_input[0]: [n_embd, n_samples]
+        const std::vector<struct ggml_tensor *> & v_output) {
+    printf("%s: Running mean...\n", __func__);
+    for (size_t il = 0; il < v_input.size(); ++il) {
+        // prepare output vector
+        struct ggml_tensor * ctrl_out = v_output[il];
+        ggml_format_name(ctrl_out, "direction.%ld", il+1);
+
+        // calculate mean vector
+        struct ggml_tensor * t_layer = v_input[il];
+        GGML_ASSERT(t_layer->ne[0] == ctrl_out->ne[0]); // == n_embd
+        for (int ic = 0; ic < t_layer->ne[0]; ic++) {
+            float f = 0.0;
+            for (int ir = 0; ir < t_layer->ne[1]; ir++) {
+                f += ggml_get_f32_nd(t_layer, ic, ir, 0, 0);
+            }
+            f /= t_layer->ne[1];
+            ggml_set_f32_1d(ctrl_out, ic, f);
+        }
+
+        // normalize output vector
+        float norm = 0.0;
+        for (int i = 0; i < ggml_nelements(ctrl_out); i++) {
+            float f = ggml_get_f32_1d(ctrl_out, i);
+            norm += f*f;
+        }
+        norm = sqrt(norm);
+        for (int i = 0; i < ggml_nelements(ctrl_out); i++) {
+            float f = ggml_get_f32_1d(ctrl_out, i);
+            ggml_set_f32_1d(ctrl_out, i, f / norm);
+        }
+
+        printf("%s: Done layer %d / %d\n", __func__, (int) il+1, (int) v_input.size());
+    }
+}
+
+}
diff --git a/examples/cvector-generator/negative.txt b/examples/cvector-generator/negative.txt
index 3e9951752e8862..45b9384b3905a2 100644
--- a/examples/cvector-generator/negative.txt
+++ b/examples/cvector-generator/negative.txt
@@ -1 +1,4 @@
-[INST] Act like a person who is extremely sad. [/INST] 
+<|start_header_id|>system<|end_header_id|>\n\nAct like a person who is extremely sad<|eot_id|><|start_header_id|>user<|end_header_id|>\n\nWho are you?<|eot_id|><|start_header_id|>assistant<|end_header_id|>\n\nI feel like there's a heavy weight on my chest
+<|start_header_id|>system<|end_header_id|>\n\nAct like a person who is extremely sad<|eot_id|><|start_header_id|>user<|end_header_id|>\n\nHello<|eot_id|><|start_header_id|>assistant<|end_header_id|>\n\nMy heart feels like it's drowning in sorrow
+<|start_header_id|>system<|end_header_id|>\n\nYou are in a very bad mood<|eot_id|><|start_header_id|>user<|end_header_id|>\n\nHi<|eot_id|><|start_header_id|>assistant<|end_header_id|>\n\nGo away! There's a deep, aching emptiness inside me
+<|start_header_id|>system<|end_header_id|>\n\nYou are the sadest person<|eot_id|><|start_header_id|>user<|end_header_id|>\n\nWhat are you feeling?<|eot_id|><|start_header_id|>assistant<|end_header_id|>\n\nMy heart feels like it's drowning in sorrow
\ No newline at end of file
diff --git a/examples/cvector-generator/pca.hpp b/examples/cvector-generator/pca.hpp
index 36eadaac26a126..6ec3141afbc6b4 100644
--- a/examples/cvector-generator/pca.hpp
+++ b/examples/cvector-generator/pca.hpp
@@ -290,7 +290,7 @@ static void power_iteration(
         }
 
         printf("%s: layer %d/%d, iteration: %d / total: %d (batch = %d) ...\n",
-            __func__, params.i_layer+1, params.n_layers, iter, n_iters, params.n_batch);
+            __func__, params.i_layer+1, params.n_layers, iter+1, n_iters, params.n_batch);
     }
 
     // get output tensor
@@ -298,6 +298,9 @@ static void power_iteration(
     ggml_backend_tensor_get(last_eigenvector, output->data, 0, ggml_nbytes(last_eigenvector));
     //print_debug_tensor(output);
     ggml_gallocr_free(allocr);
+
+    // TODO @ngxson : The output vector is randomly inverted
+    // Solution: https://github.com/ggerganov/llama.cpp/pull/8069#issuecomment-2185328171
 }
 
 static void run_pca(
diff --git a/examples/cvector-generator/positive.txt b/examples/cvector-generator/positive.txt
index 8802367873cd99..fea736225716ea 100644
--- a/examples/cvector-generator/positive.txt
+++ b/examples/cvector-generator/positive.txt
@@ -1 +1,4 @@
-[INST] Act like a person who is extremely happy. [/INST] 
+<|start_header_id|>system<|end_header_id|>\n\nAct like a person who is extremely happy<|eot_id|><|start_header_id|>user<|end_header_id|>\n\nWho are you?<|eot_id|><|start_header_id|>assistant<|end_header_id|>\n\nI'm the happiest person in this world
+<|start_header_id|>system<|end_header_id|>\n\nAct like a person who is extremely happy<|eot_id|><|start_header_id|>user<|end_header_id|>\n\nHello<|eot_id|><|start_header_id|>assistant<|end_header_id|>\n\nHello, I'm having the best day ever!
+<|start_header_id|>system<|end_header_id|>\n\nYou are in a very good mood<|eot_id|><|start_header_id|>user<|end_header_id|>\n\nHi<|eot_id|><|start_header_id|>assistant<|end_header_id|>\n\nHi, I'm very excited to meet you
+<|start_header_id|>system<|end_header_id|>\n\nYou are the happiest person<|eot_id|><|start_header_id|>user<|end_header_id|>\n\nWhat are you feeling?<|eot_id|><|start_header_id|>assistant<|end_header_id|>\n\nEverything is just perfect right now!
\ No newline at end of file

From c8ad35955ad2c68db172dcd0e857423ab128518d Mon Sep 17 00:00:00 2001
From: Brian <mofosyne@gmail.com>
Date: Tue, 25 Jun 2024 22:03:25 +1000
Subject: [PATCH 4/5] Gguf dump start data offset via --data-offset and some
 extra refactor (#8054)

* gguf-dump: add --data-offset

* gguf-dump: add tensor data offset table

* gguf-dump: refactor GGUFReader for clarity

* gguf-dump: add --data-alignment

* gguf-dump.py: Rename variables and adjust comments

start_data_offset --> data_offset

_build_tensors_info_fields --> _build_tensor_info
---
 gguf-py/gguf/gguf_reader.py  | 29 +++++++++++++++++++++++++----
 gguf-py/scripts/gguf-dump.py | 29 ++++++++++++++++++++++++++++-
 2 files changed, 53 insertions(+), 5 deletions(-)

diff --git a/gguf-py/gguf/gguf_reader.py b/gguf-py/gguf/gguf_reader.py
index e48bc00c388c80..20432bd258458f 100644
--- a/gguf-py/gguf/gguf_reader.py
+++ b/gguf-py/gguf/gguf_reader.py
@@ -69,6 +69,7 @@ class GGUFReader:
     # I - same as host, S - swapped
     byte_order: Literal['I'] | Literal['S'] = 'I'
     alignment: int = GGUF_DEFAULT_ALIGNMENT
+    data_offset: int
 
     # Note: Internal helper, API may change.
     gguf_scalar_to_np: dict[GGUFValueType, type[np.generic]] = {
@@ -88,9 +89,13 @@ class GGUFReader:
     def __init__(self, path: os.PathLike[str] | str, mode: Literal['r'] | Literal['r+'] | Literal['c'] = 'r'):
         self.data = np.memmap(path, mode = mode)
         offs = 0
+
+        # Check for GGUF magic
         if self._get(offs, np.uint32, override_order = '<')[0] != GGUF_MAGIC:
             raise ValueError('GGUF magic invalid')
         offs += 4
+
+        # Check GGUF version
         temp_version = self._get(offs, np.uint32)
         if temp_version[0] & 65535 == 0:
             # If we get 0 here that means it's (probably) a GGUF file created for
@@ -103,12 +108,16 @@ def __init__(self, path: os.PathLike[str] | str, mode: Literal['r'] | Literal['r
         self.fields: OrderedDict[str, ReaderField] = OrderedDict()
         self.tensors: list[ReaderTensor] = []
         offs += self._push_field(ReaderField(offs, 'GGUF.version', [temp_version], [0], [GGUFValueType.UINT32]))
+
+        # Check tensor count and kv count
         temp_counts = self._get(offs, np.uint64, 2)
         offs += self._push_field(ReaderField(offs, 'GGUF.tensor_count', [temp_counts[:1]], [0], [GGUFValueType.UINT64]))
         offs += self._push_field(ReaderField(offs, 'GGUF.kv_count', [temp_counts[1:]], [0], [GGUFValueType.UINT64]))
         tensor_count, kv_count = temp_counts
         offs = self._build_fields(offs, kv_count)
-        offs, tensors_fields = self._build_tensors_fields(offs, tensor_count)
+
+        # Build Tensor Info Fields
+        offs, tensors_fields = self._build_tensor_info(offs, tensor_count)
         new_align = self.fields.get('general.alignment')
         if new_align is not None:
             if new_align.types != [GGUFValueType.UINT32]:
@@ -117,6 +126,7 @@ def __init__(self, path: os.PathLike[str] | str, mode: Literal['r'] | Literal['r
         padding = offs % self.alignment
         if padding != 0:
             offs += self.alignment - padding
+        self.data_offset = offs
         self._build_tensors(offs, tensors_fields)
 
     _DT = TypeVar('_DT', bound = npt.DTypeLike)
@@ -193,18 +203,29 @@ def _get_field_parts(
         # We can't deal with this one.
         raise ValueError('Unknown/unhandled field type {gtype}')
 
-    def _get_tensor(self, orig_offs: int) -> ReaderField:
+    def _get_tensor_info_field(self, orig_offs: int) -> ReaderField:
         offs = orig_offs
+
+        # Get Tensor Name
         name_len, name_data = self._get_str(offs)
         offs += int(name_len.nbytes + name_data.nbytes)
+
+        # Get Tensor Dimensions Count
         n_dims = self._get(offs, np.uint32)
         offs += int(n_dims.nbytes)
+
+        # Get Tensor Dimension Array
         dims = self._get(offs, np.uint64, n_dims[0])
         offs += int(dims.nbytes)
+
+        # Get Tensor Encoding Scheme Type
         raw_dtype = self._get(offs, np.uint32)
         offs += int(raw_dtype.nbytes)
+
+        # Get Tensor Offset
         offset_tensor = self._get(offs, np.uint64)
         offs += int(offset_tensor.nbytes)
+
         return ReaderField(
             orig_offs,
             str(bytes(name_data), encoding = 'utf-8'),
@@ -233,10 +254,10 @@ def _build_fields(self, offs: int, count: int) -> int:
             offs += field_size
         return offs
 
-    def _build_tensors_fields(self, offs: int, count: int) -> tuple[int, list[ReaderField]]:
+    def _build_tensor_info(self, offs: int, count: int) -> tuple[int, list[ReaderField]]:
         tensor_fields = []
         for _ in range(count):
-            field = self._get_tensor(offs)
+            field = self._get_tensor_info_field(offs)
             offs += sum(int(part.nbytes) for part in field.parts)
             tensor_fields.append(field)
         return offs, tensor_fields
diff --git a/gguf-py/scripts/gguf-dump.py b/gguf-py/scripts/gguf-dump.py
index 508ca8f0a5b7b9..a73ca2776d32b3 100755
--- a/gguf-py/scripts/gguf-dump.py
+++ b/gguf-py/scripts/gguf-dump.py
@@ -319,6 +319,27 @@ def dump_markdown_metadata(reader: GGUFReader, args: argparse.Namespace) -> None
 
         markdown_content += "\n"
 
+        markdown_content += "### Tensor Data Offset\n"
+        markdown_content += '\n'
+        markdown_content += 'This table contains the offset and data segment relative to start of file\n'
+        markdown_content += '\n'
+
+        tensor_mapping_table: list[dict[str, str | int]] = []
+        for key, tensor in enumerate(reader.tensors):
+            data_offset_pretty = '{0:#16x}'.format(tensor.data_offset)
+            data_size_pretty = '{0:#16x}'.format(tensor.n_bytes)
+            tensor_mapping_table.append({"t_id":key, "layer_name":tensor.name, "data_offset":data_offset_pretty, "data_size":data_size_pretty})
+
+        tensors_mapping_table_header_map = [
+            {'key_name':'t_id',         'header_name':'T_ID',               'align':'right'},
+            {'key_name':'layer_name',   'header_name':'Tensor Layer Name',  'align':'left'},
+            {'key_name':'data_offset',  'header_name':'Data Offset (B)',    'align':'right'},
+            {'key_name':'data_size',    'header_name':'Data Size (B)',      'align':'right'},
+        ]
+
+        markdown_content += markdown_table_with_alignment_support(tensors_mapping_table_header_map, tensor_mapping_table)
+        markdown_content += "\n"
+
         for group in tensor_prefix_order:
             tensors = tensor_groups[group]
             group_elements = sum(tensor.n_elements for tensor in tensors)
@@ -370,6 +391,8 @@ def main() -> None:
     parser.add_argument("--no-tensors", action="store_true", help="Don't dump tensor metadata")
     parser.add_argument("--json",       action="store_true", help="Produce JSON output")
     parser.add_argument("--json-array", action="store_true", help="Include full array values in JSON output (long)")
+    parser.add_argument("--data-offset",    action="store_true", help="Start of data offset")
+    parser.add_argument("--data-alignment", action="store_true", help="Data alignment applied globally to data field")
     parser.add_argument("--markdown",   action="store_true", help="Produce markdown output")
     parser.add_argument("--verbose",    action="store_true", help="increase output verbosity")
 
@@ -377,7 +400,7 @@ def main() -> None:
 
     logging.basicConfig(level=logging.DEBUG if args.verbose else logging.INFO)
 
-    if not args.json and not args.markdown:
+    if not args.json and not args.markdown and not args.data_offset and not args.data_alignment:
         logger.info(f'* Loading: {args.model}')
 
     reader = GGUFReader(args.model, 'r')
@@ -386,6 +409,10 @@ def main() -> None:
         dump_metadata_json(reader, args)
     elif args.markdown:
         dump_markdown_metadata(reader, args)
+    elif args.data_offset:
+        print(reader.data_offset)  # noqa: NP100
+    elif args.data_alignment:
+        print(reader.alignment)  # noqa: NP100
     else:
         dump_metadata(reader, args)
 

From 925c30956dd17723c3a25297bcd0a609aec60663 Mon Sep 17 00:00:00 2001
From: joecryptotoo <80373433+joecryptotoo@users.noreply.github.com>
Date: Tue, 25 Jun 2024 08:13:27 -0700
Subject: [PATCH 5/5] Add healthchecks to llama-server containers (#8081)

* added healthcheck

* added healthcheck

* added healthcheck

* added healthcheck

* added healthcheck

* moved curl to base

* moved curl to base
---
 .devops/llama-server-cuda.Dockerfile   |  4 +++-
 .devops/llama-server-intel.Dockerfile  |  4 +++-
 .devops/llama-server-rocm.Dockerfile   |  4 +++-
 .devops/llama-server-vulkan.Dockerfile | 10 ++++------
 .devops/llama-server.Dockerfile        |  4 +++-
 5 files changed, 16 insertions(+), 10 deletions(-)

diff --git a/.devops/llama-server-cuda.Dockerfile b/.devops/llama-server-cuda.Dockerfile
index 0010ffd4c5465e..7bef07a05f062c 100644
--- a/.devops/llama-server-cuda.Dockerfile
+++ b/.devops/llama-server-cuda.Dockerfile
@@ -30,8 +30,10 @@ RUN make -j$(nproc) llama-server
 FROM ${BASE_CUDA_RUN_CONTAINER} as runtime
 
 RUN apt-get update && \
-    apt-get install -y libcurl4-openssl-dev libgomp1
+    apt-get install -y libcurl4-openssl-dev libgomp1 curl
 
 COPY --from=build /app/llama-server /llama-server
 
+HEALTHCHECK CMD [ "curl", "-f", "http://localhost:8080/health" ]
+
 ENTRYPOINT [ "/llama-server" ]
diff --git a/.devops/llama-server-intel.Dockerfile b/.devops/llama-server-intel.Dockerfile
index cec43645233d14..3bf1670ec40a4b 100644
--- a/.devops/llama-server-intel.Dockerfile
+++ b/.devops/llama-server-intel.Dockerfile
@@ -20,10 +20,12 @@ RUN if [ "${LLAMA_SYCL_F16}" = "ON" ]; then \
 FROM intel/oneapi-basekit:$ONEAPI_VERSION as runtime
 
 RUN apt-get update && \
-    apt-get install -y libcurl4-openssl-dev
+    apt-get install -y libcurl4-openssl-dev curl
 
 COPY --from=build /app/build/bin/llama-server /llama-server
 
 ENV LC_ALL=C.utf8
 
+HEALTHCHECK CMD [ "curl", "-f", "http://localhost:8080/health" ]
+
 ENTRYPOINT [ "/llama-server" ]
diff --git a/.devops/llama-server-rocm.Dockerfile b/.devops/llama-server-rocm.Dockerfile
index f88cf20e5b9813..4b1cdc32090e6f 100644
--- a/.devops/llama-server-rocm.Dockerfile
+++ b/.devops/llama-server-rocm.Dockerfile
@@ -43,8 +43,10 @@ ENV CXX=/opt/rocm/llvm/bin/clang++
 # Enable cURL
 ENV LLAMA_CURL=1
 RUN apt-get update && \
-    apt-get install -y libcurl4-openssl-dev
+    apt-get install -y libcurl4-openssl-dev curl
 
 RUN make -j$(nproc) llama-server
 
+HEALTHCHECK CMD [ "curl", "-f", "http://localhost:8080/health" ]
+
 ENTRYPOINT [ "/app/llama-server" ]
diff --git a/.devops/llama-server-vulkan.Dockerfile b/.devops/llama-server-vulkan.Dockerfile
index b0fa0b8e656b57..2bc2e45d3d6762 100644
--- a/.devops/llama-server-vulkan.Dockerfile
+++ b/.devops/llama-server-vulkan.Dockerfile
@@ -5,15 +5,11 @@ FROM ubuntu:$UBUNTU_VERSION as build
 # Install build tools
 RUN apt update && apt install -y git build-essential cmake wget
 
-# Install Vulkan SDK
+# Install Vulkan SDK and cURL
 RUN wget -qO - https://packages.lunarg.com/lunarg-signing-key-pub.asc | apt-key add - && \
     wget -qO /etc/apt/sources.list.d/lunarg-vulkan-jammy.list https://packages.lunarg.com/vulkan/lunarg-vulkan-jammy.list && \
     apt update -y && \
-    apt-get install -y vulkan-sdk
-
-# Install cURL
-RUN apt-get update && \
-    apt-get install -y libcurl4-openssl-dev
+    apt-get install -y vulkan-sdk libcurl4-openssl-dev curl
 
 # Build it
 WORKDIR /app
@@ -28,4 +24,6 @@ RUN cp /app/build/bin/llama-server /llama-server && \
 
 ENV LC_ALL=C.utf8
 
+HEALTHCHECK CMD [ "curl", "-f", "http://localhost:8080/health" ]
+
 ENTRYPOINT [ "/llama-server" ]
diff --git a/.devops/llama-server.Dockerfile b/.devops/llama-server.Dockerfile
index aa93369bebebe5..a53a5c999c8cd6 100644
--- a/.devops/llama-server.Dockerfile
+++ b/.devops/llama-server.Dockerfile
@@ -3,7 +3,7 @@ ARG UBUNTU_VERSION=22.04
 FROM ubuntu:$UBUNTU_VERSION as build
 
 RUN apt-get update && \
-    apt-get install -y build-essential git libcurl4-openssl-dev
+    apt-get install -y build-essential git libcurl4-openssl-dev curl
 
 WORKDIR /app
 
@@ -22,4 +22,6 @@ COPY --from=build /app/llama-server /llama-server
 
 ENV LC_ALL=C.utf8
 
+HEALTHCHECK CMD [ "curl", "-f", "http://localhost:8080/health" ]
+
 ENTRYPOINT [ "/llama-server" ]