moxin-org · jmbejar · Jul 26, 2024 · Jul 22, 2024 · Jul 23, 2024 · Jul 23, 2024
diff --git a/moxin-backend/src/backend_impls/chat_ui.rs b/moxin-backend/src/backend_impls/chat_ui.rs
@@ -316,22 +316,15 @@ fn create_wasi(
     file: &DownloadedFile,
     load_model: &LoadModelOptions,
 ) -> wasmedge_sdk::WasmEdgeResult<WasiModule> {
-    let ctx_size = if load_model.n_ctx > 0 {
-        Some(load_model.n_ctx.to_string())
-    } else {
-        None
-    };
+    let ctx_size = Some(format!("{}", file.context_size));
 
     let n_gpu_layers = match load_model.gpu_layers {
         moxin_protocol::protocol::GPULayers::Specific(n) => Some(n.to_string()),
         moxin_protocol::protocol::GPULayers::Max => None,
     };
 
-    let batch_size = if load_model.n_batch > 0 {
-        Some(load_model.n_batch.to_string())
-    } else {
-        None
-    };
+    // Set n_batch to a fixed value of 128.
+    let batch_size = Some(format!("128"));
 
     let mut prompt_template = load_model.prompt_template.clone();
     if prompt_template.is_none() && !file.prompt_template.is_empty() {

diff --git a/moxin-backend/src/backend_impls/mod.rs b/moxin-backend/src/backend_impls/mod.rs
@@ -136,8 +136,6 @@ fn test_chat() {
             prompt_template: None,
             gpu_layers: moxin_protocol::protocol::GPULayers::Max,
             use_mlock: false,
-            n_batch: 512,
-            n_ctx: 512,
             rope_freq_scale: 0.0,
             rope_freq_base: 0.0,
             context_overflow_policy: moxin_protocol::protocol::ContextOverflowPolicy::StopAtLimit,
@@ -211,8 +209,6 @@ fn test_chat_stop() {
             prompt_template: None,
             gpu_layers: moxin_protocol::protocol::GPULayers::Max,
             use_mlock: false,
-            n_batch: 512,
-            n_ctx: 512,
             rope_freq_scale: 0.0,
             rope_freq_base: 0.0,
             context_overflow_policy: moxin_protocol::protocol::ContextOverflowPolicy::StopAtLimit,

diff --git a/moxin-protocol/src/protocol.rs b/moxin-protocol/src/protocol.rs
@@ -28,8 +28,6 @@ pub struct LoadModelOptions {
     pub prompt_template: Option<String>,
     pub gpu_layers: GPULayers,
     pub use_mlock: bool,
-    pub n_batch: u32,
-    pub n_ctx: u32,
     pub rope_freq_scale: f32,
     pub rope_freq_base: f32,
 

diff --git a/src/app.rs b/src/app.rs
@@ -335,7 +335,7 @@ impl MatchEvent for App {
                     .ui
                     .chat_history_card_options(id!(chat_history_card_options));
                 // TODO: Would be cool to listen for this action inside of the widget itself.
-                chat_history_card_options.selected(cx, chat_id, cords);
+                let _ = chat_history_card_options.selected(cx, chat_id, cords);
             }
         }
     }

diff --git a/src/chat/chat_history_card.rs b/src/chat/chat_history_card.rs
@@ -355,7 +355,7 @@ impl ChatHistoryCard {
         &mut self,
         cx: &mut Cx,
         actions: &Actions,
-        scope: &mut Scope,
+        _scope: &mut Scope,
     ) {
         for action in actions {
             if let ChatHistoryCardAction::ActivateTitleEdition(chat_id) =