brittlewis12
diff --git a/‎examples/simple/src/main.rs‎
Lines changed: 0 additions & 1 deletion b/‎examples/simple/src/main.rs‎
Lines changed: 0 additions & 1 deletion
diff --git a/‎llama-cpp-2/src/context.rs‎
Lines changed: 0 additions & 1 deletion b/‎llama-cpp-2/src/context.rs‎
Lines changed: 0 additions & 1 deletion
diff --git a/‎llama-cpp-2/src/context/sample.rs‎
Lines changed: 0 additions & 141 deletions b/‎llama-cpp-2/src/context/sample.rs‎
Lines changed: 0 additions & 141 deletions
diff --git a/‎llama-cpp-2/src/context/sample/sampler.rs‎
Lines changed: 0 additions & 112 deletions b/‎llama-cpp-2/src/context/sample/sampler.rs‎
Lines changed: 0 additions & 112 deletions
diff --git a/‎llama-cpp-2/src/lib.rs‎
Lines changed: 1 addition & 1 deletion b/‎llama-cpp-2/src/lib.rs‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎llama-cpp-2/src/sampler_chain.rs‎
Lines changed: 25 additions & 23 deletions b/‎llama-cpp-2/src/sampler_chain.rs‎
Lines changed: 25 additions & 23 deletions
@@ -252,7 +252,6 @@ either reduce n_len or increase n_ctx"
         {
             // sample the most likely token
             let new_token_id = sampler.sample(&mut ctx, None);
-            sampler.accept(new_token_id);
 
             // is it an end of stream?
             if model.is_eog_token(new_token_id) {
 
@@ -17,7 +17,6 @@ use crate::{
 
 pub mod kv_cache;
 pub mod params;
-pub mod sample;
 pub mod session;
 
 /// Safe wrapper around `llama_context`.
 
@@ -23,7 +23,7 @@ use std::path::PathBuf;
 use std::string::FromUtf8Error;
 
 pub mod context;
-pub mod grammar;
+// pub mod grammar;
 pub mod llama_backend;
 pub mod llama_batch;
 pub mod model;
 
@@ -24,6 +24,14 @@ impl Debug for LlamaSampler {
 }
 
 impl LlamaSampler {
+    /// Create a new `LlamaSampler`.
+    /// ```
+    /// # use llama_cpp_2::sampler_chain::{LlamaSampler, params::LlamaSamplerChainParams};
+    /// let mut chain = LlamaSampler::new(LlamaSamplerChainParams::default());
+    /// chain = chain.add_temp(0.7);
+    /// chain = chain.add_dist(42);
+    /// assert_eq!(chain.len(), 2);
+    /// ```
     pub fn new(sampler_chain_params: params::LlamaSamplerChainParams) -> Self {
         let sampler = unsafe {
             NonNull::new(llama_cpp_sys_2::llama_sampler_chain_init(
@@ -120,22 +128,6 @@ impl LlamaSampler {
         self
     }
 
-    /// Initialize a tail-free sampler with the given z value and add it to the sampler chain.
-    ///
-    /// Tail Free Sampling described in https://www.trentonbricken.com/Tail-Free-Sampling/.
-    pub fn add_tail_free(self, z: f32, min_keep: usize) -> Self {
-        unsafe {
-            let tail_free_sampler =
-                NonNull::new(llama_cpp_sys_2::llama_sampler_init_tail_free(z, min_keep))
-                    .expect("llama_sampler_chain_init_tail_free returned null");
-            llama_cpp_sys_2::llama_sampler_chain_add(
-                self.sampler.as_ptr(),
-                tail_free_sampler.as_ptr(),
-            );
-        }
-        self
-    }
-
     /// Initialize a typical-p sampler with the given value and add it to the sampler chain.
     pub fn add_typical_p(self, p: f32, min_keep: usize) -> Self {
         unsafe {
@@ -209,6 +201,23 @@ impl LlamaSampler {
         self
     }
 
+    /// Initialize an XTC sampler with the given values and add it to the sampler chain.
+    pub fn add_xtc(self, p: f32, t: f32, min_keep: usize, seed: u32) -> Self {
+        unsafe {
+            let xtc_sampler = NonNull::new(llama_cpp_sys_2::llama_sampler_init_xtc(
+                p, t, min_keep, seed,
+            ))
+            .expect("llama_sampler_chain_init_xtc returned null");
+            llama_cpp_sys_2::llama_sampler_chain_add(self.sampler.as_ptr(), xtc_sampler.as_ptr());
+        }
+        self
+    }
+
+    /// Get the number of samplers in the chain.
+    pub fn len(&self) -> i32 {
+        unsafe { llama_cpp_sys_2::llama_sampler_chain_n(self.sampler.as_ptr()) }
+    }
+
     /// Reset the sampler chain.
     pub fn reset(&self) {
         unsafe {
@@ -225,13 +234,6 @@ impl LlamaSampler {
         LlamaToken(token)
     }
 
-    /// Accept a sampled token.
-    pub fn accept(&self, token: LlamaToken) {
-        unsafe {
-            llama_cpp_sys_2::llama_sampler_accept(self.sampler.as_ptr(), token.0);
-        }
-    }
-
     /// Reset the timings for the sampler.
     pub fn reset_timings(&self) {
         unsafe {
Original file line number	Diff line number	Diff line change
`@@ -252,7 +252,6 @@ either reduce n_len or increase n_ctx"`
`252`	`252`	`{`
`253`	`253`	`// sample the most likely token`
`254`	`254`	`let new_token_id = sampler.sample(&mut ctx, None);`
`255`		`- sampler.accept(new_token_id);`
`256`	`255`
`257`	`256`	`// is it an end of stream?`
`258`	`257`	`if model.is_eog_token(new_token_id) {`