Make changes more readable

nkoppel · nkoppel · commit e7e0f934ccfd · 2024-03-11T12:00:55.000-05:00
diff --git a/crates/llama_cpp/src/standard_sampler.rs b/crates/llama_cpp/src/standard_sampler.rs
@@ -121,7 +121,7 @@ impl SamplerStage {
     pub fn from_grammar(grammar: LlamaGrammar, start_position: Option<usize>) -> Self {
         SamplerStage::Grammar(GrammarStage {
             grammar,
-            accepted_to: start_position,
+            accepted_up_to: start_position,
         })
     }
 
@@ -193,7 +193,7 @@ impl SamplerStage {
                     llama_sample_tail_free(context, p_ptr, *z, min_keep);
                 }
                 SamplerStage::Grammar(stage) => {
-                    stage.apply(context, tokens, candidates_p, min_keep)
+                    candidates_p = stage.apply(context, tokens, candidates_p, min_keep)
                 }
             }
         }
@@ -206,7 +206,7 @@ impl SamplerStage {
 #[derive(Clone, Debug)]
 pub struct GrammarStage {
     grammar: LlamaGrammar,
-    accepted_to: Option<usize>,
+    accepted_up_to: Option<usize>,
 }
 
 impl GrammarStage {
@@ -216,15 +216,21 @@ impl GrammarStage {
         tokens: &[Token],
         mut candidates_p: llama_token_data_array,
         _min_keep: usize,
-    ) {
-        let accepted_to = self.accepted_to.unwrap_or(tokens.len());
-        for token in &tokens[accepted_to..] {
+    ) -> llama_token_data_array {
+        // If `accepted_up_to` is `None`, assume that we should start at the end of context.
+        let accepted_up_to = self.accepted_up_to.unwrap_or(tokens.len());
+
+        // Accept all new tokens until the end of context.
+        for token in &tokens[accepted_up_to..] {
             unsafe { llama_grammar_accept_token(context, self.grammar.grammar.as_ptr(), token.0) }
         }
-        self.accepted_to = Some(tokens.len());
+        self.accepted_up_to = Some(tokens.len());
 
+        // Apply grammar sampling to `candidates_p`.
         let p_ptr = addr_of_mut!(candidates_p);
         unsafe { llama_sample_grammar(context, p_ptr, self.grammar.grammar.as_ptr()) };
+
+        candidates_p
     }
 }
 

Original file line number	Diff line number	Diff line change
`@@ -121,7 +121,7 @@ impl SamplerStage {`
`121`	`121`	`pub fn from_grammar(grammar: LlamaGrammar, start_position: Option<usize>) -> Self {`
`122`	`122`	`SamplerStage::Grammar(GrammarStage {`
`123`	`123`	`grammar,`
`124`		`- accepted_to: start_position,`
	`124`	`+ accepted_up_to: start_position,`
`125`	`125`	`})`
`126`	`126`	`}`
`127`	`127`
`@@ -193,7 +193,7 @@ impl SamplerStage {`
`193`	`193`	`llama_sample_tail_free(context, p_ptr, *z, min_keep);`
`194`	`194`	`}`
`195`	`195`	`SamplerStage::Grammar(stage) => {`
`196`		`- stage.apply(context, tokens, candidates_p, min_keep)`
	`196`	`+ candidates_p = stage.apply(context, tokens, candidates_p, min_keep)`
`197`	`197`	`}`
`198`	`198`	`}`
`199`	`199`	`}`
`@@ -206,7 +206,7 @@ impl SamplerStage {`
`206`	`206`	`#[derive(Clone, Debug)]`
`207`	`207`	`pub struct GrammarStage {`
`208`	`208`	`grammar: LlamaGrammar,`
`209`		`- accepted_to: Option<usize>,`
	`209`	`+ accepted_up_to: Option<usize>,`
`210`	`210`	`}`
`211`	`211`
`212`	`212`	`impl GrammarStage {`
`@@ -216,15 +216,21 @@ impl GrammarStage {`
`216`	`216`	`tokens: &[Token],`
`217`	`217`	`mut candidates_p: llama_token_data_array,`
`218`	`218`	`_min_keep: usize,`
`219`		`- ) {`
`220`		`- let accepted_to = self.accepted_to.unwrap_or(tokens.len());`
`221`		`- for token in &tokens[accepted_to..] {`
	`219`	`+ ) -> llama_token_data_array {`
	`220`	+ // If `accepted_up_to` is `None`, assume that we should start at the end of context.
	`221`	`+ let accepted_up_to = self.accepted_up_to.unwrap_or(tokens.len());`
	`222`	`+`
	`223`	`+ // Accept all new tokens until the end of context.`
	`224`	`+ for token in &tokens[accepted_up_to..] {`
`222`	`225`	`unsafe { llama_grammar_accept_token(context, self.grammar.grammar.as_ptr(), token.0) }`
`223`	`226`	`}`
`224`		`- self.accepted_to = Some(tokens.len());`
	`227`	`+ self.accepted_up_to = Some(tokens.len());`
`225`	`228`
	`229`	+ // Apply grammar sampling to `candidates_p`.
`226`	`230`	`let p_ptr = addr_of_mut!(candidates_p);`
`227`	`231`	`unsafe { llama_sample_grammar(context, p_ptr, self.grammar.grammar.as_ptr()) };`
	`232`	`+`
	`233`	`+ candidates_p`
`228`	`234`	`}`
`229`	`235`	`}`
`230`	`236`