feat: add lstrip and special keyword arguments to token_to_piece method

yoshoku · yoshoku · commit eefe9a81de8d · 2024-07-13T14:33:05.000+09:00
diff --git a/ext/llama_cpp/dummy.rb b/ext/llama_cpp/dummy.rb
@@ -466,8 +466,10 @@ def rope_freq_scale_train; end
 
     # Converts token to Ruby String.
     # @param token [Integer] The token to be converted.
+    # @param lstrip [Integer] The number allows the user to skip up to 'lstrip' leading spaces before copying.
+    # @param special [Boolean] The flag whether to allow rendering special tokens in the output.
     # @return [String]
-    def token_to_piece(token); end
+    def token_to_piece(token, lstrip: 0, special: false); end
 
     # Returns the logits.
     #
diff --git a/ext/llama_cpp/llama_cpp.cpp b/ext/llama_cpp/llama_cpp.cpp
@@ -1530,7 +1530,7 @@ class RbLLaMAModel {
     rb_define_method(rb_cLLaMAModel, "n_embd", RUBY_METHOD_FUNC(_llama_model_get_model_n_embd), 0);
     rb_define_method(rb_cLLaMAModel, "n_layer", RUBY_METHOD_FUNC(_llama_model_get_model_n_layer), 0);
     rb_define_method(rb_cLLaMAModel, "rope_freq_scale_train", RUBY_METHOD_FUNC(_llama_model_rope_freq_scale_train), 0);
-    rb_define_method(rb_cLLaMAModel, "token_to_piece", RUBY_METHOD_FUNC(_llama_model_token_to_piece), 1);
+    rb_define_method(rb_cLLaMAModel, "token_to_piece", RUBY_METHOD_FUNC(_llama_model_token_to_piece), -1);
     rb_define_method(rb_cLLaMAModel, "tokenize", RUBY_METHOD_FUNC(_llama_model_tokenize), -1);
     rb_define_method(rb_cLLaMAModel, "desc", RUBY_METHOD_FUNC(_llama_model_get_model_desc), 0);
     rb_define_method(rb_cLLaMAModel, "size", RUBY_METHOD_FUNC(_llama_model_get_model_size), 0);
@@ -1691,18 +1691,33 @@ class RbLLaMAModel {
     return DBL2NUM(llama_rope_freq_scale_train(ptr->model));
   }
 
-  static VALUE _llama_model_token_to_piece(VALUE self, VALUE token_) {
+  static VALUE _llama_model_token_to_piece(int argc, VALUE* argv, VALUE self) {
+    VALUE kw_args = Qnil;
+    ID kw_table[2] = { rb_intern("lstrip"), rb_intern("special") };
+    VALUE kw_values[2] = { Qundef, Qundef };
+    VALUE token_ = Qnil;
+    rb_scan_args(argc, argv, "1:", &token_, &kw_args);
+    rb_get_kwargs(kw_args, kw_table, 0, 2, kw_values);
+
     if (!RB_INTEGER_TYPE_P(token_)) {
       rb_raise(rb_eArgError, "token must be an integer");
       return Qnil;
     }
+    if (kw_values[0] != Qundef && !RB_INTEGER_TYPE_P(kw_values[0])) {
+      rb_raise(rb_eArgError, "lstrip must be an integer");
+      return Qnil;
+    }
+
     const llama_token token = NUM2INT(token_);
+    const int32_t lstrip = kw_values[0] != Qundef ? NUM2INT(kw_values[0]) : 0;
+    const bool special = kw_values[1] != Qundef ? RTEST(kw_values[1]) : false;
+
     LLaMAModelWrapper* ptr = get_llama_model(self);
     std::vector<char> result(8, 0);
-    const int n_tokens = llama_token_to_piece(ptr->model, token, result.data(), result.size(), false);
+    const int n_tokens = llama_token_to_piece(ptr->model, token, result.data(), result.size(), lstrip, special);
     if (n_tokens < 0) {
       result.resize(-n_tokens);
-      const int check = llama_token_to_piece(ptr->model, token, result.data(), result.size(), false);
+      const int check = llama_token_to_piece(ptr->model, token, result.data(), result.size(), lstrip, special);
       if (check != -n_tokens) {
         rb_raise(rb_eRuntimeError, "failed to convert");
         return Qnil;
@@ -2788,7 +2803,7 @@ class RbLLaMAContext {
     ID kw_table[3] = { rb_intern("logits"), rb_intern("logits_guidance"), rb_intern("scale") };
     VALUE kw_values[3] = { Qundef, Qundef, Qundef };
     rb_scan_args(argc, argv, ":", &kw_args);
-    rb_get_kwargs(kw_args, kw_table, 0, 3, kw_values);
+    rb_get_kwargs(kw_args, kw_table, 3, 0, kw_values);
 
     if (!RB_TYPE_P(kw_values[0], T_ARRAY)) {
       rb_raise(rb_eArgError, "logits must be an Array");
diff --git a/sig/llama_cpp.rbs b/sig/llama_cpp.rbs
@@ -164,7 +164,7 @@ module LLaMACpp
     def n_embd: () -> Integer
     def n_layer: () -> Integer
     def rope_freq_scale_train: () -> Float
-    def token_to_piece: (Integer) -> String
+    def token_to_piece: (Integer, ?lstrip: Integer, ?special: bool) -> String
     def tokenize: (text: String, ?n_max_tokens: Integer, ?add_bos: bool, ?special: bool) -> Array[Integer]
     def desc: () -> String
     def size: () -> Integer