Upload folder using huggingface_hub

Files changed (3) hide show

README.md CHANGED Viewed

@@ -101,6 +101,14 @@ will yield:
 ```
 <|start_header_id|>system<|end_header_id|>
 // Supported function definitions that should be called when necessary.
 namespace functions {
@@ -115,7 +123,7 @@ location: string,
 What is the weather for Istanbul?
 ```
-A more detailed example is provided [here](https://github.com/MeetKai/functionary/blob/main/tests/prompt_test_v2.llama3.txt).
 ## Run the model

 ```
 <|start_header_id|>system<|end_header_id|>
+You are capable of executing available function(s) if required.
+Only execute function(s) when absolutely necessary.
+Ask for the required input to:recipient==all
+Use JSON for function arguments.
+Respond in this format:
+>>>${recipient}
+${content}
+Available functions:
 // Supported function definitions that should be called when necessary.
 namespace functions {
 What is the weather for Istanbul?
 ```
+A more detailed example is provided [here](https://github.com/MeetKai/functionary/blob/main/tests/prompt_test_v3.llama3.txt).
 ## Run the model

modeling_functionary.py CHANGED Viewed

@@ -66,22 +66,23 @@ class FunctionaryForCausalLM(LlamaForCausalLM):
         )
         input_ids = kwargs.pop("input_ids")
-        function_call_token = "<|reserved_special_token_249|>"
         correct_results = []
         for input_id, result in zip(input_ids, results):
             final_output_json = {"role": "assistant", "content": None, "tool_calls": None}
             tool_calls = []
             raw_output_str = tokenizer.decode(result[len(input_id):].cpu())
-            has_text = False if raw_output_str.startswith(function_call_token) else True
             chunks = raw_output_str.split(function_call_token)
             for i, chunk in enumerate(chunks):
                 if len(chunk) == 0:
                     continue
                 chunk = chunk.replace(tokenizer.pad_token, "")
                 if i == 0 and has_text is not False:
                     final_output_json["content"] = chunk.strip[:-len("<|eot_id|>")] if chunk.endswith("<|eot_id|>") else chunk
                 else:
                     tool_calls.append(
                         {

         )
         input_ids = kwargs.pop("input_ids")
+        function_call_token = ">>>"
         correct_results = []
         for input_id, result in zip(input_ids, results):
             final_output_json = {"role": "assistant", "content": None, "tool_calls": None}
             tool_calls = []
             raw_output_str = tokenizer.decode(result[len(input_id):].cpu())
             chunks = raw_output_str.split(function_call_token)
             for i, chunk in enumerate(chunks):
                 if len(chunk) == 0:
                     continue
                 chunk = chunk.replace(tokenizer.pad_token, "")
+                has_text = True if chunk.startswith("all") else False
                 if i == 0 and has_text is not False:
                     final_output_json["content"] = chunk.strip[:-len("<|eot_id|>")] if chunk.endswith("<|eot_id|>") else chunk
+                    final_output_json["content"] = final_output_json["content"][len("all\n"):]
                 else:
                     tool_calls.append(
                         {

tokenizer_config.json CHANGED Viewed

@@ -2050,7 +2050,7 @@
     }
   },
   "bos_token": "<|begin_of_text|>",
-  "chat_template": "{% for message in messages %}\n{% if message['role'] == 'user' or message['role'] == 'system' %}\n{{ '<|start_header_id|>' + message['role'] + '<|end_header_id|>\n\n' + message['content'] + '<|eot_id|>' }}{% elif message['role'] == 'tool' %}\n{{ '<|start_header_id|>' + message['role'] + '<|end_header_id|>\n\n' + message['content'] + '<|eot_id|>' }}{% else %}\n{{ '<|start_header_id|>' + message['role'] + '<|end_header_id|>\n\n'}}{% if message['content'] is not none %}\n{{ '>>>all\n' + message['content'] }}{% endif %}\n{% if 'tool_calls' in message and message['tool_calls'] is not none %}\n{% for tool_call in message['tool_calls'] %}\n{{ '>>>' + tool_call['function']['name'] + '\n' + tool_call['function']['arguments'] }}{% endfor %}\n{% endif %}\n{{ '<|eot_id|>' }}{% endif %}\n{% endfor %}\n{% if add_generation_prompt %}{{ '<|start_header_id|>assistant<|end_header_id|>\n\n' }}{% endif %}",
   "clean_up_tokenization_spaces": true,
   "eos_token": "<|eot_id|>",
   "legacy": true,

     }
   },
   "bos_token": "<|begin_of_text|>",
+  "chat_template": "{% for message in messages %}\n{% if message['role'] == 'user' or message['role'] == 'system' %}\n{{ '<|start_header_id|>' + message['role'] + '<|end_header_id|>\n\n' + message['content'] + '<|eot_id|>' }}{% elif message['role'] == 'tool' %}\n{{ '<|start_header_id|>' + message['role'] + '<|end_header_id|>\n\n' + message['content'] + '<|eot_id|>' }}{% else %}\n{{ '<|start_header_id|>' + message['role'] + '<|end_header_id|>\n\n'}}{% if message['content'] is not none %}\n{{ '>>>all\n' + message['content'] }}{% endif %}\n{% if 'tool_calls' in message and message['tool_calls'] is not none %}\n{% for tool_call in message['tool_calls'] %}\n{{ '>>>' + tool_call['function']['name'] + '\n' + tool_call['function']['arguments'] }}{% endfor %}\n{% endif %}\n{{ '<|eot_id|>' }}{% endif %}\n{% endfor %}\n{% if add_generation_prompt %}{{ '<|start_header_id|>assistant<|end_header_id|>\n\n>>>' }}{% endif %}",
   "clean_up_tokenization_spaces": true,
   "eos_token": "<|eot_id|>",
   "legacy": true,