HuggingFaceTB
/

SmolLM2-1.7B-Instruct

Text Generation

Transformers.js

text-generation-inference

Inference Endpoints

Model card Files Files and versions Metrics Training metrics Community

loubnabnl HF staff commited on Nov 4, 2024

Commit

963bc16

·

verified ·

1 Parent(s): ba519e2

Update README.md

Files changed (1) hide show

README.md +66 -1

README.md CHANGED Viewed

@@ -192,8 +192,73 @@ def parse_response(text: str) -> str | dict[str, any]:
     if matches:
         return json.loads(matches[0])
     return text
 ```
-More details can be found [here](https://huggingface.co/HuggingFaceTB/SmolLM2-1.7B-Instruct/blob/main/instructions_function_calling.md)
 ## Limitations

     if matches:
         return json.loads(matches[0])
     return text
+model_name_smollm = "HuggingFaceTB/SmolLM2-1.7B-Instruct"
+model = AutoModelForCausalLM.from_pretrained(model_name_smollm, device_map="auto", torch_dtype="auto", trust_remote_code=True)
+tokenizer = AutoTokenizer.from_pretrained(model_name_smollm)
+from datetime import datetime
+import random
+def get_current_time() -> str:
+    """Returns the current time in 24-hour format.
+    Returns:
+        str: Current time in HH:MM:SS format.
+    """
+    return datetime.now().strftime("%H:%M:%S")
+def get_random_number_between(min: int, max: int) -> int:
+    """
+    Gets a random number between min and max.
+    Args:
+        min: The minimum number.
+        max: The maximum number.
+    Returns:
+        A random number between min and max.
+    """
+    return random.randint(min, max)
+tools = [get_json_schema(get_random_number_between), get_json_schema(get_current_time)]
+toolbox = {"get_random_number_between": get_random_number_between, "get_current_time": get_current_time}
+query = "Give me a number between 1 and 300"
+messages = prepare_messages(query, tools=tools)
+inputs = tokenizer.apply_chat_template(messages, add_generation_prompt=True, return_tensors="pt").to(model.device)
+outputs = model.generate(inputs, max_new_tokens=512, do_sample=False, num_return_sequences=1, eos_token_id=tokenizer.eos_token_id)
+result = tokenizer.decode(outputs[0][len(inputs[0]):], skip_special_tokens=True)
+tool_calls = parse_response(result)
+# [{'name': 'get_random_number_between', 'arguments': {'min': 1, 'max': 300}}
+# Get tool responses
+tool_responses = [toolbox.get(tc["name"])(*tc["arguments"].values()) for tc in tool_calls]
+# [63]
+# For the second turn, rebuild the history of messages:
+history = messages.copy()
+# Add the "parsed response"
+history.append({"role": "assistant", "content": result})
+query = "Can you give me the hour?"
+history.append({"role": "user", "content": query})
+inputs = tokenizer.apply_chat_template(history, add_generation_prompt=True, return_tensors="pt").to(model.device)
+outputs = model.generate(inputs, max_new_tokens=512, do_sample=False, num_return_sequences=1, eos_token_id=tokenizer.eos_token_id)
+result = tokenizer.decode(outputs[0][len(inputs[0]):], skip_special_tokens=True)
+tool_calls = parse_response(result)
+tool_responses = [toolbox.get(tc["name"])(*tc["arguments"].values()) for tc in tool_calls]
+# ['07:57:25']
 ```
+More details such as parallel function calls and tools not available can be found [here](https://huggingface.co/HuggingFaceTB/SmolLM2-1.7B-Instruct/blob/main/instructions_function_calling.md)
 ## Limitations