dottxt-ai
diff --git a/‎its-a-smol-world/README.md‎
Lines changed: 48 additions & 0 deletions b/‎its-a-smol-world/README.md‎
Lines changed: 48 additions & 0 deletions
diff --git a/‎its-a-smol-world/demo.gif‎
5.7 MB b/‎its-a-smol-world/demo.gif‎
5.7 MB
diff --git a/‎its-a-smol-world/requirements.txt‎
Lines changed: 4 additions & 0 deletions b/‎its-a-smol-world/requirements.txt‎
Lines changed: 4 additions & 0 deletions
diff --git a/‎its-a-smol-world/src/__init__.py‎ b/‎its-a-smol-world/src/__init__.py‎
diff --git a/‎its-a-smol-world/src/app.py‎
Lines changed: 56 additions & 0 deletions b/‎its-a-smol-world/src/app.py‎
Lines changed: 56 additions & 0 deletions
diff --git a/‎its-a-smol-world/src/functions.json‎
Lines changed: 72 additions & 0 deletions b/‎its-a-smol-world/src/functions.json‎
Lines changed: 72 additions & 0 deletions
diff --git a/‎its-a-smol-world/src/smol_mind.py‎
Lines changed: 178 additions & 0 deletions b/‎its-a-smol-world/src/smol_mind.py‎
Lines changed: 178 additions & 0 deletions
@@ -0,0 +1,48 @@
+# The Bunny B1: Powered by SmolLM2
+
+This is a demo to celebrate the release of [the `SmolLM2-1.7B` model](https://huggingface.co/collections/HuggingFaceTB/smollm2-6723884218bcda64b34d7db9) from Hugging Face 🤗!
+
+Ever want to have a natural language interface to local apps? The Bunny B1 demonstrates how to combine the power of SmolLM2 with structured generation using [Outlines](https://github.com/dottxt-ai/outlines) to be able to map natural language requests to calls to applications, even on smaller devices.
+
+Here's a look at the demo in action:
+
+![Bunny B1](./demo.gif)
+
+## Setting up the environment
+
+```bash
+python3 -m venv .venv
+source .venv/bin/activate
+pip install -r requirements.txt
+```
+
+## Running the demo
+
+To start the demo, run the following command:
+
+```bash
+python3 ./src/app.py
+```
+
+The demo provides an interface for natural language interaction with a mobile device. You can provide natural language commands and the model will choose one of the following actions:
+
+- Send a text message
+- Order a food delivery
+- Order a ride
+- Get the weather
+
+To add a new function you can edit `functions.json` and follow the pattern you'll find in the examples.
+
+## Good Test Examples:
+
+"I'd like to order two coffees from starbucks"
+
+"I need a ride to SEATAC terminal A"
+
+"What's the weather in san francisco today?"
+
+"Text Remi and tell him the project is looking good"
+
+## Customizing
+
+The `constants.py` file allows you to customize the model, device, and torch tensor type. This demo was created on a Mac so the default device is `mps`. You can swap this out for `cuda` if you'd like.
@@ -0,0 +1,4 @@
+outlines==0.1.0
+transformers
+torch
+accelerate>=0.26.0
@@ -0,0 +1,56 @@
+import time
+import itertools
+import threading
+import sys
+import argparse
+from smol_mind import SmolMind, load_functions
+from constants import MODEL_NAME
+
+def spinner(stop_event):
+ spinner = itertools.cycle(['-', '/', '|', '\\'])
+ while not stop_event.is_set():
+ sys.stdout.write(next(spinner))
+ sys.stdout.flush()
+ sys.stdout.write('\b')
+ time.sleep(0.1)
+
+def main():
+ # Add command-line argument parsing
+ parser = argparse.ArgumentParser(description="SmolMind CLI")
+ parser.add_argument('-d', '--debug', action='store_true', help='Enable debug mode')
+ parser.add_argument('-i', '--instruct', action='store_true', help='Enable instruct mode (disables continue mode)')
+ args = parser.parse_args()
+
+ print("loading SmolMind...")
+ functions = load_functions("./src/functions.json")
+ sm = SmolMind(functions, model_name=MODEL_NAME, debug=args.debug, instruct=args.instruct)
+ if args.debug:
+ print("Using model:", sm.model_name)
+ print("Debug mode:", "Enabled" if args.debug else "Disabled")
+ print("Instruct mode:", "Enabled" if args.instruct else "Disabled")
+ print("Welcome to the Bunny B1! What do you need?")
+ while True:
+ user_input = input("> ")
+ if user_input.lower() in ["exit", "quit"]:
+ print("Goodbye!")
+ break
+ 
+ # Create a shared event to stop the spinner
+ stop_event = threading.Event()
+ 
+ # Start the spinner in a separate thread
+ spinner_thread = threading.Thread(target=spinner, args=(stop_event,))
+ spinner_thread.daemon = True
+ spinner_thread.start()
+
+ response = sm.get_function_call(user_input)
+
+ # Stop the spinner
+ stop_event.set()
+ spinner_thread.join()
+ sys.stdout.write(' \b') # Erase the spinner
+ 
+ print(response)
+
+if __name__ == "__main__":
+ main()
@@ -0,0 +1,72 @@
+{
+ "functions": [
+ {
+ "name": "send_text",
+ "description": "Send a text message to a contact",
+ "parameters": {
+ "type": "dict",
+ "properties": {
+ "to": {
+ "type": "string",
+ "description": "The name of the contact to send the text to."
+ },
+ "message": {
+ "type": "string",
+ "description": "The message to send to the contact."
+ }
+ },
+ "required": ["to", "message"]
+ }
+ },
+ { 
+ "name": "order_food",
+ "description": "Order food from a restaurant",
+ "parameters": {
+ "type": "dict",
+ "properties": {
+ "restaurant": {
+ "type": "string",
+ "description": "The name of the restaurant to order from."
+ },
+ "item": {
+ "type": "string",
+ "description": "The name of the item to order."
+ },
+ "quantity": {
+ "type": "integer",
+ "description": "The quantity of the item to order."
+ }
+ },
+ "required": ["restaurant", "item", "quantity"]
+ }
+ },
+ {
+ "name": "order_ride",
+ "description": "Order a ride from a ride sharing service",
+ "parameters": {
+ "type": "dict",
+ "properties": {
+ "dest": {
+ "type": "string",
+ "description": "The destination of the ride."
+ }
+ },
+ "required": ["dest"]
+ }
+ },
+ {
+ "name": "get_weather",
+ "description": "Get the weather for a city",
+ "parameters": {
+ "type": "dict",
+ "properties": {
+ "city": {
+ "type": "string",
+ "description": "The city to get the weather for."
+ }
+ },
+ "required": ["city"]
+ }
+ }
+ ]
+}
@@ -0,0 +1,178 @@
+import json
+from textwrap import dedent
+import outlines
+from outlines.samplers import greedy
+from transformers import AutoTokenizer, logging
+import warnings
+from constants import MODEL_NAME, DEVICE, T_TYPE
+
+
+logging.set_verbosity_error()
+
+def format_functions(functions):
+ formatted_functions = []
+ for func in functions:
+ function_info = f"{func['name']}: {func['description']}\n"
+ if 'parameters' in func and 'properties' in func['parameters']:
+ for arg, details in func['parameters']['properties'].items():
+ description = details.get('description', 'No description provided')
+ function_info += f"- {arg}: {description}\n"
+ formatted_functions.append(function_info)
+ return "\n".join(formatted_functions)
+
+SYSTEM_PROMPT_FOR_CHAT_MODEL = dedent("""
+ You are an expert designed to call the correct function to solve a problem based on the user's request.
+ The functions available (with required parameters) to you are:
+ {functions}
+ 
+ You will be given a user prompt and you need to decide which function to call.
+ You will then need to format the function call correctly and return it in the correct format.
+ The format for the function call is:
+ [func1(params_name=params_value]
+ NO other text MUST be included.
+ 
+ For example:
+ Request: I want to order a cheese pizza from Pizza Hut.
+ Response: [order_food(restaurant="Pizza Hut", item="cheese pizza", quantity=1)]
+ 
+ Request: Is it raining in NY.
+ Response: [get_weather(city="New York")]
+
+ Request: I need a ride to SFO.
+ Response: [order_ride(destination="SFO")]
+ 
+ Request: I want to send a text to John saying Hello.
+ Response: [send_text(to="John", message="Hello!")]
+""")
+
+
+ASSISTANT_PROMPT_FOR_CHAT_MODEL = dedent("""
+ I understand and will only return the function call in the correct format.
+ """
+)
+USER_PROMPT_FOR_CHAT_MODEL = dedent("""
+ Request: {user_prompt}. 
+""")
+
+def continue_prompt(question, functions, tokenizer):
+ prompt = SYSTEM_PROMPT_FOR_CHAT_MODEL.format(functions=format_functions(functions))
+ prompt += "\n\n"
+ prompt += USER_PROMPT_FOR_CHAT_MODEL.format(user_prompt=question)
+ return prompt
+
+def instruct_prompt(question, functions, tokenizer):
+ messages = [
+ {"role": "user", "content": SYSTEM_PROMPT_FOR_CHAT_MODEL.format(functions=format_functions(functions))},
+ {"role": "assistant", "content": ASSISTANT_PROMPT_FOR_CHAT_MODEL },
+ {"role": "user", "content": USER_PROMPT_FOR_CHAT_MODEL.format(user_prompt=question)},
+ ]
+ fc_prompt = tokenizer.apply_chat_template(messages, tokenize=False)
+ return fc_prompt
+
+INTEGER = r"(-)?(0|[1-9][0-9]*)"
+STRING_INNER = r'([^"\\\x00-\x1F\x7F-\x9F]|\\["\\])'
+# We'll limit this to just a max of 42 characters
+STRING = f'"{STRING_INNER}{{1,42}}"'
+# i.e. 1 is a not a float but 1.0 is.
+FLOAT = rf"({INTEGER})(\.[0-9]+)([eE][+-][0-9]+)?"
+BOOLEAN = r"(true|false)"
+NULL = r"null"
+
+simple_type_map = {
+ "string": STRING,
+ "any": STRING,
+ "integer": INTEGER,
+ "number": FLOAT,
+ "float": FLOAT,
+ "boolean": BOOLEAN,
+ "null": NULL,
+}
+
+def build_dict_regex(props):
+ out_re = r"\{"
+ args_part = ", ".join(
+ [f'"{prop}": ' + type_to_regex(props[prop]) for prop in props]
+ )
+ return out_re + args_part + r"\}"
+
+def type_to_regex(arg_meta):
+ arg_type = arg_meta["type"]
+ if arg_type == "object":
+ arg_type = "dict"
+ if arg_type == "dict":
+ try:
+ result = build_dict_regex(arg_meta["properties"])
+ except KeyError:
+ return "Definition does not contain 'properties' value."
+ elif arg_type in ["array","tuple"]:
+ pattern = type_to_regex(arg_meta["items"])
+ result = r"\[(" + pattern + ", ){0,8}" + pattern + r"\]"
+ else:
+ result = simple_type_map[arg_type]
+ return result
+
+type_to_regex({
+ "type": "array",
+ "items": {"type": "float"}
+})
+
+def build_standard_fc_regex(function_data):
+ out_re = r"\[" + function_data["name"] + r"\("
+ args_part = ", ".join(
+ [
+ f"{arg}=" + type_to_regex(function_data["parameters"]["properties"][arg])
+ for arg in function_data["parameters"]["properties"]
+
+ if arg in function_data["parameters"]["required"]
+ ]
+ )
+ optional_part = "".join(
+ [
+ f"(, {arg}="
+ + type_to_regex(function_data["parameters"]["properties"][arg])
+ + r")?"
+ for arg in function_data["parameters"]["properties"]
+ if not (arg in function_data["parameters"]["required"])
+ ]
+ )
+ return out_re + args_part + optional_part + r"\)]"
+
+def multi_function_fc_regex(fs):
+ multi_regex = "|".join([
+ rf"({build_standard_fc_regex(f)})" for f in fs
+ ])
+ return multi_regex
+
+def load_functions(path):
+ with open(path, "r") as f:
+ return json.load(f)['functions']
+
+class SmolMind:
+ def __init__(self, functions, model_name=MODEL_NAME,instruct=True,debug=False):
+ self.model_name = model_name
+ self.instruct = instruct
+ self.debug = debug
+ self.functions = functions
+ self.fc_regex = multi_function_fc_regex(functions)
+ self.model = outlines.models.transformers(
+ model_name,
+ device=DEVICE,
+ model_kwargs={
+ "trust_remote_code": True,
+ "torch_dtype": T_TYPE,
+ }) 
+ self.tokenizer = AutoTokenizer.from_pretrained(model_name)
+ self.generator = outlines.generate.regex(self.model, self.fc_regex, sampler=greedy())
+
+ def get_function_call(self, user_prompt):
+ with warnings.catch_warnings():
+ warnings.simplefilter("ignore")
+ if self.instruct:
+ prompt = instruct_prompt(user_prompt, self.functions, self.tokenizer)
+ else:
+ prompt = continue_prompt(user_prompt, self.functions, self.tokenizer)
+ response = self.generator(prompt)
+ if self.debug:
+ print(f"functions: {self.functions}")
+ print(f"prompt: {prompt}")
+ return response