import gradio as gr from transformers import AutoTokenizer import json tokenizer = AutoTokenizer.from_pretrained("HuggingFaceH4/zephyr-7b-beta") demo_conversation = """[ {"role": "system", "content": "You are a helpful chatbot."}, {"role": "user", "content": "Hi there!"}, {"role": "assistant", "content": "Hello, human!"}, {"role": "user", "content": "Can I ask a question?"} ]""" default_template = """{% for message in messages %} {{ "<|im_start|>" + message["role"] + "\\n" + message["content"] + "<|im_end|>\\n" }} {% endfor %} {% if add_generation_prompt %} {{ "<|im_start|>assistant\\n" }} {% endif %}""" description_text = """### This space is a helper app for writing [Chat Templates](https://huggingface.co/docs/transformers/main/en/chat_templating). ### When you're happy with the outputs from your template, you can use the code block at the end to add it to a PR!""" def apply_chat_template(template, test_conversation, add_generation_prompt, cleanup_whitespace): if cleanup_whitespace: template = "".join([line.strip() for line in template.split('\n')]) tokenizer.chat_template = template outputs = [] conversation = json.loads(test_conversation) pr_snippet = ( "CHECKPOINT = \"big-ai-company/cool-new-model\"\n" "tokenizer = AutoTokenizer.from_pretrained(CHECKPOINT)", f"tokenizer.chat_template = \"{template}\"", "tokenizer.push_to_hub(CHECKPOINT, create_pr=True)" ) pr_snippet = "\n".join(pr_snippet) formatted = tokenizer.apply_chat_template(conversation, tokenize=False, add_generation_prompt=add_generation_prompt) return formatted #, pr_snippet def open_pr(template, model_repo): tokenizer = AutoTokenizer.from_pretrained(model_repo) tokenizer.chat_template = template tokenizer.push_to_hub(model_repo, create_pr=True) with gr.Blocks() as demo: gr.Markdown(description_text) with gr.Row(): with gr.Column(): template = gr.TextArea(value=default_template, lines=10, max_lines=30, label="Chat Template") example = gr.TextArea(value=demo_conversation, lines=6, label="Conversation") generate_prompt = gr.Checkbox(value=False, label="Add generation prompt") clean_whitespace = gr.Checkbox(value=True, label="Cleanup template whitespace") btn = gr.Button("Submit") with gr.Column(): output = gr.TextArea(label="Formatted conversation") model_repo = gr.Textbox(label='Model repo to open a PR') btn_pr = gr.Button("Open a PR with template update") btn.click(fn=apply_chat_template, inputs=[template, example, generate_prompt, clean_whitespace], outputs=[output]) btn_pr.click(fn=open_pr, inputs=[template, model_repo]) demo.launch()