Spaces:
Runtime error
Runtime error
| import html | |
| import os | |
| import time | |
| import torch | |
| import transformers | |
| import gradio as gr | |
| class FormComponent: | |
| def get_expected_parent(self): | |
| return gr.components.Form | |
| class FormRow(FormComponent, gr.Row): | |
| """Same as gr.Row but fits inside gradio forms""" | |
| def get_block_name(self): | |
| return "row" | |
| def wrap_gradio_gpu_call(func, extra_outputs=None): | |
| def f(*args, **kwargs): | |
| res = func(*args, **kwargs) | |
| return res | |
| return wrap_gradio_call(f, extra_outputs=extra_outputs, add_stats=True) | |
| class Model: | |
| name = None | |
| model = None | |
| tokenizer = None | |
| available_models = ["0Tick/e621TagAutocomplete","0Tick/danbooruTagAutocomplete"] | |
| current = Model() | |
| job_count = 1 | |
| def device(): | |
| return torch.device("cpu") | |
| def generate_batch(input_ids, min_length, max_length, num_beams, temperature, repetition_penalty, length_penalty, sampling_mode, top_k, top_p): | |
| top_p = float(top_p) if sampling_mode == 'Top P' else None | |
| top_k = int(top_k) if sampling_mode == 'Top K' else None | |
| outputs = current.model.generate( | |
| input_ids, | |
| do_sample=True, | |
| temperature=max(float(temperature), 1e-6), | |
| repetition_penalty=repetition_penalty, | |
| length_penalty=length_penalty, | |
| top_p=top_p, | |
| top_k=top_k, | |
| num_beams=int(num_beams), | |
| min_length=min_length, | |
| max_length=max_length, | |
| pad_token_id=current.tokenizer.pad_token_id or current.tokenizer.eos_token_id | |
| ) | |
| texts = current.tokenizer.batch_decode(outputs, skip_special_tokens=True) | |
| return texts | |
| def model_selection_changed(model_name): | |
| if model_name == "None": | |
| current.tokenizer = None | |
| current.model = None | |
| current.name = None | |
| devices.torch_gc() | |
| def generate(id_task, model_name, batch_count, batch_size, text, *args): | |
| job_count = batch_count | |
| print(f"Model:{model_name},Count:{batch_count*batch_size},StartingText:{text}") | |
| if current.name != model_name: | |
| current.tokenizer = None | |
| current.model = None | |
| current.name = None | |
| if model_name != 'None': | |
| path = model_name | |
| current.tokenizer = transformers.AutoTokenizer.from_pretrained(path) | |
| current.model = transformers.AutoModelForCausalLM.from_pretrained(path) | |
| current.name = model_name | |
| assert current.model, 'No model available' | |
| assert current.tokenizer, 'No tokenizer available' | |
| current.model.to(device()) | |
| input_ids = current.tokenizer(text, return_tensors="pt").input_ids | |
| if input_ids.shape[1] == 0: | |
| input_ids = torch.asarray([[current.tokenizer.bos_token_id]], dtype=torch.long) | |
| input_ids = input_ids.to(device()) | |
| input_ids = input_ids.repeat((batch_size, 1)) | |
| markup = '<table><tbody>' | |
| index = 0 | |
| for i in range(batch_count): | |
| texts = generate_batch(input_ids, *args) | |
| for generated_text in texts: | |
| index += 1 | |
| markup += f""" | |
| <tr> | |
| <td> | |
| <div class="prompt gr-box gr-text-input"> | |
| <p id='promptgen_res_{index}'>{html.escape(generated_text)}</p> | |
| </div> | |
| </td> | |
| </tr> | |
| """ | |
| markup += '</tbody></table>' | |
| return markup, '' | |
| with gr.Blocks(analytics_enabled=False) as space: | |
| with gr.Row(): | |
| with gr.Column(scale=80): | |
| prompt = gr.Textbox(label="Prompt", elem_id="promptgen_prompt", show_label=False, lines=2, placeholder="Beginning of the prompt")#.style(container=False) | |
| with gr.Column(scale=10): | |
| submit = gr.Button('Generate', elem_id="promptgen_generate", variant='primary') | |
| with gr.Row(elem_id="promptgen_main"): | |
| with gr.Column(variant="compact"): | |
| selected_text = gr.TextArea(elem_id='promptgen_selected_text', visible=False) | |
| with FormRow(): | |
| model_selection = gr.Dropdown(label="Model", elem_id="promptgen_model", value=available_models[0], choices=["None"] + available_models) | |
| with FormRow(): | |
| sampling_mode = gr.Radio(label="Sampling mode", elem_id="promptgen_sampling_mode", value="Top K", choices=["Top K", "Top P"]) | |
| top_k = gr.Slider(label="Top K", elem_id="promptgen_top_k", value=12, minimum=1, maximum=50, step=1) | |
| top_p = gr.Slider(label="Top P", elem_id="promptgen_top_p", value=0.15, minimum=0, maximum=1, step=0.001) | |
| with gr.Row(): | |
| num_beams = gr.Slider(label="Number of beams", elem_id="promptgen_num_beams", value=1, minimum=1, maximum=8, step=1) | |
| temperature = gr.Slider(label="Temperature", elem_id="promptgen_temperature", value=1, minimum=0, maximum=4, step=0.01) | |
| repetition_penalty = gr.Slider(label="Repetition penalty", elem_id="promptgen_repetition_penalty", value=1, minimum=1, maximum=4, step=0.01) | |
| with FormRow(): | |
| length_penalty = gr.Slider(label="Length preference", elem_id="promptgen_length_preference", value=1, minimum=-10, maximum=10, step=0.1) | |
| min_length = gr.Slider(label="Min length", elem_id="promptgen_min_length", value=20, minimum=1, maximum=400, step=1) | |
| max_length = gr.Slider(label="Max length", elem_id="promptgen_max_length", value=150, minimum=1, maximum=400, step=1) | |
| with FormRow(): | |
| batch_count = gr.Slider(label="Batch count", elem_id="promptgen_batch_count", value=1, minimum=1, maximum=100, step=1) | |
| batch_size = gr.Slider(label="Batch size", elem_id="promptgen_batch_size", value=10, minimum=1, maximum=100, step=1) | |
| with gr.Column(): | |
| with gr.Group(elem_id="promptgen_results_column"): | |
| res = gr.HTML() | |
| res_info = gr.HTML() | |
| submit.click( | |
| fn=generate, | |
| inputs=[model_selection, model_selection, batch_count, batch_size, prompt, min_length, max_length, num_beams, temperature, repetition_penalty, length_penalty, sampling_mode, top_k, top_p, ], | |
| outputs=[res, res_info] | |
| ) | |
| model_selection.change( | |
| fn=model_selection_changed, | |
| inputs=[model_selection], | |
| outputs=[], | |
| ) | |
| space.launch() |