add txt2txt utils and cli, start on dgpu

2025-01-09 21:13:20 -05:00 · 2025-01-09 21:13:20 -05:00 · 4404c82b9a
parent 22e40b766f
commit 4404c82b9a
3 changed files with 113 additions and 3 deletions
--- a/skynet/cli.py
+++ b/skynet/cli.py
@ -97,6 +97,45 @@ def inpaint(model, prompt, input, mask, output, strength, guidance, steps, seed)
        seed=seed
    )

+
+@click.command()
+@click.option('--model', '-m', default='microsoft/DialoGPT-small')
+@click.option(
+    '--prompt', '-p', default='a red old tractor in a sunny wheat field')
+@click.option('--output', '-o', default='output.txt')
+@click.option('--temperature', '-t', default=1.0)
+@click.option('--max-length', '-ml', default=256)
+@click.option('--num-return-sequences', '-rs', defautl=1)
+@click.option('--no-repeat-ngram', '-nr', default=2)
+@click.option('--top-p', '-tp', default=0.95)
+def txt2txt(
+    model,
+    prompt,
+    output,
+    temperature,
+    max_length,
+    num_return_sequences,
+    no_repeat_ngram,
+    top_p
+):
+    from . import utils
+    config = load_skynet_toml()
+    hf_token = load_key(config, 'skynet.dgpu.hf_token')
+    hf_home = load_key(config, 'skynet.dgpu.hf_home')
+    set_hf_vars(hf_token, hf_home)
+    utils.txt2txt(
+        hf_token=hf_token,
+        model=model,
+        prompt=prompt,
+        output=output,
+        temperature=temperature,
+        max_length=max_length,
+        num_return_sequences=num_return_sequences,
+        no_repeat_ngram=no_repeat_ngram,
+        top_p=top_p
+    )
+
+
@click.command()
@click.option('--input', '-i', default='input.png')
@click.option('--output', '-o', default='output.png')
--- a/skynet/dgpu/compute.py
+++ b/skynet/dgpu/compute.py
@ -8,7 +8,8 @@ import logging
 from hashlib import sha256
 import zipfile
 from PIL import Image
-from diffusers import DiffusionPipeline
+from diffusers import DiffusionPipeline, AutoPipelineForInpainting
+from transformers import AutoModelForCausalLM, AutoTokenizer

 import trio
 import torch
@ -63,6 +64,19 @@ def prepare_params_for_diffuse(
    )


+def prepare_params_for_transform(
+    params: dict,
+):
+    return (
+        params['prompt'],
+        int(params['num_return_sequences']),
+        int(params['no_repeat_ngram_size']),
+        float(params['top_p']),
+        float(params['temperature']),
+        int(params['max_length']),
+    )
+
+
 class SkynetMM:

    def __init__(self, config: dict):
@ -100,7 +114,9 @@ class SkynetMM:
        self._model = pipeline_for(
            name, mode, cache_dir=self.cache_dir)

-    def get_model(self, name: str, mode: str) -> DiffusionPipeline:
+    def get_model(
+        self, name: str, mode: str
+    ) -> DiffusionPipeline | AutoPipelineForInpainting | AutoModelForCausalLM:
        if name not in MODELS:
            raise DGPUComputeError(f'Unknown model {model_name}')

@ -167,6 +183,26 @@ class SkynetMM:

                    output_hash = sha256(output_binary).hexdigest()

+                case 'txt2txt':
+                    arguments = prepare_params_for_transform(params)
+                    prompt, num_return_sequences, no_repeat_ngram_size, top_p, temperature, max_length = arguments
+                    tokenizer = AutoTokenizer.from_pretrained(model)
+
+                    self.get_model(params['model'], method)
+                    tokenized_input = tokenizer.encode(prompt, return_tensors='pt')
+                    tokenized_output = self._model.generate(
+                        tokenized_input,
+                        max_length=max_length,
+                        num_return_sequences=num_return_sequences,
+                        no_repeat_ngram_size=no_repeat_ngram_size,
+                        top_p=top_p,
+                        temperature=temperature,
+                    )
+
+                    output = tokenizer.decode(tokenized_output, skip_special_tokens=True)
+
+                    output_hash = sha256(output).hexdigest()
+
                case _:
                    raise DGPUComputeError('Unsupported compute method')

--- a/skynet/utils.py
+++ b/skynet/utils.py
@ -22,6 +22,7 @@ from diffusers import (
    EulerAncestralDiscreteScheduler
 )
 from realesrgan import RealESRGANer
+from transformers import AutoTokenizer, AutoModelForCausalLM
 from huggingface_hub import login
 import trio

@ -68,7 +69,7 @@ def pipeline_for(
    mode: str,
    mem_fraction: float = 1.0,
    cache_dir: str | None = None
-) -> DiffusionPipeline:
+) -> DiffusionPipeline | AutoPipelineForInpainting | AutoModelForCausalLM:

    assert torch.cuda.is_available()
    torch.cuda.empty_cache()
@ -109,6 +110,10 @@ def pipeline_for(
    if 'inpaint' in mode:
        pipe_class = AutoPipelineForInpainting

+    elif 'txt2txt' in mode:
+        # TODO: unsure about pipe
+        pipe_class = AutoModelForCausalLM
+
    else:
        pipe_class = DiffusionPipeline

@ -233,6 +238,36 @@ def inpaint(
    image.save(output)


+def txt2txt(
+    hf_token: str,
+    model: str = 'tiiuae/falcon-40b-instruct',
+    prompt: str = 'who is ur faja?',
+    output: str = 'output.txt',
+    num_return_sequences: int = 1,
+    no_repeat_ngram_size: int = 2,
+    top_p: float = 0.95,
+    temperature: float = 1.0,
+    max_length: int = 256,
+):
+    login(token=hf_token)
+    tokenizer = AutoTokenizer.from_pretrained(model)
+    pipe = pipeline_for(model, 'txt2txt')
+
+    prompt = prompt
+    tokenized_input = tokenizer.encode(prompt, return_tensors='pt')
+    tokenized_output = pipe.generate(
+        tokenized_input,
+        max_length=max_length,
+        num_return_sequences=num_return_sequences,
+        no_repeat_ngram_size=no_repeat_ngram_size,
+        top_p=top_p,
+        temperature=temperature
+    )
+    response = tokenizer.decode(tokenized_output, skip_special_tokens=True)
+    with open(output, 'w', encoding='utf-8') as f:
+        f.write(response)
+
+
 def init_upscaler(model_path: str = 'weights/RealESRGAN_x4plus.pth'):
    return RealESRGANer(
        scale=4,