min-dalle-test/replicate_predictor.py

from min_dalle import MinDalle
import tempfile
import torch, torch.backends.cudnn
from typing import Iterator
from cog import BasePredictor, Path, Input

torch.backends.cudnn.deterministic = False


class ReplicatePredictor(BasePredictor):
    def setup(self):
        self.model = MinDalle(is_mega=True, is_reusable=True)

    def predict(
        self,
        text: str = Input(
            description='For long prompts, only the first 64 tokens will be used to generate the image.',
            default='Dali painting of WALL·E'
        ),
        intermediate_outputs: bool = Input(
            description='Whether to show intermediate outputs while running.  This adds less than a second to the run time.',
            default=True
        ),
        grid_size: int = Input(
            description='Size of the image grid.  5x5 takes around 16 seconds, 8x8 takes around 36 seconds',
            ge=1,
            le=8,
            default=4
        ),
        log2_supercondition_factor: int = Input(
            description='Higher values result in better agreement with the text but a narrower variety of generated images',
            ge=1,
            le=6,
            default=4
        ),
    ) -> Iterator[Path]:
        try: 
            seed = -1
            log2_mid_count = 3 if intermediate_outputs else 0
            image_stream = self.model.generate_image_stream(
                text,
                seed,
                grid_size=grid_size,
                log2_mid_count=log2_mid_count,
                log2_supercondition_factor=log2_supercondition_factor,
                is_verbose=True
            )

            iter = 0
            path = Path(tempfile.mkdtemp())
            for image in image_stream:
                iter += 1
                image_path = path / 'min-dalle-iter-{}.jpg'.format(iter)
                image.save(str(image_path))
                yield image_path
        except:
            print("An error occured, deleting model")
            del self.model
            torch.cuda.empty_cache()
            self.setup()
            raise Exception("There was an error, please try again")
generate_image_stream 2022-07-05 00:02:33 +00:00			`from min_dalle import MinDalle`
updated replicate predict.py file 2022-06-29 19:53:25 +00:00			`import tempfile`
faster inference with cuda/cudnn backends flags 2022-07-09 10:48:51 +00:00			`import torch, torch.backends.cudnn`
generate_image_stream 2022-07-05 00:02:33 +00:00			`from typing import Iterator`
updated replicate predict.py file 2022-06-29 19:53:25 +00:00			`from cog import BasePredictor, Path, Input`

faster inference with cuda/cudnn backends flags 2022-07-09 10:48:51 +00:00			`torch.backends.cudnn.deterministic = False`

updated replicate predict.py file 2022-06-29 19:53:25 +00:00
update replicate files 2022-07-05 09:47:35 +00:00			`class ReplicatePredictor(BasePredictor):`
updated replicate predict.py file 2022-06-29 19:53:25 +00:00			`def setup(self):`
update replicate_predictor.py 2022-07-05 11:07:29 +00:00			`self.model = MinDalle(is_mega=True, is_reusable=True)`
updated replicate predict.py file 2022-06-29 19:53:25 +00:00
			`def predict(`
			`self,`
			`text: str = Input(`
properly limit input to 64 tokens 2022-07-06 02:14:19 +00:00			`description='For long prompts, only the first 64 tokens will be used to generate the image.',`
update replicate, clear cuda cache if cuda available 2022-07-04 11:28:44 +00:00			`default='Dali painting of WALL·E'`
updated replicate predict.py file 2022-06-29 19:53:25 +00:00			`),`
boolean intermediate_outputs 2022-07-05 13:43:41 +00:00			`intermediate_outputs: bool = Input(`
			`description='Whether to show intermediate outputs while running. This adds less than a second to the run time.',`
			`default=True`
			`),`
update replicate files 2022-07-02 14:05:16 +00:00			`grid_size: int = Input(`
clamp in place 2022-07-10 12:07:54 +00:00			`description='Size of the image grid. 5x5 takes around 16 seconds, 8x8 takes around 36 seconds',`
update replicate files 2022-07-02 14:32:17 +00:00			`ge=1,`
support bfloat16 2022-07-07 12:21:20 +00:00			`le=8,`
update replicate, clear cuda cache if cuda available 2022-07-04 11:28:44 +00:00			`default=4`
faster decoder self attention 2022-07-04 12:05:55 +00:00			`),`
update replicate files 2022-07-05 09:55:10 +00:00			`log2_supercondition_factor: int = Input(`
wording explaining super condition factor 2022-07-05 09:57:55 +00:00			`description='Higher values result in better agreement with the text but a narrower variety of generated images',`
update replicate files 2022-07-05 09:55:10 +00:00			`ge=1,`
			`le=6,`
			`default=4`
control super condition factor 2022-07-05 01:30:27 +00:00			`),`
generate_image_stream 2022-07-05 00:02:33 +00:00			`) -> Iterator[Path]:`
add try-except to replicate 2022-07-07 16:35:00 +00:00			`try:`
			`seed = -1`
			`log2_mid_count = 3 if intermediate_outputs else 0`
			`image_stream = self.model.generate_image_stream(`
			`text,`
			`seed,`
			`grid_size=grid_size,`
			`log2_mid_count=log2_mid_count,`
			`log2_supercondition_factor=log2_supercondition_factor,`
			`is_verbose=True`
			`)`
update predict.py 2022-07-04 22:37:07 +00:00
add try-except to replicate 2022-07-07 16:35:00 +00:00			`iter = 0`
			`path = Path(tempfile.mkdtemp())`
			`for image in image_stream:`
			`iter += 1`
			`image_path = path / 'min-dalle-iter-{}.jpg'.format(iter)`
			`image.save(str(image_path))`
			`yield image_path`
			`except:`
			`print("An error occured, deleting model")`
			`del self.model`
generate_images_stream and generate_images 2022-07-07 21:03:47 +00:00			`torch.cuda.empty_cache()`
add try-except to replicate 2022-07-07 16:35:00 +00:00			`self.setup()`
			`raise Exception("There was an error, please try again")`