You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

61 lines
2.1 KiB

from min_dalle import MinDalle
import tempfile
import torch, torch.backends.cudnn
from typing import Iterator
from cog import BasePredictor, Path, Input
torch.backends.cudnn.deterministic = False
class ReplicatePredictor(BasePredictor):
def setup(self):
self.model = MinDalle(
is_mega=True,
is_reusable=True,
dtype=torch.float32
)
def predict(
self,
text: str = Input(default='Dali painting of WALL·E'),
save_as_png: bool = Input(default=False),
progressive_outputs: bool = Input(default=True),
grid_size: int = Input(ge=1, le=9, default=5),
temperature: str = Input(
choices=(
['1/{}'.format(2 ** i) for i in range(4, 0, -1)] +
[str(2 ** i) for i in range(5)]
),
default='4',
description='Advanced Setting, see Readme below if interested.'
),
top_k: int = Input(
choices=[2 ** i for i in range(15)],
default=64,
description='Advanced Setting, see Readme below if interested.'
),
supercondition_factor: int = Input(
choices=[2 ** i for i in range(2, 7)],
default=16,
description='Advanced Setting, see Readme below if interested.'
)
) -> Iterator[Path]:
log2_mid_count = 3 if progressive_outputs else 0
image_stream = self.model.generate_image_stream(
text = text,
seed = -1,
grid_size = grid_size,
log2_mid_count = log2_mid_count,
temperature = eval(temperature),
supercondition_factor = float(supercondition_factor),
top_k = top_k,
is_verbose = True
)
i = 0
path = Path(tempfile.mkdtemp())
for image in image_stream:
i += 1
ext = 'png' if i == 2 ** log2_mid_count and save_as_png else 'jpg'
image_path = path / 'min-dalle-iter-{}.{}'.format(i, ext)
image.save(str(image_path))
yield image_path