You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
61 lines
2.1 KiB
61 lines
2.1 KiB
from min_dalle import MinDalle |
|
import tempfile |
|
import torch, torch.backends.cudnn |
|
from typing import Iterator |
|
from cog import BasePredictor, Path, Input |
|
|
|
torch.backends.cudnn.deterministic = False |
|
|
|
class ReplicatePredictor(BasePredictor): |
|
def setup(self): |
|
self.model = MinDalle( |
|
is_mega=True, |
|
is_reusable=True, |
|
dtype=torch.float32 |
|
) |
|
|
|
def predict( |
|
self, |
|
text: str = Input(default='Dali painting of WALL·E'), |
|
save_as_png: bool = Input(default=False), |
|
progressive_outputs: bool = Input(default=True), |
|
grid_size: int = Input(ge=1, le=9, default=5), |
|
temperature: str = Input( |
|
choices=( |
|
['1/{}'.format(2 ** i) for i in range(4, 0, -1)] + |
|
[str(2 ** i) for i in range(5)] |
|
), |
|
default='4', |
|
description='Advanced Setting, see Readme below if interested.' |
|
), |
|
top_k: int = Input( |
|
choices=[2 ** i for i in range(15)], |
|
default=64, |
|
description='Advanced Setting, see Readme below if interested.' |
|
), |
|
supercondition_factor: int = Input( |
|
choices=[2 ** i for i in range(2, 7)], |
|
default=16, |
|
description='Advanced Setting, see Readme below if interested.' |
|
) |
|
) -> Iterator[Path]: |
|
log2_mid_count = 3 if progressive_outputs else 0 |
|
image_stream = self.model.generate_image_stream( |
|
text = text, |
|
seed = -1, |
|
grid_size = grid_size, |
|
log2_mid_count = log2_mid_count, |
|
temperature = eval(temperature), |
|
supercondition_factor = float(supercondition_factor), |
|
top_k = top_k, |
|
is_verbose = True |
|
) |
|
|
|
i = 0 |
|
path = Path(tempfile.mkdtemp()) |
|
for image in image_stream: |
|
i += 1 |
|
ext = 'png' if i == 2 ** log2_mid_count and save_as_png else 'jpg' |
|
image_path = path / 'min-dalle-iter-{}.{}'.format(i, ext) |
|
image.save(str(image_path)) |
|
yield image_path |