min-dalle-test/replicate_predictor.py

51 lines
1.7 KiB
Python
Raw Normal View History

2022-07-05 00:02:33 +00:00
from min_dalle import MinDalle
2022-06-29 19:53:25 +00:00
import tempfile
2022-07-05 00:02:33 +00:00
from typing import Iterator
2022-06-29 19:53:25 +00:00
from cog import BasePredictor, Path, Input
2022-07-05 09:47:35 +00:00
class ReplicatePredictor(BasePredictor):
2022-06-29 19:53:25 +00:00
def setup(self):
2022-07-05 11:07:29 +00:00
self.model = MinDalle(is_mega=True, is_reusable=True)
2022-06-29 19:53:25 +00:00
def predict(
self,
text: str = Input(
2022-07-06 02:14:19 +00:00
description='For long prompts, only the first 64 tokens will be used to generate the image.',
default='Dali painting of WALL·E'
2022-06-29 19:53:25 +00:00
),
2022-07-05 13:43:41 +00:00
intermediate_outputs: bool = Input(
description='Whether to show intermediate outputs while running. This adds less than a second to the run time.',
default=True
),
2022-07-02 14:05:16 +00:00
grid_size: int = Input(
2022-07-07 12:21:20 +00:00
description='Size of the image grid. 4x4 takes about 15 seconds, 8x8 takes about 45 seconds',
2022-07-02 14:32:17 +00:00
ge=1,
2022-07-07 12:21:20 +00:00
le=8,
default=4
2022-07-04 12:05:55 +00:00
),
2022-07-05 09:55:10 +00:00
log2_supercondition_factor: int = Input(
description='Higher values result in better agreement with the text but a narrower variety of generated images',
2022-07-05 09:55:10 +00:00
ge=1,
le=6,
default=4
2022-07-05 01:30:27 +00:00
),
2022-07-05 00:02:33 +00:00
) -> Iterator[Path]:
2022-07-05 13:06:27 +00:00
seed = -1
2022-07-05 13:43:41 +00:00
log2_mid_count = 3 if intermediate_outputs else 0
2022-07-05 00:02:33 +00:00
image_stream = self.model.generate_image_stream(
2022-07-05 00:10:37 +00:00
text,
seed,
2022-07-04 22:37:07 +00:00
grid_size=grid_size,
2022-07-05 13:43:41 +00:00
log2_mid_count=log2_mid_count,
2022-07-05 09:55:10 +00:00
log2_supercondition_factor=log2_supercondition_factor,
2022-07-05 00:02:33 +00:00
is_verbose=True
2022-07-04 22:37:07 +00:00
)
2022-07-05 02:05:32 +00:00
iter = 0
path = Path(tempfile.mkdtemp())
2022-07-05 00:02:33 +00:00
for image in image_stream:
2022-07-05 02:05:32 +00:00
iter += 1
image_path = path / 'min-dalle-iter-{}.jpg'.format(iter)
image.save(str(image_path))
yield image_path