2022-07-05 00:02:33 +00:00
|
|
|
from min_dalle import MinDalle
|
2022-06-29 19:53:25 +00:00
|
|
|
import tempfile
|
2022-07-05 00:02:33 +00:00
|
|
|
from typing import Iterator
|
2022-07-05 00:36:23 +00:00
|
|
|
from math import log2
|
2022-06-29 19:53:25 +00:00
|
|
|
from cog import BasePredictor, Path, Input
|
|
|
|
|
|
|
|
|
|
|
|
class Predictor(BasePredictor):
|
|
|
|
def setup(self):
|
2022-07-01 23:44:24 +00:00
|
|
|
self.model = MinDalle(is_mega=True)
|
2022-06-29 19:53:25 +00:00
|
|
|
|
|
|
|
def predict(
|
|
|
|
self,
|
|
|
|
text: str = Input(
|
2022-07-02 14:46:56 +00:00
|
|
|
description='Text',
|
2022-07-04 11:28:44 +00:00
|
|
|
default='Dali painting of WALL·E'
|
2022-06-29 19:53:25 +00:00
|
|
|
),
|
2022-07-02 14:05:16 +00:00
|
|
|
grid_size: int = Input(
|
2022-07-04 11:28:44 +00:00
|
|
|
description='Size of the image grid',
|
2022-07-02 14:32:17 +00:00
|
|
|
ge=1,
|
2022-07-05 00:38:35 +00:00
|
|
|
le=4,
|
2022-07-04 11:28:44 +00:00
|
|
|
default=4
|
2022-07-04 12:05:55 +00:00
|
|
|
),
|
|
|
|
seed: int = Input(
|
|
|
|
description='Set the seed to a positive number for reproducible results',
|
|
|
|
default=-1
|
|
|
|
),
|
2022-07-05 00:36:23 +00:00
|
|
|
intermediate_image_count: int = Input(
|
|
|
|
description='Set the number of intermediate images to show',
|
|
|
|
choices=[1, 2, 4, 8, 16],
|
|
|
|
default=8
|
2022-07-04 22:37:07 +00:00
|
|
|
),
|
2022-07-05 00:02:33 +00:00
|
|
|
) -> Iterator[Path]:
|
|
|
|
image_stream = self.model.generate_image_stream(
|
2022-07-05 00:10:37 +00:00
|
|
|
text,
|
|
|
|
seed,
|
2022-07-04 22:37:07 +00:00
|
|
|
grid_size=grid_size,
|
2022-07-05 00:36:23 +00:00
|
|
|
log2_mid_count=log2(intermediate_image_count),
|
2022-07-05 00:02:33 +00:00
|
|
|
is_verbose=True
|
2022-07-04 22:37:07 +00:00
|
|
|
)
|
|
|
|
|
2022-07-05 00:02:33 +00:00
|
|
|
for image in image_stream:
|
2022-07-05 00:36:23 +00:00
|
|
|
path = Path(tempfile.mkdtemp()) / 'output.jpg'
|
|
|
|
image.save(str(path))
|
|
|
|
yield path
|