from openai import OpenAI
import openai

client = OpenAI()

try:
  response = client.images.generate(
    model="dall-e-3",
    prompt="a white siamese cat",
    size="1024x1024",
    quality="standard",
    n=1,
  )

  image_url = response.data[0].url
  print(f"Generated image url: {image_url}")
except openai.OpenAIError as e:
  print(e)

Generated image url: https://oaidalleapiprodscus.blob.core.windows.net/private/org-WQiPiqMq85IHphFJqtWq0Q4B/user-B9QNgF1Sobj6vm4KI3lFQigJ/img-IZqUZuVQDvda5d69f8O2x5nf.png?st=2024-02-09T07%3A25%3A37Z&se=2024-02-09T09%3A25%3A37Z&sp=r&sv=2021-08-06&sr=b&rscd=inline&rsct=image/png&skoid=6aaadede-4fb3-4698-a8f6-684d7786b067&sktid=a48cca56-e6da-484e-a814-9c849652bcb3&skt=2024-02-09T05%3A02%3A09Z&ske=2024-02-10T05%3A02%3A09Z&sks=b&skv=2021-08-06&sig=m/GVoZU7mT2QBJe3gOvUFDYpSJVBr0DC8i150nPDDEE%3D

from IPython.display import Image

# Display the image
Image(url=image_url)

# Create an image and get the binary data to save
response = client.images.generate(
  model="dall-e-3",
  prompt="a sunlit indoor lounge area with a pool",
  size="1024x1024",
  quality="standard",
  n=1,
  response_format="b64_json"
)

# Save the returning image data as a png file
import base64
image_data_base64 = response.data[0].b64_json
image_data = base64.b64decode(image_data_base64)

generated_image_path = 'output/generated_image.png'
with open(generated_image_path, 'wb') as file:
    file.write(image_data)

# Display the base image
print(f"****** GENERATED IMAGE: {generated_image_path} ******")
Image(filename=generated_image_path)

****** GENERATED IMAGE: output/generated_image.png ******

# NOTE: Here I duplicated the image file as 'output/mask_image.png' and manually masked the area as transparent.
base_image_path = 'data/base_image.png'

# Display the base image
print(f"****** BASE IMAGE: {base_image_path} ******")
Image(filename=base_image_path)

****** BASE IMAGE: data/base_image.png ******

mask_image_path = 'data/mask_image.png'

# Display the mask image
print(f"****** MASK IMAGE: {mask_image_path} ******")
Image(filename=mask_image_path)

****** MASK IMAGE: data/mask_image.png ******

edit_response = client.images.edit(
  model="dall-e-2",
  image=open(base_image_path, "rb"),
  mask=open(mask_image_path, "rb"),
  prompt="A sunlit indoor lounge area with a pool containing a flamingo",
  n=1,
  size="1024x1024",
  response_format="b64_json"
)
image_url = edit_response.data[0].url

# Save the returning image data as a png file
import base64
image_data_base64 = edit_response.data[0].b64_json
image_data = base64.b64decode(image_data_base64)

edited_image_path = 'output/edited_image.png'
with open(edited_image_path, 'wb') as file:
    file.write(image_data)

# Display the edited image
print(f"****** EDITED IMAGE: {edited_image_path} ******")
Image(filename=edited_image_path)

****** EDITED IMAGE: output/edited_image.png ******

variation_response = client.images.create_variation(
  image=open(base_image_path, "rb"),
  n=1,
  size="1024x1024",
  response_format="b64_json"
)

# Save the returning image data as a png file
import base64
image_data_base64 = variation_response.data[0].b64_json
image_data = base64.b64decode(image_data_base64)

# Display the first image
print(f"****** FIRST VARIATION ******")
Image(data=image_data)

****** FIRST VARIATION ******

from io import BytesIO
from PIL import Image as PilImage
from openai import OpenAI
from IPython.display import Image
client = OpenAI()

# Read the image file from disk and resize it
image = PilImage.open(base_image_path)
image = image.resize((256, 256))

# Convert the image to a BytesIO object
byte_stream = BytesIO()
image.save(byte_stream, format='PNG')
byte_array = byte_stream.getvalue()

variation_response2 = client.images.create_variation(
  image=byte_array,
  n=1,
  model="dall-e-2",
  size="1024x1024"
)

# Display the variation image
print(f"****** VARIATION ******")
Image(url=variation_response2.data[0].url)

****** VARIATION ******

Image Generation¶

Introduction¶

Error Handling¶

Generations¶

Prompting¶

Edits (DALL·E 2 only)¶

Variations (DALL·E 2 only)¶

Operating on Image Data¶