Back to Unilm

import packages

textdiffuser/data/visualize_charseg.ipynb

latest757 B
Original Source
python
# import packages
import os 
from PIL import Image, ImageEnhance
import cv2
import numpy as np
python
# display images
root = 'laion-ocr-example/06269/062690093'
img_root = os.path.join(root, 'image.jpg')
img = Image.open(img_root)
display(img)
python
# visualize
segmap_root = os.path.join(root, 'charseg.npy')
segmap_np = np.load(segmap_root)
print(segmap_np.shape)

segmap_pil = Image.fromarray(segmap_np.astype(np.uint8))
# display(segmap_pil)
enhancer = ImageEnhance.Brightness(segmap_pil)
factor = 5 
bright_image = enhancer.enhance(factor)   
# display(bright_image)

img_resize = img.resize((256,256))
blank = Image.new('RGB', (512, 256))
blank.paste(img_resize, (0,0))
blank.paste(bright_image, (256,0))
display(blank)