hydrus/include/HydrusImageHandling.py

661 lines
21 KiB
Python
Executable File

import ClientConstants as CC
import cStringIO
import numpy.core.multiarray # important this comes before cv!
import cv
import cv2
import HydrusConstants as HC
import HydrusExceptions
import HydrusThreading
import lz4
import numpy
import os
from PIL import _imaging
from PIL import Image as PILImage
import shutil
import struct
import threading
import time
import traceback
import wx
#LINEAR_SCALE_PALETTE = [ 0, 0, 0, 1, 1, 1, 2, 2, 2, 3, 3, 3, 4, 4, 4, 5, 5, 5, 6, 6, 6, 7, 7, 7, 8, 8, 8, 9, 9, 9, 10, 10, 10, 11, 11, 11, 12, 12, 12, 13, 13, 13, 14, 14, 14, 15, 15, 15, 16, 16, 16, 17, 17, 17, 18, 18, 18, 19, 19, 19, 20, 20, 20, 21, 21, 21, 22, 22, 22, 23, 23, 23, 24, 24, 24, 25, 25, 25, 26, 26, 26, 27, 27, 27, 28, 28, 28, 29, 29, 29, 30, 30, 30, 31, 31, 31, 32, 32, 32, 33, 33, 33, 34, 34, 34, 35, 35, 35, 36, 36, 36, 37, 37, 37, 38, 38, 38, 39, 39, 39, 40, 40, 40, 41, 41, 41, 42, 42, 42, 43, 43, 43, 44, 44, 44, 45, 45, 45, 46, 46, 46, 47, 47, 47, 48, 48, 48, 49, 49, 49, 50, 50, 50, 51, 51, 51, 52, 52, 52, 53, 53, 53, 54, 54, 54, 55, 55, 55, 56, 56, 56, 57, 57, 57, 58, 58, 58, 59, 59, 59, 60, 60, 60, 61, 61, 61, 62, 62, 62, 63, 63, 63, 64, 64, 64, 65, 65, 65, 66, 66, 66, 67, 67, 67, 68, 68, 68, 69, 69, 69, 70, 70, 70, 71, 71, 71, 72, 72, 72, 73, 73, 73, 74, 74, 74, 75, 75, 75, 76, 76, 76, 77, 77, 77, 78, 78, 78, 79, 79, 79, 80, 80, 80, 81, 81, 81, 82, 82, 82, 83, 83, 83, 84, 84, 84, 85, 85, 85, 86, 86, 86, 87, 87, 87, 88, 88, 88, 89, 89, 89, 90, 90, 90, 91, 91, 91, 92, 92, 92, 93, 93, 93, 94, 94, 94, 95, 95, 95, 96, 96, 96, 97, 97, 97, 98, 98, 98, 99, 99, 99, 100, 100, 100, 101, 101, 101, 102, 102, 102, 103, 103, 103, 104, 104, 104, 105, 105, 105, 106, 106, 106, 107, 107, 107, 108, 108, 108, 109, 109, 109, 110, 110, 110, 111, 111, 111, 112, 112, 112, 113, 113, 113, 114, 114, 114, 115, 115, 115, 116, 116, 116, 117, 117, 117, 118, 118, 118, 119, 119, 119, 120, 120, 120, 121, 121, 121, 122, 122, 122, 123, 123, 123, 124, 124, 124, 125, 125, 125, 126, 126, 126, 127, 127, 127, 128, 128, 128, 129, 129, 129, 130, 130, 130, 131, 131, 131, 132, 132, 132, 133, 133, 133, 134, 134, 134, 135, 135, 135, 136, 136, 136, 137, 137, 137, 138, 138, 138, 139, 139, 139, 140, 140, 140, 141, 141, 141, 142, 142, 142, 143, 143, 143, 144, 144, 144, 145, 145, 145, 146, 146, 146, 147, 147, 147, 148, 148, 148, 149, 149, 149, 150, 150, 150, 151, 151, 151, 152, 152, 152, 153, 153, 153, 154, 154, 154, 155, 155, 155, 156, 156, 156, 157, 157, 157, 158, 158, 158, 159, 159, 159, 160, 160, 160, 161, 161, 161, 162, 162, 162, 163, 163, 163, 164, 164, 164, 165, 165, 165, 166, 166, 166, 167, 167, 167, 168, 168, 168, 169, 169, 169, 170, 170, 170, 171, 171, 171, 172, 172, 172, 173, 173, 173, 174, 174, 174, 175, 175, 175, 176, 176, 176, 177, 177, 177, 178, 178, 178, 179, 179, 179, 180, 180, 180, 181, 181, 181, 182, 182, 182, 183, 183, 183, 184, 184, 184, 185, 185, 185, 186, 186, 186, 187, 187, 187, 188, 188, 188, 189, 189, 189, 190, 190, 190, 191, 191, 191, 192, 192, 192, 193, 193, 193, 194, 194, 194, 195, 195, 195, 196, 196, 196, 197, 197, 197, 198, 198, 198, 199, 199, 199, 200, 200, 200, 201, 201, 201, 202, 202, 202, 203, 203, 203, 204, 204, 204, 205, 205, 205, 206, 206, 206, 207, 207, 207, 208, 208, 208, 209, 209, 209, 210, 210, 210, 211, 211, 211, 212, 212, 212, 213, 213, 213, 214, 214, 214, 215, 215, 215, 216, 216, 216, 217, 217, 217, 218, 218, 218, 219, 219, 219, 220, 220, 220, 221, 221, 221, 222, 222, 222, 223, 223, 223, 224, 224, 224, 225, 225, 225, 226, 226, 226, 227, 227, 227, 228, 228, 228, 229, 229, 229, 230, 230, 230, 231, 231, 231, 232, 232, 232, 233, 233, 233, 234, 234, 234, 235, 235, 235, 236, 236, 236, 237, 237, 237, 238, 238, 238, 239, 239, 239, 240, 240, 240, 241, 241, 241, 242, 242, 242, 243, 243, 243, 244, 244, 244, 245, 245, 245, 246, 246, 246, 247, 247, 247, 248, 248, 248, 249, 249, 249, 250, 250, 250, 251, 251, 251, 252, 252, 252, 253, 253, 253, 254, 254, 254, 255, 255, 255 ]
def ConvertToPngIfBmp( path ):
with open( path, 'rb' ) as f: header = f.read( 2 )
if header == 'BM':
temp_path = HC.GetTempPath()
shutil.move( path, temp_path )
pil_image = GeneratePILImage( temp_path )
pil_image = pil_image.convert( 'P' )
pil_image.save( path, 'PNG' )
os.remove( temp_path )
def EfficientlyResizeNumpyImage( numpy_image, ( target_x, target_y ) ):
( im_y, im_x, depth ) = numpy_image.shape
if target_x >= im_x and target_y >= im_y: return numpy_image
result = numpy_image
# this seems to slow things down a lot, at least for cv!
#if im_x > 2 * target_x and im_y > 2 * target_y: result = cv2.resize( numpy_image, ( 2 * target_x, 2 * target_y ), interpolation = cv2.INTER_NEAREST )
return cv2.resize( result, ( target_x, target_y ), interpolation = cv2.INTER_LINEAR )
def EfficientlyResizePILImage( pil_image, ( target_x, target_y ) ):
( im_x, im_y ) = pil_image.size
if target_x >= im_x and target_y >= im_y: return pil_image
#if pil_image.mode == 'RGB': # low quality resize screws up alpha channel!
#
# if im_x > 2 * target_x and im_y > 2 * target_y: pil_image.thumbnail( ( 2 * target_x, 2 * target_y ), PILImage.NEAREST )
#
return pil_image.resize( ( target_x, target_y ), PILImage.ANTIALIAS )
def EfficientlyThumbnailNumpyImage( numpy_image, ( target_x, target_y ) ):
( im_y, im_x, depth ) = numpy_image.shape
if target_x >= im_x and target_y >= im_y: return numpy_image
( target_x, target_y ) = GetThumbnailResolution( ( im_x, im_y ), ( target_x, target_y ) )
return cv2.resize( numpy_image, ( target_x, target_y ), interpolation = cv2.INTER_AREA )
def EfficientlyThumbnailPILImage( pil_image, ( target_x, target_y ) ):
( im_x, im_y ) = pil_image.size
#if pil_image.mode == 'RGB': # low quality resize screws up alpha channel!
#
# if im_x > 2 * target_x or im_y > 2 * target_y: pil_image.thumbnail( ( 2 * target_x, 2 * target_y ), PILImage.NEAREST )
#
pil_image.thumbnail( ( target_x, target_y ), PILImage.ANTIALIAS )
def GenerateNumpyImage( path ):
numpy_image = cv2.imread( path, flags = -1 ) # flags = -1 loads alpha channel, if present
( y, x, depth ) = numpy_image.shape
if depth == 4: raise Exception( 'CV is bad at alpha!' )
else: numpy_image = cv2.cvtColor( numpy_image, cv2.COLOR_BGR2RGB )
return numpy_image
def GenerateHydrusBitmap( path ):
try:
numpy_image = GenerateNumpyImage( path )
return GenerateHydrusBitmapFromNumPyImage( numpy_image )
except:
pil_image = GeneratePILImage( path )
return GenerateHydrusBitmapFromPILImage( pil_image )
def GenerateHydrusBitmapFromNumPyImage( numpy_image ):
( y, x, depth ) = numpy_image.shape
if depth == 4: return HydrusBitmap( numpy_image.data, wx.BitmapBufferFormat_RGBA, ( x, y ) )
else: return HydrusBitmap( numpy_image.data, wx.BitmapBufferFormat_RGB, ( x, y ) )
def GenerateNumPyImageFromPILImage( pil_image ):
if pil_image.mode == 'RGBA' or ( pil_image.mode == 'P' and pil_image.info.has_key( 'transparency' ) ):
if pil_image.mode == 'P': pil_image = pil_image.convert( 'RGBA' )
else:
if pil_image.mode != 'RGB': pil_image = pil_image.convert( 'RGB' )
( w, h ) = pil_image.size
s = pil_image.tostring()
return numpy.fromstring( s, dtype = 'uint8' ).reshape( ( h, w, len( s ) // ( w * h ) ) )
def GenerateHydrusBitmapFromPILImage( pil_image ):
if pil_image.mode == 'RGBA' or ( pil_image.mode == 'P' and pil_image.info.has_key( 'transparency' ) ):
if pil_image.mode == 'P': pil_image = pil_image.convert( 'RGBA' )
format = wx.BitmapBufferFormat_RGBA
else:
if pil_image.mode != 'RGB': pil_image = pil_image.convert( 'RGB' )
format = wx.BitmapBufferFormat_RGB
return HydrusBitmap( pil_image.tostring(), format, pil_image.size )
def GeneratePerceptualHash( path ):
numpy_image = cv2.imread( path, cv2.CV_LOAD_IMAGE_UNCHANGED )
( y, x, depth ) = numpy_image.shape
if depth == 4:
# create a white greyscale canvas
white = numpy.ones( ( x, y ) ) * 255
# create weight and transform numpy_image to greyscale
numpy_alpha = numpy_image[ :, :, 3 ]
numpy_image_bgr = numpy_image[ :, :, :3 ]
numpy_image_gray = cv2.cvtColor( numpy_image_bgr, cv2.COLOR_BGR2GRAY )
numpy_image_result = numpy.empty( ( y, x ), numpy.float32 )
# paste greyscale onto the white
# can't think of a better way to do this!
# cv2.addWeighted only takes a scalar for weight!
for i in range( y ):
for j in range( x ):
opacity = float( numpy_alpha[ i, j ] ) / 255.0
grey_part = numpy_image_gray[ i, j ] * opacity
white_part = 255 * ( 1 - opacity )
pixel = grey_part + white_part
numpy_image_result[ i, j ] = pixel
numpy_image_gray = numpy_image_result
# use 255 for white weight, alpha for image weight
else:
numpy_image_gray = cv2.cvtColor( numpy_image, cv2.COLOR_BGR2GRAY )
numpy_image_tiny = cv2.resize( numpy_image_gray, ( 32, 32 ), interpolation = cv2.INTER_AREA )
# convert to float and calc dct
numpy_image_tiny_float = numpy.float32( numpy_image_tiny )
dct = cv2.dct( numpy_image_tiny_float )
# take top left 8x8 of dct
dct_88 = dct[:8,:8]
# get mean of dct, excluding [0,0]
mask = numpy.ones( ( 8, 8 ) )
mask[0,0] = 0
average = numpy.average( dct_88, weights = mask )
# make a monochromatic, 64-bit hash of whether the entry is above or below the mean
bytes = []
for i in range( 8 ):
byte = 0
for j in range( 8 ):
byte <<= 1 # shift byte one left
value = dct_88[i,j]
if value > average: byte |= 1
bytes.append( byte )
answer = str( bytearray( bytes ) )
# we good
return answer
def old_GeneratePerceptualHash( path ):
# I think what I should be doing here is going cv2.imread( path, flags = cv2.CV_LOAD_IMAGE_GRAYSCALE )
# then efficiently resize
thumbnail = GeneratePILImage( path )
# convert to 32 x 32 greyscale
if thumbnail.mode == 'P':
thumbnail = thumbnail.convert( 'RGBA' ) # problem with some P images converting to L without RGBA step in between
if thumbnail.mode == 'RGBA':
# this is some code i picked up somewhere
# another great example of PIL failing; it turns all alpha to pure black on a RGBA->RGB
thumbnail.load()
canvas = PILImage.new( 'RGB', thumbnail.size, ( 255, 255, 255 ) )
canvas.paste( thumbnail, mask = thumbnail.split()[3] )
thumbnail = canvas
thumbnail = thumbnail.convert( 'L' )
thumbnail = thumbnail.resize( ( 32, 32 ), PILImage.ANTIALIAS )
# convert to mat
numpy_thumbnail_8 = cv.CreateMatHeader( 32, 32, cv.CV_8UC1 )
cv.SetData( numpy_thumbnail_8, thumbnail.tostring() )
numpy_thumbnail_32 = cv.CreateMat( 32, 32, cv.CV_32FC1 )
cv.Convert( numpy_thumbnail_8, numpy_thumbnail_32 )
# compute dct
dct = cv.CreateMat( 32, 32, cv.CV_32FC1 )
cv.DCT( numpy_thumbnail_32, dct, cv.CV_DXT_FORWARD )
# take top left 8x8 of dct
dct = cv.GetSubRect( dct, ( 0, 0, 8, 8 ) )
# get mean of dct, excluding [0,0]
mask = cv.CreateMat( 8, 8, cv.CV_8U )
cv.Set( mask, 1 )
mask[0,0] = 0
channel_averages = cv.Avg( dct, mask )
average = channel_averages[0]
# make a monochromatic, 64-bit hash of whether the entry is above or below the mean
bytes = []
for i in range( 8 ):
byte = 0
for j in range( 8 ):
byte <<= 1 # shift byte one left
value = dct[i,j]
if value > average: byte |= 1
bytes.append( byte )
answer = str( bytearray( bytes ) )
# we good
return answer
def GeneratePILImage( path ): return PILImage.open( path )
def GeneratePILImageFromNumpyImage( numpy_image ):
( h, w, depth ) = numpy_image.shape
if depth == 3: format = 'RGB'
elif depth == 4: format = 'RGBA'
pil_image = PILImage.fromstring( format, ( w, h ), numpy_image.data )
return pil_image
def GetGIFFrameDurations( path ):
pil_image_for_duration = GeneratePILImage( path )
frame_durations = []
i = 0
while True:
try: pil_image_for_duration.seek( i )
except: break
if 'duration' not in pil_image_for_duration.info: duration = 40 # 25 fps default when duration is missing or too funky to extract. most stuff looks ok at this.
else:
duration = pil_image_for_duration.info[ 'duration' ]
if duration == 0: duration = 40
frame_durations.append( duration )
i += 1
return frame_durations
def GetHammingDistance( phash1, phash2 ):
distance = 0
phash1 = bytearray( phash1 )
phash2 = bytearray( phash2 )
for i in range( len( phash1 ) ):
xor = phash1[i] ^ phash2[i]
while xor > 0:
distance += 1
xor &= xor - 1
return distance
def GetImageProperties( path ):
( ( width, height ), num_frames ) = GetResolutionAndNumFrames( path )
if num_frames > 1:
durations = GetGIFFrameDurations( path )
duration = sum( durations )
else:
duration = None
num_frames = None
return ( ( width, height ), duration, num_frames )
def GetResolutionAndNumFrames( path ):
pil_image = GeneratePILImage( path )
( x, y ) = pil_image.size
try:
pil_image.seek( 1 )
pil_image.seek( 0 )
num_frames = 1
while True:
try:
pil_image.seek( pil_image.tell() + 1 )
num_frames += 1
except: break
except: num_frames = 1
return ( ( x, y ), num_frames )
def GetThumbnailResolution( ( im_x, im_y ), ( target_x, target_y ) ):
im_x = float( im_x )
im_y = float( im_y )
target_x = float( target_x )
target_y = float( target_y )
x_ratio = im_x / target_x
y_ratio = im_y / target_y
ratio_to_use = max( x_ratio, y_ratio )
target_x = int( im_x / ratio_to_use )
target_y = int( im_y / ratio_to_use )
return ( target_x, target_y )
''' # old pil code
def _GetCurrentFramePIL( pil_image, target_resolution, canvas ):
current_frame = EfficientlyResizePILImage( pil_image, target_resolution )
if pil_image.mode == 'P' and 'transparency' in pil_image.info:
# I think gif problems are around here somewhere; the transparency info is not converted to RGBA properly, so it starts drawing colours when it should draw nothing
current_frame = current_frame.convert( 'RGBA' )
if canvas is None: canvas = current_frame
else: canvas.paste( current_frame, None, current_frame ) # yeah, use the rgba image as its own mask, wut.
else: canvas = current_frame
return canvas
def _GetFramePIL( self, index ):
pil_image = self._image_object
pil_image.seek( index )
canvas = self._GetCurrentFramePIL( pil_image, self._target_resolution, canvas )
return GenerateHydrusBitmapFromPILImage( canvas )
def _GetFramesPIL( self ):
pil_image = self._image_object
canvas = None
global_palette = pil_image.palette
dirty = pil_image.palette.dirty
mode = pil_image.palette.mode
rawmode = pil_image.palette.rawmode
# believe it or not, doing this actually fixed a couple of gifs!
pil_image.seek( 1 )
pil_image.seek( 0 )
while True:
canvas = self._GetCurrentFramePIL( pil_image, self._target_resolution, canvas )
yield GenerateHydrusBitmapFromPILImage( canvas )
try:
pil_image.seek( pil_image.tell() + 1 )
if pil_image.palette == global_palette: # for some reason, when we fall back to global palette (no local-frame palette), we reset bunch of important variables!
pil_image.palette.dirty = dirty
pil_image.palette.mode = mode
pil_image.palette.rawmode = rawmode
except: break
'''
# the cv code was initially written by @fluffy_cub
class HydrusBitmap( object ):
def __init__( self, data, format, size ):
self._data = lz4.dumps( data )
self._format = format
self._size = size
def GetWxBitmap( self ):
( width, height ) = self._size
if self._format == wx.BitmapBufferFormat_RGB: return wx.BitmapFromBuffer( width, height, lz4.loads( self._data ) )
else: return wx.BitmapFromBufferRGBA( width, height, lz4.loads( self._data ) )
def GetWxImage( self ):
( width, height ) = self._size
if self._format == wx.BitmapBufferFormat_RGB: return wx.ImageFromBuffer( width, height, lz4.loads( self._data ) )
else:
bitmap = wx.BitmapFromBufferRGBA( width, height, lz4.loads( self._data ) )
image = wx.ImageFromBitmap( bitmap )
wx.CallAfter( bitmap.Destroy )
return image
def GetEstimatedMemoryFootprint( self ): return len( self._data )
def GetSize( self ): return self._size
class RasterContainer( object ):
def __init__( self, media, target_resolution = None ):
if target_resolution is None: target_resolution = media.GetResolution()
self._media = media
self._target_resolution = target_resolution
hash = self._media.GetHash()
mime = self._media.GetMime()
self._path = CC.GetFilePath( hash, mime )
( original_width, original_height ) = self._media.GetResolution()
( my_width, my_height ) = target_resolution
width_zoom = my_width / float( original_width )
height_zoom = my_height / float( original_height )
self._zoom = min( ( width_zoom, height_zoom ) )
if self._zoom > 1.0: self._zoom = 1.0
class ImageContainer( RasterContainer ):
def __init__( self, media, target_resolution = None ):
RasterContainer.__init__( self, media, target_resolution )
self._hydrus_bitmap = None
HydrusThreading.CallToThread( self.THREADRender )
def _GetHydrusBitmap( self ):
try:
numpy_image = GenerateNumpyImage( self._path )
resized_numpy_image = EfficientlyResizeNumpyImage( numpy_image, self._target_resolution )
return GenerateHydrusBitmapFromNumPyImage( resized_numpy_image )
except:
pil_image = GeneratePILImage( self._path )
resized_pil_image = EfficientlyResizePILImage( pil_image, self._target_resolution )
return GenerateHydrusBitmapFromPILImage( resized_pil_image )
def THREADRender( self ):
time.sleep( 0.00001 ) # thread yield
wx.CallAfter( self.SetHydrusBitmap, self._GetHydrusBitmap() )
HC.pubsub.pub( 'finished_rendering', self.GetKey() )
def GetEstimatedMemoryFootprint( self ): return self._hydrus_bitmap.GetEstimatedMemoryFootprint()
def GetHash( self ): return self._media.GetHash()
def GetHydrusBitmap( self ): return self._hydrus_bitmap
def GetKey( self ): return ( self._media.GetHash(), self._target_resolution )
def GetNumFrames( self ): return self._media.GetNumFrames()
def GetResolution( self ): return self._media.GetResolution()
def GetSize( self ): return self._target_resolution
def GetZoom( self ): return self._zoom
def IsRendered( self ): return self._hydrus_bitmap is not None
def IsScaled( self ): return self._zoom != 1.0
def SetHydrusBitmap( self, hydrus_bitmap ): self._hydrus_bitmap = hydrus_bitmap