123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147 |
- local gm = require 'graphicsmagick'
- local ffi = require 'ffi'
- require 'pl'
- local image_loader = {}
- local clip_eps8 = (1.0 / 255.0) * 0.5 - (1.0e-7 * (1.0 / 255.0) * 0.5)
- local clip_eps16 = (1.0 / 65535.0) * 0.5 - (1.0e-7 * (1.0 / 65535.0) * 0.5)
- local background_color = 0.5
- function image_loader.decode_float(blob)
- local im, alpha = image_loader.decode_byte(blob)
- if im then
- im = im:float():div(255)
- end
- return im, alpha, blob
- end
- function image_loader.encode_png(rgb, alpha, depth)
- depth = depth or 8
- if rgb:type() == "torch.ByteTensor" then
- rgb = rgb:float():div(255)
- end
- if alpha then
- if not (alpha:size(2) == rgb:size(2) and alpha:size(3) == rgb:size(3)) then
- alpha = gm.Image(alpha, "I", "DHW"):size(rgb:size(3), rgb:size(2), "SincFast"):toTensor("float", "I", "DHW")
- end
- local rgba = torch.Tensor(4, rgb:size(2), rgb:size(3))
- rgba[1]:copy(rgb[1])
- rgba[2]:copy(rgb[2])
- rgba[3]:copy(rgb[3])
- rgba[4]:copy(alpha)
-
- if depth < 16 then
- rgba:add(clip_eps8)
- rgba[torch.lt(rgba, 0.0)] = 0.0
- rgba[torch.gt(rgba, 1.0)] = 1.0
- else
- rgba:add(clip_eps16)
- rgba[torch.lt(rgba, 0.0)] = 0.0
- rgba[torch.gt(rgba, 1.0)] = 1.0
- end
- local im = gm.Image():fromTensor(rgba, "RGBA", "DHW")
- return im:depth(depth):format("PNG"):toBlob(9)
- else
- if depth < 16 then
- rgb = rgb:clone():add(clip_eps8)
- rgb[torch.lt(rgb, 0.0)] = 0.0
- rgb[torch.gt(rgb, 1.0)] = 1.0
- else
- rgb = rgb:clone():add(clip_eps16)
- rgb[torch.lt(rgb, 0.0)] = 0.0
- rgb[torch.gt(rgb, 1.0)] = 1.0
- end
- local im = gm.Image(rgb, "RGB", "DHW")
- return im:depth(depth):format("PNG"):toBlob(9)
- end
- end
- function image_loader.save_png(filename, rgb, alpha, depth)
- depth = depth or 8
- local blob, len = image_loader.encode_png(rgb, alpha, depth)
- local fp = io.open(filename, "wb")
- if not fp then
- error("IO error: " .. filename)
- end
- fp:write(ffi.string(blob, len))
- fp:close()
- return true
- end
- function image_loader.decode_byte(blob)
- local load_image = function()
- local im = gm.Image()
- local alpha = nil
- local gamma_lcd = 0.454545
-
- im:fromBlob(blob, #blob)
-
- if im:colorspace() == "CMYK" then
- im:colorspace("RGB")
- end
- local gamma = math.floor(im:gamma() * 1000000) / 1000000
- if gamma ~= 0 and gamma ~= gamma_lcd then
- im:gammaCorrection(gamma / gamma_lcd)
- end
- -- FIXME: How to detect that a image has an alpha channel?
- if blob:sub(1, 4) == "\x89PNG" or blob:sub(1, 3) == "GIF" then
- -- split alpha channel
- im = im:toTensor('float', 'RGBA', 'DHW')
- local sum_alpha = (im[4] - 1.0):sum()
- if sum_alpha < 0 then
- alpha = im[4]:reshape(1, im:size(2), im:size(3))
- -- drop full transparent background
- local mask = torch.le(alpha, 0.0)
- im[1][mask] = background_color
- im[2][mask] = background_color
- im[3][mask] = background_color
- end
- local new_im = torch.FloatTensor(3, im:size(2), im:size(3))
- new_im[1]:copy(im[1])
- new_im[2]:copy(im[2])
- new_im[3]:copy(im[3])
- im = new_im:mul(255):byte()
- else
- im = im:toTensor('byte', 'RGB', 'DHW')
- end
- return {im, alpha, blob}
- end
- local state, ret = pcall(load_image)
- if state then
- return ret[1], ret[2], ret[3]
- else
- return nil, nil, nil
- end
- end
- function image_loader.load_float(file)
- local fp = io.open(file, "rb")
- if not fp then
- error(file .. ": failed to load image")
- end
- local buff = fp:read("*a")
- fp:close()
- return image_loader.decode_float(buff)
- end
- function image_loader.load_byte(file)
- local fp = io.open(file, "rb")
- if not fp then
- error(file .. ": failed to load image")
- end
- local buff = fp:read("*a")
- fp:close()
- return image_loader.decode_byte(buff)
- end
- local function test()
- require 'image'
- local img
- img = image_loader.load_float("./a.jpg")
- if img then
- print(img:min())
- print(img:max())
- image.display(img)
- end
- img = image_loader.load_float("./b.png")
- if img then
- image.display(img)
- end
- end
- --test()
- return image_loader
|