# 一张图片的像素值范围是[0,255], 因此默认类型是 unit8, 可用如下代码查看数据类型：
from skimage import io,data
img=data.chelsea()
print(img.dtype.name)

uint8


# unit8 转 float
from skimage import data,img_as_float,color
img=data.chelsea()
print("data.chelsea的格式为：{}".format(img.dtype.name))
dst=img_as_float(img)
print("将其转为float后：{}".format(dst.dtype.name))

gry=color.rgb2gray(img)
print("将其转为灰度图后：{}".format(gry.dtype.name))

data.chelsea的格式为：uint8
将其转为float后：float64
将其转为灰度图后：float64


# float 转 uint8
from skimage import img_as_ubyte
import numpy as np
img = np.array([0, 0.5, 1], dtype=float)
print(img.dtype.name)
dst=img_as_ubyte(img)
print(dst.dtype.name)

float64
uint8


# rgb 转灰度图：
from skimage import io,data,color
img=data.chelsea()
gray=color.rgb2gray(img)
io.imshow(gray)
# 其它的转换，用法都是一样的，列举常用的如下：
# hsv = color.rgb2hsv(img)
# io.imshow(hsv)

# lab= color.rgb2lab(img)
# io.imshow(lab)

# 下面是从其他颜色空间转换至rgb，不能用chelsea
# gray= color.gray2rgb(img)
# gray= color.hsv2rgb(img)
# gray= color.lab2rgb(img)

<matplotlib.image.AxesImage at 0x26b1ce58b50>


# rgb 转 hsv
from skimage import io,data,color
img=data.chelsea()
hsv=color.convert_colorspace(img,'RGB','HSV')
io.imshow(hsv)

<matplotlib.image.AxesImage at 0x26b1cf18610>


# 根据灰度值，将图片分成三类，然后用默认颜色对三类进行着色
from skimage import io,data,color
import numpy as np
img=data.astronaut()
gray=color.rgb2gray(img)
labels=gray
labels[labels<0.4]=0
labels[labels>=0.75]=2
labels[((gray>=0.4) & (gray<0.75))]=1
dst=color.label2rgb(labels)
io.imshow(dst)

<matplotlib.image.AxesImage at 0x26b1cf5fd30>


from skimage import transform,data
import matplotlib.pyplot as plt
print('将 camera 图片由原来的 512*512 大小，变成了 80*60 大小。')
print('从下图中的坐标尺，我们能够看出来：')
img = data.camera()
dst=transform.resize(img, (80, 60))
plt.figure('resize')
plt.subplot(121)
plt.title('before resize')
plt.imshow(img,plt.cm.gray)

plt.subplot(122)
plt.title('after resize')
plt.imshow(dst,plt.cm.gray)
plt.show()

将 camera 图片由原来的 512*512 大小，变成了 80*60 大小。
从下图中的坐标尺，我们能够看出来：


from skimage import transform,data
img = data.camera()
print("#图片原始大小:{}".format(img.shape)) 
print("#缩小为原来图片大小的 0.1 倍:{}".format(transform.rescale(img, 0.1).shape))
print("#缩小为原来图片行数一半，列数四分之一:{}".format(transform.rescale(img, [0.5,0.25]).shape))
print("#放大为原来图片大小的 2 倍:{}".format(transform.rescale(img, 2).shape) )

#图片原始大小:(512, 512)
#缩小为原来图片大小的 0.1 倍:(51, 51)
#缩小为原来图片行数一半，列数四分之一:(256, 128)
#放大为原来图片大小的 2 倍:(1024, 1024)


from skimage import transform,data
import matplotlib.pyplot as plt
img = data.camera()
print(img.shape) #图片原始大小
img1=transform.rotate(img, 60) #旋转 90 度，不改变大小
print(img1.shape)
img2=transform.rotate(img, 30,resize=True) #旋转 30 度，同时改变大小
print(img2.shape) 
plt.figure('resize')
plt.subplot(121)
plt.title('rotate 60')
plt.imshow(img1,plt.cm.gray)
plt.subplot(122)
plt.title('rotate 30')
plt.imshow(img2,plt.cm.gray)

(512, 512)
(512, 512)
(699, 699)

<matplotlib.image.AxesImage at 0x26b1f0e2ef0>


import numpy as np
import matplotlib.pyplot as plt
from skimage import data,transform
image = data.astronaut() #载入宇航员图片
rows, cols, dim = image.shape #获取图片的行数，列数和通道数
pyramid = tuple(transform.pyramid_gaussian(image, downscale=3)) #产生高斯金字塔图像
#共生成了 log3(512)≈6 幅金字塔图像，加上原始图像共 7 幅，pyramid[0]-pyramid[1]
composite_image = np.ones((rows, cols + cols//3+1, 3), dtype=np.double) #生成背景
composite_image[:rows, :cols, :] = pyramid[0] #融合原始图像
i_row = 0
for p in pyramid[1:]:
    n_rows, n_cols = p.shape[:2]
    composite_image[i_row:i_row + n_rows, cols:cols + n_cols] = p #循环融合 7 幅金字塔图像
    i_row += n_rows
plt.imshow(composite_image)
plt.show()

d:\Applications\miniconda\envs\dip\lib\site-packages\skimage\_shared\utils.py:348: RuntimeWarning: Images with dimensions (M, N, 3) are interpreted as 2D+RGB by default. Use `multichannel=False` to interpret as 3D image with last dimension of length 3.
  return func(*args, **kwargs)


# 除了高斯金字塔外，还有其它的金字塔，如拉普拉斯金字塔：
import numpy as np
import matplotlib.pyplot as plt
from skimage import data,transform,img_as_ubyte

image = data.astronaut() #载入宇航员图片
rows, cols, dim = image.shape #获取图片的行数，列数和通道数
pyramid = tuple(transform.pyramid_laplacian(image,downscale= 2,channel_axis=2)) #产生拉普拉斯金字塔图像
# 共生成了 log2(512)=9 幅金字塔图像，加上原始图像共 10 幅，pyramid[0]-pyramid[1]
# 金字塔图像类型为float64,故区间为[0,1]

composite_image = np.ones((rows, cols + cols//2 + 3, 3),dtype=float) #生成背景
composite_image[:rows,:cols,:]=pyramid[0]
i_row = 0
for p in pyramid[1:]:
    n_rows, n_cols= p.shape[:2]
    composite_image[i_row:i_row + n_rows, cols:cols + n_cols] = p
    i_row += n_rows

#手动将[0,1]变成[0,255]
# 为什么手算和使用img_as_ubyte()效果不同?
plt.imshow((composite_image*255).astype(np.ubyte))
# plt.imshow(img_as_ubyte(composite_image))
plt.show()


import skimage.io as io
from skimage import data_dir
str=data_dir + '/*.png'
coll = io.ImageCollection(str)
print(len(coll))
# 结果为 23 说明系统自带了 23 张 png 的示例图片，这些图片都读取了出来，放在图片集合 coll 里。
# 如果我们想显示其中一张图片，则可以在后加上一行代码：
io.imshow(coll[10])

23

<matplotlib.image.AxesImage at 0x26b1facf0d0>


import skimage.io as io
from skimage import data_dir

# str='d:/pic/*.jpg:d:/pic/*.png'
# 根据pull#3928，现在改用lists
str=['./*.png','./*.jpg','./*.tif']

coll = io.ImageCollection(str)
print(len(coll))

3


from skimage import data_dir,io,color
def convert_gray(f):
    rgb=io.imread(f)
    return color.rgb2gray(rgb)
 
str=data_dir+'/*.png'
coll = io.ImageCollection(str,load_func=convert_gray)
io.imshow(coll[10])

<matplotlib.image.AxesImage at 0x26b1fb5cee0>


from skimage import data_dir,io,color
from matplotlib import pyplot as plt
import imageio

# ImageCollection can be modified to load images 
# --from an arbitrary source by specifying a combination of load_pattern and load_func.
# For an ImageCollection ic, 
# ic[5] uses load_func(load_pattern[5]) to load the image.

video_file = './rikka.gif'
def vidread_step(f, step):
    vid = imageio.get_reader(f)
    seq = [v for v in vid.iter_data()]
    return seq[::step]

ic = io.ImageCollection(video_file, load_func=vidread_step, step=1)
# 长度必然为1
sub_plots=[221,222,223,224]
fig = plt.figure()
for i in range(4):
    plt.subplot(sub_plots[i])
    plt.imshow(ic[0][i])
plt.show()


# 我们看看图片连接前后的维度变化：
from skimage import data_dir,io,color

video_file = './rikka.gif'
def vidread_step(f, step):
    vid = imageio.get_reader(f)
    seq = [v for v in vid.iter_data()]
    return seq[::step]
coll = io.ImageCollection(video_file, load_func=vidread_step, step=1)

print(len(coll)) #连接的图片数量
print(coll[0][0].shape) #连接前的图片尺寸，所有的都一样
mat=io.concatenate_images(coll[0])
print(mat.shape) #连接后的数组尺寸

1
(400, 400, 4)
(5, 400, 400, 4)


from PIL import Image, ImageDraw,ImageFont
from matplotlib import pyplot as plt
im = Image.open("./dog.jpg").convert('RGBA')
txt=Image.new('RGBA', im.size, (0,0,0,0))
fnt=ImageFont.truetype("c:/Windows/fonts/Tahoma.ttf", 40)
d=ImageDraw.Draw(txt)
d.text((txt.size[0]-240,txt.size[1]-120), " This is YH's\nwater mark",font=fnt, fill=(255,255,255,255))
out=Image.alpha_composite(im, txt)
plt.imshow(out)

<matplotlib.image.AxesImage at 0x26b2134ee00>

3.1 图像数据类型及颜色空间转换¶

一、图像数据类型及转换¶

二、颜色空间及其转换¶

3.2 图像的形变与缩放¶

1、改变图片尺寸 resize¶

2、按比例缩放 rescale¶

3、旋转 rotate¶

4、图像金字塔¶

3.3 图像的批量处理¶