Python遥感开发之FY的批量处理

Python遥感开发之FY的批量处理

  • 0 FY遥感数据
  • 1 批量提取数据
  • 2 批量拼接TIF数据
  • 3 批量HAM转WGS投影(重要)
  • 4 批量掩膜裁剪

介绍FY数据的格式,以及FY数据的批量提取数据、批量拼接数据、批量投影转换、批量掩膜裁剪等操作。
本博客代码参考《 Hammer坐标系转换到WGS1984,以处理FY3D/MERSI NVI数据为例。FY3D/MERSI NVI空间分辨率250m,全球 10°×10°分幅 》,非常感谢博主公开代码!!!


0 FY遥感数据

  • 本博客以《MERSI-II植被指数旬产品(1000M)》数据处理为例子,“FY3D_MERSI_00A0_L3_NVI_MLT_HAM_20191130_AOTD_1000M_MS.HDF”,其中FY3D是卫星名字、MERSI是仪器名称、00A0是数据区域类型(也是该影像的经纬度范围)、L3是数据级别、NVI是数据名称、MLT是通道名称、HAM是投影方式、AOTD是时段类型、1000M是分辨率、HDF是数据名称格式。
  • 最核心最难的就是HAM投影如何转换成常见的WGS投影

1 批量提取数据

MERSI-II植被指数旬产品(1000M)数据包含如下波段,根据需要自己取
CH1表示蓝光波段
CH2表示绿光波段
CH3表示红外波段
CH4表示近红外波段
CH5表示亮温
Python遥感开发之FY的批量处理_第1张图片

Python遥感开发之FY的批量处理_第2张图片
切记
Python遥感开发之FY的批量处理_第3张图片
完整代码如下所示:

import os
from osgeo import gdal
import h5py

def get_data_list(file_path, out = ""):
    list1 = []  # 文件的完整路径
    if os.path.isdir(file_path):
        fileList = os.listdir(file_path)
        if out != "":
            for f in fileList:
                out_data = out + "\\" + f
                out_data = out_data.replace(".HDF", "_ndvi.tif")
                list1.append(out_data)
        else:
            for f in fileList:
                pre_data = file_path + '\\' + f  # 文件的完整路径
                list1.append(pre_data)
        return list1

import numpy as np

def HDF2Tif(in_file,out_file):
    hdf_ds = h5py.File(in_file, "r")
    if type(hdf_ds.attrs['Left-Top X']) is np.ndarray:
        left_x = hdf_ds.attrs['Left-Top X'][0]
    else:
        left_x = float(hdf_ds.attrs['Left-Top X'])

    if type(hdf_ds.attrs['Left-Top Y']) is np.ndarray:
        left_y = hdf_ds.attrs['Left-Top Y'][0]
    else:
        left_y = float(hdf_ds.attrs['Left-Top Y'])

    res_x = hdf_ds.attrs['Resolution X'][0]
    res_y = hdf_ds.attrs['Resolution Y'][0]
    ndviname = list(hdf_ds.keys())[6] #5是evi 6是ndvi
    # print(list(hdf_ds.keys()))

    ndvi_ds = hdf_ds[ndviname]
    rows = ndvi_ds.shape[0]
    cols = ndvi_ds.shape[1]
    data = ndvi_ds[()]
    driver = gdal.GetDriverByName("GTiff")
    outds = driver.Create(out_file, cols, rows, 1, gdal.GDT_Int16)
    outds.SetGeoTransform(
        (float(left_x) * 1000,#切记250m的分辨率需要除以4
         float(res_x) * 1000,
         0,
         float(left_y) * 1000,#切记250m的分辨率需要除以4
         0,
         -1 * float(res_y) * 1000)
    )
    proj = 'PROJCS["World_Hammer",GEOGCS["Unknown datum based upon the custom spheroid",DATUM["Not_specified_based_on_custom_spheroid",SPHEROID["Custom spheroid",6363961,0]],PRIMEM["Greenwich",0],UNIT["Degree",0.0174532925199433]],PROJECTION["Hammer_Aitoff"],PARAMETER["False_Easting",0],PARAMETER["False_Northing",0],PARAMETER["Central_Meridian",0],UNIT["metre",1],AXIS["Easting",EAST],AXIS["Northing",NORTH]]'
    outds.SetProjection(proj)
    outband = outds.GetRasterBand(1)
    outband.WriteArray(data)
    pass

if __name__ == '__main__':
    infile = r"C:\Users\Administrator\Desktop\HDF"
    outfile = r"C:\Users\Administrator\Desktop\01提取ndvi"
    infile_list = get_data_list(infile)
    outfile_list = get_data_list(infile,outfile)
    for in_file,out_file in zip(infile_list,outfile_list):
        print(in_file)
        HDF2Tif(in_file,out_file)

Python遥感开发之FY的批量处理_第4张图片

Python遥感开发之FY的批量处理_第5张图片

2 批量拼接TIF数据

import os
from osgeo import gdal

def get_data_list(file_path, out = ""):
    list1 = []  # 文件的完整路径
    if os.path.isdir(file_path):
        fileList = os.listdir(file_path)
        if out != "":
            for f in fileList:
                out_data = out + "\\" + f
                out_data = out_data.replace(".HDF", "_ndvi.tif")
                list1.append(out_data)
        else:
            for f in fileList:
                pre_data = file_path + '\\' + f  # 文件的完整路径
                list1.append(pre_data)
        return list1

def get_same_list(image, infile_list):
    infile_list02 = []
    for data in infile_list:
        if image in data:
            # print("----", data)
            infile_list02.append(data)
    return infile_list02

def get_same_image_list(infile_list):
    image_list= []
    for file in infile_list:
        filename = file[-31:-23]
        if filename not in image_list:
            image_list.append(filename)
    return list(set(image_list))

def pinjie(infile_list,outfile):
    ds = gdal.Open(infile_list[0])
    cols = ds.RasterXSize
    rows = ds.RasterYSize
    ingeo = ds.GetGeoTransform()
    proj = ds.GetProjection()
    minx = ingeo[0]
    maxy = ingeo[3]
    maxx = ingeo[0] + ingeo[1] * cols
    miny = ingeo[3] + ingeo[5] * rows
    ds = None
    for file in infile_list[1:]:
        ds = gdal.Open(file)
        cols = ds.RasterXSize
        rows = ds.RasterYSize
        geo = ds.GetGeoTransform()
        minx_ = geo[0]
        maxy_ = geo[3]
        maxx_ = geo[0] + geo[1] * cols
        miny_ = geo[3] + geo[5] * rows
        minx = min(minx, minx_)
        maxy = max(maxy, maxy_)
        maxx = max(maxx, maxx_)
        miny = min(miny, miny_)
        geo = None
        ds = None
    newcols = int((maxx - minx) / abs(ingeo[1]))
    newrows = int((maxy - miny) / abs(ingeo[5]))
    driver = gdal.GetDriverByName("GTiff")
    outds = driver.Create(outfile, newcols, newrows, 1, gdal.GDT_Int16)
    outgeo = (minx, ingeo[1], 0, maxy, 0, ingeo[5])
    outds.SetGeoTransform(outgeo)
    outds.SetProjection(proj)
    outband = outds.GetRasterBand(1)
    for file in infile_list:
        ds = gdal.Open(file)
        data = ds.ReadAsArray()
        geo = ds.GetGeoTransform()
        x = int(abs((geo[0] - minx) / ingeo[1]))
        y = int(abs((geo[3] - maxy) / ingeo[5]))
        outband.WriteArray(data, x, y)
        ds = None
    outband.FlushCache()
    pass
if __name__ == '__main__':

    infile = r"C:\Users\Administrator\Desktop\01提取ndvi"
    outfile = r"C:\Users\Administrator\Desktop\02拼接"
    infile_list = get_data_list(infile)
    image_name_list = get_same_image_list(infile_list)
    print(image_name_list)
    for name in image_name_list:
        print(name)
        infile_list02 = get_same_list(name, infile_list)
        pinjie(infile_list02,outfile+"\\"+name+".tif")

Python遥感开发之FY的批量处理_第6张图片

3 批量HAM转WGS投影(重要)

切记:代码中出现的0.01表示1000m分辨率,如果需要换成250m分辨率,请根据代码注释自行更换。
Python遥感开发之FY的批量处理_第7张图片
Python遥感开发之FY的批量处理_第8张图片

完整代码如下:

import os
from osgeo import gdal
import numpy as np
import math
from osgeo import osr

def get_data_list(file_path, out = ""):
    list1 = []  # 文件的完整路径
    if os.path.isdir(file_path):
        fileList = os.listdir(file_path)
        if out != "":
            for f in fileList:
                out_data = out + "\\" + f
                # out_data = out_data.replace(".HDF", "_ndvi.tif")
                list1.append(out_data)
        else:
            for f in fileList:
                pre_data = file_path + '\\' + f  # 文件的完整路径
                list1.append(pre_data)
        return list1

def H2W(infile,outfile):
    ds = gdal.Open(infile)
    ingeo = ds.GetGeoTransform()
    cols = ds.RasterXSize
    rows = ds.RasterYSize
    or_x = ingeo[0]
    or_y = ingeo[3]
    end_x = ingeo[0] + cols * ingeo[1]
    end_y = ingeo[3] + rows * ingeo[5]
    # X方向分块
    xblocksize = int((cols + 1) / 5)
    # Y方向分块
    yblocksize = int((rows + 1) / 5)
    lon_max = -360
    lon_min = 360
    lat_max = -90
    lat_min = 90
    for i in range(0, rows + 1, yblocksize):
        if i + yblocksize < rows + 1:
            numrows = yblocksize
        else:
            numrows = rows + 1 - i
        for j in range(0, cols + 1, xblocksize):
            if j + xblocksize < cols + 1:
                numcols = xblocksize
            else:
                numcols = cols + 1 - j
            # 计算所有点的Hammer坐标系下X方向坐标数组
            x = ingeo[0] + j * ingeo[1]
            y = ingeo[3] + i * ingeo[5]
            xgrid, ygrid = np.meshgrid(np.linspace(x, x + numcols * ingeo[1], num=numcols),
                                       np.linspace(y, y + numrows * ingeo[5], num=numrows))
            # 将hammer坐标转化为经纬度坐标
            # 首先将Hammer转化为-1到1
            xgrid = np.where(xgrid > (18000.0 * 1000.0), (18000.0 * 1000.0) - xgrid, xgrid)
            xgrid = xgrid / (18000.0 * 1000.0)
            ygrid = np.where(ygrid > (9000.0 * 1000.0), (9000.0 * 1000.0) - ygrid, ygrid)
            ygrid = ygrid / (9000.0 * 1000.0)
            z = np.sqrt(1 - np.square(xgrid) / 2.0 - np.square(ygrid) / 2.0)
            lon = 2 * np.arctan(np.sqrt(2) * xgrid * z / (2.0 * (np.square(z)) - 1))
            xgrid = None
            lat = np.arcsin(np.sqrt(2) * ygrid * z)
            ygrid = None
            z = None
            lon = lon / math.pi * 180.0
            lat = lat / math.pi * 180.0
            lon[lon < 0] = lon[lon < 0] + 360.0
            # lat[lat<0]=lat[lat<0]+180
            lon_max = max(lon_max, np.max(lon))
            lon_min = min(lon_min, np.min(lon))
            lon = None
            lat_max = max(lat_max, np.max(lat))
            lat_min = min(lat_min, np.min(lat))
            lat = None

    newcols = math.ceil((lon_max - lon_min) / 0.01)#切记250m的分辨率需要把0.01换成0.0025
    newrows = math.ceil((lat_max - lat_min) / 0.01)#切记250m的分辨率需要把0.01换成0.0025
    driver = gdal.GetDriverByName("GTiff")
    outds = driver.Create(outfile, newcols, newrows, 1, gdal.GDT_Int16)
    geo2 = (lon_min, 0.01, 0, lat_max, 0, -1 * 0.01)#切记250m的分辨率需要把0.01换成0.0025
    oproj_srs = osr.SpatialReference()
    proj_4 = "+proj=longlat +datum=WGS84 +no_defs"
    oproj_srs.ImportFromProj4(proj_4)
    outds.SetGeoTransform(geo2)
    outds.SetProjection(oproj_srs.ExportToWkt())
    outband = outds.GetRasterBand(1)
    datav = ds.ReadAsArray()
    data = np.full((datav.shape[0] + 1, datav.shape[1] + 1), -32750, dtype=int)
    data[0:datav.shape[0], 0:datav.shape[1]] = datav
    xblocksize = int(newcols / 5)
    yblocksize = int(newrows / 5)
    for i in range(0, newrows, yblocksize):
        if i + yblocksize < newrows:
            numrows = yblocksize
        else:
            numrows = newrows - i
        for j in range(0, newcols, xblocksize):
            if j + xblocksize < newcols:
                numcols = xblocksize
            else:
                numcols = newcols - j
            x = lon_min + j * 0.01 + 0.01 / 2.0 #切记250m的分辨率需要把0.01换成0.0025
            y = lat_max + i * (-1 * 0.01) - 0.01 / 2.0#切记250m的分辨率需要把0.01换成0.0025
            newxgrid, newygrid = np.meshgrid(np.linspace(x, x + numcols * 0.01, num=numcols),#切记250m的分辨率需要把0.01换成0.0025
                                             np.linspace(y, y + numrows * (-1 * 0.01), num=numrows))#切记250m的分辨率需要把0.01换成0.0025
            # 将经纬度坐标转化为Hammer坐标
            newxgrid = np.where(newxgrid > 180.0, newxgrid - 360.0, newxgrid)
            newxgrid = newxgrid / 180.0 * math.pi
            newygrid = newygrid / 180.0 * math.pi
            newz = np.sqrt(1 + np.cos(newygrid) * np.cos(newxgrid / 2.0))
            x = np.cos(newygrid) * np.sin(newxgrid / 2.0) / newz
            newxgrid = None
            y = np.sin(newygrid) / newz
            newygrid = None
            newz = None
            x = x * (18000.0 * 1000.0)
            y = y * (9000.0 * 1000.0)
            x_index = (np.floor((x - or_x) / ingeo[1])).astype(int)
            x_index = np.where(x_index < 0, data.shape[1] - 1, x_index)
            x_index = np.where(x_index >= data.shape[1], data.shape[1] - 1, x_index)
            y_index = (np.floor((y - or_y) / ingeo[5])).astype(int)
            y_index = np.where(y_index < 0, data.shape[0] - 1, y_index)
            y_index = np.where(y_index >= data.shape[0], data.shape[0] - 1, y_index)
            newdata = data[y_index, x_index]
            outband.WriteArray(newdata, j, i)
    outband.SetNoDataValue(-32750)
    outband.FlushCache()

if __name__ == '__main__':
    infile_path = r"C:\Users\Administrator\Desktop\02拼接"
    outfile_path = r"C:\Users\Administrator\Desktop\03WGS"
    infile_list = get_data_list(infile_path)
    outfile_list = get_data_list(infile_path,outfile_path)
    for infile,outfile in zip(infile_list,outfile_list):
        print(infile)
        H2W(infile,outfile)

Python遥感开发之FY的批量处理_第9张图片
Python遥感开发之FY的批量处理_第10张图片

4 批量掩膜裁剪

请参考本人博客《Python遥感开发之批量掩膜和裁剪》

你可能感兴趣的:(Python图像遥感,Python遥感开发,HAM转WGS,FY数据处理,Python处理HAM)