from hdfs.client import Client import matplotlib.pyplot as mp import numpy as np import sys import struct import binascii from io import BytesIO def ibm2ieee(ibm): if ibm == 0: return 0.0 sign = ibm >> 31 & 0x01 exponent = ibm >> 24 & 0x7f mantissa = (ibm & 0x00ffffff) / float(pow(2, 24)) return (1 - 2 * sign) * mantissa * pow(16, exponent - 64) client = Client("http://192.168.92.145:9870/") # c = client.list("/") #列出所有hdfs目录 filename = "/input/LX_SEGY005.segy" # hdfs文件路径 with client.read(filename) as fs: fSegy = fs.read() fSegy = BytesIO(fSegy) nTrace = 311 nSample = 783 data = np.zeros((nSample, nTrace)) fSegy.seek(3600, 0) # 跳过3600字节卷头 for iTrace in range(nTrace): fSegy.seek(240, 1) # 每一道都跳过240字节道头 for iSample in range(nSample): tempValue = fSegy.read(4) hexValue = tempValue.hex() # print(hexValue) decValue = int(hexValue, 16) unintValue = struct.unpack('>L', struct.pack('>I', decValue))[ 0] # < > 用于控制大小端转换 floatValue = ibm2ieee(unintValue) data[iSample][iTrace] = floatValue fSegy.close() print(data)
📢📢📢将bytes结果转化为字节流,
fSegy = BytesIO(fSegy)