58 from daal.data_management
import Compressor_Zlib, Decompressor_Zlib, level9, DecompressionStream, CompressionStream
60 utils_folder = os.path.realpath(os.path.abspath(os.path.dirname(os.path.dirname(__file__))))
61 if utils_folder
not in sys.path:
62 sys.path.insert(0, utils_folder)
63 from utils
import getCRC32, readTextFile
65 DATA_PREFIX = os.path.join(
'..',
'data',
'batch')
66 datasetFileName = os.path.join(DATA_PREFIX,
'logitboost_train.csv')
69 def printCRC32(rawData, deCompressedData):
72 crcRawData = getCRC32(rawData)
73 crcDecompressedData = getCRC32(deCompressedData)
75 print(
"\nCompression example program results:\n")
77 print(
"Raw data checksum: 0x{:02X}".format(crcRawData))
78 print(
"Decompressed data checksum: 0x{:02X}".format(crcDecompressedData))
80 if rawData.size != deCompressedData.size:
81 print(
"ERROR: Decompressed data size mismatches with the raw data size")
83 elif crcRawData != crcDecompressedData:
84 print(
"ERROR: Decompressed data CRC mismatches with the raw data CRC")
87 print(
"OK: Decompressed data CRC matches with the raw data CRC")
90 if __name__ ==
"__main__":
92 rawData = readTextFile(datasetFileName)
95 compressor = Compressor_Zlib()
96 compressor.parameter.gzHeader =
True 97 compressor.parameter.level = level9
100 comprStream = CompressionStream(compressor)
103 comprStream.push_back(rawData)
106 compressedData = np.empty(comprStream.getCompressedDataSize(), dtype=np.uint8)
109 comprStream.copyCompressedArray(compressedData)
112 decompressor = Decompressor_Zlib()
113 decompressor.parameter.gzHeader =
True 116 deComprStream = DecompressionStream(decompressor)
119 deComprStream.push_back(compressedData)
122 deCompressedData = np.empty(deComprStream.getDecompressedDataSize(), dtype=np.uint8)
125 deComprStream.copyDecompressedArray(deCompressedData)
128 printCRC32(rawData, deCompressedData)