Context Navigation

source: thirdparty/SZ/sz/src/sz_float_pwr.c @ 9ee2ce3

Revision 9ee2ce3, 61.9 KB checked in by Hal Finkel <hfinkel@…>, 6 years ago (diff)
importing new SZ files
Property mode set to `100644`

Rev	Line
[2c47b73]	1	/**
	2	* @file sz_float_pwr.c
	3	* @author Sheng Di
	4	* @date Aug, 2016
	5	* @brief SZ_Init, Compression and Decompression functions
	6	* This file contains the compression/decompression functions related to point-wise relative errors
	7	* (C) 2016 by Mathematics and Computer Science (MCS), Argonne National Laboratory.
	8	* See COPYRIGHT in top-level directory.
	9	*/
	10
	11
	12	#include <stdio.h>
	13	#include <stdlib.h>
	14	#include <string.h>
	15	#include <unistd.h>
	16	#include <math.h>
	17	#include "sz.h"
	18	#include "CompressElement.h"
	19	#include "DynamicByteArray.h"
	20	#include "DynamicIntArray.h"
	21	#include "TightDataPointStorageF.h"
	22	#include "sz_float.h"
	23	#include "sz_float_pwr.h"
	24	#include "zlib.h"
	25	#include "rw.h"
[9ee2ce3]	26	#include "utility.h"
[2c47b73]	27
	28	void compute_segment_precisions_float_1D(float oriData, size_t dataLength, float pwrErrBound, unsigned char* pwrErrBoundBytes, double globalPrecision)
	29	{
	30	size_t i = 0, j = 0, k = 0;
	31	float realPrecision = oriData[0]!=0?fabs(confparams_cpr->pw_relBoundRatio*oriData[0]):confparams_cpr->pw_relBoundRatio;
	32	float approxPrecision;
	33	unsigned char realPrecBytes[4];
	34	float curPrecision;
	35	float curValue;
	36	float sum = 0;
	37	for(i=0;i<dataLength;i++)
	38	{
	39	curValue = oriData[i];
	40	if(i%confparams_cpr->segment_size==0&&i>0)
	41	{
	42	//get two first bytes of the realPrecision
	43	if(confparams_cpr->pwr_type==SZ_PWR_AVG_TYPE)
	44	{
	45	realPrecision = sum/confparams_cpr->segment_size;
	46	sum = 0;
	47	}
	48	realPrecision *= confparams_cpr->pw_relBoundRatio;
	49
	50	if(confparams_cpr->errorBoundMode==ABS_AND_PW_REL\|\|confparams_cpr->errorBoundMode==REL_AND_PW_REL)
	51	realPrecision = realPrecision<globalPrecision?realPrecision:globalPrecision;
	52	else if(confparams_cpr->errorBoundMode==ABS_OR_PW_REL\|\|confparams_cpr->errorBoundMode==REL_OR_PW_REL)
	53	realPrecision = realPrecision<globalPrecision?globalPrecision:realPrecision;
	54
	55	floatToBytes(realPrecBytes, realPrecision);
	56	realPrecBytes[2] = realPrecBytes[3] = 0;
	57	approxPrecision = bytesToFloat(realPrecBytes);
	58	//put the realPrecision in float* pwrErBound
	59	pwrErrBound[j++] = approxPrecision;
	60	//put the two bytes in pwrErrBoundBytes
	61	pwrErrBoundBytes[k++] = realPrecBytes[0];
	62	pwrErrBoundBytes[k++] = realPrecBytes[1];
	63
	64	realPrecision = fabs(curValue);
	65	}
	66
	67	if(curValue!=0)
	68	{
	69	curPrecision = fabs(curValue);
	70
	71	switch(confparams_cpr->pwr_type)
	72	{
	73	case SZ_PWR_MIN_TYPE:
	74	if(realPrecision>curPrecision)
	75	realPrecision = curPrecision;
	76	break;
	77	case SZ_PWR_AVG_TYPE:
	78	sum += curPrecision;
	79	break;
	80	case SZ_PWR_MAX_TYPE:
	81	if(realPrecision<curPrecision)
	82	realPrecision = curPrecision;
	83	break;
	84	}
	85	}
	86	}
	87	if(confparams_cpr->pwr_type==SZ_PWR_AVG_TYPE)
	88	{
	89	int size = dataLength%confparams_cpr->segment_size==0?confparams_cpr->segment_size:dataLength%confparams_cpr->segment_size;
	90	realPrecision = sum/size;
	91	}
	92	if(confparams_cpr->errorBoundMode==ABS_AND_PW_REL\|\|confparams_cpr->errorBoundMode==REL_AND_PW_REL)
	93	realPrecision = realPrecision<globalPrecision?realPrecision:globalPrecision;
	94	else if(confparams_cpr->errorBoundMode==ABS_OR_PW_REL\|\|confparams_cpr->errorBoundMode==REL_OR_PW_REL)
	95	realPrecision = realPrecision<globalPrecision?globalPrecision:realPrecision;
	96	floatToBytes(realPrecBytes, realPrecision);
	97	realPrecBytes[2] = realPrecBytes[3] = 0;
	98	approxPrecision = bytesToFloat(realPrecBytes);
	99	//put the realPrecision in float* pwrErBound
	100	pwrErrBound[j++] = approxPrecision;
	101	//put the two bytes in pwrErrBoundBytes
	102	pwrErrBoundBytes[k++] = realPrecBytes[0];
	103	pwrErrBoundBytes[k++] = realPrecBytes[1];
	104	}
	105
	106	unsigned int optimize_intervals_float_1D_pwr(float oriData, size_t dataLength, float pwrErrBound)
	107	{
	108	size_t i = 0, j = 0;
	109	float realPrecision = pwrErrBound[j++];
	110	unsigned long radiusIndex;
	111	float pred_value = 0, pred_err;
	112	int intervals = (int)malloc(confparams_cpr->maxRangeRadius*sizeof(int));
	113	memset(intervals, 0, confparams_cpr->maxRangeRadius*sizeof(int));
	114	int totalSampleSize = dataLength/confparams_cpr->sampleDistance;
	115	for(i=2;i<dataLength;i++)
	116	{
	117	if(i%confparams_cpr->segment_size==0)
	118	realPrecision = pwrErrBound[j++];
	119	if(i%confparams_cpr->sampleDistance==0)
	120	{
	121	//pred_value = 2*oriData[i-1] - oriData[i-2];
	122	pred_value = oriData[i-1];
	123	pred_err = fabs(pred_value - oriData[i]);
	124	radiusIndex = (unsigned long)((pred_err/realPrecision+1)/2);
	125	if(radiusIndex>=confparams_cpr->maxRangeRadius)
	126	radiusIndex = confparams_cpr->maxRangeRadius - 1;
	127	intervals[radiusIndex]++;
	128	}
	129	}
	130	//compute the appropriate number
	131	size_t targetCount = totalSampleSize*confparams_cpr->predThreshold;
	132	size_t sum = 0;
	133	for(i=0;i<confparams_cpr->maxRangeRadius;i++)
	134	{
	135	sum += intervals[i];
	136	if(sum>targetCount)
	137	break;
	138	}
	139	if(i>=confparams_cpr->maxRangeRadius)
	140	i = confparams_cpr->maxRangeRadius-1;
	141
	142	unsigned int accIntervals = 2*(i+1);
	143	unsigned int powerOf2 = roundUpToPowerOf2(accIntervals);
	144
	145	if(powerOf2<32)
	146	powerOf2 = 32;
	147
	148	free(intervals);
	149	//printf("accIntervals=%d, powerOf2=%d\n", accIntervals, powerOf2);
	150	return powerOf2;
	151	}
	152
	153	void compute_segment_precisions_float_2D(float oriData, float pwrErrBound,
	154	size_t r1, size_t r2, size_t R2, size_t edgeSize, unsigned char* pwrErrBoundBytes, float Min, float Max, double globalPrecision)
	155	{
	156	size_t i = 0, j = 0, k = 0, p = 0, index = 0, J = 0; //I=-1,J=-1 if they are needed
	157	float realPrecision;
	158	float approxPrecision;
	159	unsigned char realPrecBytes[4];
	160	float curValue, curAbsValue;
	161	float* statAbsValues = (float)malloc(R2sizeof(float));
	162
	163	float max = fabs(Min)<fabs(Max)?fabs(Max):fabs(Min); //get the max abs value.
	164	float min = fabs(Min)<fabs(Max)?fabs(Min):fabs(Max);
	165	for(i=0;i<R2;i++)
	166	{
	167	if(confparams_cpr->pwr_type == SZ_PWR_MIN_TYPE)
	168	statAbsValues[i] = max;
	169	else if(confparams_cpr->pwr_type == SZ_PWR_MAX_TYPE)
	170	statAbsValues[i] = min;
	171	else
	172	statAbsValues[i] = 0; //for SZ_PWR_AVG_TYPE
	173	}
	174	for(i=0;i<r1;i++)
	175	{
	176	for(j=0;j<r2;j++)
	177	{
	178	index = i*r2+j;
	179	curValue = oriData[index];
	180	if(((i%edgeSize==edgeSize-1 \|\| i==r1-1) &&j%edgeSize==0&&j>0) \|\| (i%edgeSize==0&&j==0&&i>0))
	181	{
	182	if(confparams_cpr->pwr_type==SZ_PWR_AVG_TYPE)
	183	{
	184	int a = edgeSize, b = edgeSize;
	185	if(j==0)
	186	{
	187	if(r2%edgeSize==0)
	188	b = edgeSize;
	189	else
	190	b = r2%edgeSize;
	191	}
	192	if(i==r1-1)
	193	{
	194	if(r1%edgeSize==0)
	195	a = edgeSize;
	196	else
	197	a = r1%edgeSize;
	198	}
	199	realPrecision = confparams_cpr->pw_relBoundRatiostatAbsValues[J]/(ab);
	200	}
	201	else
	202	realPrecision = confparams_cpr->pw_relBoundRatio*statAbsValues[J];
	203
	204	if(confparams_cpr->errorBoundMode==ABS_AND_PW_REL\|\|confparams_cpr->errorBoundMode==REL_AND_PW_REL)
	205	realPrecision = realPrecision<globalPrecision?realPrecision:globalPrecision;
	206	else if(confparams_cpr->errorBoundMode==ABS_OR_PW_REL\|\|confparams_cpr->errorBoundMode==REL_OR_PW_REL)
	207	realPrecision = realPrecision<globalPrecision?globalPrecision:realPrecision;
	208
	209	floatToBytes(realPrecBytes, realPrecision);
	210	realPrecBytes[2] = realPrecBytes[3] = 0;
	211	approxPrecision = bytesToFloat(realPrecBytes);
	212	//put the realPrecision in float* pwrErBound
	213	pwrErrBound[p++] = approxPrecision;
	214	//put the two bytes in pwrErrBoundBytes
	215	pwrErrBoundBytes[k++] = realPrecBytes[0];
	216	pwrErrBoundBytes[k++] = realPrecBytes[1];
	217
	218	if(confparams_cpr->pwr_type == SZ_PWR_MIN_TYPE)
	219	statAbsValues[J] = max;
	220	else if(confparams_cpr->pwr_type == SZ_PWR_MAX_TYPE)
	221	statAbsValues[J] = min;
	222	else
	223	statAbsValues[J] = 0; //for SZ_PWR_AVG_TYPE
	224	}
	225	if(j==0)
	226	J = 0;
	227	else if(j%edgeSize==0)
	228	J++;
	229	if(curValue!=0)
	230	{
	231	curAbsValue = fabs(curValue);
	232
	233	switch(confparams_cpr->pwr_type)
	234	{
	235	case SZ_PWR_MIN_TYPE:
	236	if(statAbsValues[J]>curAbsValue)
	237	statAbsValues[J] = curAbsValue;
	238	break;
	239	case SZ_PWR_AVG_TYPE:
	240	statAbsValues[J] += curAbsValue;
	241	break;
	242	case SZ_PWR_MAX_TYPE:
	243	if(statAbsValues[J]<curAbsValue)
	244	statAbsValues[J] = curAbsValue;
	245	break;
	246	}
	247	}
	248	}
	249	}
	250
	251	if(confparams_cpr->pwr_type==SZ_PWR_AVG_TYPE)
	252	{
	253	int a = edgeSize, b = edgeSize;
	254	if(r2%edgeSize==0)
	255	b = edgeSize;
	256	else
	257	b = r2%edgeSize;
	258	if(r1%edgeSize==0)
	259	a = edgeSize;
	260	else
	261	a = r1%edgeSize;
	262	realPrecision = confparams_cpr->pw_relBoundRatiostatAbsValues[J]/(ab);
	263	}
	264	else
	265	realPrecision = confparams_cpr->pw_relBoundRatio*statAbsValues[J];
	266
	267	if(confparams_cpr->errorBoundMode==ABS_AND_PW_REL\|\|confparams_cpr->errorBoundMode==REL_AND_PW_REL)
	268	realPrecision = realPrecision<globalPrecision?realPrecision:globalPrecision;
	269	else if(confparams_cpr->errorBoundMode==ABS_OR_PW_REL\|\|confparams_cpr->errorBoundMode==REL_OR_PW_REL)
	270	realPrecision = realPrecision<globalPrecision?globalPrecision:realPrecision;
	271
	272	floatToBytes(realPrecBytes, realPrecision);
	273	realPrecBytes[2] = realPrecBytes[3] = 0;
	274	approxPrecision = bytesToFloat(realPrecBytes);
	275	//put the realPrecision in float* pwrErBound
	276	pwrErrBound[p++] = approxPrecision;
	277	//put the two bytes in pwrErrBoundBytes
	278	pwrErrBoundBytes[k++] = realPrecBytes[0];
	279	pwrErrBoundBytes[k++] = realPrecBytes[1];
	280
	281	free(statAbsValues);
	282	}
	283
	284	unsigned int optimize_intervals_float_2D_pwr(float oriData, size_t r1, size_t r2, size_t R2, size_t edgeSize, float pwrErrBound)
	285	{
	286	size_t i = 0,j = 0, index, I=0, J=0;
	287	float realPrecision = pwrErrBound[0];
	288	unsigned long radiusIndex;
	289	float pred_value = 0, pred_err;
	290	int intervals = (int)malloc(confparams_cpr->maxRangeRadius*sizeof(int));
	291	memset(intervals, 0, confparams_cpr->maxRangeRadius*sizeof(int));
	292	size_t totalSampleSize = (r1-1)*(r2-1)/confparams_cpr->sampleDistance;
	293	size_t ir2;
	294	for(i=1;i<r1;i++)
	295	{
	296	ir2 = i*r2;
	297	if(i%edgeSize==0)
	298	{
	299	I++;
	300	J = 0;
	301	}
	302	for(j=1;j<r2;j++)
	303	{
	304	index = ir2+j;
	305	if(j%edgeSize==0)
	306	J++;
	307
	308	if((i+j)%confparams_cpr->sampleDistance==0)
	309	{
	310	realPrecision = pwrErrBound[I*R2+J];
	311	pred_value = oriData[index-1] + oriData[index-r2] - oriData[index-r2-1];
	312	pred_err = fabs(pred_value - oriData[index]);
	313	radiusIndex = (unsigned long)((pred_err/realPrecision+1)/2);
	314	if(radiusIndex>=confparams_cpr->maxRangeRadius)
	315	radiusIndex = confparams_cpr->maxRangeRadius - 1;
	316	intervals[radiusIndex]++;
	317	}
	318	}
	319	}
	320	//compute the appropriate number
	321	size_t targetCount = totalSampleSize*confparams_cpr->predThreshold;
	322	size_t sum = 0;
	323	for(i=0;i<confparams_cpr->maxRangeRadius;i++)
	324	{
	325	sum += intervals[i];
	326	if(sum>targetCount)
	327	break;
	328	}
	329	if(i>=confparams_cpr->maxRangeRadius)
	330	i = confparams_cpr->maxRangeRadius-1;
	331	unsigned int accIntervals = 2*(i+1);
	332	unsigned int powerOf2 = roundUpToPowerOf2(accIntervals);
	333
	334	if(powerOf2<32)
	335	powerOf2 = 32;
	336
	337	free(intervals);
	338	//printf("confparams_cpr->maxRangeRadius = %d, accIntervals=%d, powerOf2=%d\n", confparams_cpr->maxRangeRadius, accIntervals, powerOf2);
	339	return powerOf2;
	340	}
	341
	342	void compute_segment_precisions_float_3D(float oriData, float pwrErrBound,
	343	size_t r1, size_t r2, size_t r3, size_t R2, size_t R3, size_t edgeSize, unsigned char* pwrErrBoundBytes, float Min, float Max, double globalPrecision)
	344	{
	345	size_t i = 0, j = 0, k = 0, p = 0, q = 0, index = 0, J = 0, K = 0; //I=-1,J=-1 if they are needed
	346	size_t r23 = r2*r3, ir, jr;
	347	float realPrecision;
	348	float approxPrecision;
	349	unsigned char realPrecBytes[4];
	350	float curValue, curAbsValue;
	351
	352	float** statAbsValues = create2DArray_float(R2, R3);
	353	float max = fabs(Min)<fabs(Max)?fabs(Max):fabs(Min); //get the max abs value.
	354	float min = fabs(Min)<fabs(Max)?fabs(Min):fabs(Max);
	355
	356	for(i=0;i<R2;i++)
	357	for(j=0;j<R3;j++)
	358	{
	359	if(confparams_cpr->pwr_type == SZ_PWR_MIN_TYPE)
	360	statAbsValues[i][j] = max;
	361	else if(confparams_cpr->pwr_type == SZ_PWR_MAX_TYPE)
	362	statAbsValues[i][j] = min;
	363	else
	364	statAbsValues[i][j] = 0;
	365	}
	366	for(i=0;i<r1;i++)
	367	{
	368	ir = i*r23;
	369	if(i%edgeSize==0&&i>0)
	370	{
	371	realPrecision = confparams_cpr->pw_relBoundRatio*statAbsValues[J][K];
	372	floatToBytes(realPrecBytes, realPrecision);
	373	memset(&realPrecBytes[2], 0, 2);
	374	approxPrecision = bytesToFloat(realPrecBytes);
	375	//put the realPrecision in float* pwrErBound
	376	pwrErrBound[p++] = approxPrecision;
	377	//put the two bytes in pwrErrBoundBytes
	378	//printf("q=%d, i=%d, j=%d, k=%d\n",q,i,j,k);
	379	pwrErrBoundBytes[q++] = realPrecBytes[0];
	380	pwrErrBoundBytes[q++] = realPrecBytes[1];
	381	if(confparams_cpr->pwr_type == SZ_PWR_MIN_TYPE)
	382	statAbsValues[J][K] = max;
	383	else if(confparams_cpr->pwr_type == SZ_PWR_MAX_TYPE)
	384	statAbsValues[J][K] = min;
	385
	386	}
	387	for(j=0;j<r2;j++)
	388	{
	389	jr = j*r3;
	390	if((i%edgeSize==edgeSize-1 \|\| i == r1-1)&&j%edgeSize==0&&j>0)
	391	{
	392	realPrecision = confparams_cpr->pw_relBoundRatio*statAbsValues[J][K];
	393	floatToBytes(realPrecBytes, realPrecision);
	394	memset(&realPrecBytes[2], 0, 2);
	395	approxPrecision = bytesToFloat(realPrecBytes);
	396	//put the realPrecision in float* pwrErBound
	397	pwrErrBound[p++] = approxPrecision;
	398	//put the two bytes in pwrErrBoundBytes
	399	//printf("q=%d, i=%d, j=%d, k=%d\n",q,i,j,k);
	400	pwrErrBoundBytes[q++] = realPrecBytes[0];
	401	pwrErrBoundBytes[q++] = realPrecBytes[1];
	402	if(confparams_cpr->pwr_type == SZ_PWR_MIN_TYPE)
	403	statAbsValues[J][K] = max;
	404	else if(confparams_cpr->pwr_type == SZ_PWR_MAX_TYPE)
	405	statAbsValues[J][K] = min;
	406	}
	407
	408	if(j==0)
	409	J = 0;
	410	else if(j%edgeSize==0)
	411	J++;
	412
	413	for(k=0;k<r3;k++)
	414	{
	415	index = ir+jr+k;
	416	curValue = oriData[index];
	417	if((i%edgeSize==edgeSize-1 \|\| i == r1-1)&&(j%edgeSize==edgeSize-1\|\|j==r2-1)&&k%edgeSize==0&&k>0)
	418	{
	419	realPrecision = confparams_cpr->pw_relBoundRatio*statAbsValues[J][K];
	420	floatToBytes(realPrecBytes, realPrecision);
	421	memset(&realPrecBytes[2], 0, 2);
	422	approxPrecision = bytesToFloat(realPrecBytes);
	423	//put the realPrecision in float* pwrErBound
	424	pwrErrBound[p++] = approxPrecision;
	425	//put the two bytes in pwrErrBoundBytes
	426	//printf("q=%d, i=%d, j=%d, k=%d\n",q,i,j,k);
	427	pwrErrBoundBytes[q++] = realPrecBytes[0];
	428	pwrErrBoundBytes[q++] = realPrecBytes[1];
	429
	430	if(confparams_cpr->pwr_type == SZ_PWR_MIN_TYPE)
	431	statAbsValues[J][K] = max;
	432	else if(confparams_cpr->pwr_type == SZ_PWR_MAX_TYPE)
	433	statAbsValues[J][K] = min;
	434	}
	435
	436	if(k==0)
	437	K = 0;
	438	else if(k%edgeSize==0)
	439	K++;
	440
	441	if(curValue!=0)
	442	{
	443	curAbsValue = fabs(curValue);
	444	if(confparams_cpr->pwr_type == SZ_PWR_MIN_TYPE)
	445	{
	446	if(statAbsValues[J][K]>curAbsValue)
	447	{
	448	statAbsValues[J][K] = curAbsValue;
	449	}
	450	}
	451	else if(confparams_cpr->pwr_type == SZ_PWR_MAX_TYPE)
	452	{
	453	if(statAbsValues[J][K]<curAbsValue)
	454	{
	455	statAbsValues[J][K] = curAbsValue;
	456	}
	457	}
	458	}
	459	}
	460	}
	461	}
	462
	463	realPrecision = confparams_cpr->pw_relBoundRatio*statAbsValues[J][K];
	464	floatToBytes(realPrecBytes, realPrecision);
	465	realPrecBytes[2] = realPrecBytes[3] = 0;
	466	approxPrecision = bytesToFloat(realPrecBytes);
	467	//put the realPrecision in float* pwrErBound
	468	pwrErrBound[p++] = approxPrecision;
	469	//put the two bytes in pwrErrBoundBytes
	470	pwrErrBoundBytes[q++] = realPrecBytes[0];
	471	pwrErrBoundBytes[q++] = realPrecBytes[1];
	472
	473	free2DArray_float(statAbsValues, R2);
	474	}
	475
	476	unsigned int optimize_intervals_float_3D_pwr(float oriData, size_t r1, size_t r2, size_t r3, size_t R2, size_t R3, size_t edgeSize, float pwrErrBound)
	477	{
	478	size_t i,j,k, ir,jr,index, I = 0,J=0,K=0;
	479	float realPrecision = pwrErrBound[0];
	480	unsigned long radiusIndex;
	481	size_t r23=r2*r3;
	482	size_t R23 = R2*R3;
	483	float pred_value = 0, pred_err;
	484	int intervals = (int)malloc(confparams_cpr->maxRangeRadius*sizeof(int));
	485	memset(intervals, 0, confparams_cpr->maxRangeRadius*sizeof(int));
	486	size_t totalSampleSize = (r1-1)(r2-1)(r3-1)/confparams_cpr->sampleDistance;
	487	for(i=1;i<r1;i++)
	488	{
	489	ir = i*r23;
	490	if(i%edgeSize==0)
	491	{
	492	I++;
	493	J = 0;
	494	}
	495	for(j=1;j<r2;j++)
	496	{
	497	jr = j*r3;
	498	if(j%edgeSize==0)
	499	{
	500	J++;
	501	K = 0;
	502	}
	503	for(k=1;k<r3;k++)
	504	{
	505	index = ir+jr+k;
	506	if(k%edgeSize==0)
	507	K++;
	508	if((i+j+k)%confparams_cpr->sampleDistance==0)
	509	{
	510	realPrecision = pwrErrBound[IR23+JR2+K];
	511	pred_value = oriData[index-1] + oriData[index-r3] + oriData[index-r23]
	512	- oriData[index-1-r23] - oriData[index-r3-1] - oriData[index-r3-r23] + oriData[index-r3-r23-1];
	513	pred_err = fabs(pred_value - oriData[index]);
	514	radiusIndex = (unsigned long)((pred_err/realPrecision+1)/2);
	515	if(radiusIndex>=confparams_cpr->maxRangeRadius)
	516	radiusIndex = confparams_cpr->maxRangeRadius - 1;
	517	intervals[radiusIndex]++;
	518	}
	519	}
	520	}
	521	}
	522	//compute the appropriate number
	523	size_t targetCount = totalSampleSize*confparams_cpr->predThreshold;
	524	size_t sum = 0;
	525	for(i=0;i<confparams_cpr->maxRangeRadius;i++)
	526	{
	527	sum += intervals[i];
	528	if(sum>targetCount)
	529	break;
	530	}
	531	if(i>=confparams_cpr->maxRangeRadius)
	532	i = confparams_cpr->maxRangeRadius-1;
	533	unsigned int accIntervals = 2*(i+1);
	534	unsigned int powerOf2 = roundUpToPowerOf2(accIntervals);
	535
	536	if(powerOf2<32)
	537	powerOf2 = 32;
	538
	539	free(intervals);
	540	//printf("accIntervals=%d, powerOf2=%d\n", accIntervals, powerOf2);
	541	return powerOf2;
	542	}
	543
	544	void SZ_compress_args_float_NoCkRngeNoGzip_1D_pwr(unsigned char** newByteData, float *oriData, double globalPrecision,
	545	size_t dataLength, size_t *outSize, float min, float max)
	546	{
	547	size_t pwrLength = dataLength%confparams_cpr->segment_size==0?dataLength/confparams_cpr->segment_size:dataLength/confparams_cpr->segment_size+1;
	548	float* pwrErrBound = (float)malloc(sizeof(float)pwrLength);
	549	size_t pwrErrBoundBytes_size = sizeof(unsigned char)pwrLength2;
	550	unsigned char* pwrErrBoundBytes = (unsigned char*)malloc(pwrErrBoundBytes_size);
	551
	552	compute_segment_precisions_float_1D(oriData, dataLength, pwrErrBound, pwrErrBoundBytes, globalPrecision);
	553
	554	unsigned int quantization_intervals;
	555	if(exe_params->optQuantMode==1)
	556	{
	557	quantization_intervals = optimize_intervals_float_1D_pwr(oriData, dataLength, pwrErrBound);
	558	updateQuantizationInfo(quantization_intervals);
	559	}
	560	else
	561	quantization_intervals = exe_params->intvCapacity;
	562	size_t i = 0, j = 0;
	563	int reqLength;
	564	float realPrecision = pwrErrBound[j++];
	565	float medianValue = 0;
	566	float radius = fabs(max)<fabs(min)?fabs(min):fabs(max);
	567	short radExpo = getExponent_float(radius);
	568
	569	computeReqLength_float(realPrecision, radExpo, &reqLength, &medianValue);
	570
	571	int* type = (int) malloc(dataLengthsizeof(int));
	572	//type[dataLength]=0;
	573
	574	float* spaceFillingValue = oriData; //
	575
	576	DynamicByteArray *resiBitLengthArray;
	577	new_DBA(&resiBitLengthArray, DynArrayInitLen);
	578
	579	DynamicIntArray *exactLeadNumArray;
	580	new_DIA(&exactLeadNumArray, DynArrayInitLen);
	581
	582	DynamicByteArray *exactMidByteArray;
	583	new_DBA(&exactMidByteArray, DynArrayInitLen);
	584
	585	DynamicIntArray *resiBitArray;
	586	new_DIA(&resiBitArray, DynArrayInitLen);
	587
	588	type[0] = 0;
	589
	590	unsigned char preDataBytes[4] = {0};
	591	intToBytes_bigEndian(preDataBytes, 0);
	592
	593	int reqBytesLength = reqLength/8;
	594	int resiBitsLength = reqLength%8;
	595	float last3CmprsData[3] = {0};
	596
	597	FloatValueCompressElement vce = (FloatValueCompressElement)malloc(sizeof(FloatValueCompressElement));
	598	LossyCompressionElement lce = (LossyCompressionElement)malloc(sizeof(LossyCompressionElement));
	599
	600	//add the first data
	601	addDBA_Data(resiBitLengthArray, (unsigned char)resiBitsLength);
	602	compressSingleFloatValue(vce, spaceFillingValue[0], realPrecision, medianValue, reqLength, reqBytesLength, resiBitsLength);
	603	updateLossyCompElement_Float(vce->curBytes, preDataBytes, reqBytesLength, resiBitsLength, lce);
	604	memcpy(preDataBytes,vce->curBytes,4);
	605	addExactData(exactMidByteArray, exactLeadNumArray, resiBitArray, lce);
	606	listAdd_float(last3CmprsData, vce->data);
	607	//printf("%.30G\n",last3CmprsData[0]);
	608
	609	//add the second data
	610	type[1] = 0;
	611	addDBA_Data(resiBitLengthArray, (unsigned char)resiBitsLength);
	612	compressSingleFloatValue(vce, spaceFillingValue[1], realPrecision, medianValue, reqLength, reqBytesLength, resiBitsLength);
	613	updateLossyCompElement_Float(vce->curBytes, preDataBytes, reqBytesLength, resiBitsLength, lce);
	614	memcpy(preDataBytes,vce->curBytes,4);
	615	addExactData(exactMidByteArray, exactLeadNumArray, resiBitArray, lce);
	616	listAdd_float(last3CmprsData, vce->data);
	617	//printf("%.30G\n",last3CmprsData[0]);
	618
	619	int state;
	620	double checkRadius;
	621	float curData;
	622	float pred;
	623	double predAbsErr;
	624	checkRadius = (exe_params->intvCapacity-1)*realPrecision;
	625	double interval = 2*realPrecision;
	626	int updateReqLength = 0; //a marker: 1 means already updated
	627
	628	for(i=2;i<dataLength;i++)
	629	{
	630	curData = spaceFillingValue[i];
	631	if(i%confparams_cpr->segment_size==0)
	632	{
	633	realPrecision = pwrErrBound[j++];
	634	checkRadius = (exe_params->intvCapacity-1)*realPrecision;
	635	interval = 2*realPrecision;
	636	updateReqLength = 0;
	637	}
	638	//pred = 2*last3CmprsData[0] - last3CmprsData[1];
	639	pred = last3CmprsData[0];
	640	predAbsErr = fabs(curData - pred);
	641	if(predAbsErr<checkRadius)
	642	{
	643	state = (predAbsErr/realPrecision+1)/2;
	644	if(curData>=pred)
	645	{
	646	type[i] = exe_params->intvRadius+state;
	647	pred = pred + state*interval;
	648	}
	649	else //curData<pred
	650	{
	651	type[i] = exe_params->intvRadius-state;
	652	pred = pred - state*interval;
	653	}
	654	listAdd_float(last3CmprsData, pred);
	655	continue;
	656	}
	657
	658	//unpredictable data processing
	659	if(updateReqLength==0)
	660	{
	661	computeReqLength_float(realPrecision, radExpo, &reqLength, &medianValue);
	662	reqBytesLength = reqLength/8;
	663	resiBitsLength = reqLength%8;
	664	updateReqLength = 1;
	665	}
	666
	667	type[i] = 0;
	668	addDBA_Data(resiBitLengthArray, (unsigned char)resiBitsLength);
	669
	670	compressSingleFloatValue(vce, curData, realPrecision, medianValue, reqLength, reqBytesLength, resiBitsLength);
	671	updateLossyCompElement_Float(vce->curBytes, preDataBytes, reqBytesLength, resiBitsLength, lce);
	672	memcpy(preDataBytes,vce->curBytes,4);
	673	addExactData(exactMidByteArray, exactLeadNumArray, resiBitArray, lce);
	674
	675	listAdd_float(last3CmprsData, vce->data);
	676	}//end of for
	677
	678	// char* expSegmentsInBytes;
	679	// int expSegmentsInBytes_size = convertESCToBytes(esc, &expSegmentsInBytes);
	680	int exactDataNum = exactLeadNumArray->size;
	681
	682	TightDataPointStorageF* tdps;
	683
	684	new_TightDataPointStorageF2(&tdps, dataLength, exactDataNum,
	685	type, exactMidByteArray->array, exactMidByteArray->size,
	686	exactLeadNumArray->array,
	687	resiBitArray->array, resiBitArray->size,
	688	resiBitLengthArray->array, resiBitLengthArray->size,
	689	realPrecision, medianValue, (char)reqLength, quantization_intervals, pwrErrBoundBytes, pwrErrBoundBytes_size, radExpo);
	690
	691	//sdi:Debug
	692	/* int sum =0;
	693	for(i=0;i<dataLength;i++)
	694	if(type[i]==0) sum++;
	695	printf("opt_quantizations=%d, exactDataNum=%d, sum=%d\n",quantization_intervals, exactDataNum, sum);
	696	*/
	697	// writeUShortData(type, dataLength, "compressStateBytes.sb");
	698	// unsigned short type_[dataLength];
	699	// SZ_Reset();
	700	// decode_withTree(tdps->typeArray, tdps->typeArray_size, type_);
	701	// printf("tdps->typeArray_size=%d\n", tdps->typeArray_size);
	702
	703	//free memory
	704	free_DBA(resiBitLengthArray);
	705	free_DIA(exactLeadNumArray);
	706	free_DIA(resiBitArray);
	707	free(type);
	708
	709	convertTDPStoFlatBytes_float(tdps, newByteData, outSize);
	710
	711	int floatSize=sizeof(float);
	712	if(outSize>dataLengthfloatSize)
	713	{
	714	size_t k = 0, i;
	715	tdps->isLossless = 1;
	716	size_t totalByteLength = 3 + exe_params->SZ_SIZE_TYPE + 1 + floatSize*dataLength;
	717	newByteData = (unsigned char)malloc(totalByteLength);
	718
	719	unsigned char dsLengthBytes[exe_params->SZ_SIZE_TYPE];
	720	intToBytes_bigEndian(dsLengthBytes, dataLength);//4
	721	for (i = 0; i < 3; i++)//3
	722	(*newByteData)[k++] = versionNumber[i];
	723
	724	if(exe_params->SZ_SIZE_TYPE==4)
	725	{
	726	(*newByteData)[k++] = 16; //=00010000
	727	}
	728	else
	729	{
	730	(*newByteData)[k++] = 80;
	731	}
	732	for (i = 0; i < exe_params->SZ_SIZE_TYPE; i++)//4 or 8
	733	(*newByteData)[k++] = dsLengthBytes[i];
	734
	735
	736	if(sysEndianType==BIG_ENDIAN_SYSTEM)
	737	memcpy((newByteData)+4+exe_params->SZ_SIZE_TYPE, oriData, dataLengthfloatSize);
	738	else
	739	{
	740	unsigned char* p = (*newByteData)+4+exe_params->SZ_SIZE_TYPE;
	741	for(i=0;i<dataLength;i++,p+=floatSize)
	742	floatToBytes(p, oriData[i]);
	743	}
	744	*outSize = totalByteLength;
	745	}
	746
	747	free(pwrErrBound);
	748
	749	free(vce);
	750	free(lce);
	751	free_TightDataPointStorageF(tdps);
	752	free(exactMidByteArray);
	753	}
	754
	755	void SZ_compress_args_float_NoCkRngeNoGzip_2D_pwr(unsigned char** newByteData, float *oriData, double globalPrecision, size_t r1, size_t r2,
	756	size_t *outSize, float min, float max)
	757	{
	758	size_t dataLength=r1*r2;
	759	int blockEdgeSize = computeBlockEdgeSize_2D(confparams_cpr->segment_size);
	760	size_t R1 = 1+(r1-1)/blockEdgeSize;
	761	size_t R2 = 1+(r2-1)/blockEdgeSize;
	762	float* pwrErrBound = (float)malloc(sizeof(float)R1*R2);
	763	size_t pwrErrBoundBytes_size = sizeof(unsigned char)R1R2*2;
	764	unsigned char* pwrErrBoundBytes = (unsigned char*)malloc(pwrErrBoundBytes_size);
	765
	766	compute_segment_precisions_float_2D(oriData, pwrErrBound, r1, r2, R2, blockEdgeSize, pwrErrBoundBytes, min, max, globalPrecision);
	767
	768	unsigned int quantization_intervals;
	769	if(exe_params->optQuantMode==1)
	770	{
	771	quantization_intervals = optimize_intervals_float_2D_pwr(oriData, r1, r2, R2, blockEdgeSize, pwrErrBound);
	772	updateQuantizationInfo(quantization_intervals);
	773	}
	774	else
	775	quantization_intervals = exe_params->intvCapacity;
	776	//printf("quantization_intervals=%d\n",quantization_intervals);
	777
	778	size_t i=0,j=0,I=0,J=0;
	779	int reqLength;
	780	float realPrecision = pwrErrBound[I*R2+J];
	781	float pred1D, pred2D;
	782	float diff = 0.0;
	783	double itvNum = 0;
	784	float P0, P1;
	785
	786	P0 = (float)malloc(r2sizeof(float));
	787	memset(P0, 0, r2*sizeof(float));
	788	P1 = (float)malloc(r2sizeof(float));
	789	memset(P1, 0, r2*sizeof(float));
	790
	791	float medianValue = 0;
	792	float radius = fabs(max)<fabs(min)?fabs(min):fabs(max);
	793	short radExpo = getExponent_float(radius);
	794	int updateReqLength = 1;
	795
	796	computeReqLength_float(realPrecision, radExpo, &reqLength, &medianValue);
	797
	798	int* type = (int) malloc(dataLengthsizeof(int));
	799	//type[dataLength]=0;
	800
	801	float* spaceFillingValue = oriData; //
	802
	803	DynamicByteArray *resiBitLengthArray;
	804	new_DBA(&resiBitLengthArray, DynArrayInitLen);
	805
	806	DynamicIntArray *exactLeadNumArray;
	807	new_DIA(&exactLeadNumArray, DynArrayInitLen);
	808
	809	DynamicByteArray *exactMidByteArray;
	810	new_DBA(&exactMidByteArray, DynArrayInitLen);
	811
	812	DynamicIntArray *resiBitArray;
	813	new_DIA(&resiBitArray, DynArrayInitLen);
	814
	815	type[0] = 0;
	816
	817	unsigned char preDataBytes[4];
	818	intToBytes_bigEndian(preDataBytes, 0);
	819
	820	int reqBytesLength = reqLength/8;
	821	int resiBitsLength = reqLength%8;
	822
	823	FloatValueCompressElement vce = (FloatValueCompressElement)malloc(sizeof(FloatValueCompressElement));
	824	LossyCompressionElement lce = (LossyCompressionElement)malloc(sizeof(LossyCompressionElement));
	825
	826	/* Process Row-0 data 0*/
	827	type[0] = 0;
	828	addDBA_Data(resiBitLengthArray, (unsigned char)resiBitsLength);
	829	compressSingleFloatValue(vce, spaceFillingValue[0], realPrecision, medianValue, reqLength, reqBytesLength, resiBitsLength);
	830	updateLossyCompElement_Float(vce->curBytes, preDataBytes, reqBytesLength, resiBitsLength, lce);
	831	memcpy(preDataBytes,vce->curBytes,4);
	832	addExactData(exactMidByteArray, exactLeadNumArray, resiBitArray, lce);
	833	P1[0] = vce->data;
	834
	835	/* Process Row-0 data 1*/
	836	pred1D = P1[0];
	837	diff = spaceFillingValue[1] - pred1D;
	838
	839	itvNum = fabs(diff)/realPrecision + 1;
	840
	841	if (itvNum < exe_params->intvCapacity)
	842	{
	843	if (diff < 0) itvNum = -itvNum;
	844	type[1] = (int) (itvNum/2) + exe_params->intvRadius;
	845	P1[1] = pred1D + 2 * (type[1] - exe_params->intvRadius) * realPrecision;
	846	}
	847	else
	848	{
	849	type[1] = 0;
	850
	851	addDBA_Data(resiBitLengthArray, (unsigned char)resiBitsLength);
	852	compressSingleFloatValue(vce, spaceFillingValue[1], realPrecision, medianValue, reqLength, reqBytesLength, resiBitsLength);
	853	updateLossyCompElement_Float(vce->curBytes, preDataBytes, reqBytesLength, resiBitsLength, lce);
	854	memcpy(preDataBytes,vce->curBytes,4);
	855	addExactData(exactMidByteArray, exactLeadNumArray, resiBitArray, lce);
	856	P1[1] = vce->data;
	857	}
	858
	859	/* Process Row-0 data 2 --> data r2-1 */
	860	for (j = 2; j < r2; j++)
	861	{
	862	if(j%blockEdgeSize==0)
	863	{
	864	J++;
	865	realPrecision = pwrErrBound[I*R2+J];
	866	updateReqLength = 0;
	867	}
	868
	869	pred1D = 2*P1[j-1] - P1[j-2];
	870	diff = spaceFillingValue[j] - pred1D;
	871
	872	itvNum = fabs(diff)/realPrecision + 1;
	873
	874	if (itvNum < exe_params->intvCapacity)
	875	{
	876	if (diff < 0) itvNum = -itvNum;
	877	type[j] = (int) (itvNum/2) + exe_params->intvRadius;
	878	P1[j] = pred1D + 2 * (type[j] - exe_params->intvRadius) * realPrecision;
	879	}
	880	else
	881	{
	882	if(updateReqLength==0)
	883	{
	884	computeReqLength_float(realPrecision, radExpo, &reqLength, &medianValue);
	885	reqBytesLength = reqLength/8;
	886	resiBitsLength = reqLength%8;
	887	updateReqLength = 1;
	888	}
	889
	890	type[j] = 0;
	891
	892	addDBA_Data(resiBitLengthArray, (unsigned char)resiBitsLength);
	893	compressSingleFloatValue(vce, spaceFillingValue[j], realPrecision, medianValue, reqLength, reqBytesLength, resiBitsLength);
	894	updateLossyCompElement_Float(vce->curBytes, preDataBytes, reqBytesLength, resiBitsLength, lce);
	895	memcpy(preDataBytes,vce->curBytes,4);
	896	addExactData(exactMidByteArray, exactLeadNumArray, resiBitArray, lce);
	897	P1[j] = vce->data;
	898	}
	899	}
	900
	901	/* Process Row-1 --> Row-r1-1 */
	902	size_t index;
	903	for (i = 1; i < r1; i++)
	904	{
	905	/* Process row-i data 0 */
	906	index = i*r2;
	907	J = 0;
	908	if(i%blockEdgeSize==0)
	909	I++;
	910	realPrecision = pwrErrBound[I*R2+J]; //J==0
	911	updateReqLength = 0;
	912
	913	pred1D = P1[0];
	914	diff = spaceFillingValue[index] - pred1D;
	915
	916	itvNum = fabs(diff)/realPrecision + 1;
	917
	918	if (itvNum < exe_params->intvCapacity)
	919	{
	920	if (diff < 0) itvNum = -itvNum;
	921	type[index] = (int) (itvNum/2) + exe_params->intvRadius;
	922	P0[0] = pred1D + 2 * (type[index] - exe_params->intvRadius) * realPrecision;
	923	}
	924	else
	925	{
	926	if(updateReqLength==0)
	927	{
	928	computeReqLength_float(realPrecision, radExpo, &reqLength, &medianValue);
	929	reqBytesLength = reqLength/8;
	930	resiBitsLength = reqLength%8;
	931	updateReqLength = 1;
	932	}
	933
	934	type[index] = 0;
	935
	936	addDBA_Data(resiBitLengthArray, (unsigned char)resiBitsLength);
	937	compressSingleFloatValue(vce, spaceFillingValue[index], realPrecision, medianValue, reqLength, reqBytesLength, resiBitsLength);
	938	updateLossyCompElement_Float(vce->curBytes, preDataBytes, reqBytesLength, resiBitsLength, lce);
	939	memcpy(preDataBytes,vce->curBytes,4);
	940	addExactData(exactMidByteArray, exactLeadNumArray, resiBitArray, lce);
	941	P0[0] = vce->data;
	942	}
	943
	944	/* Process row-i data 1 --> r2-1*/
	945	for (j = 1; j < r2; j++)
	946	{
	947	index = i*r2+j;
	948
	949	if(j%blockEdgeSize==0)
	950	{
	951	J++;
	952	realPrecision = pwrErrBound[I*R2+J];
	953	updateReqLength = 0;
	954	}
	955	pred2D = P0[j-1] + P1[j] - P1[j-1];
	956
	957	diff = spaceFillingValue[index] - pred2D;
	958
	959	itvNum = fabs(diff)/realPrecision + 1;
	960
	961	if (itvNum < exe_params->intvCapacity)
	962	{
	963	if (diff < 0) itvNum = -itvNum;
	964	type[index] = (int) (itvNum/2) + exe_params->intvRadius;
	965	P0[j] = pred2D + 2 * (type[index] - exe_params->intvRadius) * realPrecision;
	966	}
	967	else
	968	{
	969	if(updateReqLength==0)
	970	{
	971	computeReqLength_float(realPrecision, radExpo, &reqLength, &medianValue);
	972	reqBytesLength = reqLength/8;
	973	resiBitsLength = reqLength%8;
	974	updateReqLength = 1;
	975	}
	976
	977	type[index] = 0;
	978
	979	addDBA_Data(resiBitLengthArray, (unsigned char)resiBitsLength);
	980	compressSingleFloatValue(vce, spaceFillingValue[index], realPrecision, medianValue, reqLength, reqBytesLength, resiBitsLength);
	981	updateLossyCompElement_Float(vce->curBytes, preDataBytes, reqBytesLength, resiBitsLength, lce);
	982	memcpy(preDataBytes,vce->curBytes,4);
	983	addExactData(exactMidByteArray, exactLeadNumArray, resiBitArray, lce);
	984	P0[j] = vce->data;
	985	}
	986	}
	987
	988	float *Pt;
	989	Pt = P1;
	990	P1 = P0;
	991	P0 = Pt;
	992	}
	993
	994	if(r2!=1)
	995	free(P0);
	996	free(P1);
	997	int exactDataNum = exactLeadNumArray->size;
	998
	999	TightDataPointStorageF* tdps;
	1000
	1001	new_TightDataPointStorageF2(&tdps, dataLength, exactDataNum,
	1002	type, exactMidByteArray->array, exactMidByteArray->size,
	1003	exactLeadNumArray->array,
	1004	resiBitArray->array, resiBitArray->size,
	1005	resiBitLengthArray->array, resiBitLengthArray->size,
	1006	realPrecision, medianValue, (char)reqLength, quantization_intervals, pwrErrBoundBytes, pwrErrBoundBytes_size, radExpo);
	1007
	1008	//free memory
	1009	free_DBA(resiBitLengthArray);
	1010	free_DIA(exactLeadNumArray);
	1011	free_DIA(resiBitArray);
	1012	free(type);
	1013
	1014	convertTDPStoFlatBytes_float(tdps, newByteData, outSize);
	1015
	1016	free(pwrErrBound);
	1017
	1018	free(vce);
	1019	free(lce);
	1020	free_TightDataPointStorageF(tdps);
	1021	free(exactMidByteArray);
	1022	}
	1023
	1024	void SZ_compress_args_float_NoCkRngeNoGzip_3D_pwr(unsigned char** newByteData, float *oriData, double globalPrecision,
	1025	size_t r1, size_t r2, size_t r3, size_t *outSize, float min, float max)
	1026	{
	1027	size_t dataLength=r1r2r3;
	1028
	1029	int blockEdgeSize = computeBlockEdgeSize_3D(confparams_cpr->segment_size);
	1030	size_t R1 = 1+(r1-1)/blockEdgeSize;
	1031	size_t R2 = 1+(r2-1)/blockEdgeSize;
	1032	size_t R3 = 1+(r3-1)/blockEdgeSize;
	1033	float* pwrErrBound = (float)malloc(sizeof(float)R1R2R3);
	1034	size_t pwrErrBoundBytes_size = sizeof(unsigned char)R1R2R32;
	1035	unsigned char* pwrErrBoundBytes = (unsigned char*)malloc(pwrErrBoundBytes_size);
	1036
	1037	compute_segment_precisions_float_3D(oriData, pwrErrBound, r1, r2, r3, R2, R3, blockEdgeSize, pwrErrBoundBytes, min, max, globalPrecision);
	1038
	1039	unsigned int quantization_intervals;
	1040	if(exe_params->optQuantMode==1)
	1041	{
	1042	quantization_intervals = optimize_intervals_float_3D_pwr(oriData, r1, r2, r3, R2, R3, blockEdgeSize, pwrErrBound);
	1043	updateQuantizationInfo(quantization_intervals);
	1044	}
	1045	else
	1046	quantization_intervals = exe_params->intvCapacity;
	1047	size_t i=0,j=0,k=0, I = 0, J = 0, K = 0;
	1048	int reqLength;
	1049	float realPrecision = pwrErrBound[0];
	1050	float pred1D, pred2D, pred3D;
	1051	float diff = 0.0;
	1052	double itvNum = 0;
	1053	float P0, P1;
	1054
	1055	size_t r23 = r2*r3;
	1056	size_t R23 = R2*R3;
	1057	P0 = (float)malloc(r23sizeof(float));
	1058	P1 = (float)malloc(r23sizeof(float));
	1059	float radius = fabs(max)<fabs(min)?fabs(min):fabs(max);
	1060	float medianValue = 0;
	1061	short radExpo = getExponent_float(radius);
	1062	int updateReqLength = 0;
	1063
	1064	computeReqLength_float(realPrecision, radExpo, &reqLength, &medianValue);
	1065
	1066	int* type = (int) malloc(dataLengthsizeof(int));
	1067	//type[dataLength]=0;realPrecision
	1068
	1069	float* spaceFillingValue = oriData; //
	1070
	1071	DynamicByteArray *resiBitLengthArray;
	1072	new_DBA(&resiBitLengthArray, DynArrayInitLen);
	1073
	1074	DynamicIntArray *exactLeadNumArray;
	1075	new_DIA(&exactLeadNumArray, DynArrayInitLen);
	1076
	1077	DynamicByteArray *exactMidByteArray;
	1078	new_DBA(&exactMidByteArray, DynArrayInitLen);
	1079
	1080	DynamicIntArray *resiBitArray;
	1081	new_DIA(&resiBitArray, DynArrayInitLen);
	1082
	1083	type[0] = 0;
	1084
	1085	unsigned char preDataBytes[4];
	1086	intToBytes_bigEndian(preDataBytes, 0);
	1087
	1088	int reqBytesLength = reqLength/8;
	1089	int resiBitsLength = reqLength%8;
	1090
	1091	FloatValueCompressElement vce = (FloatValueCompressElement)malloc(sizeof(FloatValueCompressElement));
	1092	LossyCompressionElement lce = (LossyCompressionElement)malloc(sizeof(LossyCompressionElement));
	1093
	1094
	1095	/////////////////////////// Process layer-0 ///////////////////////////
	1096	/* Process Row-0 data 0*/
	1097	type[0] = 0;
	1098	addDBA_Data(resiBitLengthArray, (unsigned char)resiBitsLength);
	1099	compressSingleFloatValue(vce, spaceFillingValue[0], realPrecision, medianValue, reqLength, reqBytesLength, resiBitsLength);
	1100	updateLossyCompElement_Float(vce->curBytes, preDataBytes, reqBytesLength, resiBitsLength, lce);
	1101	memcpy(preDataBytes,vce->curBytes,4);
	1102	addExactData(exactMidByteArray, exactLeadNumArray, resiBitArray, lce);
	1103	P1[0] = vce->data;
	1104
	1105	/* Process Row-0 data 1*/
	1106	pred1D = P1[0];
	1107	diff = spaceFillingValue[1] - pred1D;
	1108
	1109	itvNum = fabs(diff)/realPrecision + 1;
	1110
	1111	if (itvNum < exe_params->intvCapacity)
	1112	{
	1113	if (diff < 0) itvNum = -itvNum;
	1114	type[1] = (int) (itvNum/2) + exe_params->intvRadius;
	1115	P1[1] = pred1D + 2 * (type[1] - exe_params->intvRadius) * realPrecision;
	1116	}
	1117	else
	1118	{
	1119	if(updateReqLength==0)
	1120	{
	1121	computeReqLength_float(realPrecision, radExpo, &reqLength, &medianValue);
	1122	reqBytesLength = reqLength/8;
	1123	resiBitsLength = reqLength%8;
	1124	updateReqLength = 1;
	1125	}
	1126
	1127	type[1] = 0;
	1128
	1129	addDBA_Data(resiBitLengthArray, (unsigned char)resiBitsLength);
	1130	compressSingleFloatValue(vce, spaceFillingValue[1], realPrecision, medianValue, reqLength, reqBytesLength, resiBitsLength);
	1131	updateLossyCompElement_Float(vce->curBytes, preDataBytes, reqBytesLength, resiBitsLength, lce);
	1132	memcpy(preDataBytes,vce->curBytes,4);
	1133	addExactData(exactMidByteArray, exactLeadNumArray, resiBitArray, lce);
	1134	P1[1] = vce->data;
	1135	}
	1136
	1137	/* Process Row-0 data 2 --> data r3-1 */
	1138	for (j = 2; j < r3; j++)
	1139	{
	1140	if(j%blockEdgeSize==0)
	1141	{
	1142	J++;
	1143	realPrecision = pwrErrBound[J];
	1144	updateReqLength = 0;
	1145	}
	1146	pred1D = 2*P1[j-1] - P1[j-2];
	1147	diff = spaceFillingValue[j] - pred1D;
	1148
	1149	itvNum = fabs(diff)/realPrecision + 1;
	1150
	1151	if (itvNum < exe_params->intvCapacity)
	1152	{
	1153	if (diff < 0) itvNum = -itvNum;
	1154	type[j] = (int) (itvNum/2) + exe_params->intvRadius;
	1155	P1[j] = pred1D + 2 * (type[j] - exe_params->intvRadius) * realPrecision;
	1156	}
	1157	else
	1158	{
	1159	if(updateReqLength==0)
	1160	{
	1161	computeReqLength_float(realPrecision, radExpo, &reqLength, &medianValue);
	1162	reqBytesLength = reqLength/8;
	1163	resiBitsLength = reqLength%8;
	1164	updateReqLength = 1;
	1165	}
	1166
	1167	type[j] = 0;
	1168
	1169	addDBA_Data(resiBitLengthArray, (unsigned char)resiBitsLength);
	1170	compressSingleFloatValue(vce, spaceFillingValue[j], realPrecision, medianValue, reqLength, reqBytesLength, resiBitsLength);
	1171	updateLossyCompElement_Float(vce->curBytes, preDataBytes, reqBytesLength, resiBitsLength, lce);
	1172	memcpy(preDataBytes,vce->curBytes,4);
	1173	addExactData(exactMidByteArray, exactLeadNumArray, resiBitArray, lce);
	1174	P1[j] = vce->data;
	1175	}
	1176	}
	1177
	1178	/* Process Row-1 --> Row-r2-1 */
	1179	size_t index;
	1180	K = 0;
	1181	for (i = 1; i < r2; i++)
	1182	{
	1183	/* Process row-i data 0 */
	1184	index = i*r3;
	1185
	1186	J = 0;
	1187	if(i%blockEdgeSize==0)
	1188	I++;
	1189	realPrecision = pwrErrBound[I*R3+J]; //J==0
	1190	updateReqLength = 0;
	1191
	1192	pred1D = P1[index-r3];
	1193	diff = spaceFillingValue[index] - pred1D;
	1194
	1195	itvNum = fabs(diff)/realPrecision + 1;
	1196
	1197	if (itvNum < exe_params->intvCapacity)
	1198	{
	1199	if (diff < 0) itvNum = -itvNum;
	1200	type[index] = (int) (itvNum/2) + exe_params->intvRadius;
	1201	P1[index] = pred1D + 2 * (type[index] - exe_params->intvRadius) * realPrecision;
	1202	}
	1203	else
	1204	{
	1205	if(updateReqLength==0)
	1206	{
	1207	computeReqLength_float(realPrecision, radExpo, &reqLength, &medianValue);
	1208	reqBytesLength = reqLength/8;
	1209	resiBitsLength = reqLength%8;
	1210	updateReqLength = 1;
	1211	}
	1212
	1213	type[index] = 0;
	1214
	1215	addDBA_Data(resiBitLengthArray, (unsigned char)resiBitsLength);
	1216	compressSingleFloatValue(vce, spaceFillingValue[index], realPrecision, medianValue, reqLength, reqBytesLength, resiBitsLength);
	1217	updateLossyCompElement_Float(vce->curBytes, preDataBytes, reqBytesLength, resiBitsLength, lce);
	1218	memcpy(preDataBytes,vce->curBytes,4);
	1219	addExactData(exactMidByteArray, exactLeadNumArray, resiBitArray, lce);
	1220	P1[index] = vce->data;
	1221	}
	1222
	1223	/* Process row-i data 1 --> data r3-1*/
	1224	for (j = 1; j < r3; j++) //note that this j refers to fastest dimension (lowest order)
	1225	{
	1226	index = i*r3+j;
	1227	if(j%blockEdgeSize==0)
	1228	{
	1229	J++;
	1230	realPrecision = pwrErrBound[I*R3+J];
	1231	updateReqLength = 0;
	1232	}
	1233
	1234	pred2D = P1[index-1] + P1[index-r3] - P1[index-r3-1];
	1235
	1236	diff = spaceFillingValue[index] - pred2D;
	1237
	1238	itvNum = fabs(diff)/realPrecision + 1;
	1239
	1240	if (itvNum < exe_params->intvCapacity)
	1241	{
	1242	if (diff < 0) itvNum = -itvNum;
	1243	type[index] = (int) (itvNum/2) + exe_params->intvRadius;
	1244	P1[index] = pred2D + 2 * (type[index] - exe_params->intvRadius) * realPrecision;
	1245	}
	1246	else
	1247	{
	1248	if(updateReqLength==0)
	1249	{
	1250	computeReqLength_float(realPrecision, radExpo, &reqLength, &medianValue);
	1251	reqBytesLength = reqLength/8;
	1252	resiBitsLength = reqLength%8;
	1253	updateReqLength = 1;
	1254	}
	1255
	1256	type[index] = 0;
	1257
	1258	addDBA_Data(resiBitLengthArray, (unsigned char)resiBitsLength);
	1259	compressSingleFloatValue(vce, spaceFillingValue[index], realPrecision, medianValue, reqLength, reqBytesLength, resiBitsLength);
	1260	updateLossyCompElement_Float(vce->curBytes, preDataBytes, reqBytesLength, resiBitsLength, lce);
	1261	memcpy(preDataBytes,vce->curBytes,4);
	1262	addExactData(exactMidByteArray, exactLeadNumArray, resiBitArray, lce);
	1263	P1[index] = vce->data;
	1264	}
	1265	}
	1266	}
	1267
	1268	/////////////////////////// Process layer-1 --> layer-r1-1 ///////////////////////////
	1269
	1270	for (k = 1; k < r1; k++)
	1271	{
	1272	/* Process Row-0 data 0*/
	1273	index = k*r23;
	1274	I = 0;
	1275	J = 0;
	1276	if(k%blockEdgeSize==0)
	1277	K++;
	1278	realPrecision = pwrErrBound[K*R23]; //J==0
	1279	updateReqLength = 0;
	1280
	1281	pred1D = P1[0];
	1282	diff = spaceFillingValue[index] - pred1D;
	1283
	1284	itvNum = fabs(diff)/realPrecision + 1;
	1285
	1286	if (itvNum < exe_params->intvCapacity)
	1287	{
	1288	if (diff < 0) itvNum = -itvNum;
	1289	type[index] = (int) (itvNum/2) + exe_params->intvRadius;
	1290	P0[0] = pred1D + 2 * (type[index] - exe_params->intvRadius) * realPrecision;
	1291	}
	1292	else
	1293	{
	1294	if(updateReqLength==0)
	1295	{
	1296	computeReqLength_float(realPrecision, radExpo, &reqLength, &medianValue);
	1297	reqBytesLength = reqLength/8;
	1298	resiBitsLength = reqLength%8;
	1299	updateReqLength = 1;
	1300	}
	1301
	1302	type[index] = 0;
	1303
	1304	addDBA_Data(resiBitLengthArray, (unsigned char)resiBitsLength);
	1305	compressSingleFloatValue(vce, spaceFillingValue[index], realPrecision, medianValue, reqLength, reqBytesLength, resiBitsLength);
	1306	updateLossyCompElement_Float(vce->curBytes, preDataBytes, reqBytesLength, resiBitsLength, lce);
	1307	memcpy(preDataBytes,vce->curBytes,4);
	1308	addExactData(exactMidByteArray, exactLeadNumArray, resiBitArray, lce);
	1309	P0[0] = vce->data;
	1310	}
	1311
	1312	/* Process Row-0 data 1 --> data r3-1 */
	1313	for (j = 1; j < r3; j++)
	1314	{
	1315	index = k*r23+j;
	1316
	1317	if(j%blockEdgeSize==0)
	1318	{
	1319	J++;
	1320	realPrecision = pwrErrBound[K*R23+J];
	1321	updateReqLength = 0;
	1322	}
	1323	pred2D = P0[j-1] + P1[j] - P1[j-1];
	1324	diff = spaceFillingValue[index] - pred2D;
	1325
	1326	itvNum = fabs(diff)/realPrecision + 1;
	1327
	1328	if (itvNum < exe_params->intvCapacity)
	1329	{
	1330	if (diff < 0) itvNum = -itvNum;
	1331	type[index] = (int) (itvNum/2) + exe_params->intvRadius;
	1332	P0[j] = pred2D + 2 * (type[index] - exe_params->intvRadius) * realPrecision;
	1333	/* if(type[index]==0)
	1334	printf("err:type[%d]=0, index4\n", index); */
	1335	}
	1336	else
	1337	{
	1338	if(updateReqLength==0)
	1339	{
	1340	computeReqLength_float(realPrecision, radExpo, &reqLength, &medianValue);
	1341	reqBytesLength = reqLength/8;
	1342	resiBitsLength = reqLength%8;
	1343	updateReqLength = 1;
	1344	}
	1345
	1346	type[index] = 0;
	1347
	1348	addDBA_Data(resiBitLengthArray, (unsigned char)resiBitsLength);
	1349	compressSingleFloatValue(vce, spaceFillingValue[index], realPrecision, medianValue, reqLength, reqBytesLength, resiBitsLength);
	1350	updateLossyCompElement_Float(vce->curBytes, preDataBytes, reqBytesLength, resiBitsLength, lce);
	1351	memcpy(preDataBytes,vce->curBytes,4);
	1352	addExactData(exactMidByteArray, exactLeadNumArray, resiBitArray, lce);
	1353	P0[j] = vce->data;
	1354	}
	1355	}
	1356
	1357	/* Process Row-1 --> Row-r2-1 */
	1358	size_t index2D;
	1359	for (i = 1; i < r2; i++)
	1360	{
	1361	/* Process Row-i data 0 */
	1362	index = kr23 + ir3;
	1363	J = 0;
	1364	if(i%blockEdgeSize==0)
	1365	I++;
	1366	realPrecision = pwrErrBound[KR23+IR3+J]; //J==0
	1367	updateReqLength = 0;
	1368
	1369	index2D = i*r3;
	1370	pred2D = P0[index2D-r3] + P1[index2D] - P1[index2D-r3];
	1371	diff = spaceFillingValue[index] - pred2D;
	1372
	1373	itvNum = fabs(diff)/realPrecision + 1;
	1374
	1375	if (itvNum < exe_params->intvCapacity)
	1376	{
	1377	if (diff < 0) itvNum = -itvNum;
	1378	type[index] = (int) (itvNum/2) + exe_params->intvRadius;
	1379	P0[index2D] = pred2D + 2 * (type[index] - exe_params->intvRadius) * realPrecision;
	1380	}
	1381	else
	1382	{
	1383	if(updateReqLength==0)
	1384	{
	1385	computeReqLength_float(realPrecision, radExpo, &reqLength, &medianValue);
	1386	reqBytesLength = reqLength/8;
	1387	resiBitsLength = reqLength%8;
	1388	updateReqLength = 1;
	1389	}
	1390
	1391	type[index] = 0;
	1392
	1393	addDBA_Data(resiBitLengthArray, (unsigned char)resiBitsLength);
	1394	compressSingleFloatValue(vce, spaceFillingValue[index], realPrecision, medianValue, reqLength, reqBytesLength, resiBitsLength);
	1395	updateLossyCompElement_Float(vce->curBytes, preDataBytes, reqBytesLength, resiBitsLength, lce);
	1396	memcpy(preDataBytes,vce->curBytes,4);
	1397	addExactData(exactMidByteArray, exactLeadNumArray, resiBitArray, lce);
	1398	P0[index2D] = vce->data;
	1399	}
	1400
	1401	/* Process Row-i data 1 --> data r3-1 */
	1402	for (j = 1; j < r3; j++)
	1403	{
	1404	index = kr23 + ir3 + j;
	1405	if(j%blockEdgeSize==0)
	1406	{
	1407	J++;
	1408	realPrecision = pwrErrBound[KR23+IR3+J];
	1409	updateReqLength = 0;
	1410	}
	1411	index2D = i*r3 + j;
	1412	pred3D = P0[index2D-1] + P0[index2D-r3]+ P1[index2D] - P0[index2D-r3-1] - P1[index2D-r3] - P1[index2D-1] + P1[index2D-r3-1];
	1413	diff = spaceFillingValue[index] - pred3D;
	1414
	1415	itvNum = fabs(diff)/realPrecision + 1;
	1416
	1417	if (itvNum < exe_params->intvCapacity)
	1418	{
	1419	if (diff < 0) itvNum = -itvNum;
	1420	type[index] = (int) (itvNum/2) + exe_params->intvRadius;
	1421	P0[index2D] = pred3D + 2 * (type[index] - exe_params->intvRadius) * realPrecision;
	1422	}
	1423	else
	1424	{
	1425	if(updateReqLength==0)
	1426	{
	1427	computeReqLength_float(realPrecision, radExpo, &reqLength, &medianValue);
	1428	reqBytesLength = reqLength/8;
	1429	resiBitsLength = reqLength%8;
	1430	updateReqLength = 1;
	1431	}
	1432
	1433	type[index] = 0;
	1434
	1435	addDBA_Data(resiBitLengthArray, (unsigned char)resiBitsLength);
	1436	compressSingleFloatValue(vce, spaceFillingValue[index], realPrecision, medianValue, reqLength, reqBytesLength, resiBitsLength);
	1437	updateLossyCompElement_Float(vce->curBytes, preDataBytes, reqBytesLength, resiBitsLength, lce);
	1438	memcpy(preDataBytes,vce->curBytes,4);
	1439	addExactData(exactMidByteArray, exactLeadNumArray, resiBitArray, lce);
	1440	P0[index2D] = vce->data;
	1441	}
	1442	}
	1443	}
	1444
	1445	float *Pt;
	1446	Pt = P1;
	1447	P1 = P0;
	1448	P0 = Pt;
	1449	}
	1450	if(r23!=1)
	1451	free(P0);
	1452	free(P1);
	1453	int exactDataNum = exactLeadNumArray->size;
	1454
	1455	TightDataPointStorageF* tdps;
	1456
	1457	new_TightDataPointStorageF2(&tdps, dataLength, exactDataNum,
	1458	type, exactMidByteArray->array, exactMidByteArray->size,
	1459	exactLeadNumArray->array,
	1460	resiBitArray->array, resiBitArray->size,
	1461	resiBitLengthArray->array, resiBitLengthArray->size,
	1462	realPrecision, medianValue, (char)reqLength, quantization_intervals, pwrErrBoundBytes, pwrErrBoundBytes_size, radExpo);
	1463
	1464	//sdi:Debug
	1465	/* int sum =0;
	1466	for(i=0;i<dataLength;i++)
	1467	if(type[i]==0) sum++;
	1468	printf("opt_quantizations=%d, exactDataNum=%d, sum=%d\n",quantization_intervals, exactDataNum, sum);
	1469	*/
	1470
	1471	convertTDPStoFlatBytes_float(tdps, newByteData, outSize);
	1472
	1473	//free memory
	1474	free_DBA(resiBitLengthArray);
	1475	free_DIA(exactLeadNumArray);
	1476	free_DIA(resiBitArray);
	1477	free(type);
	1478
	1479
	1480	free(pwrErrBound);
	1481
	1482	free(vce);
	1483	free(lce);
	1484	free_TightDataPointStorageF(tdps);
	1485	free(exactMidByteArray);
	1486	}
	1487
	1488	void createRangeGroups_float(float posGroups, float negGroups, int posFlags, int negFlags)
	1489	{
	1490	size_t size = GROUP_COUNT*sizeof(float);
	1491	size_t size2 = GROUP_COUNT*sizeof(int);
	1492	posGroups = (float)malloc(size);
	1493	negGroups = (float)malloc(size);
	1494	posFlags = (int)malloc(size2);
	1495	negFlags = (int)malloc(size2);
	1496	memset(*posGroups, 0, size);
	1497	memset(*negGroups, 0, size);
	1498	memset(*posFlags, 0, size2);
	1499	memset(*negFlags, 0, size2);
	1500	}
	1501
	1502	void compressGroupIDArray_float(char* groupID, TightDataPointStorageF* tdps)
	1503	{
	1504	size_t dataLength = tdps->dataSeriesLength;
	1505	int* standGroupID = (int)malloc(dataLengthsizeof(int));
	1506
	1507	size_t i;
	1508	standGroupID[0] = groupID[0]+GROUP_COUNT; //plus an offset such that it would not be a negative number.
	1509	char lastGroupIDValue = groupID[0], curGroupIDValue;
	1510	int offset = 2*(GROUP_COUNT + 2);
	1511	for(i=1; i<dataLength;i++)
	1512	{
	1513	curGroupIDValue = groupID[i];
	1514	standGroupID[i] = (curGroupIDValue - lastGroupIDValue) + offset;
	1515	lastGroupIDValue = curGroupIDValue;
	1516	}
	1517
	1518	unsigned char* out = NULL;
	1519	size_t outSize;
	1520
	1521	HuffmanTree* huffmanTree = SZ_Reset();
	1522	encode_withTree(huffmanTree, standGroupID, dataLength, &out, &outSize);
	1523	SZ_ReleaseHuffman(huffmanTree);
	1524
	1525	tdps->pwrErrBoundBytes = out; //groupIDArray
	1526	tdps->pwrErrBoundBytes_size = outSize;
	1527
	1528	free(standGroupID);
	1529	}
	1530
	1531	TightDataPointStorageF* SZ_compress_float_1D_MDQ_pwrGroup(float* oriData, size_t dataLength, int errBoundMode,
	1532	double absErrBound, double relBoundRatio, double pwrErrRatio, float valueRangeSize, float medianValue_f)
	1533	{
	1534	size_t i;
	1535	float posGroups, negGroups, *groups;
	1536	float pos_01_group = 0, neg_01_group = 0; //[0,1] and [-1,0]
	1537	int posFlags, negFlags, *flags;
	1538	int pos_01_flag = 0, neg_01_flag = 0;
	1539	createRangeGroups_float(&posGroups, &negGroups, &posFlags, &negFlags);
	1540	size_t nbBins = (size_t)(1/pwrErrRatio);
	1541	if(nbBins%2==1)
	1542	nbBins++;
	1543	exe_params->intvRadius = nbBins;
	1544
	1545	int reqLength, status;
	1546	float medianValue = medianValue_f;
	1547	float realPrecision = (float)getRealPrecision_float(valueRangeSize, errBoundMode, absErrBound, relBoundRatio, &status);
	1548	if(realPrecision<0)
	1549	realPrecision = pwrErrRatio;
	1550	float realGroupPrecision; //precision (error) based on group ID
	1551	getPrecisionReqLength_float(realPrecision);
	1552	short radExpo = getExponent_float(valueRangeSize/2);
	1553	short lastGroupNum = 0, groupNum, grpNum = 0;
	1554
	1555	double* groupErrorBounds = generateGroupErrBounds(errBoundMode, realPrecision, pwrErrRatio);
	1556	exe_params->intvRadius = generateGroupMaxIntervalCount(groupErrorBounds);
	1557
	1558	computeReqLength_float(realPrecision, radExpo, &reqLength, &medianValue);
	1559
	1560	int* type = (int) malloc(dataLengthsizeof(int));
	1561	char groupID = (char) malloc(dataLength*sizeof(char));
	1562	char *gp = groupID;
	1563
	1564	float* spaceFillingValue = oriData;
	1565
	1566	DynamicIntArray *exactLeadNumArray;
	1567	new_DIA(&exactLeadNumArray, DynArrayInitLen);
	1568
	1569	DynamicByteArray *exactMidByteArray;
	1570	new_DBA(&exactMidByteArray, DynArrayInitLen);
	1571
	1572	DynamicIntArray *resiBitArray;
	1573	new_DIA(&resiBitArray, DynArrayInitLen);
	1574
	1575	unsigned char preDataBytes[4];
	1576	intToBytes_bigEndian(preDataBytes, 0);
	1577
	1578	int reqBytesLength = reqLength/8;
	1579	int resiBitsLength = reqLength%8;
	1580
	1581	FloatValueCompressElement vce = (FloatValueCompressElement)malloc(sizeof(FloatValueCompressElement));
	1582	LossyCompressionElement lce = (LossyCompressionElement)malloc(sizeof(LossyCompressionElement));
	1583
	1584	int state;
	1585	float curData, decValue;
	1586	float pred;
	1587	float predAbsErr;
	1588	double interval = 0;
	1589
	1590	//add the first data
	1591	type[0] = 0;
	1592	compressSingleFloatValue(vce, spaceFillingValue[0], realPrecision, medianValue, reqLength, reqBytesLength, resiBitsLength);
	1593	updateLossyCompElement_Float(vce->curBytes, preDataBytes, reqBytesLength, resiBitsLength, lce);
	1594	memcpy(preDataBytes,vce->curBytes,4);
	1595	addExactData(exactMidByteArray, exactLeadNumArray, resiBitArray, lce);
	1596
	1597	curData = spaceFillingValue[0];
	1598	groupNum = computeGroupNum_float(vce->data);
	1599
	1600	if(curData > 0 && groupNum >= 0)
	1601	{
	1602	groups = posGroups;
	1603	flags = posFlags;
	1604	grpNum = groupNum;
	1605	}
	1606	else if(curData < 0 && groupNum >= 0)
	1607	{
	1608	groups = negGroups;
	1609	flags = negFlags;
	1610	grpNum = groupNum;
	1611	}
	1612	else if(curData >= 0 && groupNum == -1)
	1613	{
	1614	groups = &pos_01_group;
	1615	flags = &pos_01_flag;
	1616	grpNum = 0;
	1617	}
	1618	else //curData < 0 && groupNum == -1
	1619	{
	1620	groups = &neg_01_group;
	1621	flags = &neg_01_flag;
	1622	grpNum = 0;
	1623	}
	1624
	1625	listAdd_float_group(groups, flags, groupNum, spaceFillingValue[0], vce->data, gp);
	1626	gp++;
	1627
	1628	for(i=1;i<dataLength;i++)
	1629	{
	1630	curData = oriData[i];
	1631	//printf("i=%d, posGroups[3]=%f, negGroups[3]=%f\n", i, posGroups[3], negGroups[3]);
	1632
	1633	groupNum = computeGroupNum_float(curData);
	1634
	1635	if(curData > 0 && groupNum >= 0)
	1636	{
	1637	groups = posGroups;
	1638	flags = posFlags;
	1639	grpNum = groupNum;
	1640	}
	1641	else if(curData < 0 && groupNum >= 0)
	1642	{
	1643	groups = negGroups;
	1644	flags = negFlags;
	1645	grpNum = groupNum;
	1646	}
	1647	else if(curData >= 0 && groupNum == -1)
	1648	{
	1649	groups = &pos_01_group;
	1650	flags = &pos_01_flag;
	1651	grpNum = 0;
	1652	}
	1653	else //curData < 0 && groupNum == -1
	1654	{
	1655	groups = &neg_01_group;
	1656	flags = &neg_01_flag;
	1657	grpNum = 0;
	1658	}
	1659
	1660	if(groupNum>=GROUP_COUNT)
	1661	{
	1662	type[i] = 0;
	1663	compressSingleFloatValue(vce, curData, realPrecision, medianValue, reqLength, reqBytesLength, resiBitsLength);
	1664	updateLossyCompElement_Float(vce->curBytes, preDataBytes, reqBytesLength, resiBitsLength, lce);
	1665	memcpy(preDataBytes,vce->curBytes,4);
	1666	addExactData(exactMidByteArray, exactLeadNumArray, resiBitArray, lce);
	1667	listAdd_float_group(groups, flags, lastGroupNum, curData, vce->data, gp); //set the group number to be last one in order to get the groupID array as smooth as possible.
	1668	}
	1669	else if(flags[grpNum]==0) //the dec value may not be in the same group
	1670	{
	1671	type[i] = 0;
	1672	compressSingleFloatValue(vce, curData, realPrecision, medianValue, reqLength, reqBytesLength, resiBitsLength);
	1673	updateLossyCompElement_Float(vce->curBytes, preDataBytes, reqBytesLength, resiBitsLength, lce);
	1674	memcpy(preDataBytes,vce->curBytes,4);
	1675	addExactData(exactMidByteArray, exactLeadNumArray, resiBitArray, lce);
	1676	//decGroupNum = computeGroupNum_float(vce->data);
	1677
	1678	//if(decGroupNum < groupNum)
	1679	// decValue = curData>0?pow(2, groupNum):-pow(2, groupNum);
	1680	//else if(decGroupNum > groupNum)
	1681	// decValue = curData>0?pow(2, groupNum+1):-pow(2, groupNum+1);
	1682	//else
	1683	// decValue = vce->data;
	1684
	1685	decValue = vce->data;
	1686	listAdd_float_group(groups, flags, groupNum, curData, decValue, gp);
	1687	lastGroupNum = curData>0?groupNum + 2: -(groupNum+2);
	1688	}
	1689	else //if flags[groupNum]==1, the dec value must be in the same group
	1690	{
	1691	pred = groups[grpNum];
	1692	predAbsErr = fabs(curData - pred);
	1693	realGroupPrecision = groupErrorBounds[grpNum]; //compute real error bound
	1694	interval = realGroupPrecision*2;
	1695	state = (predAbsErr/realGroupPrecision+1)/2;
	1696	if(curData>=pred)
	1697	{
	1698	type[i] = exe_params->intvRadius+state;
	1699	decValue = pred + state*interval;
	1700	}
	1701	else //curData<pred
	1702	{
	1703	type[i] = exe_params->intvRadius-state;
	1704	decValue = pred - state*interval;
	1705	}
	1706	//decGroupNum = computeGroupNum_float(pred);
	1707
	1708	if((decValue>0&&curData<0)\|\|(decValue<0&&curData>=0))
	1709	decValue = 0;
	1710	//else
	1711	//{
	1712	// if(decGroupNum < groupNum)
	1713	// decValue = curData>0?pow(2, groupNum):-pow(2, groupNum);
	1714	// else if(decGroupNum > groupNum)
	1715	// decValue = curData>0?pow(2, groupNum+1):-pow(2, groupNum+1);
	1716	// else
	1717	// decValue = pred;
	1718	//}
	1719
	1720	if(fabs(curData-decValue)>realGroupPrecision)
	1721	{
	1722	type[i] = 0;
	1723	compressSingleFloatValue(vce, curData, realPrecision, medianValue, reqLength, reqBytesLength, resiBitsLength);
	1724	updateLossyCompElement_Float(vce->curBytes, preDataBytes, reqBytesLength, resiBitsLength, lce);
	1725	memcpy(preDataBytes,vce->curBytes,4);
	1726	addExactData(exactMidByteArray, exactLeadNumArray, resiBitArray, lce);
	1727
	1728	decValue = vce->data;
	1729	}
	1730
	1731	listAdd_float_group(groups, flags, groupNum, curData, decValue, gp);
	1732	lastGroupNum = curData>=0?groupNum + 2: -(groupNum+2);
	1733	}
	1734	gp++;
	1735
	1736	}
	1737
	1738	int exactDataNum = exactLeadNumArray->size;
	1739
	1740	TightDataPointStorageF* tdps;
	1741
	1742	//combineTypeAndGroupIDArray(nbBins, dataLength, &type, groupID);
	1743
	1744	new_TightDataPointStorageF(&tdps, dataLength, exactDataNum,
	1745	type, exactMidByteArray->array, exactMidByteArray->size,
	1746	exactLeadNumArray->array,
	1747	resiBitArray->array, resiBitArray->size,
	1748	resiBitsLength,
	1749	realPrecision, medianValue, (char)reqLength, nbBins, NULL, 0, radExpo);
	1750
	1751	compressGroupIDArray_float(groupID, tdps);
	1752
	1753	free(posGroups);
	1754	free(negGroups);
	1755	free(posFlags);
	1756	free(negFlags);
	1757	free(groupID);
	1758	free(groupErrorBounds);
	1759
	1760	free_DIA(exactLeadNumArray);
	1761	free_DIA(resiBitArray);
	1762	free(type);
	1763	free(vce);
	1764	free(lce);
	1765	free(exactMidByteArray); //exactMidByteArray->array has been released in free_TightDataPointStorageF(tdps);
	1766
	1767	return tdps;
	1768	}
	1769
	1770	void SZ_compress_args_float_NoCkRngeNoGzip_1D_pwrgroup(unsigned char** newByteData, float *oriData,
	1771	size_t dataLength, double absErrBound, double relBoundRatio, double pwrErrRatio, float valueRangeSize, float medianValue_f, size_t *outSize)
	1772	{
	1773	TightDataPointStorageF* tdps = SZ_compress_float_1D_MDQ_pwrGroup(oriData, dataLength, confparams_cpr->errorBoundMode,
	1774	absErrBound, relBoundRatio, pwrErrRatio,
	1775	valueRangeSize, medianValue_f);
	1776
	1777	convertTDPStoFlatBytes_float(tdps, newByteData, outSize);
	1778
	1779	if(outSize>dataLengthsizeof(float))
	1780	SZ_compress_args_float_StoreOriData(oriData, dataLength+2, tdps, newByteData, outSize);
	1781
	1782	free_TightDataPointStorageF(tdps);
	1783	}
[9ee2ce3]	1784
	1785	#include <stdbool.h>
	1786
	1787	void SZ_compress_args_float_NoCkRngeNoGzip_1D_pwr_pre_log(unsigned char** newByteData, float oriData, double pwrErrRatio, size_t dataLength, size_t outSize, float min, float max){
	1788
	1789	float * log_data = (float ) malloc(dataLength sizeof(float));
	1790
	1791	unsigned char * signs = (unsigned char *) malloc(dataLength);
	1792	memset(signs, 0, dataLength);
	1793	// preprocess
	1794	float max_abs_log_data;
	1795	if(min == 0) max_abs_log_data = fabs(log2(fabs(max)));
	1796	else if(max == 0) max_abs_log_data = fabs(log2(fabs(min)));
	1797	else max_abs_log_data = fabs(log2(fabs(min))) > fabs(log2(fabs(max))) ? fabs(log2(fabs(min))) : fabs(log2(fabs(max)));
	1798	float min_log_data = max_abs_log_data;
	1799	bool positive = true;
	1800	for(size_t i=0; i<dataLength; i++){
	1801	if(oriData[i] < 0){
	1802	signs[i] = 1;
	1803	log_data[i] = -oriData[i];
	1804	positive = false;
	1805	}
	1806	else
	1807	log_data[i] = oriData[i];
	1808	if(log_data[i] > 0){
	1809	log_data[i] = log2(log_data[i]);
	1810	if(log_data[i] > max_abs_log_data) max_abs_log_data = log_data[i];
	1811	if(log_data[i] < min_log_data) min_log_data = log_data[i];
	1812	}
	1813	}
	1814
	1815	float valueRangeSize, medianValue_f;
	1816	computeRangeSize_float(log_data, dataLength, &valueRangeSize, &medianValue_f);
	1817	if(fabs(min_log_data) > max_abs_log_data) max_abs_log_data = fabs(min_log_data);
	1818	double realPrecision = log2(1.0 + pwrErrRatio) - max_abs_log_data * 1.2e-7;
	1819	for(size_t i=0; i<dataLength; i++){
	1820	if(oriData[i] == 0){
	1821	log_data[i] = min_log_data - 2.0001*realPrecision;
	1822	}
	1823	}
	1824
	1825	TightDataPointStorageF* tdps = SZ_compress_float_1D_MDQ(log_data, dataLength, realPrecision, valueRangeSize, medianValue_f);
	1826	tdps->minLogValue = min_log_data - 1.0001*realPrecision;
	1827	free(log_data);
	1828	if(!positive){
	1829	unsigned char * comp_signs;
	1830	// compress signs
	1831	unsigned long signSize = sz_lossless_compress(confparams_cpr->losslessCompressor, confparams_cpr->gzipMode, signs, dataLength, &comp_signs);
	1832	tdps->pwrErrBoundBytes = comp_signs;
	1833	tdps->pwrErrBoundBytes_size = signSize;
	1834	}
	1835	else{
	1836	tdps->pwrErrBoundBytes = NULL;
	1837	tdps->pwrErrBoundBytes_size = 0;
	1838	}
	1839	free(signs);
	1840
	1841	convertTDPStoFlatBytes_float(tdps, newByteData, outSize);
	1842	if(outSize>dataLengthsizeof(float))
	1843	SZ_compress_args_float_StoreOriData(oriData, dataLength+2, tdps, newByteData, outSize);
	1844
	1845	free_TightDataPointStorageF(tdps);
	1846	}
	1847
	1848	void SZ_compress_args_float_NoCkRngeNoGzip_2D_pwr_pre_log(unsigned char** newByteData, float oriData, double pwrErrRatio, size_t r1, size_t r2, size_t outSize, float min, float max){
	1849
	1850	size_t dataLength = r1 * r2;
	1851	float * log_data = (float ) malloc(dataLength sizeof(float));
	1852
	1853	unsigned char * signs = (unsigned char *) malloc(dataLength);
	1854	memset(signs, 0, dataLength);
	1855	// preprocess
	1856	float max_abs_log_data;
	1857	if(min == 0) max_abs_log_data = fabs(log2(fabs(max)));
	1858	else if(max == 0) max_abs_log_data = fabs(log2(fabs(min)));
	1859	else max_abs_log_data = fabs(log2(fabs(min))) > fabs(log2(fabs(max))) ? fabs(log2(fabs(min))) : fabs(log2(fabs(max)));
	1860	float min_log_data = max_abs_log_data;
	1861	bool positive = true;
	1862	for(size_t i=0; i<dataLength; i++){
	1863	if(oriData[i] < 0){
	1864	signs[i] = 1;
	1865	log_data[i] = -oriData[i];
	1866	positive = false;
	1867	}
	1868	else
	1869	log_data[i] = oriData[i];
	1870	if(log_data[i] > 0){
	1871	log_data[i] = log2(log_data[i]);
	1872	if(log_data[i] > max_abs_log_data) max_abs_log_data = log_data[i];
	1873	if(log_data[i] < min_log_data) min_log_data = log_data[i];
	1874	}
	1875	}
	1876
	1877	float valueRangeSize, medianValue_f;
	1878	computeRangeSize_float(log_data, dataLength, &valueRangeSize, &medianValue_f);
	1879	if(fabs(min_log_data) > max_abs_log_data) max_abs_log_data = fabs(min_log_data);
	1880	double realPrecision = log2(1.0 + pwrErrRatio) - max_abs_log_data * 1.2e-7;
	1881	for(size_t i=0; i<dataLength; i++){
	1882	if(oriData[i] == 0){
	1883	log_data[i] = min_log_data - 2.0001*realPrecision;
	1884	}
	1885	}
	1886
	1887	TightDataPointStorageF* tdps = SZ_compress_float_2D_MDQ(log_data, r1, r2, realPrecision, valueRangeSize, medianValue_f);
	1888	tdps->minLogValue = min_log_data - 1.0001*realPrecision;
	1889	free(log_data);
	1890	if(!positive){
	1891	unsigned char * comp_signs;
	1892	// compress signs
	1893	unsigned long signSize = sz_lossless_compress(confparams_cpr->losslessCompressor, confparams_cpr->gzipMode, signs, dataLength, &comp_signs);
	1894	tdps->pwrErrBoundBytes = comp_signs;
	1895	tdps->pwrErrBoundBytes_size = signSize;
	1896	}
	1897	else{
	1898	tdps->pwrErrBoundBytes = NULL;
	1899	tdps->pwrErrBoundBytes_size = 0;
	1900	}
	1901	free(signs);
	1902
	1903	convertTDPStoFlatBytes_float(tdps, newByteData, outSize);
	1904	if(outSize>dataLengthsizeof(float))
	1905	SZ_compress_args_float_StoreOriData(oriData, dataLength+2, tdps, newByteData, outSize);
	1906
	1907	free_TightDataPointStorageF(tdps);
	1908	}
	1909
	1910	void SZ_compress_args_float_NoCkRngeNoGzip_3D_pwr_pre_log(unsigned char** newByteData, float oriData, double pwrErrRatio, size_t r1, size_t r2, size_t r3, size_t outSize, float min, float max){
	1911
	1912	size_t dataLength = r1 * r2 * r3;
	1913	float * log_data = (float ) malloc(dataLength sizeof(float));
	1914
	1915	unsigned char * signs = (unsigned char *) malloc(dataLength);
	1916	memset(signs, 0, dataLength);
	1917	// preprocess
	1918	float max_abs_log_data;
	1919	if(min == 0) max_abs_log_data = fabs(log2(fabs(max)));
	1920	else if(max == 0) max_abs_log_data = fabs(log2(fabs(min)));
	1921	else max_abs_log_data = fabs(log2(fabs(min))) > fabs(log2(fabs(max))) ? fabs(log2(fabs(min))) : fabs(log2(fabs(max)));
	1922	float min_log_data = max_abs_log_data;
	1923	bool positive = true;
	1924	for(size_t i=0; i<dataLength; i++){
	1925	if(oriData[i] < 0){
	1926	signs[i] = 1;
	1927	log_data[i] = -oriData[i];
	1928	positive = false;
	1929	}
	1930	else
	1931	log_data[i] = oriData[i];
	1932	if(log_data[i] > 0){
	1933	log_data[i] = log2(log_data[i]);
	1934	if(log_data[i] > max_abs_log_data) max_abs_log_data = log_data[i];
	1935	if(log_data[i] < min_log_data) min_log_data = log_data[i];
	1936	}
	1937	}
	1938
	1939	float valueRangeSize, medianValue_f;
	1940	computeRangeSize_float(log_data, dataLength, &valueRangeSize, &medianValue_f);
	1941	if(fabs(min_log_data) > max_abs_log_data) max_abs_log_data = fabs(min_log_data);
	1942	double realPrecision = log2(1.0 + pwrErrRatio) - max_abs_log_data * 1.2e-7;
	1943	for(size_t i=0; i<dataLength; i++){
	1944	if(oriData[i] == 0){
	1945	log_data[i] = min_log_data - 2.0001*realPrecision;
	1946	}
	1947	}
	1948
	1949	TightDataPointStorageF* tdps = SZ_compress_float_3D_MDQ(log_data, r1, r2, r3, realPrecision, valueRangeSize, medianValue_f);
	1950	tdps->minLogValue = min_log_data - 1.0001*realPrecision;
	1951	free(log_data);
	1952	if(!positive){
	1953	unsigned char * comp_signs;
	1954	// compress signs
	1955	unsigned long signSize = sz_lossless_compress(confparams_cpr->losslessCompressor, confparams_cpr->gzipMode, signs, dataLength, &comp_signs);
	1956	tdps->pwrErrBoundBytes = comp_signs;
	1957	tdps->pwrErrBoundBytes_size = signSize;
	1958	}
	1959	else{
	1960	tdps->pwrErrBoundBytes = NULL;
	1961	tdps->pwrErrBoundBytes_size = 0;
	1962	}
	1963	free(signs);
	1964
	1965	convertTDPStoFlatBytes_float(tdps, newByteData, outSize);
	1966	if(outSize>dataLengthsizeof(float))
	1967	SZ_compress_args_float_StoreOriData(oriData, dataLength+2, tdps, newByteData, outSize);
	1968
	1969	free_TightDataPointStorageF(tdps);
	1970	}

Note: See TracBrowser for help on using the repository browser.

Download in other formats: