-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathFP_ETA1.cpp
250 lines (203 loc) · 5.97 KB
/
FP_ETA1.cpp
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
#include <stdio.h>
#include <stdlib.h>
#include <math.h>
#include <random>
#include <iostream>
#include <time.h>
//#include <values.h>
#define bitnum 12
#define mask 0xFFF
/* endianness testing */
const int EndianTest = 0x04030201;
#define LITTLE_ENDIAN() (*((const char *) &EndianTest) == 0x01)
/* extract nth LSB from object stored in lvalue x */
#define GET_BIT(x, n) ((((const char *) &x)[LITTLE_ENDIAN() ? (n) / CHARBITS : sizeof(x) - (n) / CHARBITS - 1] >> ((n) % CHARBITS)) & 0x01)
#define PUT_BIT(x, n) (putchar(GET_BIT((x), (n)) ? '1' : '0'))
#define not_real_number printf("Not real number\n"); \
exit(1);
std::random_device rd; //Will be used to obtain a seed for the random number engine
std::mt19937 generator(rd()); //Standard mersenne_twister_engine seeded with rd()
std::uniform_int_distribution<int> RandomExponent(0, 254);
std::uniform_int_distribution<int> RandomMantisa(0, 0x7FFFFF);
std::uniform_int_distribution<int> RandomSign(0, 1);
int nnn = 1;
int checknum = 0;
//Union 사용
typedef union {
float f;
struct {
unsigned int mantisa : 23;
unsigned int exponent : 8;
unsigned int sign : 1;
} parts;
} float_cast;
float_cast makeFP();
float_cast FPAdder(float_cast a, float_cast b);
float_cast makeFP() {
//exponet => 127(7F) ~ -128(80)
//mantisa => 524287(7FFFF) ~ 0(0)
float_cast num;
num.parts.exponent = RandomExponent(generator); //0~255 -> 2^(exponent - 126) * 1.(mantisa)
//if exponent == 255 -> inf
num.parts.mantisa = RandomMantisa(generator);
num.parts.sign = 0;
return num;
}
unsigned int eta1(unsigned int a, unsigned int b)
{
unsigned int M, N, m, n, inaccuratePart = 0, r, sum = 0;
int carry, imask = 0x800;
M = a & mask;
N = b & mask;
while (1) {
m = a & imask;
n = b & imask;
r = m ^ n;
inaccuratePart += r;
if (r == imask && m == imask && n == imask) {
inaccuratePart += imask - 1;
break;
}
imask /= 2;
}
sum = (a - M) + (b - N) + inaccuratePart;
return sum;
}
float_cast FPAdder(float_cast a, float_cast b) {
//먼저 두 값이 real number인지 판단해야한다. (inf, -inf, 0, -0, NAN)
//0 FF 000000 -> inf, 1 FF 000000 -> -inf, 00000 -> 0, 100000 -> -0
//입력값이 INF일 수 가있나?
if (a.parts.exponent == 0xFF && a.parts.sign == 0) //a is inf
{
not_real_number
}
else if (a.parts.exponent == 0xFF && a.parts.sign == 1)//a is -inf
{
not_real_number
}
if (b.parts.exponent == 0xFF && b.parts.sign == 0) //b is inf
{
not_real_number
}
else if (b.parts.exponent == 0xFF && b.parts.sign == 1)//b is -inf
{
not_real_number
}
float_cast z; //return 값
z.parts.sign = 0;
unsigned int sum = 0;
//굳이 0 따로 볼필요없다.
if (a.f == 0) //a == 0 || b == 0 return a or b
z.f = b.f;
else if (b.f == 0)
z.f = a.f;
int subEx = a.parts.exponent - b.parts.exponent;
if (subEx == 0) {//exponents equal
checknum = 1;
z.parts.exponent = a.parts.exponent;
//eta1
sum = eta1(a.parts.mantisa, b.parts.mantisa);
if (sum == 0)
z.f = 0;
else {
z.parts.mantisa = sum >> 1;
z.parts.exponent++;
if (z.parts.exponent >= 0xFF) {//is it overflow?
printf("Overflow\n");
}
else {
}
//z.parts.mantisa &= 0x7FFFF;
}
}
else { //shift smaller one to bigger one
if (subEx > 0) {// a's exponent > b's exponent => shift mantisa right
//b.parts.exponent = a.parts.exponent;
z.parts.exponent = a.parts.exponent;
if (abs(subEx) >= 23) //shift 가 mantisa의 23비트 넘어서면 0으로 초기화!
b.parts.mantisa = 0;
else {
//a.parts.mantisa >>= abs(subEx);
if (b.parts.exponent != 0)
b.parts.mantisa = (b.parts.mantisa >> 1) + 0x400000;
if (abs(subEx) > 1)
b.parts.mantisa >>= abs(subEx) - 1;
}
}
else {// a's exponent < b's exponent => shift mantisa right
//a.parts.exponent = b.parts.exponent;
z.parts.exponent = b.parts.exponent;
if (abs(subEx) >= 23)//shift 가 mantisa의 23비트 넘어서면 0으로 초기화!
a.parts.mantisa = 0;
else {
//a.parts.mantisa >>= abs(subEx);
if (a.parts.exponent != 0)
a.parts.mantisa = (a.parts.mantisa >> 1) + 0x400000;
if (abs(subEx) > 1)
a.parts.mantisa >>= abs(subEx) - 1;
}
}
//eta1
sum = eta1(a.parts.mantisa, b.parts.mantisa);
//mantisa + matisa가 23비트가 넘어가버리면 자동으로 잘라버림! (왜냐면 union이니깐)
//따라서 우리가 직접 넘어가는 carry값을 처리해줘야한다.
if (sum > 0x7FFFFF) {
z.parts.mantisa = (sum >> 1) - 0x400000;
z.parts.exponent++;
}
else
z.parts.mantisa = sum;
if (z.parts.mantisa == 0)
z.f = 0;
}
return z;
}
int main(void) {
float_cast A, B, ans;
float_cast orgAns;
//FILE* input = fopen("input.txt", "r");
int cnt = 0;
printf("A\t\t+\t\tB\t=\torgANS\t\tmyANS\n");
printf("**********************************************************************\n");
A = makeFP();
B = makeFP();
//A, B 랜덤 지정
//while (!feof(input)) {
// fscanf(input, "%f %f ", &A.f, &B.f);
//A.f = 1.134724000000E-38;
//B.f = 3.848032000000E-36;
//A, B 직접 지정
ans = FPAdder(A, B);
orgAns.f = A.f + B.f;
if (checknum == 1) {
printf("%d: %e + %e = %e, %e\n", nnn, A.f, B.f, orgAns.f, ans.f);
checknum = 0;
printf("\n\n******************************\n");
}
else {
printf("++ %d: %e + %e = %e, %e\n", nnn, A.f, B.f, orgAns.f, ans.f);
printf("\n\n******************************\n");
}
nnn++;
//}
//fclose(input);
}
/*
sign = 1
exponent = 7e
mantisa = 0*/
/*오버플로 언더플로 예시가 생길 수 잇나
오버플로 언더플로 warning 이나 runtime error 발생시키나요? 예외처리
단순히 에러처리하는것으로 보자.
rounding 은 무엇? 어떻게 하나요
shift 할 때 맨첨엔 1넣고 , 담부턴 0으로 넣기?
exponent, mantissa 둘다 랜덤정수로 입력하기
c++ 랜덤정수 넣기
에러체크 , med 이런식으로 검색해보기 (척도가 없어서 그럼)
*/
/*
3.4028235E38
~
-3.4028235E38
0_0000_0000_ 11111111111111111 -> 1.1754942E-38
*/