Commitf7bc922

authored

Fix float 8 cast (#37)

* fix f8* fix* cleaning

1 parent2fde01f commitf7bc922Copy full SHA for f7bc922

File tree

2 files changed

+145

-63

lines changed

_unittests/ut_validation
- test_f8.py
onnx_array_api/validation
- f8.py

2 files changed

+145

-63

lines changed

`‎_unittests/ut_validation/test_f8.py`

Lines changed: 71 additions & 11 deletions

Original file line number	Diff line number	Diff line change
`@@ -1,9 +1,11 @@`
`1`	`1`	`importos`
`2`	`2`	`importpprint`
	`3`	`+importstruct`
`3`	`4`	`importunittest`
`4`	`5`	`importwarnings`
`5`	`6`	`importnumpy`
`6`	`7`	`importpandas`
	`8`	`+fromonnximportTensorProto`
`7`	`9`	`fromonnx_array_api.validation.f8import (`
`8`	`10`	`CastFloat8,`
`9`	`11`	`UndefinedCastError,`
`@@ -285,6 +287,15 @@ def test_search_float32_into_fe4m3fn(self):`
`285`	`287`	`ok=""ifb==nfelse"WRONG",`
`286`	`288`	`true=value,`
`287`	`289`	`add=add,`
	`290`	`+exponent=(`
	`291`	`+int.from_bytes(`
	`292`	`+struct.pack("<f",numpy.float32(v)),"little"`
	`293`	`+ )`
	`294`	`+&0x7F800000`
	`295`	`+ )`
	`296`	`+>>23,`
	`297`	`+d1=v-fe4m3_to_float32_float(nf),`
	`298`	`+d2=v-fe4m3_to_float32_float(b),`
`288`	`299`	`)`
`289`	`300`	`)`
`290`	`301`	`ifwrong>0:`
`@@ -449,10 +460,13 @@ def test_search_e4m3_pow(self):`
`449`	`460`	`continue`
`450`	`461`	`r2=float32_to_fe4m3(v)`
`451`	`462`	`ifr1!=r2:`
	`463`	`+ex=abs(v-fe4m3_to_float32(r1))==abs(v-fe4m3_to_float32(r2))`
`452`	`464`	`raiseAssertionError(`
`453`	`465`	`f"p={p}, v={v}, "`
`454`	`466`	`f"search={r1}:{display_fe4m3(r1)}={fe4m3_to_float32(r1)} != "`
`455`		`-f"bit={r2}:{display_fe4m3(r2)}={fe4m3_to_float32(r2)}"`
	`467`	`+f"bit={r2}:{display_fe4m3(r2)}={fe4m3_to_float32(r2)} "`
	`468`	`+f"d1={v-fe4m3_to_float32(r1)} d2={v-fe4m3_to_float32(r2)} "`
	`469`	`+f"\|d1\|==\|d2\|={ex}"`
`456`	`470`	`)`
`457`	`471`	`forpinrange(1,40):`
`458`	`472`	`v=-(2** (-p))`
`@@ -462,10 +476,13 @@ def test_search_e4m3_pow(self):`
`462`	`476`	`continue`
`463`	`477`	`r2=float32_to_fe4m3(v)`
`464`	`478`	`ifr1!=r2:`
	`479`	`+ex=abs(v-fe4m3_to_float32(r1))==abs(v-fe4m3_to_float32(r2))`
`465`	`480`	`raiseAssertionError(`
`466`	`481`	`f"p={p}, v={v}, "`
`467`	`482`	`f"search={r1}:{display_fe4m3(r1)}={fe4m3_to_float32(r1)} != "`
`468`		`-f"bit={r2}:{display_fe4m3(r2)}={fe4m3_to_float32(r2)}"`
	`483`	`+f"bit={r2}:{display_fe4m3(r2)}={fe4m3_to_float32(r2)} "`
	`484`	`+f"d1={v-fe4m3_to_float32(r1)} d2={v-fe4m3_to_float32(r2)} "`
	`485`	`+f"\|d1\|==\|d2\|={ex}"`
`469`	`486`	`)`
`470`	`487`
`471`	`488`	`deftest_search_e5m2_pow(self):`
`@@ -478,10 +495,13 @@ def test_search_e5m2_pow(self):`
`478`	`495`	`continue`
`479`	`496`	`r2=float32_to_fe5m2(v)`
`480`	`497`	`ifr1!=r2:`
	`498`	`+ex=abs(v-fe5m2_to_float32(r1))==abs(v-fe5m2_to_float32(r2))`
`481`	`499`	`raiseAssertionError(`
`482`	`500`	`f"p={p}, v={v}, "`
`483`	`501`	`f"search={r1}:{display_fe5m2(r1)}={fe5m2_to_float32(r1)} != "`
`484`		`-f"bit={r2}:{display_fe5m2(r2)}={fe5m2_to_float32(r2)}"`
	`502`	`+f"bit={r2}:{display_fe5m2(r2)}={fe5m2_to_float32(r2)} "`
	`503`	`+f"d1={v-fe4m3_to_float32(r1)} d2={v-fe5m2_to_float32(r2)} "`
	`504`	`+f"\|d1\|==\|d2\|={ex}"`
`485`	`505`	`)`
`486`	`506`	`forpinrange(1,40):`
`487`	`507`	`v=-(2** (-p))`
`@@ -491,10 +511,13 @@ def test_search_e5m2_pow(self):`
`491`	`511`	`continue`
`492`	`512`	`r2=float32_to_fe5m2(v)`
`493`	`513`	`ifr1!=r2:`
	`514`	`+ex=abs(v-fe5m2_to_float32(r1))==abs(v-fe5m2_to_float32(r2))`
`494`	`515`	`raiseAssertionError(`
`495`	`516`	`f"p={p}, v={v}, "`
`496`	`517`	`f"search={r1}:{display_fe5m2(r1)}={fe5m2_to_float32(r1)} != "`
`497`		`-f"bit={r2}:{display_fe5m2(r2)}={fe5m2_to_float32(r2)}"`
	`518`	`+f"bit={r2}:{display_fe5m2(r2)}={fe5m2_to_float32(r2)} "`
	`519`	`+f"d1={v-fe4m3_to_float32(r1)} d2={v-fe5m2_to_float32(r2)} "`
	`520`	`+f"\|d1\|==\|d2\|={ex}"`
`498`	`521`	`)`
`499`	`522`
`500`	`523`	`deftest_float32_to_fe4m3fn_inf(self):`
`@@ -1152,13 +1175,50 @@ def test_float8_e5m2fnuz_negative_nan(self):`
`1152`	`1175`	`self.assertTrue(numpy.isnan(back))`
`1153`	`1176`
`1154`	`1177`	`deftest_fe4m3fn_to_float32_bug(self):`
`1155`		`-cases= [(1.8131605,1.875)]`
`1156`		`-forval,expectedincases:`
`1157`		`-withself.subTest(value=val,expected=expected):`
`1158`		`-res=fe4m3_to_float32(search_float32_into_fe4m3(val))`
`1159`		`-self.assertEqual(expected,res)`
`1160`		`-res=fe4m3_to_float32(float32_to_fe4m3(val))`
`1161`		`-self.assertEqual(expected,res)`
	`1178`	`+cases= [`
	`1179`	`+ (0.00439453125,0.00390625,TensorProto.FLOAT8E4M3FN),`
	`1180`	`+ (0.005859375,0.005859375,TensorProto.FLOAT8E4M3FN),`
	`1181`	`+ (0.005759375,0.005859375,TensorProto.FLOAT8E4M3FN),`
	`1182`	`+ (0.0046875,0.00390625,TensorProto.FLOAT8E4M3FN),`
	`1183`	`+ (0.001953125,0.001953125,TensorProto.FLOAT8E4M3FN),`
	`1184`	`+ (0.0029296875,0.00390625,TensorProto.FLOAT8E4M3FN),`
	`1185`	`+ (0.002053125,0.001953125,TensorProto.FLOAT8E4M3FN),`
	`1186`	`+ (0.00234375,0.001953125,TensorProto.FLOAT8E4M3FN),`
	`1187`	`+ (0.0087890625,0.0078125,TensorProto.FLOAT8E4M3FN),`
	`1188`	`+ (0.001171875,0.001953125,TensorProto.FLOAT8E4M3FN),`
	`1189`	`+ (1.8131605,1.875,TensorProto.FLOAT8E4M3FN),`
	`1190`	`+ (-100,-96,TensorProto.FLOAT8E4M3FNUZ),`
	`1191`	`+ (416,384,TensorProto.FLOAT8E5M2FNUZ),`
	`1192`	`+ ]`
	`1193`	`+forval,expected,ptincases:`
	`1194`	`+withself.subTest(value=val,expected=expected,proto=pt):`
	`1195`	`+ifpt==TensorProto.FLOAT8E4M3FN:`
	`1196`	`+res=fe4m3_to_float32(search_float32_into_fe4m3(val))`
	`1197`	`+self.assertEqual(expected,res)`
	`1198`	`+res=fe4m3_to_float32(float32_to_fe4m3(val))`
	`1199`	`+self.assertEqual(expected,res)`
	`1200`	`+continue`
	`1201`	`+ifpt==TensorProto.FLOAT8E4M3FNUZ:`
	`1202`	`+res=fe4m3_to_float32(`
	`1203`	`+search_float32_into_fe4m3(val,uz=True),uz=True`
	`1204`	`+ )`
	`1205`	`+self.assertEqual(expected,res)`
	`1206`	`+res=fe4m3_to_float32(float32_to_fe4m3(val,uz=True),uz=True)`
	`1207`	`+self.assertEqual(expected,res)`
	`1208`	`+continue`
	`1209`	`+ifpt==TensorProto.FLOAT8E5M2FNUZ:`
	`1210`	`+res=fe5m2_to_float32(`
	`1211`	`+search_float32_into_fe5m2(val,fn=True,uz=True),`
	`1212`	`+fn=True,`
	`1213`	`+uz=True,`
	`1214`	`+ )`
	`1215`	`+self.assertEqual(expected,res)`
	`1216`	`+res=fe5m2_to_float32(`
	`1217`	`+float32_to_fe5m2(val,fn=True,uz=True),fn=True,uz=True`
	`1218`	`+ )`
	`1219`	`+self.assertEqual(expected,res)`
	`1220`	`+continue`
	`1221`	`+raiseAssertionError(f"Unexpected value for pt={pt}.")`
`1162`	`1222`
`1163`	`1223`
`1164`	`1224`	`if__name__=="__main__":`

`‎onnx_array_api/validation/f8.py`

Lines changed: 74 additions & 52 deletions

Original file line number	Diff line number	Diff line change
`@@ -399,10 +399,9 @@ def find_closest_value(value, sorted_values):`
`399`	`399`	`ifd1<d2:`
`400`	`400`	`returnsorted_values[a][1]`
`401`	`401`	`ifd1==d2:`
`402`		`-raiseUndefinedCastError(`
`403`		`-f"Unable to cast{value}, d1={d1}, d2={d2}, "`
`404`		`-f"options are{sorted_values[a][1]} and{sorted_values[b][1]}."`
`405`		`- )`
	`402`	`+# Applies rule tie to even`
	`403`	`+ca,cb=sorted_values[a][1],sorted_values[b][1]`
	`404`	`+returncbifca&1==1elseca`
`406`	`405`	`returnsorted_values[b][1]`
`407`	`406`	`returnsorted_values[a][1]`
`408`	`407`
`@@ -520,28 +519,35 @@ def float32_to_fe4m3(x, fn: bool = True, uz: bool = False, saturate: bool = True`
`520`	`519`	`ife<116:`
`521`	`520`	`pass`
`522`	`521`	`elife<117:`
`523`		`-ret\|=1`
	`522`	`+# first positive number`
	`523`	`+ifm>0:`
	`524`	`+ret\|=1`
`524`	`525`	`if (m>>23)&1:`
`525`	`526`	`# rounding`
`526`	`527`	`ret+=1`
`527`		`-elife<120:# 127 - 8 + 1`
`528`		`-d=119-e`
`529`		`-ret\|=1<< (2-d)`
`530`		`-ret\|=m>> (21+d)`
`531`		`-if (m>> (20+d))&1:`
	`528`	`+elife<120:`
	`529`	`+# denormalized number`
	`530`	`+ex=e-119`
	`531`	`+ret\|=1<< (2+ex)`
	`532`	`+ret\|=m>> (21-ex)`
	`533`	`+mask=1<< (20-ex)`
	`534`	`+ifm&maskand (`
	`535`	`+ret&1`
	`536`	`+orm& (mask-1)>0`
	`537`	`+or (m&maskandm& (mask<<1)andm& (mask-1)==0)`
	`538`	`+ ):`
`532`	`539`	`# rounding`
`533`	`540`	`ret+=1`
`534`		`-elife<135:# 127 + 8`
	`541`	`+elife<135:`
	`542`	`+# normalized number`
`535`	`543`	`ex=e-119# 127 - 8`
`536`	`544`	`ifex==0:`
`537`	`545`	`ret\|=0x4`
`538`	`546`	`ret\|=m>>21`
`539`	`547`	`else:`
`540`	`548`	`ret\|=ex<<3`
`541`	`549`	`ret\|=m>>20`
`542`		`-if (m&0x80000)and (`
`543`		`- (m&0x100000)or (m&0x7FFFF)`
`544`		`- ):# round to nearest even`
	`550`	`+ifm&0x80000and ((m&0x100000)or (m&0x7FFFF)):`
`545`	`551`	`if (ret&0x7F)<0x7F:`
`546`	`552`	`# rounding`
`547`	`553`	`ret+=1`
`@@ -569,19 +575,25 @@ def float32_to_fe4m3(x, fn: bool = True, uz: bool = False, saturate: bool = True`
`569`	`575`	`ife<117:`
`570`	`576`	`pass`
`571`	`577`	`elife<118:`
`572`		`-ret\|=1`
`573`		`-if (m>>23)&1:`
`574`		`-# rounding`
`575`		`-ret+=1`
`576`		`-elife<121:# 127 - 7 + 1`
`577`		`-d=120-e`
`578`		`-ret\|=1<< (2-d)`
`579`		`-ret\|=m>> (21+d)`
`580`		`-if (m>> (20+d))&1:`
	`578`	`+# first positive number`
	`579`	`+ifm>0:`
	`580`	`+ret\|=1`
	`581`	`+elife<121:`
	`582`	`+# denormalized number`
	`583`	`+ex=e-120`
	`584`	`+ret\|=1<< (2+ex)`
	`585`	`+ret\|=m>> (21-ex)`
	`586`	`+mask=1<< (20-ex)`
	`587`	`+ifm&maskand (`
	`588`	`+ret&1`
	`589`	`+orm& (mask-1)>0`
	`590`	`+or (m&maskandm& (mask<<1)andm& (mask-1)==0)`
	`591`	`+ ):`
`581`	`592`	`# rounding`
`582`	`593`	`ret+=1`
`583`		`-elife<136:# 127 + 8 + 1`
`584`		`-ex=e-120# 127 - 7`
	`594`	`+elife<136:`
	`595`	`+# normalized number`
	`596`	`+ex=e-120`
`585`	`597`	`ifex==0:`
`586`	`598`	`ret\|=0x4`
`587`	`599`	`ret\|=m>>21`
`@@ -590,9 +602,7 @@ def float32_to_fe4m3(x, fn: bool = True, uz: bool = False, saturate: bool = True`
`590`	`602`	`ret\|=m>>20`
`591`	`603`	`if (ret&0x7F)==0x7F:`
`592`	`604`	`ret&=0xFE`
`593`		`-if (m&0x80000)and (`
`594`		`- (m&0x100000)or (m&0x7FFFF)`
`595`		`- ):# round to nearest even`
	`605`	`+if (m&0x80000)and ((m&0x100000)or (m&0x7FFFF)):`
`596`	`606`	`if (ret&0x7F)<0x7E:`
`597`	`607`	`# rounding`
`598`	`608`	`ret+=1`
`@@ -633,25 +643,31 @@ def float32_to_fe5m2(x, fn: bool = False, uz: bool = False, saturate: bool = Tru`
`633`	`643`	`ife<109:`
`634`	`644`	`pass`
`635`	`645`	`elife<110:`
`636`		`-ret\|=1`
	`646`	`+# first positive number`
	`647`	`+ifm>0:`
	`648`	`+ret\|=1`
`637`	`649`	`if (m>>23)&1:`
`638`	`650`	`# rounding`
`639`		`-# may be unused`
`640`	`651`	`ret+=1`
`641`		`-elife<112:# 127 - 16 + 1`
`642`		`-d=111-e`
`643`		`-ret\|=1<< (1-d)`
`644`		`-ret\|=m>> (22+d)`
`645`		`-if (m>> (21+d))&1:`
	`652`	`+elife<112:`
	`653`	`+# denormlized number`
	`654`	`+ex=e-111`
	`655`	`+ret\|=1<< (1+ex)`
	`656`	`+ret\|=m>> (22-ex)`
	`657`	`+mask=1<< (21-ex)`
	`658`	`+ifm&maskand (`
	`659`	`+ret&1`
	`660`	`+orm& (mask-1)>0`
	`661`	`+or (m&maskandm& (mask<<1)andm& (mask-1)==0)`
	`662`	`+ ):`
`646`	`663`	`# rounding`
`647`	`664`	`ret+=1`
`648`		`-elife<143:# 127 + 15 + 1`
`649`		`-ex=e-111# 127 - 16`
	`665`	`+elife<143:`
	`666`	`+# normalized number`
	`667`	`+ex=e-111`
`650`	`668`	`ret\|=ex<<2`
`651`	`669`	`ret\|=m>>21`
`652`		`-ifm&0x100000and (`
`653`		`- (m&0xFFFFF)or (m&0x200000)`
`654`		`- ):# round to nearest even`
	`670`	`+ifm&0x100000and ((m&0xFFFFF)or (m&0x200000)):`
`655`	`671`	`if (ret&0x7F)<0x7F:`
`656`	`672`	`# rounding`
`657`	`673`	`ret+=1`
`@@ -681,25 +697,31 @@ def float32_to_fe5m2(x, fn: bool = False, uz: bool = False, saturate: bool = Tru`
`681`	`697`	`ife<110:`
`682`	`698`	`pass`
`683`	`699`	`elife<111:`
`684`		`-ret\|=1`
	`700`	`+# first positive number`
	`701`	`+ifm>0:`
	`702`	`+ret\|=1`
`685`	`703`	`if (m>>23)&1:`
`686`	`704`	`# rounding`
`687`		`-# may be unused`
`688`	`705`	`ret+=1`
`689`		`-elife<113:# 127 - 15 + 1`
`690`		`-d=112-e`
`691`		`-ret\|=1<< (1-d)`
`692`		`-ret\|=m>> (22+d)`
`693`		`-if (m>> (21+d))&1:`
	`706`	`+elife<113:`
	`707`	`+# denormlized number`
	`708`	`+ex=e-112`
	`709`	`+ret\|=1<< (1+ex)`
	`710`	`+ret\|=m>> (22-ex)`
	`711`	`+mask=1<< (21-ex)`
	`712`	`+ifm&maskand (`
	`713`	`+ret&1`
	`714`	`+orm& (mask-1)>0`
	`715`	`+or (m&maskandm& (mask<<1)andm& (mask-1)==0)`
	`716`	`+ ):`
`694`	`717`	`# rounding`
`695`	`718`	`ret+=1`
`696`		`-elife<143:# 127 + 15 + 1`
`697`		`-ex=e-112# 127 - 15`
	`719`	`+elife<143:`
	`720`	`+# normalized number`
	`721`	`+ex=e-112`
`698`	`722`	`ret\|=ex<<2`
`699`	`723`	`ret\|=m>>21`
`700`		`-ifm&0x100000and (`
`701`		`- (m&0xFFFFF)or (m&0x200000)`
`702`		`- ):# round to nearest even`
	`724`	`+ifm&0x100000and ((m&0xFFFFF)or (m&0x200000)):`
`703`	`725`	`if (ret&0x7F)<0x7B:`
`704`	`726`	`# rounding`
`705`	`727`	`ret+=1`

0 commit comments

Comments

(0)

Movatterモバイル変換

Navigation Menu

Search code, repositories, users, issues, pull requests...

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Uh oh!

Commitf7bc922

File tree

2 files changed

2 files changed

`‎_unittests/ut_validation/test_f8.py`

`‎onnx_array_api/validation/f8.py`

0 commit comments