CE-Programming
diff --git a/‎src/crt/dtof.src‎
Lines changed: 219 additions & 18 deletions b/‎src/crt/dtof.src‎
Lines changed: 219 additions & 18 deletions
diff --git a/‎src/softfloat/f64_to_f32.c‎
Lines changed: 0 additions & 88 deletions b/‎src/softfloat/f64_to_f32.c‎
Lines changed: 0 additions & 88 deletions
diff --git a/‎src/softfloat/include/specialize.h‎
Lines changed: 0 additions & 21 deletions b/‎src/softfloat/include/specialize.h‎
Lines changed: 0 additions & 21 deletions
@@ -1,18 +1,219 @@
-	assume	adl=1
-
-	section	.text
-
-	public	__dtof
-
-__dtof:
-	; f64_ret_f32
-	push	af, iy, bc, de, hl
-	call	___f64_to_f32
-	pop	af
-	ld	a, e
-	pop	de
-	ld	e, a
-	pop	bc, iy, af
-	ret
-
-	extern	___f64_to_f32
+	assume	adl=1
+
+	section	.text
+
+	public	__dtof
+
+	private	__dtof_helper
+__dtof_helper:
+	; Moving this block of code to be behind __dtof ensures that
+	; __dtof.ret_copysign can always be reached by jr in all paths.
+.overflow:
+	; carry is set here
+	pop	hl
+	; A = $10
+	add	a, c	; attempts to overflow the low 4 bits of the exponent
+	rl	b	; (0x7F << 1) | 1 if the input is inf/NaN
+	inc	b	; B will only be zero if the input was inf/NaN
+	jr	nz, .not_inf_nan
+
+	; carry is cleared
+	adc	hl, hl
+	jr	nz, .has_payload
+	ld	a, e
+	rla
+	and	a, $3F
+	jr	z, .no_payload
+.has_payload:
+	set	5, e	; ensure that NaN stays NaN
+.no_payload:
+	ld	a, c
+	push	de
+	pop	bc
+	ld	l, 5
+	call	__lshru
+	push	bc
+	pop	hl
+.finish_inf_nan:
+	ld	a, $7F
+	jr	__dtof.ret_copysign
+.not_inf_nan:
+	; return infinity
+	ld	hl, $800000
+	jr	.finish_inf_nan
+
+; Convert BC:UDE:UHL F64 to E:UHL F32
+; Rounding: round to nearest with ties to even
+; Behaviour:
+;  Underflow: Returns signed zero. No signals raised.
+;  Subnormal: No signals raised.
+;  Rounded to Infinity: No signals raised.
+;  Overflow: Returns signed infinity. No signals raised.
+;  Signaling NaN: Quiet bit preserved. No signals raised.
+;  Quiet NaN: Quiet bit preserved. No signals raised.
+;  NaN Payloads: Copies the most significant payload bits. The LSB of mantissa is set if payload bits were discarded/truncated out.
+__dtof:
+	bit	7, b
+	push	af	; preserve A and signbit
+	push	bc
+	push	de
+	push	hl
+	res	7, b
+	ld	hl, -$3810
+	add.s	hl, bc
+	jr	nc, .maybe_subnormal
+	ld	hl, -$47F0	; $FFB810
+	ld	a, l		; ld a, $10
+	add.s	hl, bc
+	jr	c, __dtof_helper.overflow
+	; result is normal or rounds to infinity
+	; calculate new exponent
+	; we only need the low 8 bits of the exponent
+	add	hl, hl
+	add	hl, hl
+	add	hl, hl
+	add	hl, hl
+	; offset = -$380 - -$47F = $FF = -1 ; therefore decrement
+	; H = exponent + 1
+	ld	l, 29		; f64_mant_bits - f32_mant_bits = 52 - 23 = 29
+	ex	(sp), hl	; (SP) = exponent/shift, HL = lo24
+
+	; clear exponent
+	dec	a	; ld	a, $0F
+	and	a, c
+	ld	c, a
+	xor	a, a
+	ld	b, a
+	; test round bit
+	bit	4, e
+	jr	z, .round_down
+	; test guard bit
+	ld	a, e
+	and	a, $20
+	jr	nz, .round_up
+	; test sticky bits
+	inc	a	; make A non-zero
+	adc	hl, hl
+	jr	nz, .round_up
+	ld	a, e
+	rla
+	and	a, $1F
+.round_up:
+.round_down:
+	call	__llshru
+	; B, C, and UDE are zero here
+	or	a, a
+	jr	z, .no_round
+	inc	hl	; does not overflow
+.no_round:
+	pop	af	; a = exponent + 1, flags = 29 = ---5H3V-C
+	sbc	a, b	; decrement exponent and clear carry
+	rra
+	jr	nc, .even_exponent
+	ld	bc, $800000
+	add	hl, bc	; the result might be rounded to infinity here
+	adc	a, c	; adc a, 0 ; wont overflow
+.even_exponent:
+.subnormal_no_round:
+.ret_copysign:
+	pop	de
+	ld	e, a
+	pop	bc
+	pop	af
+	ret	z
+	set	7, e
+	ret
+
+.ret_zero:
+	; carry is cleared
+	pop	hl
+	xor	a, a
+	sbc	hl, hl
+	jr	.ret_copysign
+
+.maybe_subnormal:
+	ld	hl, -$3690
+	add.s	hl, bc
+	jr	nc, .ret_zero
+	; calculate shift
+	; A = (uint8_t)((BC - $3690) >> 4)
+	; A = (uint8_t)((HL << 4) >> 8)
+	add	hl, hl
+	add	hl, hl
+	add	hl, hl
+	add	hl, hl
+	; Shift = -A + 4 + 24
+	ld	a, 4 + 24
+	sub	a, h
+	; maximum shift = 24 + 4 + 25 = 24 + 29 = 53
+	; minimum shift = 24 + 4 + 1 = 24 + 5 = 29
+	ld	b, a
+	ld	e, a	; store shift amount
+	xor	a, a
+	; calculate sticky bits
+	sbc	hl, hl
+	inc	hl	; ld hl, 1
+.shift_loop:
+	add	hl, hl
+	adc	a, a
+	djnz	.shift_loop
+	; carry won't be set
+	; set C:UDE to A:UHL
+	; shift by an additional 24 bits
+	dec	hl
+	jr	z, .the_set_bit_is_in_hl
+	dec	a
+.the_set_bit_is_in_hl:
+	ld	c, a
+	ld	a, e	; restore shift amount
+	ex	de, hl
+	scf
+	sbc	hl, hl
+	; BC:UDE:UHL = 1 << shift
+	; (SP) = X
+	call	__lland
+	call	__llcmpzero
+	pop	hl
+	; DE and BC are swapped here
+	pop	bc
+	pop	de
+	push	de
+	push	bc
+
+	; clear exponent and include the implicit mantissa bit
+	ld	d, 0
+	jr	z, .no_sticky_bits
+	inc	d
+.no_sticky_bits:
+
+	ld	l, a	; L = shift
+	ld	a, e
+	and	a, $0F
+	or	a, $10
+
+	call	__lshru
+	xor	a, a	; subnormal exponent
+	; HL = BC >> 1
+	scf
+	sbc	hl, hl	; ld hl, -1
+	add	hl, sp
+	push	bc
+	srl	(hl)
+	pop	hl
+	rr	h
+	rr	l	; round bit shifted out
+
+	jr	nc, .subnormal_no_round
+	dec	d
+	jr	z, .subnormal_round_up
+	bit	0, l
+	jr	z, .subnormal_no_round
+.subnormal_round_up:
+	inc	hl	; wont overflow, but may become FLT_MIN
+; .subnormal_no_round:
+	jr	.ret_copysign
+
+	extern	__lland
+	extern	__llcmpzero
+	extern	__llshru
+	extern	__lshru
@@ -145,15 +145,7 @@ void softfloat_f32UIToCommonNaN( uint_fast32_t uiA, struct commonNaN *zPtr );
 | Converts the common NaN pointed to by 'aPtr' into a 32-bit floating-point
 | NaN, and returns the bit pattern of this value as an unsigned integer.
 *----------------------------------------------------------------------------*/
-#if 0
 uint_fast32_t softfloat_commonNaNToF32UI( const struct commonNaN *aPtr );
-#else
-/** only used by f64_to_f32 currently */
-static inline uint_fast32_t softfloat_commonNaNToF32UI( const struct commonNaN *aPtr )
-{
-    return (uint_fast32_t) aPtr->sign<<31 | 0x7FC00000 | aPtr->v64>>41;
-}
-#endif
 
 /*----------------------------------------------------------------------------
 | Interpreting 'uiA' and 'uiB' as the bit patterns of two 32-bit floating-
@@ -186,20 +178,7 @@ bool softfloat_isSigNaNF64UI(uint64_t a) __attribute__((__const__, __nothrow__,
 | location pointed to by 'zPtr'.  If the NaN is a signaling NaN, the invalid
 | exception is raised.
 *----------------------------------------------------------------------------*/
-#if 0
 void softfloat_f64UIToCommonNaN( uint_fast64_t uiA, struct commonNaN *zPtr );
-#else
-/** only used by f64_to_f32 currently */
-static inline void softfloat_f64UIToCommonNaN( uint_fast64_t uiA, struct commonNaN *zPtr )
-{
-    if ( softfloat_isSigNaNF64UI( uiA ) ) {
-        softfloat_raiseFlags( softfloat_flag_invalid );
-    }
-    zPtr->sign = uiA>>63;
-    zPtr->v64  = uiA<<12;
-    zPtr->v0   = 0;
-}
-#endif
 
 /*----------------------------------------------------------------------------
 | Converts the common NaN pointed to by 'aPtr' into a 64-bit floating-point