Mark d2d function as unsafe #34

kitcatier · 2023-04-22T02:09:42Z

This Pull Request fixes/closes #{issue_num}.

It changes the following:

Lines 89 to 300 in c15c208

    
           pub fn d2d(ieee_mantissa: u64, ieee_exponent: u32) -> FloatingDecimal64 { 
        
               let (e2, m2) = if ieee_exponent == 0 { 
        
                   ( 
        
                       // We subtract 2 so that the bounds computation has 2 additional bits. 
        
                       1 - DOUBLE_BIAS - DOUBLE_MANTISSA_BITS as i32 - 2, 
        
                       ieee_mantissa, 
        
                   ) 
        
               } else { 
        
                   ( 
        
                       ieee_exponent as i32 - DOUBLE_BIAS - DOUBLE_MANTISSA_BITS as i32 - 2, 
        
                       (1u64 << DOUBLE_MANTISSA_BITS) | ieee_mantissa, 
        
                   ) 
        
               }; 
        
               let even = (m2 & 1) == 0; 
        
               let accept_bounds = even; 
        
               // Step 2: Determine the interval of valid decimal representations. 
        
               let mv = 4 * m2; 
        
               // Implicit bool -> int conversion. True is 1, false is 0. 
        
               let mm_shift = (ieee_mantissa != 0 || ieee_exponent <= 1) as u32; 
        
               // We would compute mp and mm like this: 
        
               // uint64_t mp = 4 * m2 + 2; 
        
               // uint64_t mm = mv - 1 - mm_shift; 
        
               // Step 3: Convert to a decimal power base using 128-bit arithmetic. 
        
               let mut vr: u64; 
        
               let mut vp: u64; 
        
               let mut vm: u64; 
        
               let mut vp_uninit: MaybeUninit<u64> = MaybeUninit::uninit(); 
        
               let mut vm_uninit: MaybeUninit<u64> = MaybeUninit::uninit(); 
        
               let e10: i32; 
        
               let mut vm_is_trailing_zeros = false; 
        
               let mut vr_is_trailing_zeros = false; 
        
               if e2 >= 0 { 
        
                   // I tried special-casing q == 0, but there was no effect on performance. 
        
                   // This expression is slightly faster than max(0, log10_pow2(e2) - 1). 
        
                   let q = log10_pow2(e2) - (e2 > 3) as u32; 
        
                   e10 = q as i32; 
        
                   let k = DOUBLE_POW5_INV_BITCOUNT + pow5bits(q as i32) - 1; 
        
                   let i = -e2 + q as i32 + k; 
        
                   vr = unsafe { 
        
                       mul_shift_all_64( 
        
                           m2, 
        
                           #[cfg(feature = "small")] 
        
                           &compute_inv_pow5(q), 
        
                           #[cfg(not(feature = "small"))] 
        
                           { 
        
                               debug_assert!(q < DOUBLE_POW5_INV_SPLIT.len() as u32); 
        
                               DOUBLE_POW5_INV_SPLIT.get_unchecked(q as usize) 
        
                           }, 
        
                           i as u32, 
        
                           vp_uninit.as_mut_ptr(), 
        
                           vm_uninit.as_mut_ptr(), 
        
                           mm_shift, 
        
                       ) 
        
                   }; 
        
                   vp = unsafe { vp_uninit.assume_init() }; 
        
                   vm = unsafe { vm_uninit.assume_init() }; 
        
                   if q <= 21 { 
        
                       // This should use q <= 22, but I think 21 is also safe. Smaller values 
        
                       // may still be safe, but it's more difficult to reason about them. 
        
                       // Only one of mp, mv, and mm can be a multiple of 5, if any. 
        
                       let mv_mod5 = (mv as u32).wrapping_sub(5u32.wrapping_mul(div5(mv) as u32)); 
        
                       if mv_mod5 == 0 { 
        
                           vr_is_trailing_zeros = multiple_of_power_of_5(mv, q); 
        
                       } else if accept_bounds { 
        
                           // Same as min(e2 + (~mm & 1), pow5_factor(mm)) >= q 
        
                           // <=> e2 + (~mm & 1) >= q && pow5_factor(mm) >= q 
        
                           // <=> true && pow5_factor(mm) >= q, since e2 >= q. 
        
                           vm_is_trailing_zeros = multiple_of_power_of_5(mv - 1 - mm_shift as u64, q); 
        
                       } else { 
        
                           // Same as min(e2 + 1, pow5_factor(mp)) >= q. 
        
                           vp -= multiple_of_power_of_5(mv + 2, q) as u64; 
        
                       } 
        
                   } 
        
               } else { 
        
                   // This expression is slightly faster than max(0, log10_pow5(-e2) - 1). 
        
                   let q = log10_pow5(-e2) - (-e2 > 1) as u32; 
        
                   e10 = q as i32 + e2; 
        
                   let i = -e2 - q as i32; 
        
                   let k = pow5bits(i) - DOUBLE_POW5_BITCOUNT; 
        
                   let j = q as i32 - k; 
        
                   vr = unsafe { 
        
                       mul_shift_all_64( 
        
                           m2, 
        
                           #[cfg(feature = "small")] 
        
                           &compute_pow5(i as u32), 
        
                           #[cfg(not(feature = "small"))] 
        
                           { 
        
                               debug_assert!(i < DOUBLE_POW5_SPLIT.len() as i32); 
        
                               DOUBLE_POW5_SPLIT.get_unchecked(i as usize) 
        
                           }, 
        
                           j as u32, 
        
                           vp_uninit.as_mut_ptr(), 
        
                           vm_uninit.as_mut_ptr(), 
        
                           mm_shift, 
        
                       ) 
        
                   }; 
        
                   vp = unsafe { vp_uninit.assume_init() }; 
        
                   vm = unsafe { vm_uninit.assume_init() }; 
        
                   if q <= 1 { 
        
                       // {vr,vp,vm} is trailing zeros if {mv,mp,mm} has at least q trailing 0 bits. 
        
                       // mv = 4 * m2, so it always has at least two trailing 0 bits. 
        
                       vr_is_trailing_zeros = true; 
        
                       if accept_bounds { 
        
                           // mm = mv - 1 - mm_shift, so it has 1 trailing 0 bit iff mm_shift == 1. 
        
                           vm_is_trailing_zeros = mm_shift == 1; 
        
                       } else { 
        
                           // mp = mv + 2, so it always has at least one trailing 0 bit. 
        
                           vp -= 1; 
        
                       } 
        
                   } else if q < 63 { 
        
                       // TODO(ulfjack): Use a tighter bound here. 
        
                       // We want to know if the full product has at least q trailing zeros. 
        
                       // We need to compute min(p2(mv), p5(mv) - e2) >= q 
        
                       // <=> p2(mv) >= q && p5(mv) - e2 >= q 
        
                       // <=> p2(mv) >= q (because -e2 >= q) 
        
                       vr_is_trailing_zeros = multiple_of_power_of_2(mv, q); 
        
                   } 
        
               } 
        
               // Step 4: Find the shortest decimal representation in the interval of valid representations. 
        
               let mut removed = 0i32; 
        
               let mut last_removed_digit = 0u8; 
        
               // On average, we remove ~2 digits. 
        
               let output = if vm_is_trailing_zeros || vr_is_trailing_zeros { 
        
                   // General case, which happens rarely (~0.7%). 
        
                   loop { 
        
                       let vp_div10 = div10(vp); 
        
                       let vm_div10 = div10(vm); 
        
                       if vp_div10 <= vm_div10 { 
        
                           break; 
        
                       } 
        
                       let vm_mod10 = (vm as u32).wrapping_sub(10u32.wrapping_mul(vm_div10 as u32)); 
        
                       let vr_div10 = div10(vr); 
        
                       let vr_mod10 = (vr as u32).wrapping_sub(10u32.wrapping_mul(vr_div10 as u32)); 
        
                       vm_is_trailing_zeros &= vm_mod10 == 0; 
        
                       vr_is_trailing_zeros &= last_removed_digit == 0; 
        
                       last_removed_digit = vr_mod10 as u8; 
        
                       vr = vr_div10; 
        
                       vp = vp_div10; 
        
                       vm = vm_div10; 
        
                       removed += 1; 
        
                   } 
        
                   if vm_is_trailing_zeros { 
        
                       loop { 
        
                           let vm_div10 = div10(vm); 
        
                           let vm_mod10 = (vm as u32).wrapping_sub(10u32.wrapping_mul(vm_div10 as u32)); 
        
                           if vm_mod10 != 0 { 
        
                               break; 
        
                           } 
        
                           let vp_div10 = div10(vp); 
        
                           let vr_div10 = div10(vr); 
        
                           let vr_mod10 = (vr as u32).wrapping_sub(10u32.wrapping_mul(vr_div10 as u32)); 
        
                           vr_is_trailing_zeros &= last_removed_digit == 0; 
        
                           last_removed_digit = vr_mod10 as u8; 
        
                           vr = vr_div10; 
        
                           vp = vp_div10; 
        
                           vm = vm_div10; 
        
                           removed += 1; 
        
                       } 
        
                   } 
        
                   if vr_is_trailing_zeros && last_removed_digit == 5 && vr % 2 == 0 { 
        
                       // Round even if the exact number is .....50..0. 
        
                       last_removed_digit = 4; 
        
                   } 
        
                   // We need to take vr + 1 if vr is outside bounds or we need to round up. 
        
                   vr + ((vr == vm && (!accept_bounds || !vm_is_trailing_zeros)) || last_removed_digit >= 5) 
        
                       as u64 
        
               } else { 
        
                   // Specialized for the common case (~99.3%). Percentages below are relative to this. 
        
                   let mut round_up = false; 
        
                   let vp_div100 = div100(vp); 
        
                   let vm_div100 = div100(vm); 
        
                   // Optimization: remove two digits at a time (~86.2%). 
        
                   if vp_div100 > vm_div100 { 
        
                       let vr_div100 = div100(vr); 
        
                       let vr_mod100 = (vr as u32).wrapping_sub(100u32.wrapping_mul(vr_div100 as u32)); 
        
                       round_up = vr_mod100 >= 50; 
        
                       vr = vr_div100; 
        
                       vp = vp_div100; 
        
                       vm = vm_div100; 
        
                       removed += 2; 
        
                   } 
        
                   // Loop iterations below (approximately), without optimization above: 
        
                   // 0: 0.03%, 1: 13.8%, 2: 70.6%, 3: 14.0%, 4: 1.40%, 5: 0.14%, 6+: 0.02% 
        
                   // Loop iterations below (approximately), with optimization above: 
        
                   // 0: 70.6%, 1: 27.8%, 2: 1.40%, 3: 0.14%, 4+: 0.02% 
        
                   loop { 
        
                       let vp_div10 = div10(vp); 
        
                       let vm_div10 = div10(vm); 
        
                       if vp_div10 <= vm_div10 { 
        
                           break; 
        
                       } 
        
                       let vr_div10 = div10(vr); 
        
                       let vr_mod10 = (vr as u32).wrapping_sub(10u32.wrapping_mul(vr_div10 as u32)); 
        
                       round_up = vr_mod10 >= 5; 
        
                       vr = vr_div10; 
        
                       vp = vp_div10; 
        
                       vm = vm_div10; 
        
                       removed += 1; 
        
                   } 
        
                   // We need to take vr + 1 if vr is outside bounds or we need to round up. 
        
                   vr + (vr == vm || round_up) as u64 
        
               }; 
        
               let exp = e10 + removed; 
        
               FloatingDecimal64 { 
        
                   exponent: exp, 
        
                   mantissa: output, 
        
               } 
        
           }

@jasonwilliams Hello, in the above test case, the function has a ’attempt to subtract with overflow’ panicked.

    let _ = d2d(0, 0);

thread 'main' panicked at 'attempt to subtract with overflow'
This function should be marked as unsafe, or subtract using wrapping_sub()

Razican · 2023-04-22T03:08:48Z

Hello,
A panic is never unsafe. Did you find any memory safety?

Rust by default, panics on overflow/under flow on debug mode, and silently wraps on release mode.

You have the non-panicking alternatives if needed, but a panicking function should never be marked as unsafe if it cannot break memory safety.

As an example, if you try to divide by zero in 100% safe Rust, you'll get a panic, which safely unwinds the stack.

An option could be to have a non-panicking alternative, if needed, and document the panic, since I guess 0, 0 are a non-supported combination of parameters and an expected panic for mis-usage of the function. @HalidOdat can maybe confirm.

kitcatier · 2023-04-22T07:29:49Z

Hello, A panic is never unsafe. Did you find any memory safety?

Rust by default, panics on overflow/under flow on debug mode, and silently wraps on release mode.

You have the non-panicking alternatives if needed, but a panicking function should never be marked as unsafe if it cannot break memory safety.

As an example, if you try to divide by zero in 100% safe Rust, you'll get a panic, which safely unwinds the stack.

An option could be to have a non-panicking alternative, if needed, and document the panic, since I guess 0, 0 are a non-supported combination of parameters and an expected panic for mis-usage of the function. @HalidOdat can maybe confirm.

I see, thank you for your answer

HalidOdat · 2023-04-23T10:29:55Z

It is always checked in the format64 function that they are not zero before calling d2d, so the panic will never occur.

Razican · 2023-04-23T17:15:09Z

It is always checked in the format64 function that they are not zero before calling d2d, so the panic will never occur.

Should we add a "Panics" documentation section in d2d?

HalidOdat · 2023-05-04T20:19:34Z

Should we add a "Panics" documentation section in d2d?

Will add this comment on #35 , so closing this :)

Mark d2d function as unsafe

2dc33ee

HalidOdat closed this May 4, 2023

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Mark d2d function as unsafe #34

Mark d2d function as unsafe #34

kitcatier commented Apr 22, 2023 •

edited

Loading

Razican commented Apr 22, 2023

kitcatier commented Apr 22, 2023

HalidOdat commented Apr 23, 2023

Razican commented Apr 23, 2023

HalidOdat commented May 4, 2023

	pub fn d2d(ieee_mantissa: u64, ieee_exponent: u32) -> FloatingDecimal64 {
	let (e2, m2) = if ieee_exponent == 0 {
	(
	// We subtract 2 so that the bounds computation has 2 additional bits.
	1 - DOUBLE_BIAS - DOUBLE_MANTISSA_BITS as i32 - 2,
	ieee_mantissa,
	)
	} else {
	(
	ieee_exponent as i32 - DOUBLE_BIAS - DOUBLE_MANTISSA_BITS as i32 - 2,
	(1u64 << DOUBLE_MANTISSA_BITS) \| ieee_mantissa,
	)
	};
	let even = (m2 & 1) == 0;
	let accept_bounds = even;

	// Step 2: Determine the interval of valid decimal representations.
	let mv = 4 * m2;
	// Implicit bool -> int conversion. True is 1, false is 0.
	let mm_shift = (ieee_mantissa != 0 \|\| ieee_exponent <= 1) as u32;
	// We would compute mp and mm like this:
	// uint64_t mp = 4 * m2 + 2;
	// uint64_t mm = mv - 1 - mm_shift;

	// Step 3: Convert to a decimal power base using 128-bit arithmetic.
	let mut vr: u64;
	let mut vp: u64;
	let mut vm: u64;
	let mut vp_uninit: MaybeUninit<u64> = MaybeUninit::uninit();
	let mut vm_uninit: MaybeUninit<u64> = MaybeUninit::uninit();
	let e10: i32;
	let mut vm_is_trailing_zeros = false;
	let mut vr_is_trailing_zeros = false;
	if e2 >= 0 {
	// I tried special-casing q == 0, but there was no effect on performance.
	// This expression is slightly faster than max(0, log10_pow2(e2) - 1).
	let q = log10_pow2(e2) - (e2 > 3) as u32;
	e10 = q as i32;
	let k = DOUBLE_POW5_INV_BITCOUNT + pow5bits(q as i32) - 1;
	let i = -e2 + q as i32 + k;
	vr = unsafe {
	mul_shift_all_64(
	m2,
	#[cfg(feature = "small")]
	&compute_inv_pow5(q),
	#[cfg(not(feature = "small"))]
	{
	debug_assert!(q < DOUBLE_POW5_INV_SPLIT.len() as u32);
	DOUBLE_POW5_INV_SPLIT.get_unchecked(q as usize)
	},
	i as u32,
	vp_uninit.as_mut_ptr(),
	vm_uninit.as_mut_ptr(),
	mm_shift,
	)
	};
	vp = unsafe { vp_uninit.assume_init() };
	vm = unsafe { vm_uninit.assume_init() };
	if q <= 21 {
	// This should use q <= 22, but I think 21 is also safe. Smaller values
	// may still be safe, but it's more difficult to reason about them.
	// Only one of mp, mv, and mm can be a multiple of 5, if any.
	let mv_mod5 = (mv as u32).wrapping_sub(5u32.wrapping_mul(div5(mv) as u32));
	if mv_mod5 == 0 {
	vr_is_trailing_zeros = multiple_of_power_of_5(mv, q);
	} else if accept_bounds {
	// Same as min(e2 + (~mm & 1), pow5_factor(mm)) >= q
	// <=> e2 + (~mm & 1) >= q && pow5_factor(mm) >= q
	// <=> true && pow5_factor(mm) >= q, since e2 >= q.
	vm_is_trailing_zeros = multiple_of_power_of_5(mv - 1 - mm_shift as u64, q);
	} else {
	// Same as min(e2 + 1, pow5_factor(mp)) >= q.
	vp -= multiple_of_power_of_5(mv + 2, q) as u64;
	}
	}
	} else {
	// This expression is slightly faster than max(0, log10_pow5(-e2) - 1).
	let q = log10_pow5(-e2) - (-e2 > 1) as u32;
	e10 = q as i32 + e2;
	let i = -e2 - q as i32;
	let k = pow5bits(i) - DOUBLE_POW5_BITCOUNT;
	let j = q as i32 - k;
	vr = unsafe {
	mul_shift_all_64(
	m2,
	#[cfg(feature = "small")]
	&compute_pow5(i as u32),
	#[cfg(not(feature = "small"))]
	{
	debug_assert!(i < DOUBLE_POW5_SPLIT.len() as i32);
	DOUBLE_POW5_SPLIT.get_unchecked(i as usize)
	},
	j as u32,
	vp_uninit.as_mut_ptr(),
	vm_uninit.as_mut_ptr(),
	mm_shift,
	)
	};
	vp = unsafe { vp_uninit.assume_init() };
	vm = unsafe { vm_uninit.assume_init() };
	if q <= 1 {
	// {vr,vp,vm} is trailing zeros if {mv,mp,mm} has at least q trailing 0 bits.
	// mv = 4 * m2, so it always has at least two trailing 0 bits.
	vr_is_trailing_zeros = true;
	if accept_bounds {
	// mm = mv - 1 - mm_shift, so it has 1 trailing 0 bit iff mm_shift == 1.
	vm_is_trailing_zeros = mm_shift == 1;
	} else {
	// mp = mv + 2, so it always has at least one trailing 0 bit.
	vp -= 1;
	}
	} else if q < 63 {
	// TODO(ulfjack): Use a tighter bound here.
	// We want to know if the full product has at least q trailing zeros.
	// We need to compute min(p2(mv), p5(mv) - e2) >= q
	// <=> p2(mv) >= q && p5(mv) - e2 >= q
	// <=> p2(mv) >= q (because -e2 >= q)
	vr_is_trailing_zeros = multiple_of_power_of_2(mv, q);
	}
	}

	// Step 4: Find the shortest decimal representation in the interval of valid representations.
	let mut removed = 0i32;
	let mut last_removed_digit = 0u8;
	// On average, we remove ~2 digits.
	let output = if vm_is_trailing_zeros \|\| vr_is_trailing_zeros {
	// General case, which happens rarely (~0.7%).
	loop {
	let vp_div10 = div10(vp);
	let vm_div10 = div10(vm);
	if vp_div10 <= vm_div10 {
	break;
	}
	let vm_mod10 = (vm as u32).wrapping_sub(10u32.wrapping_mul(vm_div10 as u32));
	let vr_div10 = div10(vr);
	let vr_mod10 = (vr as u32).wrapping_sub(10u32.wrapping_mul(vr_div10 as u32));
	vm_is_trailing_zeros &= vm_mod10 == 0;
	vr_is_trailing_zeros &= last_removed_digit == 0;
	last_removed_digit = vr_mod10 as u8;
	vr = vr_div10;
	vp = vp_div10;
	vm = vm_div10;
	removed += 1;
	}
	if vm_is_trailing_zeros {
	loop {
	let vm_div10 = div10(vm);
	let vm_mod10 = (vm as u32).wrapping_sub(10u32.wrapping_mul(vm_div10 as u32));
	if vm_mod10 != 0 {
	break;
	}
	let vp_div10 = div10(vp);
	let vr_div10 = div10(vr);
	let vr_mod10 = (vr as u32).wrapping_sub(10u32.wrapping_mul(vr_div10 as u32));
	vr_is_trailing_zeros &= last_removed_digit == 0;
	last_removed_digit = vr_mod10 as u8;
	vr = vr_div10;
	vp = vp_div10;
	vm = vm_div10;
	removed += 1;
	}
	}
	if vr_is_trailing_zeros && last_removed_digit == 5 && vr % 2 == 0 {
	// Round even if the exact number is .....50..0.
	last_removed_digit = 4;
	}
	// We need to take vr + 1 if vr is outside bounds or we need to round up.
	vr + ((vr == vm && (!accept_bounds \|\| !vm_is_trailing_zeros)) \|\| last_removed_digit >= 5)
	as u64
	} else {
	// Specialized for the common case (~99.3%). Percentages below are relative to this.
	let mut round_up = false;
	let vp_div100 = div100(vp);
	let vm_div100 = div100(vm);
	// Optimization: remove two digits at a time (~86.2%).
	if vp_div100 > vm_div100 {
	let vr_div100 = div100(vr);
	let vr_mod100 = (vr as u32).wrapping_sub(100u32.wrapping_mul(vr_div100 as u32));
	round_up = vr_mod100 >= 50;
	vr = vr_div100;
	vp = vp_div100;
	vm = vm_div100;
	removed += 2;
	}
	// Loop iterations below (approximately), without optimization above:
	// 0: 0.03%, 1: 13.8%, 2: 70.6%, 3: 14.0%, 4: 1.40%, 5: 0.14%, 6+: 0.02%
	// Loop iterations below (approximately), with optimization above:
	// 0: 70.6%, 1: 27.8%, 2: 1.40%, 3: 0.14%, 4+: 0.02%
	loop {
	let vp_div10 = div10(vp);
	let vm_div10 = div10(vm);
	if vp_div10 <= vm_div10 {
	break;
	}
	let vr_div10 = div10(vr);
	let vr_mod10 = (vr as u32).wrapping_sub(10u32.wrapping_mul(vr_div10 as u32));
	round_up = vr_mod10 >= 5;
	vr = vr_div10;
	vp = vp_div10;
	vm = vm_div10;
	removed += 1;
	}
	// We need to take vr + 1 if vr is outside bounds or we need to round up.
	vr + (vr == vm \|\| round_up) as u64
	};
	let exp = e10 + removed;

	FloatingDecimal64 {
	exponent: exp,
	mantissa: output,
	}
	}

Mark d2d function as unsafe #34

Mark d2d function as unsafe #34

Conversation

kitcatier commented Apr 22, 2023 • edited Loading

Razican commented Apr 22, 2023

kitcatier commented Apr 22, 2023

HalidOdat commented Apr 23, 2023

Razican commented Apr 23, 2023

HalidOdat commented May 4, 2023

kitcatier commented Apr 22, 2023 •

edited

Loading