-
Notifications
You must be signed in to change notification settings - Fork 83
fix 128bits ctlz intrinsincs UB #635
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
base: master
Are you sure you want to change the base?
Changes from all commits
File filter
Filter by extension
Conversations
Jump to
Diff view
Diff view
There are no files selected for viewing
| Original file line number | Diff line number | Diff line change | ||||
|---|---|---|---|---|---|---|
|
|
@@ -410,43 +410,15 @@ impl<'a, 'gcc, 'tcx> IntrinsicCallBuilderMethods<'tcx> for Builder<'a, 'gcc, 'tc | |||||
| | sym::saturating_sub => { | ||||||
| match int_type_width_signed(args[0].layout.ty, self) { | ||||||
| Some((width, signed)) => match name { | ||||||
| sym::ctlz | sym::cttz => { | ||||||
| let func = self.current_func(); | ||||||
| let then_block = func.new_block("then"); | ||||||
| let else_block = func.new_block("else"); | ||||||
| let after_block = func.new_block("after"); | ||||||
|
|
||||||
| let arg = args[0].immediate(); | ||||||
| let result = func.new_local(None, self.u32_type, "zeros"); | ||||||
| let zero = self.cx.gcc_zero(arg.get_type()); | ||||||
| let cond = self.gcc_icmp(IntPredicate::IntEQ, arg, zero); | ||||||
| self.llbb().end_with_conditional(None, cond, then_block, else_block); | ||||||
|
|
||||||
| let zero_result = self.cx.gcc_uint(self.u32_type, width); | ||||||
| then_block.add_assignment(None, result, zero_result); | ||||||
| then_block.end_with_jump(None, after_block); | ||||||
|
|
||||||
| // NOTE: since jumps were added in a place | ||||||
| // count_leading_zeroes() does not expect, the current block | ||||||
| // in the state need to be updated. | ||||||
| self.switch_to_block(else_block); | ||||||
|
|
||||||
| let zeros = match name { | ||||||
| sym::ctlz => self.count_leading_zeroes(width, arg), | ||||||
| sym::cttz => self.count_trailing_zeroes(width, arg), | ||||||
| _ => unreachable!(), | ||||||
| }; | ||||||
| self.llbb().add_assignment(None, result, zeros); | ||||||
| self.llbb().end_with_jump(None, after_block); | ||||||
|
|
||||||
| // NOTE: since jumps were added in a place rustc does not | ||||||
| // expect, the current block in the state need to be updated. | ||||||
| self.switch_to_block(after_block); | ||||||
|
|
||||||
| result.to_rvalue() | ||||||
| sym::ctlz => self.count_leading_zeroes(width, args[0].immediate()), | ||||||
|
|
||||||
| sym::ctlz_nonzero => { | ||||||
| self.count_leading_zeroes_nonzero(width, args[0].immediate()) | ||||||
| } | ||||||
| sym::cttz => self.count_trailing_zeroes(width, args[0].immediate()), | ||||||
| sym::cttz_nonzero => { | ||||||
| self.count_trailing_zeroes_nonzero(width, args[0].immediate()) | ||||||
| } | ||||||
| sym::ctlz_nonzero => self.count_leading_zeroes(width, args[0].immediate()), | ||||||
| sym::cttz_nonzero => self.count_trailing_zeroes(width, args[0].immediate()), | ||||||
| sym::ctpop => self.pop_count(args[0].immediate()), | ||||||
| sym::bswap => { | ||||||
| if width == 8 { | ||||||
|
|
@@ -886,6 +858,36 @@ impl<'a, 'gcc, 'tcx> Builder<'a, 'gcc, 'tcx> { | |||||
| } | ||||||
|
|
||||||
| fn count_leading_zeroes(&mut self, width: u64, arg: RValue<'gcc>) -> RValue<'gcc> { | ||||||
| let func = self.current_func(); | ||||||
|
Contributor
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Please add a comment to this method to describe what it does (return 0 if arg is zero, otherwise call the leading_zero builtin). |
||||||
| let then_block = func.new_block("then"); | ||||||
| let else_block = func.new_block("else"); | ||||||
| let after_block = func.new_block("after"); | ||||||
|
|
||||||
| let result = func.new_local(None, self.u32_type, "zeros"); | ||||||
| let zero = self.cx.gcc_zero(arg.get_type()); | ||||||
| let cond = self.gcc_icmp(IntPredicate::IntEQ, arg, zero); | ||||||
| self.llbb().end_with_conditional(None, cond, then_block, else_block); | ||||||
|
|
||||||
| let zero_result = self.cx.gcc_uint(self.u32_type, width); | ||||||
| then_block.add_assignment(None, result, zero_result); | ||||||
| then_block.end_with_jump(None, after_block); | ||||||
|
|
||||||
| // NOTE: since jumps were added in a place count_leading_zeroes_nonzero() does not expect, | ||||||
| // the current block in the state need to be updated. | ||||||
| self.switch_to_block(else_block); | ||||||
|
|
||||||
| let zeros = self.count_leading_zeroes_nonzero(width, arg); | ||||||
| self.llbb().add_assignment(None, result, zeros); | ||||||
| self.llbb().end_with_jump(None, after_block); | ||||||
|
|
||||||
| // NOTE: since jumps were added in a place rustc does not | ||||||
| // expect, the current block in the state need to be updated. | ||||||
| self.switch_to_block(after_block); | ||||||
|
|
||||||
| result.to_rvalue() | ||||||
| } | ||||||
|
|
||||||
| fn count_leading_zeroes_nonzero(&mut self, width: u64, arg: RValue<'gcc>) -> RValue<'gcc> { | ||||||
| // TODO(antoyo): use width? | ||||||
| let arg_type = arg.get_type(); | ||||||
| let result_type = self.u32_type; | ||||||
|
|
@@ -902,51 +904,44 @@ impl<'a, 'gcc, 'tcx> Builder<'a, 'gcc, 'tcx> { | |||||
| "__builtin_clzll" | ||||||
| } | ||||||
| else if width == 128 { | ||||||
| // Algorithm from: https://stackoverflow.com/a/28433850/389119 | ||||||
| let array_type = self.context.new_array_type(None, arg_type, 3); | ||||||
| // __buildin_clzll is UB when called with 0, so call it on the 64 high bits if they are not 0, | ||||||
| // else call it on the 64 low bits and add 64. In the else case, 64 low bits can't be 0 | ||||||
| // because arg is not 0. | ||||||
|
Contributor
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Same here, please specify that arg is not 0 because we're in |
||||||
|
|
||||||
| let result = self.current_func() | ||||||
| .new_local(None, array_type, "count_loading_zeroes_results"); | ||||||
| .new_local(None, result_type, "count_leading_zeroes_results"); | ||||||
|
|
||||||
| let ctlz_then_block = self.current_func().new_block("ctlz_then"); | ||||||
| let ctlz_else_block = self.current_func().new_block("ctlz_else"); | ||||||
| let ctlz_after_block = self.current_func().new_block("ctlz_after") | ||||||
| ; | ||||||
| let sixty_four = self.const_uint(arg_type, 64); | ||||||
| let shift = self.lshr(arg, sixty_four); | ||||||
| let high = self.gcc_int_cast(shift, self.u64_type); | ||||||
| let low = self.gcc_int_cast(arg, self.u64_type); | ||||||
|
|
||||||
| let zero = self.context.new_rvalue_zero(self.usize_type); | ||||||
| let one = self.context.new_rvalue_one(self.usize_type); | ||||||
| let two = self.context.new_rvalue_from_long(self.usize_type, 2); | ||||||
|
|
||||||
| let clzll = self.context.get_builtin_function("__builtin_clzll"); | ||||||
|
|
||||||
| let first_elem = self.context.new_array_access(None, result, zero); | ||||||
| let first_value = self.gcc_int_cast(self.context.new_call(None, clzll, &[high]), arg_type); | ||||||
| self.llbb() | ||||||
| .add_assignment(self.location, first_elem, first_value); | ||||||
|
|
||||||
| let second_elem = self.context.new_array_access(self.location, result, one); | ||||||
| let cast = self.gcc_int_cast(self.context.new_call(self.location, clzll, &[low]), arg_type); | ||||||
| let second_value = self.add(cast, sixty_four); | ||||||
| self.llbb() | ||||||
| .add_assignment(self.location, second_elem, second_value); | ||||||
|
|
||||||
| let third_elem = self.context.new_array_access(self.location, result, two); | ||||||
| let third_value = self.const_uint(arg_type, 128); | ||||||
| self.llbb() | ||||||
| .add_assignment(self.location, third_elem, third_value); | ||||||
|
|
||||||
| let not_high = self.context.new_unary_op(self.location, UnaryOp::LogicalNegate, self.u64_type, high); | ||||||
| let not_low = self.context.new_unary_op(self.location, UnaryOp::LogicalNegate, self.u64_type, low); | ||||||
| let not_low_and_not_high = not_low & not_high; | ||||||
| let index = not_high + not_low_and_not_high; | ||||||
| // NOTE: the following cast is necessary to avoid a GIMPLE verification failure in | ||||||
| // gcc. | ||||||
| // TODO(antoyo): do the correct verification in libgccjit to avoid an error at the | ||||||
| // compilation stage. | ||||||
| let index = self.context.new_cast(self.location, index, self.i32_type); | ||||||
|
|
||||||
| let res = self.context.new_array_access(self.location, result, index); | ||||||
|
|
||||||
| return self.gcc_int_cast(res.to_rvalue(), result_type); | ||||||
| let zero_hi = self.const_uint(high.get_type(), 0); | ||||||
| let cond = self.gcc_icmp(IntPredicate::IntNE, high, zero_hi); | ||||||
| self.llbb().end_with_conditional(self.location, cond, ctlz_then_block, ctlz_else_block); | ||||||
| self.switch_to_block(ctlz_then_block); | ||||||
|
|
||||||
| let result_128 = | ||||||
| self.gcc_int_cast(self.context.new_call(None, clzll, &[high]), result_type); | ||||||
|
|
||||||
| ctlz_then_block.add_assignment(self.location, result, result_128); | ||||||
| ctlz_then_block.end_with_jump(self.location, ctlz_after_block); | ||||||
|
|
||||||
| self.switch_to_block(ctlz_else_block); | ||||||
| let low = self.gcc_int_cast(arg, self.u64_type); | ||||||
| let low_leading_zeroes = | ||||||
| self.gcc_int_cast(self.context.new_call(None, clzll, &[low]), result_type); | ||||||
| let sixty_four_result_type = self.const_uint(result_type, 64); | ||||||
| let result_128 = self.add(low_leading_zeroes, sixty_four_result_type); | ||||||
| ctlz_else_block.add_assignment(self.location, result, result_128); | ||||||
| ctlz_else_block.end_with_jump(self.location, ctlz_after_block); | ||||||
| self.switch_to_block(ctlz_after_block); | ||||||
| return result.to_rvalue(); | ||||||
| } | ||||||
| else { | ||||||
| let count_leading_zeroes = self.context.get_builtin_function("__builtin_clzll"); | ||||||
|
|
@@ -961,7 +956,37 @@ impl<'a, 'gcc, 'tcx> Builder<'a, 'gcc, 'tcx> { | |||||
| self.context.new_cast(self.location, res, result_type) | ||||||
| } | ||||||
|
|
||||||
| fn count_trailing_zeroes(&mut self, _width: u64, arg: RValue<'gcc>) -> RValue<'gcc> { | ||||||
| fn count_trailing_zeroes(&mut self, width: u64, arg: RValue<'gcc>) -> RValue<'gcc> { | ||||||
|
Contributor
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Most of the code of this method is duplicated with |
||||||
| let func = self.current_func(); | ||||||
|
Contributor
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Same here, please add a comment. |
||||||
| let then_block = func.new_block("then"); | ||||||
| let else_block = func.new_block("else"); | ||||||
| let after_block = func.new_block("after"); | ||||||
|
|
||||||
| let result = func.new_local(None, self.u32_type, "zeros"); | ||||||
| let zero = self.cx.gcc_zero(arg.get_type()); | ||||||
| let cond = self.gcc_icmp(IntPredicate::IntEQ, arg, zero); | ||||||
| self.llbb().end_with_conditional(None, cond, then_block, else_block); | ||||||
|
|
||||||
| let zero_result = self.cx.gcc_uint(self.u32_type, width); | ||||||
| then_block.add_assignment(None, result, zero_result); | ||||||
| then_block.end_with_jump(None, after_block); | ||||||
|
|
||||||
| // NOTE: since jumps were added in a place count_trailing_zeroes_nonzero() does not expect, | ||||||
| // the current block in the state need to be updated. | ||||||
| self.switch_to_block(else_block); | ||||||
|
|
||||||
| let zeros = self.count_trailing_zeroes_nonzero(width, arg); | ||||||
| self.llbb().add_assignment(None, result, zeros); | ||||||
| self.llbb().end_with_jump(None, after_block); | ||||||
|
|
||||||
| // NOTE: since jumps were added in a place rustc does not | ||||||
| // expect, the current block in the state need to be updated. | ||||||
| self.switch_to_block(after_block); | ||||||
|
|
||||||
| result.to_rvalue() | ||||||
| } | ||||||
|
|
||||||
| fn count_trailing_zeroes_nonzero(&mut self, _width: u64, arg: RValue<'gcc>) -> RValue<'gcc> { | ||||||
| let arg_type = arg.get_type(); | ||||||
| let result_type = self.u32_type; | ||||||
| let arg = if arg_type.is_signed(self.cx) { | ||||||
|
|
@@ -985,50 +1010,43 @@ impl<'a, 'gcc, 'tcx> Builder<'a, 'gcc, 'tcx> { | |||||
| ("__builtin_ctzll", self.cx.ulonglong_type) | ||||||
| } | ||||||
| else if arg_type.is_u128(self.cx) { | ||||||
| // Adapted from the algorithm to count leading zeroes from: https://stackoverflow.com/a/28433850/389119 | ||||||
| let array_type = self.context.new_array_type(None, arg_type, 3); | ||||||
| let result = self.current_func() | ||||||
| .new_local(None, array_type, "count_loading_zeroes_results"); | ||||||
|
|
||||||
| let sixty_four = self.gcc_int(arg_type, 64); | ||||||
| let shift = self.gcc_lshr(arg, sixty_four); | ||||||
| let high = self.gcc_int_cast(shift, self.u64_type); | ||||||
| let low = self.gcc_int_cast(arg, self.u64_type); | ||||||
| // __buildin_ctzll is UB when called with 0, so call it on the 64 low bits if they are not 0, | ||||||
| // else call it on the 64 high bits and add 64. In the else case, 64 high bits can't be 0 | ||||||
| // because arg is not 0. | ||||||
|
Contributor
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Could you please specify that arg is not 0 since we're in the case of |
||||||
|
|
||||||
| let zero = self.context.new_rvalue_zero(self.usize_type); | ||||||
| let one = self.context.new_rvalue_one(self.usize_type); | ||||||
| let two = self.context.new_rvalue_from_long(self.usize_type, 2); | ||||||
|
|
||||||
| let ctzll = self.context.get_builtin_function("__builtin_ctzll"); | ||||||
|
|
||||||
| let first_elem = self.context.new_array_access(self.location, result, zero); | ||||||
| let first_value = self.gcc_int_cast(self.context.new_call(self.location, ctzll, &[low]), arg_type); | ||||||
| self.llbb() | ||||||
| .add_assignment(self.location, first_elem, first_value); | ||||||
|
|
||||||
| let second_elem = self.context.new_array_access(self.location, result, one); | ||||||
| let second_value = self.gcc_add(self.gcc_int_cast(self.context.new_call(self.location, ctzll, &[high]), arg_type), sixty_four); | ||||||
| self.llbb() | ||||||
| .add_assignment(self.location, second_elem, second_value); | ||||||
|
|
||||||
| let third_elem = self.context.new_array_access(self.location, result, two); | ||||||
| let third_value = self.gcc_int(arg_type, 128); | ||||||
| self.llbb() | ||||||
| .add_assignment(self.location, third_elem, third_value); | ||||||
|
|
||||||
| let not_low = self.context.new_unary_op(self.location, UnaryOp::LogicalNegate, self.u64_type, low); | ||||||
| let not_high = self.context.new_unary_op(self.location, UnaryOp::LogicalNegate, self.u64_type, high); | ||||||
| let not_low_and_not_high = not_low & not_high; | ||||||
| let index = not_low + not_low_and_not_high; | ||||||
| // NOTE: the following cast is necessary to avoid a GIMPLE verification failure in | ||||||
| // gcc. | ||||||
| // TODO(antoyo): do the correct verification in libgccjit to avoid an error at the | ||||||
| // compilation stage. | ||||||
| let index = self.context.new_cast(self.location, index, self.i32_type); | ||||||
| let result = self.current_func() | ||||||
|
Contributor
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. There is also a lot duplication with |
||||||
| .new_local(None, result_type, "count_trailing_zeroes_results"); | ||||||
|
|
||||||
| let res = self.context.new_array_access(self.location, result, index); | ||||||
| let ctlz_then_block = self.current_func().new_block("cttz_then"); | ||||||
| let ctlz_else_block = self.current_func().new_block("cttz_else"); | ||||||
| let ctlz_after_block = self.current_func().new_block("cttz_after"); | ||||||
| let clzll = self.context.get_builtin_function("__builtin_ctzll"); | ||||||
|
|
||||||
| return self.gcc_int_cast(res.to_rvalue(), result_type); | ||||||
| let low = self.gcc_int_cast(arg, self.u64_type); | ||||||
| let sixty_four = self.const_uint(arg_type, 64); | ||||||
| let shift = self.lshr(arg, sixty_four); | ||||||
| let high = self.gcc_int_cast(shift, self.u64_type); | ||||||
| let zero_low = self.const_uint(low.get_type(), 0); | ||||||
| let cond = self.gcc_icmp(IntPredicate::IntNE, low, zero_low); | ||||||
| self.llbb().end_with_conditional(self.location, cond, ctlz_then_block, ctlz_else_block); | ||||||
| self.switch_to_block(ctlz_then_block); | ||||||
|
|
||||||
| let result_128 = | ||||||
| self.gcc_int_cast(self.context.new_call(None, clzll, &[low]), result_type); | ||||||
|
|
||||||
| ctlz_then_block.add_assignment(self.location, result, result_128); | ||||||
| ctlz_then_block.end_with_jump(self.location, ctlz_after_block); | ||||||
|
|
||||||
| self.switch_to_block(ctlz_else_block); | ||||||
| let high_leading_zeroes = | ||||||
|
Contributor
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. I believe you mean:
Suggested change
|
||||||
| self.gcc_int_cast(self.context.new_call(None, clzll, &[high]), result_type); | ||||||
|
|
||||||
| let sixty_four_result_type = self.const_uint(result_type, 64); | ||||||
| let result_128 = self.add(high_leading_zeroes, sixty_four_result_type); | ||||||
| ctlz_else_block.add_assignment(self.location, result, result_128); | ||||||
| ctlz_else_block.end_with_jump(self.location, ctlz_after_block); | ||||||
| self.switch_to_block(ctlz_after_block); | ||||||
| return result.to_rvalue(); | ||||||
| } | ||||||
| else { | ||||||
| let count_trailing_zeroes = self.context.get_builtin_function("__builtin_ctzll"); | ||||||
|
|
||||||
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
Is there a UI test that tests this and now pass?
If not, could you please add a test in tests/run?