@@ -135,15 +135,15 @@ static Value *runtime_sym_lookup(
135
135
BasicBlock *dlsym_lookup = BasicBlock::Create (jl_LLVMContext, " dlsym" );
136
136
BasicBlock *ccall_bb = BasicBlock::Create (jl_LLVMContext, " ccall" );
137
137
Constant *initnul = ConstantPointerNull::get ((PointerType*)T_pvoidfunc);
138
- LoadInst *llvmf_orig = irbuilder.CreateAlignedLoad (llvmgv, sizeof (void *));
138
+ LoadInst *llvmf_orig = irbuilder.CreateAlignedLoad (T_pvoidfunc, llvmgv, sizeof (void *));
139
139
// This in principle needs a consume ordering so that load from
140
140
// this pointer sees a valid value. However, this is not supported by
141
141
// LLVM (or agreed on in the C/C++ standard FWIW) and should be
142
142
// almost impossible to happen on every platform we support since this
143
143
// ordering is enforced by the hardware and LLVM has to speculate an
144
144
// invalid load from the `cglobal` but doesn't depend on the `cglobal`
145
145
// value for this to happen.
146
- // llvmf_orig->setAtomic(AtomicOrdering::Consume );
146
+ llvmf_orig->setAtomic (AtomicOrdering::Unordered );
147
147
irbuilder.CreateCondBr (
148
148
irbuilder.CreateICmpNE (llvmf_orig, initnul),
149
149
ccall_bb,
@@ -162,7 +162,7 @@ static Value *runtime_sym_lookup(
162
162
}
163
163
Value *llvmf = irbuilder.CreateCall (prepare_call_in (jl_builderModule (irbuilder), jldlsym_func),
164
164
{ libname, stringConstPtr (irbuilder, f_name), libptrgv });
165
- auto store = irbuilder.CreateAlignedStore (llvmf, llvmgv, sizeof (void *));
165
+ StoreInst * store = irbuilder.CreateAlignedStore (llvmf, llvmgv, sizeof (void *));
166
166
store->setAtomic (AtomicOrdering::Release);
167
167
irbuilder.CreateBr (ccall_bb);
168
168
@@ -231,7 +231,7 @@ static GlobalVariable *emit_plt_thunk(
231
231
IRBuilder<> irbuilder (b0);
232
232
Value *ptr = runtime_sym_lookup (irbuilder, funcptype, f_lib, f_name, plt, libptrgv,
233
233
llvmgv, runtime_lib);
234
- auto store = irbuilder.CreateAlignedStore (irbuilder.CreateBitCast (ptr, T_pvoidfunc), got, sizeof (void *));
234
+ StoreInst * store = irbuilder.CreateAlignedStore (irbuilder.CreateBitCast (ptr, T_pvoidfunc), got, sizeof (void *));
235
235
store->setAtomic (AtomicOrdering::Release);
236
236
SmallVector<Value*, 16 > args;
237
237
for (Function::arg_iterator arg = plt->arg_begin (), arg_e = plt->arg_end (); arg != arg_e; ++arg)
@@ -314,7 +314,7 @@ static Value *emit_plt(
314
314
// consume ordering too. This is even less likely to cause issues though
315
315
// since the only thing we do to this loaded pointer is to call it
316
316
// immediately.
317
- // got_val->setAtomic(AtomicOrdering::Consume );
317
+ got_val->setAtomic (AtomicOrdering::Unordered );
318
318
return ctx.builder .CreateBitCast (got_val, funcptype);
319
319
}
320
320
@@ -429,17 +429,19 @@ static Value *llvm_type_rewrite(
429
429
Value *from;
430
430
Value *to;
431
431
const DataLayout &DL = jl_data_layout;
432
+ unsigned align = std::max (DL.getPrefTypeAlignment (target_type), DL.getPrefTypeAlignment (from_type));
432
433
if (DL.getTypeAllocSize (target_type) >= DL.getTypeAllocSize (from_type)) {
433
434
to = emit_static_alloca (ctx, target_type);
435
+ cast<AllocaInst>(to)->setAlignment (Align (align));
434
436
from = emit_bitcast (ctx, to, from_type->getPointerTo ());
435
437
}
436
438
else {
437
439
from = emit_static_alloca (ctx, from_type);
440
+ cast<AllocaInst>(from)->setAlignment (Align (align));
438
441
to = emit_bitcast (ctx, from, target_type->getPointerTo ());
439
442
}
440
- // XXX: deal with possible alignment issues
441
- ctx.builder .CreateStore (v, from);
442
- return ctx.builder .CreateLoad (to);
443
+ ctx.builder .CreateAlignedStore (v, from, align);
444
+ return ctx.builder .CreateAlignedLoad (to, align);
443
445
}
444
446
445
447
// --- argument passing and scratch space utilities ---
@@ -1604,9 +1606,9 @@ static jl_cgval_t emit_ccall(jl_codectx_t &ctx, jl_value_t **args, size_t nargs)
1604
1606
Value *ptls_i16 = emit_bitcast (ctx, ctx.ptlsStates , T_pint16);
1605
1607
const int tid_offset = offsetof (jl_tls_states_t , tid);
1606
1608
Value *ptid = ctx.builder .CreateGEP (ptls_i16, ConstantInt::get (T_size, tid_offset / 2 ));
1607
- return mark_or_box_ccall_result ( ctx,
1608
- tbaa_decorate (tbaa_const, ctx. builder . CreateLoad (ptid)),
1609
- retboxed, rt, unionall, static_rt);
1609
+ LoadInst *tid = ctx. builder . CreateAlignedLoad (ptid, sizeof ( int16_t ));
1610
+ tbaa_decorate (tbaa_const, tid);
1611
+ return mark_or_box_ccall_result (ctx, tid, retboxed, rt, unionall, static_rt);
1610
1612
}
1611
1613
else if (is_libjulia_func (jl_get_current_task)) {
1612
1614
assert (lrt == T_prjlvalue);
@@ -1615,9 +1617,9 @@ static jl_cgval_t emit_ccall(jl_codectx_t &ctx, jl_value_t **args, size_t nargs)
1615
1617
Value *ptls_pv = emit_bitcast (ctx, ctx.ptlsStates , T_pprjlvalue);
1616
1618
const int ct_offset = offsetof (jl_tls_states_t , current_task);
1617
1619
Value *pct = ctx.builder .CreateGEP (ptls_pv, ConstantInt::get (T_size, ct_offset / sizeof (void *)));
1618
- return mark_or_box_ccall_result ( ctx,
1619
- tbaa_decorate (tbaa_const, ctx. builder . CreateLoad (pct)),
1620
- retboxed, rt, unionall, static_rt);
1620
+ LoadInst *ct = ctx. builder . CreateAlignedLoad (pct, sizeof ( void *));
1621
+ tbaa_decorate (tbaa_const, ct);
1622
+ return mark_or_box_ccall_result (ctx, ct, retboxed, rt, unionall, static_rt);
1621
1623
}
1622
1624
else if (is_libjulia_func (jl_set_next_task)) {
1623
1625
assert (lrt == T_void);
@@ -1636,8 +1638,7 @@ static jl_cgval_t emit_ccall(jl_codectx_t &ctx, jl_value_t **args, size_t nargs)
1636
1638
ctx.builder .CreateCall (prepare_call (gcroot_flush_func));
1637
1639
Value *pdefer_sig = emit_defer_signal (ctx);
1638
1640
Value *defer_sig = ctx.builder .CreateLoad (pdefer_sig);
1639
- defer_sig = ctx.builder .CreateAdd (defer_sig,
1640
- ConstantInt::get (T_sigatomic, 1 ));
1641
+ defer_sig = ctx.builder .CreateAdd (defer_sig, ConstantInt::get (T_sigatomic, 1 ));
1641
1642
ctx.builder .CreateStore (defer_sig, pdefer_sig);
1642
1643
emit_signal_fence (ctx);
1643
1644
return ghostValue (jl_nothing_type);
@@ -1699,7 +1700,9 @@ static jl_cgval_t emit_ccall(jl_codectx_t &ctx, jl_value_t **args, size_t nargs)
1699
1700
idx = ctx.builder .CreateAdd (idx, ConstantInt::get (T_size, ((jl_datatype_t *)ety)->layout ->first_ptr ));
1700
1701
}
1701
1702
Value *slot_addr = ctx.builder .CreateInBoundsGEP (T_prjlvalue, arrayptr, idx);
1702
- Value *load = tbaa_decorate (tbaa_ptrarraybuf, ctx.builder .CreateLoad (T_prjlvalue, slot_addr));
1703
+ LoadInst *load = ctx.builder .CreateAlignedLoad (T_prjlvalue, slot_addr, sizeof (void *));
1704
+ load->setAtomic (AtomicOrdering::Unordered);
1705
+ tbaa_decorate (tbaa_ptrarraybuf, load);
1703
1706
Value *res = ctx.builder .CreateZExt (ctx.builder .CreateICmpNE (load, Constant::getNullValue (T_prjlvalue)), T_int32);
1704
1707
JL_GC_POP ();
1705
1708
return mark_or_box_ccall_result (ctx, res, retboxed, rt, unionall, static_rt);
0 commit comments