@@ -89,15 +89,15 @@ static Value *runtime_sym_lookup(
89
89
BasicBlock *dlsym_lookup = BasicBlock::Create (jl_LLVMContext, " dlsym" );
90
90
BasicBlock *ccall_bb = BasicBlock::Create (jl_LLVMContext, " ccall" );
91
91
Constant *initnul = ConstantPointerNull::get ((PointerType*)T_pvoidfunc);
92
- LoadInst *llvmf_orig = irbuilder.CreateAlignedLoad (llvmgv, sizeof (void *));
92
+ LoadInst *llvmf_orig = irbuilder.CreateAlignedLoad (T_pvoidfunc, llvmgv, sizeof (void *));
93
93
// This in principle needs a consume ordering so that load from
94
94
// this pointer sees a valid value. However, this is not supported by
95
95
// LLVM (or agreed on in the C/C++ standard FWIW) and should be
96
96
// almost impossible to happen on every platform we support since this
97
97
// ordering is enforced by the hardware and LLVM has to speculate an
98
98
// invalid load from the `cglobal` but doesn't depend on the `cglobal`
99
99
// value for this to happen.
100
- // llvmf_orig->setAtomic(AtomicOrdering::Consume );
100
+ llvmf_orig->setAtomic (AtomicOrdering::Unordered );
101
101
irbuilder.CreateCondBr (
102
102
irbuilder.CreateICmpNE (llvmf_orig, initnul),
103
103
ccall_bb,
@@ -116,7 +116,7 @@ static Value *runtime_sym_lookup(
116
116
}
117
117
Value *llvmf = irbuilder.CreateCall (prepare_call_in (jl_builderModule (irbuilder), jldlsym_func),
118
118
{ libname, stringConstPtr (emission_context, irbuilder, f_name), libptrgv });
119
- auto store = irbuilder.CreateAlignedStore (llvmf, llvmgv, sizeof (void *));
119
+ StoreInst * store = irbuilder.CreateAlignedStore (llvmf, llvmgv, sizeof (void *));
120
120
store->setAtomic (AtomicOrdering::Release);
121
121
irbuilder.CreateBr (ccall_bb);
122
122
@@ -172,7 +172,7 @@ static GlobalVariable *emit_plt_thunk(
172
172
IRBuilder<> irbuilder (b0);
173
173
Value *ptr = runtime_sym_lookup (emission_context, irbuilder, funcptype, f_lib, f_name, plt, libptrgv,
174
174
llvmgv, runtime_lib);
175
- auto store = irbuilder.CreateAlignedStore (irbuilder.CreateBitCast (ptr, T_pvoidfunc), got, sizeof (void *));
175
+ StoreInst * store = irbuilder.CreateAlignedStore (irbuilder.CreateBitCast (ptr, T_pvoidfunc), got, sizeof (void *));
176
176
store->setAtomic (AtomicOrdering::Release);
177
177
SmallVector<Value*, 16 > args;
178
178
for (Function::arg_iterator arg = plt->arg_begin (), arg_e = plt->arg_end (); arg != arg_e; ++arg)
@@ -237,7 +237,7 @@ static Value *emit_plt(
237
237
// consume ordering too. This is even less likely to cause issues though
238
238
// since the only thing we do to this loaded pointer is to call it
239
239
// immediately.
240
- // got_val->setAtomic(AtomicOrdering::Consume );
240
+ got_val->setAtomic (AtomicOrdering::Unordered );
241
241
return ctx.builder .CreateBitCast (got_val, funcptype);
242
242
}
243
243
@@ -352,17 +352,19 @@ static Value *llvm_type_rewrite(
352
352
Value *from;
353
353
Value *to;
354
354
const DataLayout &DL = jl_data_layout;
355
+ unsigned align = std::max (DL.getPrefTypeAlignment (target_type), DL.getPrefTypeAlignment (from_type));
355
356
if (DL.getTypeAllocSize (target_type) >= DL.getTypeAllocSize (from_type)) {
356
357
to = emit_static_alloca (ctx, target_type);
358
+ cast<AllocaInst>(to)->setAlignment (Align (align));
357
359
from = emit_bitcast (ctx, to, from_type->getPointerTo ());
358
360
}
359
361
else {
360
362
from = emit_static_alloca (ctx, from_type);
363
+ cast<AllocaInst>(from)->setAlignment (Align (align));
361
364
to = emit_bitcast (ctx, from, target_type->getPointerTo ());
362
365
}
363
- // XXX: deal with possible alignment issues
364
- ctx.builder .CreateStore (v, from);
365
- return ctx.builder .CreateLoad (to);
366
+ ctx.builder .CreateAlignedStore (v, from, align);
367
+ return ctx.builder .CreateAlignedLoad (to, align);
366
368
}
367
369
368
370
// --- argument passing and scratch space utilities ---
@@ -1580,9 +1582,9 @@ static jl_cgval_t emit_ccall(jl_codectx_t &ctx, jl_value_t **args, size_t nargs)
1580
1582
Value *ptls_i16 = emit_bitcast (ctx, ctx.ptlsStates , T_pint16);
1581
1583
const int tid_offset = offsetof (jl_tls_states_t , tid);
1582
1584
Value *ptid = ctx.builder .CreateGEP (ptls_i16, ConstantInt::get (T_size, tid_offset / 2 ));
1583
- return mark_or_box_ccall_result ( ctx,
1584
- tbaa_decorate (tbaa_const, ctx. builder . CreateLoad (ptid)),
1585
- retboxed, rt, unionall, static_rt);
1585
+ LoadInst *tid = ctx. builder . CreateAlignedLoad (ptid, sizeof ( int16_t ));
1586
+ tbaa_decorate (tbaa_const, tid);
1587
+ return mark_or_box_ccall_result (ctx, tid, retboxed, rt, unionall, static_rt);
1586
1588
}
1587
1589
else if (is_libjulia_func (jl_get_current_task)) {
1588
1590
assert (lrt == T_prjlvalue);
@@ -1591,9 +1593,9 @@ static jl_cgval_t emit_ccall(jl_codectx_t &ctx, jl_value_t **args, size_t nargs)
1591
1593
Value *ptls_pv = emit_bitcast (ctx, ctx.ptlsStates , T_pprjlvalue);
1592
1594
const int ct_offset = offsetof (jl_tls_states_t , current_task);
1593
1595
Value *pct = ctx.builder .CreateGEP (ptls_pv, ConstantInt::get (T_size, ct_offset / sizeof (void *)));
1594
- return mark_or_box_ccall_result ( ctx,
1595
- tbaa_decorate (tbaa_const, ctx. builder . CreateLoad (pct)),
1596
- retboxed, rt, unionall, static_rt);
1596
+ LoadInst *ct = ctx. builder . CreateAlignedLoad (pct, sizeof ( void *));
1597
+ tbaa_decorate (tbaa_const, ct);
1598
+ return mark_or_box_ccall_result (ctx, ct, retboxed, rt, unionall, static_rt);
1597
1599
}
1598
1600
else if (is_libjulia_func (jl_set_next_task)) {
1599
1601
assert (lrt == T_void);
@@ -1612,8 +1614,7 @@ static jl_cgval_t emit_ccall(jl_codectx_t &ctx, jl_value_t **args, size_t nargs)
1612
1614
ctx.builder .CreateCall (prepare_call (gcroot_flush_func));
1613
1615
Value *pdefer_sig = emit_defer_signal (ctx);
1614
1616
Value *defer_sig = ctx.builder .CreateLoad (pdefer_sig);
1615
- defer_sig = ctx.builder .CreateAdd (defer_sig,
1616
- ConstantInt::get (T_sigatomic, 1 ));
1617
+ defer_sig = ctx.builder .CreateAdd (defer_sig, ConstantInt::get (T_sigatomic, 1 ));
1617
1618
ctx.builder .CreateStore (defer_sig, pdefer_sig);
1618
1619
emit_signal_fence (ctx);
1619
1620
return ghostValue (jl_nothing_type);
@@ -1675,7 +1676,9 @@ static jl_cgval_t emit_ccall(jl_codectx_t &ctx, jl_value_t **args, size_t nargs)
1675
1676
idx = ctx.builder .CreateAdd (idx, ConstantInt::get (T_size, ((jl_datatype_t *)ety)->layout ->first_ptr ));
1676
1677
}
1677
1678
Value *slot_addr = ctx.builder .CreateInBoundsGEP (T_prjlvalue, arrayptr, idx);
1678
- Value *load = tbaa_decorate (tbaa_ptrarraybuf, ctx.builder .CreateLoad (T_prjlvalue, slot_addr));
1679
+ LoadInst *load = ctx.builder .CreateAlignedLoad (T_prjlvalue, slot_addr, sizeof (void *));
1680
+ load->setAtomic (AtomicOrdering::Unordered);
1681
+ tbaa_decorate (tbaa_ptrarraybuf, load);
1679
1682
Value *res = ctx.builder .CreateZExt (ctx.builder .CreateICmpNE (load, Constant::getNullValue (T_prjlvalue)), T_int32);
1680
1683
JL_GC_POP ();
1681
1684
return mark_or_box_ccall_result (ctx, res, retboxed, rt, unionall, static_rt);
0 commit comments