~pali/+junk/llvm-toolchain-3.7

%tmp2 = shufflevector <8 x i8> %tmp1, <8 x i8> undef, <16 x i32> < i32 1, i32 1, i32 1, i32 1, i32 1, i32 1, i32 1, i32 1, i32 1, i32 1, i32 1, i32 1, i32 1, i32 1, i32 1, i32 1 >

203

ret <16 x i8> %tmp2

204

}

205

206

define <8 x i16> @vduplaneQ16(<4 x i16>* %A) nounwind {

207

;CHECK-LABEL: vduplaneQ16:

208

;CHECK: vdup.16

209

%tmp1 = load <4 x i16>, <4 x i16>* %A

210

%tmp2 = shufflevector <4 x i16> %tmp1, <4 x i16> undef, <8 x i32> < i32 1, i32 1, i32 1, i32 1, i32 1, i32 1, i32 1, i32 1 >

211

ret <8 x i16> %tmp2

212

}

213

214

define <4 x i32> @vduplaneQ32(<2 x i32>* %A) nounwind {

215

;CHECK-LABEL: vduplaneQ32:

216

;CHECK: vdup.32

217

%tmp1 = load <2 x i32>, <2 x i32>* %A

218

%tmp2 = shufflevector <2 x i32> %tmp1, <2 x i32> undef, <4 x i32> < i32 1, i32 1, i32 1, i32 1 >

219

ret <4 x i32> %tmp2

220

}

221

222

define <4 x float> @vduplaneQfloat(<2 x float>* %A) nounwind {

223

;CHECK-LABEL: vduplaneQfloat:

224

;CHECK: vdup.32

225

%tmp1 = load <2 x float>, <2 x float>* %A

226

%tmp2 = shufflevector <2 x float> %tmp1, <2 x float> undef, <4 x i32> < i32 1, i32 1, i32 1, i32 1 >

227

ret <4 x float> %tmp2

228

}

229

230

define <2 x i64> @foo(<2 x i64> %arg0_int64x1_t) nounwind readnone {

231

entry:

232

%0 = shufflevector <2 x i64> %arg0_int64x1_t, <2 x i64> undef, <2 x i32> <i32 1, i32 1>

233

ret <2 x i64> %0

234

}

235

236

define <2 x i64> @bar(<2 x i64> %arg0_int64x1_t) nounwind readnone {

237

entry:

238

%0 = shufflevector <2 x i64> %arg0_int64x1_t, <2 x i64> undef, <2 x i32> <i32 0, i32 0>

239

ret <2 x i64> %0

240

}

241

242

define <2 x double> @baz(<2 x double> %arg0_int64x1_t) nounwind readnone {

243

entry:

244

%0 = shufflevector <2 x double> %arg0_int64x1_t, <2 x double> undef, <2 x i32> <i32 1, i32 1>

245

ret <2 x double> %0

246

}

247

248

define <2 x double> @qux(<2 x double> %arg0_int64x1_t) nounwind readnone {

249

entry:

250

%0 = shufflevector <2 x double> %arg0_int64x1_t, <2 x double> undef, <2 x i32> <i32 0, i32 0>

251

ret <2 x double> %0

252

}

253

254

; Radar 7373643

255

;CHECK-LABEL: redundantVdup:

256

;CHECK: vmov.i8

257

;CHECK-NOT: vdup.8

258

;CHECK: vstr

259

define void @redundantVdup(<8 x i8>* %ptr) nounwind {

260

%1 = insertelement <8 x i8> undef, i8 -128, i32 0

261

%2 = shufflevector <8 x i8> %1, <8 x i8> undef, <8 x i32> zeroinitializer

262

store <8 x i8> %2, <8 x i8>* %ptr, align 8

263

ret void

264

}

265

266

define <4 x i32> @tdupi(i32 %x, i32 %y) {

267

;CHECK-LABEL: tdupi:

268

;CHECK: vdup.32

269

%1 = insertelement <4 x i32> undef, i32 %x, i32 0

270

%2 = insertelement <4 x i32> %1, i32 %x, i32 1

271

%3 = insertelement <4 x i32> %2, i32 %x, i32 2

272

%4 = insertelement <4 x i32> %3, i32 %y, i32 3

273

ret <4 x i32> %4

274

}

275

276

define <4 x float> @tdupf(float %x, float %y) {

277

;CHECK-LABEL: tdupf:

278

;CHECK: vdup.32

279

%1 = insertelement <4 x float> undef, float %x, i32 0

280

%2 = insertelement <4 x float> %1, float %x, i32 1

281

%3 = insertelement <4 x float> %2, float %x, i32 2

282

%4 = insertelement <4 x float> %3, float %y, i32 3

283

ret <4 x float> %4

284

}

285

286

; This test checks that when splatting an element from a vector into another,

287

; the value isn't moved out to GPRs first.

288

define <4 x i32> @tduplane(<4 x i32> %invec) {

289

;CHECK-LABEL: tduplane:

290

;CHECK-NOT: vmov {{.*}}, d16[1]

291

;CHECK: vdup.32 {{.*}}, d16[1]

292

%in = extractelement <4 x i32> %invec, i32 1

293

%1 = insertelement <4 x i32> undef, i32 %in, i32 0

294

%2 = insertelement <4 x i32> %1, i32 %in, i32 1

295

%3 = insertelement <4 x i32> %2, i32 %in, i32 2

296

%4 = insertelement <4 x i32> %3, i32 255, i32 3

297

ret <4 x i32> %4

298

}

299

300

define <2 x float> @check_f32(<4 x float> %v) nounwind {

301

;CHECK-LABEL: check_f32:

302

;CHECK: vdup.32 {{.*}}, d{{..}}[1]

303

%x = extractelement <4 x float> %v, i32 3

304

%1 = insertelement <2 x float> undef, float %x, i32 0

305

%2 = insertelement <2 x float> %1, float %x, i32 1

306

ret <2 x float> %2

307

}

308

309

define <2 x i32> @check_i32(<4 x i32> %v) nounwind {

310

;CHECK-LABEL: check_i32:

311

;CHECK: vdup.32 {{.*}}, d{{..}}[1]

312

%x = extractelement <4 x i32> %v, i32 3

313

%1 = insertelement <2 x i32> undef, i32 %x, i32 0

314

%2 = insertelement <2 x i32> %1, i32 %x, i32 1

315

ret <2 x i32> %2

316

}

317

318

define <4 x i16> @check_i16(<8 x i16> %v) nounwind {

319

;CHECK-LABEL: check_i16:

320

;CHECK: vdup.16 {{.*}}, d{{..}}[3]

321

%x = extractelement <8 x i16> %v, i32 3

322

%1 = insertelement <4 x i16> undef, i16 %x, i32 0

323

%2 = insertelement <4 x i16> %1, i16 %x, i32 1

324

ret <4 x i16> %2

325

}

326

327

define <8 x i8> @check_i8(<16 x i8> %v) nounwind {

328

;CHECK-LABEL: check_i8:

329

;CHECK: vdup.8 {{.*}}, d{{..}}[3]

330

%x = extractelement <16 x i8> %v, i32 3

331

%1 = insertelement <8 x i8> undef, i8 %x, i32 0

332

%2 = insertelement <8 x i8> %1, i8 %x, i32 1

333

ret <8 x i8> %2

334

}

335

336

; Check that an SPR splat produces a vdup.

337

338

define <2 x float> @check_spr_splat2(<2 x float> %p, i16 %q) {

339

;CHECK-LABEL: check_spr_splat2:

340

;CHECK: vdup.32 d

341

%conv = sitofp i16 %q to float

342

%splat.splatinsert = insertelement <2 x float> undef, float %conv, i32 0

343

%splat.splat = shufflevector <2 x float> %splat.splatinsert, <2 x float> undef, <2 x i32> zeroinitializer

344

%sub = fsub <2 x float> %splat.splat, %p

345

ret <2 x float> %sub

346

}

347

348

define <4 x float> @check_spr_splat4(<4 x float> %p, i16 %q) {

349

;CHECK-LABEL: check_spr_splat4:

350

;CHECK: vld1.16

351

%conv = sitofp i16 %q to float

352

%splat.splatinsert = insertelement <4 x float> undef, float %conv, i32 0

353

%splat.splat = shufflevector <4 x float> %splat.splatinsert, <4 x float> undef, <4 x i32> zeroinitializer

354

%sub = fsub <4 x float> %splat.splat, %p

355

ret <4 x float> %sub

356

}

357

; Same codegen as above test; scalar is splatted using vld1, so shuffle index is irrelevant.

358

define <4 x float> @check_spr_splat4_lane1(<4 x float> %p, i16 %q) {

359

;CHECK-LABEL: check_spr_splat4_lane1:

360

;CHECK: vld1.16

361

%conv = sitofp i16 %q to float

362

%splat.splatinsert = insertelement <4 x float> undef, float %conv, i32 1

363

%splat.splat = shufflevector <4 x float> %splat.splatinsert, <4 x float> undef, <4 x i32> <i32 1, i32 1, i32 1, i32 1>

364

%sub = fsub <4 x float> %splat.splat, %p

365

ret <4 x float> %sub

366

}

Older »