| ; RUN: llc < %s | FileCheck %s |
| target datalayout = "e-m:e-i64:64-f80:128-n8:16:32:64-S128" |
| target triple = "x86_64-unknown-linux-gnu" |
| |
| define void @test(i256* %a, i256* %b, i256* %out) #0 { |
| entry: |
| %av = load i256, i256* %a |
| %bv = load i256, i256* %b |
| %r = mul i256 %av, %bv |
| store i256 %r, i256* %out |
| ret void |
| } |
| |
| ; CHECK-LABEL: @test |
| ; There is a lot of inter-register motion, and so matching the instruction |
| ; sequence will be fragile. There should be 6 underlying multiplications. |
| ; CHECK: imulq |
| ; CHECK: mulq |
| ; CHECK: imulq |
| ; CHECK: imulq |
| ; CHECK: mulq |
| ; CHECK: imulq |
| ; CHECK: mulq |
| ; CHECK: mulq |
| ; CHECK: mulq |
| ; CHECK: mulq |
| ; CHECK-NOT: imulq |
| ; CHECK-NOT: mulq |
| ; CHECK: retq |
| |
| attributes #0 = { norecurse nounwind uwtable "target-cpu"="x86-64" "target-features"="+fxsr,+mmx,+sse,+sse2,+x87" } |
| |