intel
diff --git a/‎llvm/test/CodeGen/NVPTX/LoadStoreVectorizer.ll
Lines changed: 3 additions & 0 deletions b/‎llvm/test/CodeGen/NVPTX/LoadStoreVectorizer.ll
Lines changed: 3 additions & 0 deletions
diff --git a/‎llvm/test/CodeGen/NVPTX/MachineSink-call.ll
Lines changed: 2 additions & 0 deletions b/‎llvm/test/CodeGen/NVPTX/MachineSink-call.ll
Lines changed: 2 additions & 0 deletions
diff --git a/‎llvm/test/CodeGen/NVPTX/MachineSink-convergent.ll
Lines changed: 2 additions & 0 deletions b/‎llvm/test/CodeGen/NVPTX/MachineSink-convergent.ll
Lines changed: 2 additions & 0 deletions
diff --git a/‎llvm/test/CodeGen/NVPTX/TailDuplication-convergent.ll
Lines changed: 1 addition & 0 deletions b/‎llvm/test/CodeGen/NVPTX/TailDuplication-convergent.ll
Lines changed: 1 addition & 0 deletions
diff --git a/‎llvm/test/CodeGen/NVPTX/access-non-generic.ll
Lines changed: 2 additions & 0 deletions b/‎llvm/test/CodeGen/NVPTX/access-non-generic.ll
Lines changed: 2 additions & 0 deletions
diff --git a/‎llvm/test/CodeGen/NVPTX/add-128bit.ll
Lines changed: 1 addition & 0 deletions b/‎llvm/test/CodeGen/NVPTX/add-128bit.ll
Lines changed: 1 addition & 0 deletions
diff --git a/‎llvm/test/CodeGen/NVPTX/addrspacecast-gvar.ll
Lines changed: 1 addition & 0 deletions b/‎llvm/test/CodeGen/NVPTX/addrspacecast-gvar.ll
Lines changed: 1 addition & 0 deletions
diff --git a/‎llvm/test/CodeGen/NVPTX/addrspacecast.ll
Lines changed: 3 additions & 0 deletions b/‎llvm/test/CodeGen/NVPTX/addrspacecast.ll
Lines changed: 3 additions & 0 deletions
diff --git a/‎llvm/test/CodeGen/NVPTX/aggr-param.ll
Lines changed: 1 addition & 0 deletions b/‎llvm/test/CodeGen/NVPTX/aggr-param.ll
Lines changed: 1 addition & 0 deletions
diff --git a/‎llvm/test/CodeGen/NVPTX/aggregate-return.ll
Lines changed: 1 addition & 0 deletions b/‎llvm/test/CodeGen/NVPTX/aggregate-return.ll
Lines changed: 1 addition & 0 deletions
@@ -1,5 +1,8 @@
 ; RUN: llc < %s | FileCheck -check-prefix=ENABLED %s
 ; RUN: llc -disable-nvptx-load-store-vectorizer < %s | FileCheck -check-prefix=DISABLED %s
+; RUN: %if ptxas %{ llc < %s | %ptxas-verify %}
+; RUN: %if ptxas %{ llc -disable-nvptx-load-store-vectorizer < %s | %ptxas-verify %}
+
 target triple = "nvptx64-nvidia-cuda"
 
 ; Check that the load-store vectorizer is enabled by default for nvptx, and
 
@@ -1,4 +1,6 @@
 ; RUN: llc < %s | FileCheck %s
+; RUN: %if ptxas %{ llc < %s | %ptxas-verify %}
+
 target triple = "nvptx64-nvidia-cuda"
 
 declare void @foo()
 
@@ -1,4 +1,6 @@
 ; RUN: llc < %s | FileCheck %s
+; RUN: %if ptxas %{ llc < %s | %ptxas-verify %}
+
 target triple = "nvptx64-nvidia-cuda"
 
 declare void @llvm.nvvm.barrier0()
 
@@ -1,4 +1,5 @@
 ; RUN: llc -O2 -tail-dup-size=100 -enable-tail-merge=0 < %s | FileCheck %s
+; RUN: %if ptxas %{ llc -O2 -tail-dup-size=100 -enable-tail-merge=0 < %s | %ptxas-verify %}
 target triple = "nvptx64-nvidia-cuda"
 
 declare void @foo()
 
@@ -2,6 +2,8 @@
 ; RUN: llc < %s -march=nvptx64 -mcpu=sm_20 | FileCheck %s --check-prefix PTX
 ; RUN: opt -mtriple=nvptx-- < %s -S -infer-address-spaces | FileCheck %s --check-prefix IR
 ; RUN: opt -mtriple=nvptx64-- < %s -S -infer-address-spaces | FileCheck %s --check-prefix IR
+; RUN: %if ptxas %{ llc < %s -march=nvptx -mcpu=sm_20 | %ptxas-verify %}
+; RUN: %if ptxas %{ llc < %s -march=nvptx64 -mcpu=sm_20 | %ptxas-verify %}
 
 @array = internal addrspace(3) global [10 x float] zeroinitializer, align 4
 @scalar = internal addrspace(3) global float 0.000000e+00, align 4
 
@@ -1,4 +1,5 @@
 ; RUN: llc < %s -march=nvptx -mcpu=sm_20 | FileCheck %s
+; RUN: %if ptxas %{ llc < %s -march=nvptx -mcpu=sm_20 | %ptxas-verify %}
 
 target datalayout = "e-p:32:32:32-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v16:16:16-v32:32:32-v64:64:64-v128:128:128-n16:32:64"
 
 
@@ -1,4 +1,5 @@
 ; RUN: llc < %s -march=nvptx -mcpu=sm_20 | FileCheck %s
+; RUN: %if ptxas %{ llc < %s -march=nvptx -mcpu=sm_20 | %ptxas-verify %}
 
 ; CHECK: .visible .global .align 4 .u32 g = 42;
 ; CHECK: .visible .global .align 4 .u32 g2 = generic(g);
 
@@ -1,6 +1,9 @@
 ; RUN: llc -O0 < %s -march=nvptx -mcpu=sm_20 | FileCheck %s -check-prefixes=ALL,CLS32,G32
 ; RUN: llc -O0 < %s -march=nvptx64 -mcpu=sm_20 | FileCheck %s -check-prefixes=ALL,NOPTRCONV,CLS64,G64
 ; RUN: llc -O0 < %s -march=nvptx64 -mcpu=sm_20 --nvptx-short-ptr| FileCheck %s -check-prefixes=ALL,PTRCONV,CLS64,G64
+; RUN: %if ptxas %{ llc -O0 < %s -march=nvptx -mcpu=sm_20 | %ptxas-verify %}
+; RUN: %if ptxas %{ llc -O0 < %s -march=nvptx64 -mcpu=sm_20 | %ptxas-verify %}
+; RUN: %if ptxas %{ llc -O0 < %s -march=nvptx64 -mcpu=sm_20 --nvptx-short-ptr | %ptxas-verify %}
 
 ; ALL-LABEL: conv1
 define i32 @conv1(i32 addrspace(1)* %ptr) {
 
@@ -1,4 +1,5 @@
 ; RUN: llc < %s -march=nvptx -mcpu=sm_20 | FileCheck %s
+; RUN: %if ptxas %{ llc < %s -march=nvptx -mcpu=sm_20 | %ptxas-verify %}
 
 ; Make sure aggregate param types get emitted properly.
 
 
@@ -1,4 +1,5 @@
 ; RUN: llc < %s -march=nvptx64 -mcpu=sm_35 | FileCheck %s
+; RUN: %if ptxas %{ llc < %s -march=nvptx64 -mcpu=sm_35 | %ptxas-verify -arch=sm_35 %}
 
 declare <2 x float> @barv(<2 x float> %input)
 declare <3 x float> @barv3(<3 x float> %input)
Original file line number	Diff line number	Diff line change
`@@ -1,4 +1,5 @@`
`1`	`1`	`; RUN: llc -O2 -tail-dup-size=100 -enable-tail-merge=0 < %s \| FileCheck %s`
	`2`	`+; RUN: %if ptxas %{ llc -O2 -tail-dup-size=100 -enable-tail-merge=0 < %s \| %ptxas-verify %}`
`2`	`3`	`target triple = "nvptx64-nvidia-cuda"`
`3`	`4`
`4`	`5`	`declare void @foo()`
Original file line number	Diff line number	Diff line change
`@@ -1,4 +1,5 @@`
`1`	`1`	`; RUN: llc < %s -march=nvptx -mcpu=sm_20 \| FileCheck %s`
	`2`	`+; RUN: %if ptxas %{ llc < %s -march=nvptx -mcpu=sm_20 \| %ptxas-verify %}`
`2`	`3`
`3`	`4`	`target datalayout = "e-p:32:32:32-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v16:16:16-v32:32:32-v64:64:64-v128:128:128-n16:32:64"`
`4`	`5`
Original file line number	Diff line number	Diff line change
`@@ -1,4 +1,5 @@`
`1`	`1`	`; RUN: llc < %s -march=nvptx64 -mcpu=sm_35 \| FileCheck %s`
	`2`	`+; RUN: %if ptxas %{ llc < %s -march=nvptx64 -mcpu=sm_35 \| %ptxas-verify -arch=sm_35 %}`
`2`	`3`
`3`	`4`	`declare <2 x float> @barv(<2 x float> %input)`
`4`	`5`	`declare <3 x float> @barv3(<3 x float> %input)`