mirror of
https://github.com/autc04/Retro68.git
synced 2025-01-18 20:31:19 +00:00
37 lines
1.0 KiB
C
37 lines
1.0 KiB
C
/* { dg-additional-options "-save-temps" } */
|
|
/* { dg-do run { target openacc_nvidia_accel_selected } }
|
|
{ dg-skip-if "" { *-*-* } { "*" } { "-O2" } } */
|
|
|
|
int
|
|
main (void)
|
|
{
|
|
int v1;
|
|
|
|
#pragma acc parallel
|
|
#pragma acc loop worker
|
|
for (v1 = 0; v1 < 20; v1 += 2)
|
|
;
|
|
|
|
return 0;
|
|
}
|
|
|
|
/* Todo: Boths bar.syncs can be removed.
|
|
Atm we generate this dead code inbetween forked and joining:
|
|
|
|
mov.u32 %r28, %ntid.y;
|
|
mov.u32 %r29, %tid.y;
|
|
add.u32 %r30, %r29, %r29;
|
|
setp.gt.s32 %r31, %r30, 19;
|
|
@%r31 bra $L2;
|
|
add.u32 %r25, %r28, %r28;
|
|
mov.u32 %r24, %r30;
|
|
$L3:
|
|
add.u32 %r24, %r24, %r25;
|
|
setp.le.s32 %r33, %r24, 19;
|
|
@%r33 bra $L3;
|
|
$L2:
|
|
|
|
so the loop is not recognized as empty loop (which we detect by seeing if
|
|
joining immediately follows forked). */
|
|
/* { dg-final { scan-assembler-times "bar.sync" 2 } } */
|