cbe34bb5ed
From-SVN: r243994
359 lines
9.1 KiB
C
359 lines
9.1 KiB
C
/* OpenACC constructs
|
|
|
|
Copyright (C) 2014-2017 Free Software Foundation, Inc.
|
|
|
|
Contributed by Mentor Embedded.
|
|
|
|
This file is part of the GNU Offloading and Multi Processing Library
|
|
(libgomp).
|
|
|
|
Libgomp is free software; you can redistribute it and/or modify it
|
|
under the terms of the GNU General Public License as published by
|
|
the Free Software Foundation; either version 3, or (at your option)
|
|
any later version.
|
|
|
|
Libgomp is distributed in the hope that it will be useful, but WITHOUT ANY
|
|
WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
|
|
FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
|
more details.
|
|
|
|
Under Section 7 of GPL version 3, you are granted additional
|
|
permissions described in the GCC Runtime Library Exception, version
|
|
3.1, as published by the Free Software Foundation.
|
|
|
|
You should have received a copy of the GNU General Public License and
|
|
a copy of the GCC Runtime Library Exception along with this program;
|
|
see the files COPYING3 and COPYING.RUNTIME respectively. If not, see
|
|
<http://www.gnu.org/licenses/>. */
|
|
|
|
#include "libgomp_g.h"
|
|
|
|
__asm__ (".visible .func (.param .u32 %out_retval) GOACC_tid (.param .u32 %in_ar1);\n"
|
|
".visible .func (.param .u32 %out_retval) GOACC_ntid (.param .u32 %in_ar1);\n"
|
|
".visible .func (.param .u32 %out_retval) GOACC_ctaid (.param .u32 %in_ar1);\n"
|
|
".visible .func (.param .u32 %out_retval) GOACC_nctaid (.param .u32 %in_ar1);\n"
|
|
"// BEGIN GLOBAL FUNCTION DECL: GOACC_get_num_threads\n"
|
|
".visible .func (.param .u32 %out_retval) GOACC_get_num_threads;\n"
|
|
"// BEGIN GLOBAL FUNCTION DECL: GOACC_get_thread_num\n"
|
|
".visible .func (.param .u32 %out_retval) GOACC_get_thread_num;\n"
|
|
"// BEGIN GLOBAL FUNCTION DECL: abort\n"
|
|
".extern .func abort;\n"
|
|
".visible .func (.param .u32 %out_retval) GOACC_tid (.param .u32 %in_ar1)\n"
|
|
"{\n"
|
|
".reg .u32 %ar1;\n"
|
|
".reg .u32 %retval;\n"
|
|
".reg .u64 %hr10;\n"
|
|
".reg .u32 %r22;\n"
|
|
".reg .u32 %r23;\n"
|
|
".reg .u32 %r24;\n"
|
|
".reg .u32 %r25;\n"
|
|
".reg .u32 %r26;\n"
|
|
".reg .u32 %r27;\n"
|
|
".reg .u32 %r28;\n"
|
|
".reg .u32 %r29;\n"
|
|
".reg .pred %r30;\n"
|
|
".reg .u32 %r31;\n"
|
|
".reg .pred %r32;\n"
|
|
".reg .u32 %r33;\n"
|
|
".reg .pred %r34;\n"
|
|
".local .align 8 .b8 %frame[4];\n"
|
|
"ld.param.u32 %ar1,[%in_ar1];\n"
|
|
"mov.u32 %r27,%ar1;\n"
|
|
"st.local.u32 [%frame],%r27;\n"
|
|
"ld.local.u32 %r28,[%frame];\n"
|
|
"mov.u32 %r29,1;\n"
|
|
"setp.eq.u32 %r30,%r28,%r29;\n"
|
|
"@%r30 bra $L4;\n"
|
|
"mov.u32 %r31,2;\n"
|
|
"setp.eq.u32 %r32,%r28,%r31;\n"
|
|
"@%r32 bra $L5;\n"
|
|
"mov.u32 %r33,0;\n"
|
|
"setp.eq.u32 %r34,%r28,%r33;\n"
|
|
"@!%r34 bra $L8;\n"
|
|
"mov.u32 %r23,%tid.x;\n"
|
|
"mov.u32 %r22,%r23;\n"
|
|
"bra $L7;\n"
|
|
"$L4:\n"
|
|
"mov.u32 %r24,%tid.y;\n"
|
|
"mov.u32 %r22,%r24;\n"
|
|
"bra $L7;\n"
|
|
"$L5:\n"
|
|
"mov.u32 %r25,%tid.z;\n"
|
|
"mov.u32 %r22,%r25;\n"
|
|
"bra $L7;\n"
|
|
"$L8:\n"
|
|
"{\n"
|
|
"{\n"
|
|
"call abort;\n"
|
|
"}\n"
|
|
"}\n"
|
|
"$L7:\n"
|
|
"mov.u32 %r26,%r22;\n"
|
|
"mov.u32 %retval,%r26;\n"
|
|
"st.param.u32 [%out_retval],%retval;\n"
|
|
"ret;\n"
|
|
"}\n"
|
|
".visible .func (.param .u32 %out_retval) GOACC_ntid (.param .u32 %in_ar1)\n"
|
|
"{\n"
|
|
".reg .u32 %ar1;\n"
|
|
".reg .u32 %retval;\n"
|
|
".reg .u64 %hr10;\n"
|
|
".reg .u32 %r22;\n"
|
|
".reg .u32 %r23;\n"
|
|
".reg .u32 %r24;\n"
|
|
".reg .u32 %r25;\n"
|
|
".reg .u32 %r26;\n"
|
|
".reg .u32 %r27;\n"
|
|
".reg .u32 %r28;\n"
|
|
".reg .u32 %r29;\n"
|
|
".reg .pred %r30;\n"
|
|
".reg .u32 %r31;\n"
|
|
".reg .pred %r32;\n"
|
|
".reg .u32 %r33;\n"
|
|
".reg .pred %r34;\n"
|
|
".local .align 8 .b8 %frame[4];\n"
|
|
"ld.param.u32 %ar1,[%in_ar1];\n"
|
|
"mov.u32 %r27,%ar1;\n"
|
|
"st.local.u32 [%frame],%r27;\n"
|
|
"ld.local.u32 %r28,[%frame];\n"
|
|
"mov.u32 %r29,1;\n"
|
|
"setp.eq.u32 %r30,%r28,%r29;\n"
|
|
"@%r30 bra $L11;\n"
|
|
"mov.u32 %r31,2;\n"
|
|
"setp.eq.u32 %r32,%r28,%r31;\n"
|
|
"@%r32 bra $L12;\n"
|
|
"mov.u32 %r33,0;\n"
|
|
"setp.eq.u32 %r34,%r28,%r33;\n"
|
|
"@!%r34 bra $L15;\n"
|
|
"mov.u32 %r23,%ntid.x;\n"
|
|
"mov.u32 %r22,%r23;\n"
|
|
"bra $L14;\n"
|
|
"$L11:\n"
|
|
"mov.u32 %r24,%ntid.y;\n"
|
|
"mov.u32 %r22,%r24;\n"
|
|
"bra $L14;\n"
|
|
"$L12:\n"
|
|
"mov.u32 %r25,%ntid.z;\n"
|
|
"mov.u32 %r22,%r25;\n"
|
|
"bra $L14;\n"
|
|
"$L15:\n"
|
|
"{\n"
|
|
"{\n"
|
|
"call abort;\n"
|
|
"}\n"
|
|
"}\n"
|
|
"$L14:\n"
|
|
"mov.u32 %r26,%r22;\n"
|
|
"mov.u32 %retval,%r26;\n"
|
|
"st.param.u32 [%out_retval],%retval;\n"
|
|
"ret;\n"
|
|
"}\n"
|
|
".visible .func (.param .u32 %out_retval) GOACC_ctaid (.param .u32 %in_ar1)\n"
|
|
"{\n"
|
|
".reg .u32 %ar1;\n"
|
|
".reg .u32 %retval;\n"
|
|
".reg .u64 %hr10;\n"
|
|
".reg .u32 %r22;\n"
|
|
".reg .u32 %r23;\n"
|
|
".reg .u32 %r24;\n"
|
|
".reg .u32 %r25;\n"
|
|
".reg .u32 %r26;\n"
|
|
".reg .u32 %r27;\n"
|
|
".reg .u32 %r28;\n"
|
|
".reg .u32 %r29;\n"
|
|
".reg .pred %r30;\n"
|
|
".reg .u32 %r31;\n"
|
|
".reg .pred %r32;\n"
|
|
".reg .u32 %r33;\n"
|
|
".reg .pred %r34;\n"
|
|
".local .align 8 .b8 %frame[4];\n"
|
|
"ld.param.u32 %ar1,[%in_ar1];\n"
|
|
"mov.u32 %r27,%ar1;\n"
|
|
"st.local.u32 [%frame],%r27;\n"
|
|
"ld.local.u32 %r28,[%frame];\n"
|
|
"mov.u32 %r29,1;\n"
|
|
"setp.eq.u32 %r30,%r28,%r29;\n"
|
|
"@%r30 bra $L18;\n"
|
|
"mov.u32 %r31,2;\n"
|
|
"setp.eq.u32 %r32,%r28,%r31;\n"
|
|
"@%r32 bra $L19;\n"
|
|
"mov.u32 %r33,0;\n"
|
|
"setp.eq.u32 %r34,%r28,%r33;\n"
|
|
"@!%r34 bra $L22;\n"
|
|
"mov.u32 %r23,%ctaid.x;\n"
|
|
"mov.u32 %r22,%r23;\n"
|
|
"bra $L21;\n"
|
|
"$L18:\n"
|
|
"mov.u32 %r24,%ctaid.y;\n"
|
|
"mov.u32 %r22,%r24;\n"
|
|
"bra $L21;\n"
|
|
"$L19:\n"
|
|
"mov.u32 %r25,%ctaid.z;\n"
|
|
"mov.u32 %r22,%r25;\n"
|
|
"bra $L21;\n"
|
|
"$L22:\n"
|
|
"{\n"
|
|
"{\n"
|
|
"call abort;\n"
|
|
"}\n"
|
|
"}\n"
|
|
"$L21:\n"
|
|
"mov.u32 %r26,%r22;\n"
|
|
"mov.u32 %retval,%r26;\n"
|
|
"st.param.u32 [%out_retval],%retval;\n"
|
|
"ret;\n"
|
|
"}\n"
|
|
".visible .func (.param .u32 %out_retval) GOACC_nctaid (.param .u32 %in_ar1)\n"
|
|
"{\n"
|
|
".reg .u32 %ar1;\n"
|
|
".reg .u32 %retval;\n"
|
|
".reg .u64 %hr10;\n"
|
|
".reg .u32 %r22;\n"
|
|
".reg .u32 %r23;\n"
|
|
".reg .u32 %r24;\n"
|
|
".reg .u32 %r25;\n"
|
|
".reg .u32 %r26;\n"
|
|
".reg .u32 %r27;\n"
|
|
".reg .u32 %r28;\n"
|
|
".reg .u32 %r29;\n"
|
|
".reg .pred %r30;\n"
|
|
".reg .u32 %r31;\n"
|
|
".reg .pred %r32;\n"
|
|
".reg .u32 %r33;\n"
|
|
".reg .pred %r34;\n"
|
|
".local .align 8 .b8 %frame[4];\n"
|
|
"ld.param.u32 %ar1,[%in_ar1];\n"
|
|
"mov.u32 %r27,%ar1;\n"
|
|
"st.local.u32 [%frame],%r27;\n"
|
|
"ld.local.u32 %r28,[%frame];\n"
|
|
"mov.u32 %r29,1;\n"
|
|
"setp.eq.u32 %r30,%r28,%r29;\n"
|
|
"@%r30 bra $L25;\n"
|
|
"mov.u32 %r31,2;\n"
|
|
"setp.eq.u32 %r32,%r28,%r31;\n"
|
|
"@%r32 bra $L26;\n"
|
|
"mov.u32 %r33,0;\n"
|
|
"setp.eq.u32 %r34,%r28,%r33;\n"
|
|
"@!%r34 bra $L29;\n"
|
|
"mov.u32 %r23,%nctaid.x;\n"
|
|
"mov.u32 %r22,%r23;\n"
|
|
"bra $L28;\n"
|
|
"$L25:\n"
|
|
"mov.u32 %r24,%nctaid.y;\n"
|
|
"mov.u32 %r22,%r24;\n"
|
|
"bra $L28;\n"
|
|
"$L26:\n"
|
|
"mov.u32 %r25,%nctaid.z;\n"
|
|
"mov.u32 %r22,%r25;\n"
|
|
"bra $L28;\n"
|
|
"$L29:\n"
|
|
"{\n"
|
|
"{\n"
|
|
"call abort;\n"
|
|
"}\n"
|
|
"}\n"
|
|
"$L28:\n"
|
|
"mov.u32 %r26,%r22;\n"
|
|
"mov.u32 %retval,%r26;\n"
|
|
"st.param.u32 [%out_retval],%retval;\n"
|
|
"ret;\n"
|
|
"}\n"
|
|
"// BEGIN GLOBAL FUNCTION DEF: GOACC_get_num_threads\n"
|
|
".visible .func (.param .u32 %out_retval) GOACC_get_num_threads\n"
|
|
"{\n"
|
|
".reg .u32 %retval;\n"
|
|
".reg .u64 %hr10;\n"
|
|
".reg .u32 %r22;\n"
|
|
".reg .u32 %r23;\n"
|
|
".reg .u32 %r24;\n"
|
|
".reg .u32 %r25;\n"
|
|
".reg .u32 %r26;\n"
|
|
".reg .u32 %r27;\n"
|
|
".reg .u32 %r28;\n"
|
|
".reg .u32 %r29;\n"
|
|
"mov.u32 %r26,0;\n"
|
|
"{\n"
|
|
".param .u32 %retval_in;\n"
|
|
"{\n"
|
|
".param .u32 %out_arg0;\n"
|
|
"st.param.u32 [%out_arg0],%r26;\n"
|
|
"call (%retval_in),GOACC_ntid,(%out_arg0);\n"
|
|
"}\n"
|
|
"ld.param.u32 %r27,[%retval_in];\n"
|
|
"}\n"
|
|
"mov.u32 %r22,%r27;\n"
|
|
"mov.u32 %r28,0;\n"
|
|
"{\n"
|
|
".param .u32 %retval_in;\n"
|
|
"{\n"
|
|
".param .u32 %out_arg0;\n"
|
|
"st.param.u32 [%out_arg0],%r28;\n"
|
|
"call (%retval_in),GOACC_nctaid,(%out_arg0);\n"
|
|
"}\n"
|
|
"ld.param.u32 %r29,[%retval_in];\n"
|
|
"}\n"
|
|
"mov.u32 %r23,%r29;\n"
|
|
"mul.lo.u32 %r24,%r22,%r23;\n"
|
|
"mov.u32 %r25,%r24;\n"
|
|
"mov.u32 %retval,%r25;\n"
|
|
"st.param.u32 [%out_retval],%retval;\n"
|
|
"ret;\n"
|
|
"}\n"
|
|
"// BEGIN GLOBAL FUNCTION DEF: GOACC_get_thread_num\n"
|
|
".visible .func (.param .u32 %out_retval) GOACC_get_thread_num\n"
|
|
"{\n"
|
|
".reg .u32 %retval;\n"
|
|
".reg .u64 %hr10;\n"
|
|
".reg .u32 %r22;\n"
|
|
".reg .u32 %r23;\n"
|
|
".reg .u32 %r24;\n"
|
|
".reg .u32 %r25;\n"
|
|
".reg .u32 %r26;\n"
|
|
".reg .u32 %r27;\n"
|
|
".reg .u32 %r28;\n"
|
|
".reg .u32 %r29;\n"
|
|
".reg .u32 %r30;\n"
|
|
".reg .u32 %r31;\n"
|
|
".reg .u32 %r32;\n"
|
|
".reg .u32 %r33;\n"
|
|
"mov.u32 %r28,0;\n"
|
|
"{\n"
|
|
".param .u32 %retval_in;\n"
|
|
"{\n"
|
|
".param .u32 %out_arg0;\n"
|
|
"st.param.u32 [%out_arg0],%r28;\n"
|
|
"call (%retval_in),GOACC_ntid,(%out_arg0);\n"
|
|
"}\n"
|
|
"ld.param.u32 %r29,[%retval_in];\n"
|
|
"}\n"
|
|
"mov.u32 %r22,%r29;\n"
|
|
"mov.u32 %r30,0;\n"
|
|
"{\n"
|
|
".param .u32 %retval_in;\n"
|
|
"{\n"
|
|
".param .u32 %out_arg0;\n"
|
|
"st.param.u32 [%out_arg0],%r30;\n"
|
|
"call (%retval_in),GOACC_ctaid,(%out_arg0);\n"
|
|
"}\n"
|
|
"ld.param.u32 %r31,[%retval_in];\n"
|
|
"}\n"
|
|
"mov.u32 %r23,%r31;\n"
|
|
"mul.lo.u32 %r24,%r22,%r23;\n"
|
|
"mov.u32 %r32,0;\n"
|
|
"{\n"
|
|
".param .u32 %retval_in;\n"
|
|
"{\n"
|
|
".param .u32 %out_arg0;\n"
|
|
"st.param.u32 [%out_arg0],%r32;\n"
|
|
"call (%retval_in),GOACC_tid,(%out_arg0);\n"
|
|
"}\n"
|
|
"ld.param.u32 %r33,[%retval_in];\n"
|
|
"}\n"
|
|
"mov.u32 %r25,%r33;\n"
|
|
"add.u32 %r26,%r24,%r25;\n"
|
|
"mov.u32 %r27,%r26;\n"
|
|
"mov.u32 %retval,%r27;\n"
|
|
"st.param.u32 [%out_retval],%retval;\n"
|
|
"ret;\n"
|
|
"}\n");
|