mirror of git://gcc.gnu.org/git/gcc.git
nvptx offloading linking
gcc/ * config/nvptx/mkoffload.c (Kind, Vis): Remove enums. (Token, Stmt): Remove structs. (decls, vars, fns): Remove variables. (alloc_comment, append_stmt, is_keyword): Remove macros. (tokenize, write_token, write_tokens, alloc_stmt, rev_stmts) (write_stmt, write_stmts, parse_insn, parse_list_nosemi) (parse_init, parse_file): Remove functions. (read_file): Accept a pointer to a length and store into it. (process): Don't try to parse the input file, just write it out as a string, but looking for maps. Also write out the length. (main): Don't use "-S" to compile PTX code. libgomp/ * oacc-ptx.h: Remove file, moving its content into... * config/nvptx/fortran.c: ... here... * config/nvptx/oacc-init.c: ..., here... * config/nvptx/oacc-parallel.c: ..., and here. * config/nvptx/openacc.f90: New file. * plugin/plugin-nvptx.c: Don't include "oacc-ptx.h". (link_ptx): Don't link in predefined bits of PTX code. Co-Authored-By: Bernd Schmidt <bernds@codesourcery.com> From-SVN: r228418
This commit is contained in:
parent
7fcdbdd21d
commit
113020dc59
|
|
@ -1,3 +1,18 @@
|
||||||
|
2015-10-02 Thomas Schwinge <thomas@codesourcery.com>
|
||||||
|
Bernd Schmidt <bernds@codesourcery.com>
|
||||||
|
|
||||||
|
* config/nvptx/mkoffload.c (Kind, Vis): Remove enums.
|
||||||
|
(Token, Stmt): Remove structs.
|
||||||
|
(decls, vars, fns): Remove variables.
|
||||||
|
(alloc_comment, append_stmt, is_keyword): Remove macros.
|
||||||
|
(tokenize, write_token, write_tokens, alloc_stmt, rev_stmts)
|
||||||
|
(write_stmt, write_stmts, parse_insn, parse_list_nosemi)
|
||||||
|
(parse_init, parse_file): Remove functions.
|
||||||
|
(read_file): Accept a pointer to a length and store into it.
|
||||||
|
(process): Don't try to parse the input file, just write it out as
|
||||||
|
a string, but looking for maps. Also write out the length.
|
||||||
|
(main): Don't use "-S" to compile PTX code.
|
||||||
|
|
||||||
2015-10-02 Jeff Law <law@redhat.com>
|
2015-10-02 Jeff Law <law@redhat.com>
|
||||||
|
|
||||||
* tree-ssa-dom.c (optimize_stmt): Note when loop structures need
|
* tree-ssa-dom.c (optimize_stmt): Note when loop structures need
|
||||||
|
|
|
||||||
|
|
@ -41,84 +41,12 @@ const char tool_name[] = "nvptx mkoffload";
|
||||||
|
|
||||||
#define COMMENT_PREFIX "#"
|
#define COMMENT_PREFIX "#"
|
||||||
|
|
||||||
typedef enum Kind
|
|
||||||
{
|
|
||||||
/* 0-ff used for single char tokens */
|
|
||||||
K_symbol = 0x100, /* a symbol */
|
|
||||||
K_label, /* a label defn (i.e. symbol:) */
|
|
||||||
K_ident, /* other ident */
|
|
||||||
K_dotted, /* dotted identifier */
|
|
||||||
K_number,
|
|
||||||
K_string,
|
|
||||||
K_comment
|
|
||||||
} Kind;
|
|
||||||
|
|
||||||
typedef struct Token
|
|
||||||
{
|
|
||||||
unsigned short kind : 12;
|
|
||||||
unsigned short space : 1; /* preceded by space */
|
|
||||||
unsigned short end : 1; /* succeeded by end of line */
|
|
||||||
/* Length of token */
|
|
||||||
unsigned short len;
|
|
||||||
|
|
||||||
/* Token itself */
|
|
||||||
char const *ptr;
|
|
||||||
} Token;
|
|
||||||
|
|
||||||
/* statement info */
|
|
||||||
typedef enum Vis
|
|
||||||
{
|
|
||||||
V_dot = 0, /* random pseudo */
|
|
||||||
V_var = 1, /* var decl/defn */
|
|
||||||
V_func = 2, /* func decl/defn */
|
|
||||||
V_insn = 3, /* random insn */
|
|
||||||
V_label = 4, /* label defn */
|
|
||||||
V_comment = 5,
|
|
||||||
V_pred = 6, /* predicate */
|
|
||||||
V_mask = 0x7,
|
|
||||||
V_global = 0x08, /* globalize */
|
|
||||||
V_weak = 0x10, /* weakly globalize */
|
|
||||||
V_no_eol = 0x20, /* no end of line */
|
|
||||||
V_prefix_comment = 0x40 /* prefixed comment */
|
|
||||||
} Vis;
|
|
||||||
|
|
||||||
typedef struct Stmt
|
|
||||||
{
|
|
||||||
struct Stmt *next;
|
|
||||||
Token *tokens;
|
|
||||||
unsigned char vis;
|
|
||||||
unsigned len : 12;
|
|
||||||
unsigned sym : 12;
|
|
||||||
} Stmt;
|
|
||||||
|
|
||||||
struct id_map
|
struct id_map
|
||||||
{
|
{
|
||||||
id_map *next;
|
id_map *next;
|
||||||
char *ptx_name;
|
char *ptx_name;
|
||||||
};
|
};
|
||||||
|
|
||||||
static const char *read_file (FILE *);
|
|
||||||
static Token *tokenize (const char *);
|
|
||||||
|
|
||||||
static void write_token (FILE *, const Token *);
|
|
||||||
static void write_tokens (FILE *, const Token *, unsigned, int);
|
|
||||||
|
|
||||||
static Stmt *alloc_stmt (unsigned, Token *, Token *, const Token *);
|
|
||||||
#define alloc_comment(S,E) alloc_stmt (V_comment, S, E, 0)
|
|
||||||
#define append_stmt(V, S) ((S)->next = *(V), *(V) = (S))
|
|
||||||
static Stmt *rev_stmts (Stmt *);
|
|
||||||
static void write_stmt (FILE *, const Stmt *);
|
|
||||||
static void write_stmts (FILE *, const Stmt *);
|
|
||||||
|
|
||||||
static Token *parse_insn (Token *);
|
|
||||||
static Token *parse_list_nosemi (Token *);
|
|
||||||
static Token *parse_init (Token *);
|
|
||||||
static Token *parse_file (Token *);
|
|
||||||
|
|
||||||
static Stmt *decls;
|
|
||||||
static Stmt *vars;
|
|
||||||
static Stmt *fns;
|
|
||||||
|
|
||||||
static id_map *func_ids, **funcs_tail = &func_ids;
|
static id_map *func_ids, **funcs_tail = &func_ids;
|
||||||
static id_map *var_ids, **vars_tail = &var_ids;
|
static id_map *var_ids, **vars_tail = &var_ids;
|
||||||
|
|
||||||
|
|
@ -183,7 +111,7 @@ record_id (const char *p1, id_map ***where)
|
||||||
remember, there could be a NUL in the file itself. */
|
remember, there could be a NUL in the file itself. */
|
||||||
|
|
||||||
static const char *
|
static const char *
|
||||||
read_file (FILE *stream)
|
read_file (FILE *stream, size_t *plen)
|
||||||
{
|
{
|
||||||
size_t alloc = 16384;
|
size_t alloc = 16384;
|
||||||
size_t base = 0;
|
size_t base = 0;
|
||||||
|
|
@ -213,557 +141,10 @@ read_file (FILE *stream)
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
buffer[base] = 0;
|
buffer[base] = 0;
|
||||||
|
*plen = base;
|
||||||
return buffer;
|
return buffer;
|
||||||
}
|
}
|
||||||
|
|
||||||
/* Read a token, advancing ptr.
|
|
||||||
If we read a comment, append it to the comments block. */
|
|
||||||
|
|
||||||
static Token *
|
|
||||||
tokenize (const char *ptr)
|
|
||||||
{
|
|
||||||
unsigned alloc = 1000;
|
|
||||||
unsigned num = 0;
|
|
||||||
Token *toks = XNEWVEC (Token, alloc);
|
|
||||||
int in_comment = 0;
|
|
||||||
int not_comment = 0;
|
|
||||||
|
|
||||||
for (;; num++)
|
|
||||||
{
|
|
||||||
const char *base;
|
|
||||||
unsigned kind;
|
|
||||||
int ws = 0;
|
|
||||||
int eol = 0;
|
|
||||||
|
|
||||||
again:
|
|
||||||
base = ptr;
|
|
||||||
if (in_comment)
|
|
||||||
goto block_comment;
|
|
||||||
switch (kind = *ptr++)
|
|
||||||
{
|
|
||||||
default:
|
|
||||||
break;
|
|
||||||
|
|
||||||
case '\n':
|
|
||||||
eol = 1;
|
|
||||||
/* Fall through */
|
|
||||||
case ' ':
|
|
||||||
case '\t':
|
|
||||||
case '\r':
|
|
||||||
case '\v':
|
|
||||||
/* White space */
|
|
||||||
ws = not_comment;
|
|
||||||
goto again;
|
|
||||||
|
|
||||||
case '/':
|
|
||||||
{
|
|
||||||
if (*ptr == '/')
|
|
||||||
{
|
|
||||||
/* line comment. Do not include trailing \n */
|
|
||||||
base += 2;
|
|
||||||
for (; *ptr; ptr++)
|
|
||||||
if (*ptr == '\n')
|
|
||||||
break;
|
|
||||||
kind = K_comment;
|
|
||||||
}
|
|
||||||
else if (*ptr == '*')
|
|
||||||
{
|
|
||||||
/* block comment */
|
|
||||||
base += 2;
|
|
||||||
ptr++;
|
|
||||||
|
|
||||||
block_comment:
|
|
||||||
eol = in_comment;
|
|
||||||
in_comment = 1;
|
|
||||||
for (; *ptr; ptr++)
|
|
||||||
{
|
|
||||||
if (*ptr == '\n')
|
|
||||||
{
|
|
||||||
ptr++;
|
|
||||||
break;
|
|
||||||
}
|
|
||||||
if (ptr[0] == '*' && ptr[1] == '/')
|
|
||||||
{
|
|
||||||
in_comment = 2;
|
|
||||||
ptr += 2;
|
|
||||||
break;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
kind = K_comment;
|
|
||||||
}
|
|
||||||
else
|
|
||||||
break;
|
|
||||||
}
|
|
||||||
break;
|
|
||||||
|
|
||||||
case '"':
|
|
||||||
/* quoted string */
|
|
||||||
kind = K_string;
|
|
||||||
while (*ptr)
|
|
||||||
if (*ptr == '"')
|
|
||||||
{
|
|
||||||
ptr++;
|
|
||||||
break;
|
|
||||||
}
|
|
||||||
else if (*ptr++ == '\\')
|
|
||||||
ptr++;
|
|
||||||
break;
|
|
||||||
|
|
||||||
case '.':
|
|
||||||
if (*ptr < '0' || *ptr > '9')
|
|
||||||
{
|
|
||||||
kind = K_dotted;
|
|
||||||
ws = not_comment;
|
|
||||||
goto ident;
|
|
||||||
}
|
|
||||||
/* FALLTHROUGH */
|
|
||||||
case '0'...'9':
|
|
||||||
kind = K_number;
|
|
||||||
goto ident;
|
|
||||||
break;
|
|
||||||
|
|
||||||
case '$': /* local labels. */
|
|
||||||
case '%': /* register names, pseudoes etc */
|
|
||||||
kind = K_ident;
|
|
||||||
goto ident;
|
|
||||||
|
|
||||||
case 'a'...'z':
|
|
||||||
case 'A'...'Z':
|
|
||||||
case '_':
|
|
||||||
kind = K_symbol; /* possible symbol name */
|
|
||||||
ident:
|
|
||||||
for (; *ptr; ptr++)
|
|
||||||
{
|
|
||||||
if (*ptr >= 'A' && *ptr <= 'Z')
|
|
||||||
continue;
|
|
||||||
if (*ptr >= 'a' && *ptr <= 'z')
|
|
||||||
continue;
|
|
||||||
if (*ptr >= '0' && *ptr <= '9')
|
|
||||||
continue;
|
|
||||||
if (*ptr == '_' || *ptr == '$')
|
|
||||||
continue;
|
|
||||||
if (*ptr == '.' && kind != K_dotted)
|
|
||||||
/* Idents starting with a dot, cannot have internal dots. */
|
|
||||||
continue;
|
|
||||||
if ((*ptr == '+' || *ptr == '-')
|
|
||||||
&& kind == K_number
|
|
||||||
&& (ptr[-1] == 'e' || ptr[-1] == 'E'
|
|
||||||
|| ptr[-1] == 'p' || ptr[-1] == 'P'))
|
|
||||||
/* exponent */
|
|
||||||
continue;
|
|
||||||
break;
|
|
||||||
}
|
|
||||||
if (*ptr == ':')
|
|
||||||
{
|
|
||||||
ptr++;
|
|
||||||
kind = K_label;
|
|
||||||
}
|
|
||||||
break;
|
|
||||||
}
|
|
||||||
|
|
||||||
if (alloc == num)
|
|
||||||
{
|
|
||||||
alloc *= 2;
|
|
||||||
toks = XRESIZEVEC (Token, toks, alloc);
|
|
||||||
}
|
|
||||||
Token *tok = toks + num;
|
|
||||||
|
|
||||||
tok->kind = kind;
|
|
||||||
tok->space = ws;
|
|
||||||
tok->end = 0;
|
|
||||||
tok->ptr = base;
|
|
||||||
tok->len = ptr - base - in_comment;
|
|
||||||
in_comment &= 1;
|
|
||||||
not_comment = kind != K_comment;
|
|
||||||
if (eol && num)
|
|
||||||
tok[-1].end = 1;
|
|
||||||
if (!kind)
|
|
||||||
break;
|
|
||||||
}
|
|
||||||
|
|
||||||
return toks;
|
|
||||||
}
|
|
||||||
|
|
||||||
/* Write an encoded token. */
|
|
||||||
|
|
||||||
static void
|
|
||||||
write_token (FILE *out, Token const *tok)
|
|
||||||
{
|
|
||||||
if (tok->space)
|
|
||||||
fputc (' ', out);
|
|
||||||
|
|
||||||
switch (tok->kind)
|
|
||||||
{
|
|
||||||
case K_string:
|
|
||||||
{
|
|
||||||
const char *c = tok->ptr + 1;
|
|
||||||
size_t len = tok->len - 2;
|
|
||||||
|
|
||||||
fputs ("\\\"", out);
|
|
||||||
while (len)
|
|
||||||
{
|
|
||||||
const char *bs = (const char *)memchr (c, '\\', len);
|
|
||||||
size_t l = bs ? bs - c : len;
|
|
||||||
|
|
||||||
fprintf (out, "%.*s", (int)l, c);
|
|
||||||
len -= l;
|
|
||||||
c += l;
|
|
||||||
if (bs)
|
|
||||||
{
|
|
||||||
fputs ("\\\\", out);
|
|
||||||
len--, c++;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
fputs ("\\\"", out);
|
|
||||||
}
|
|
||||||
break;
|
|
||||||
|
|
||||||
default:
|
|
||||||
/* All other tokens shouldn't have anything magic in them */
|
|
||||||
fprintf (out, "%.*s", tok->len, tok->ptr);
|
|
||||||
break;
|
|
||||||
}
|
|
||||||
if (tok->end)
|
|
||||||
fputs ("\\n", out);
|
|
||||||
}
|
|
||||||
|
|
||||||
static void
|
|
||||||
write_tokens (FILE *out, Token const *toks, unsigned len, int spc)
|
|
||||||
{
|
|
||||||
fputs ("\t\"", out);
|
|
||||||
for (; len--; toks++)
|
|
||||||
write_token (out, toks);
|
|
||||||
if (spc)
|
|
||||||
fputs (" ", out);
|
|
||||||
fputs ("\"", out);
|
|
||||||
}
|
|
||||||
|
|
||||||
static Stmt *
|
|
||||||
alloc_stmt (unsigned vis, Token *tokens, Token *end, Token const *sym)
|
|
||||||
{
|
|
||||||
static unsigned alloc = 0;
|
|
||||||
static Stmt *heap = 0;
|
|
||||||
|
|
||||||
if (!alloc)
|
|
||||||
{
|
|
||||||
alloc = 1000;
|
|
||||||
heap = XNEWVEC (Stmt, alloc);
|
|
||||||
}
|
|
||||||
|
|
||||||
Stmt *stmt = heap++;
|
|
||||||
alloc--;
|
|
||||||
|
|
||||||
tokens->space = 0;
|
|
||||||
stmt->next = 0;
|
|
||||||
stmt->vis = vis;
|
|
||||||
stmt->tokens = tokens;
|
|
||||||
stmt->len = end - tokens;
|
|
||||||
stmt->sym = sym ? sym - tokens : ~0;
|
|
||||||
|
|
||||||
return stmt;
|
|
||||||
}
|
|
||||||
|
|
||||||
static Stmt *
|
|
||||||
rev_stmts (Stmt *stmt)
|
|
||||||
{
|
|
||||||
Stmt *prev = 0;
|
|
||||||
Stmt *next;
|
|
||||||
|
|
||||||
while (stmt)
|
|
||||||
{
|
|
||||||
next = stmt->next;
|
|
||||||
stmt->next = prev;
|
|
||||||
prev = stmt;
|
|
||||||
stmt = next;
|
|
||||||
}
|
|
||||||
|
|
||||||
return prev;
|
|
||||||
}
|
|
||||||
|
|
||||||
static void
|
|
||||||
write_stmt (FILE *out, const Stmt *stmt)
|
|
||||||
{
|
|
||||||
if ((stmt->vis & V_mask) != V_comment)
|
|
||||||
{
|
|
||||||
write_tokens (out, stmt->tokens, stmt->len,
|
|
||||||
(stmt->vis & V_mask) == V_pred);
|
|
||||||
fputs (stmt->vis & V_no_eol ? "\t" : "\n", out);
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
static void
|
|
||||||
write_stmts (FILE *out, const Stmt *stmts)
|
|
||||||
{
|
|
||||||
for (; stmts; stmts = stmts->next)
|
|
||||||
write_stmt (out, stmts);
|
|
||||||
}
|
|
||||||
|
|
||||||
static Token *
|
|
||||||
parse_insn (Token *tok)
|
|
||||||
{
|
|
||||||
unsigned depth = 0;
|
|
||||||
|
|
||||||
do
|
|
||||||
{
|
|
||||||
Stmt *stmt;
|
|
||||||
Token *sym = 0;
|
|
||||||
unsigned s = V_insn;
|
|
||||||
Token *start = tok;
|
|
||||||
|
|
||||||
switch (tok++->kind)
|
|
||||||
{
|
|
||||||
case K_comment:
|
|
||||||
while (tok->kind == K_comment)
|
|
||||||
tok++;
|
|
||||||
stmt = alloc_comment (start, tok);
|
|
||||||
append_stmt (&fns, stmt);
|
|
||||||
continue;
|
|
||||||
|
|
||||||
case '{':
|
|
||||||
depth++;
|
|
||||||
break;
|
|
||||||
|
|
||||||
case '}':
|
|
||||||
depth--;
|
|
||||||
break;
|
|
||||||
|
|
||||||
case K_label:
|
|
||||||
if (tok[-1].ptr[0] != '$')
|
|
||||||
sym = tok - 1;
|
|
||||||
tok[-1].end = 1;
|
|
||||||
s = V_label;
|
|
||||||
break;
|
|
||||||
|
|
||||||
case '@':
|
|
||||||
tok->space = 0;
|
|
||||||
if (tok->kind == '!')
|
|
||||||
tok++;
|
|
||||||
if (tok->kind == K_symbol)
|
|
||||||
sym = tok;
|
|
||||||
tok++;
|
|
||||||
s = V_pred;
|
|
||||||
break;
|
|
||||||
|
|
||||||
default:
|
|
||||||
for (; tok->kind != ';'; tok++)
|
|
||||||
{
|
|
||||||
if (tok->kind == ',')
|
|
||||||
tok[1].space = 0;
|
|
||||||
else if (tok->kind == K_symbol)
|
|
||||||
sym = tok;
|
|
||||||
}
|
|
||||||
tok++->end = 1;
|
|
||||||
break;
|
|
||||||
}
|
|
||||||
|
|
||||||
stmt = alloc_stmt (s, start, tok, sym);
|
|
||||||
append_stmt (&fns, stmt);
|
|
||||||
|
|
||||||
if (!tok[-1].end && tok[0].kind == K_comment)
|
|
||||||
{
|
|
||||||
stmt->vis |= V_no_eol;
|
|
||||||
stmt = alloc_comment (tok, tok + 1);
|
|
||||||
append_stmt (&fns, stmt);
|
|
||||||
tok++;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
while (depth);
|
|
||||||
|
|
||||||
return tok;
|
|
||||||
}
|
|
||||||
|
|
||||||
/* comma separated list of tokens */
|
|
||||||
|
|
||||||
static Token *
|
|
||||||
parse_list_nosemi (Token *tok)
|
|
||||||
{
|
|
||||||
Token *start = tok;
|
|
||||||
|
|
||||||
do
|
|
||||||
if (!(++tok)->kind)
|
|
||||||
break;
|
|
||||||
while ((++tok)->kind == ',');
|
|
||||||
|
|
||||||
tok[-1].end = 1;
|
|
||||||
Stmt *stmt = alloc_stmt (V_dot, start, tok, 0);
|
|
||||||
append_stmt (&decls, stmt);
|
|
||||||
|
|
||||||
return tok;
|
|
||||||
}
|
|
||||||
|
|
||||||
#define is_keyword(T,S) \
|
|
||||||
(sizeof (S) == (T)->len && !memcmp ((T)->ptr + 1, (S), (T)->len - 1))
|
|
||||||
|
|
||||||
static Token *
|
|
||||||
parse_init (Token *tok)
|
|
||||||
{
|
|
||||||
for (;;)
|
|
||||||
{
|
|
||||||
Token *start = tok;
|
|
||||||
Token const *sym = 0;
|
|
||||||
Stmt *stmt;
|
|
||||||
|
|
||||||
if (tok->kind == K_comment)
|
|
||||||
{
|
|
||||||
while (tok->kind == K_comment)
|
|
||||||
tok++;
|
|
||||||
stmt = alloc_comment (start, tok);
|
|
||||||
append_stmt (&vars, stmt);
|
|
||||||
start = tok;
|
|
||||||
}
|
|
||||||
|
|
||||||
if (tok->kind == '{')
|
|
||||||
tok[1].space = 0;
|
|
||||||
for (; tok->kind != ',' && tok->kind != ';'; tok++)
|
|
||||||
if (tok->kind == K_symbol)
|
|
||||||
sym = tok;
|
|
||||||
tok[1].space = 0;
|
|
||||||
int end = tok++->kind == ';';
|
|
||||||
stmt = alloc_stmt (V_insn, start, tok, sym);
|
|
||||||
append_stmt (&vars, stmt);
|
|
||||||
if (!tok[-1].end && tok->kind == K_comment)
|
|
||||||
{
|
|
||||||
stmt->vis |= V_no_eol;
|
|
||||||
stmt = alloc_comment (tok, tok + 1);
|
|
||||||
append_stmt (&vars, stmt);
|
|
||||||
tok++;
|
|
||||||
}
|
|
||||||
if (end)
|
|
||||||
break;
|
|
||||||
}
|
|
||||||
return tok;
|
|
||||||
}
|
|
||||||
|
|
||||||
static Token *
|
|
||||||
parse_file (Token *tok)
|
|
||||||
{
|
|
||||||
Stmt *comment = 0;
|
|
||||||
|
|
||||||
if (tok->kind == K_comment)
|
|
||||||
{
|
|
||||||
Token *start = tok;
|
|
||||||
|
|
||||||
while (tok->kind == K_comment)
|
|
||||||
{
|
|
||||||
if (strncmp (tok->ptr, ":VAR_MAP ", 9) == 0)
|
|
||||||
record_id (tok->ptr + 9, &vars_tail);
|
|
||||||
if (strncmp (tok->ptr, ":FUNC_MAP ", 10) == 0)
|
|
||||||
record_id (tok->ptr + 10, &funcs_tail);
|
|
||||||
tok++;
|
|
||||||
}
|
|
||||||
comment = alloc_comment (start, tok);
|
|
||||||
comment->vis |= V_prefix_comment;
|
|
||||||
}
|
|
||||||
|
|
||||||
if (tok->kind == K_dotted)
|
|
||||||
{
|
|
||||||
if (is_keyword (tok, "version")
|
|
||||||
|| is_keyword (tok, "target")
|
|
||||||
|| is_keyword (tok, "address_size"))
|
|
||||||
{
|
|
||||||
if (comment)
|
|
||||||
append_stmt (&decls, comment);
|
|
||||||
tok = parse_list_nosemi (tok);
|
|
||||||
}
|
|
||||||
else
|
|
||||||
{
|
|
||||||
unsigned vis = 0;
|
|
||||||
const Token *def = 0;
|
|
||||||
unsigned is_decl = 0;
|
|
||||||
Token *start;
|
|
||||||
|
|
||||||
for (start = tok;
|
|
||||||
tok->kind && tok->kind != '=' && tok->kind != K_comment
|
|
||||||
&& tok->kind != '{' && tok->kind != ';'; tok++)
|
|
||||||
{
|
|
||||||
if (is_keyword (tok, "global")
|
|
||||||
|| is_keyword (tok, "const"))
|
|
||||||
vis |= V_var;
|
|
||||||
else if (is_keyword (tok, "func")
|
|
||||||
|| is_keyword (tok, "entry"))
|
|
||||||
vis |= V_func;
|
|
||||||
else if (is_keyword (tok, "visible"))
|
|
||||||
vis |= V_global;
|
|
||||||
else if (is_keyword (tok, "extern"))
|
|
||||||
is_decl = 1;
|
|
||||||
else if (is_keyword (tok, "weak"))
|
|
||||||
vis |= V_weak;
|
|
||||||
if (tok->kind == '(')
|
|
||||||
{
|
|
||||||
tok[1].space = 0;
|
|
||||||
tok[0].space = 1;
|
|
||||||
}
|
|
||||||
else if (tok->kind == ')' && tok[1].kind != ';')
|
|
||||||
tok[1].space = 1;
|
|
||||||
|
|
||||||
if (tok->kind == K_symbol)
|
|
||||||
def = tok;
|
|
||||||
}
|
|
||||||
|
|
||||||
if (!tok->kind)
|
|
||||||
{
|
|
||||||
/* end of file */
|
|
||||||
if (comment)
|
|
||||||
append_stmt (&fns, comment);
|
|
||||||
}
|
|
||||||
else if (tok->kind == '{'
|
|
||||||
|| tok->kind == K_comment)
|
|
||||||
{
|
|
||||||
/* function defn */
|
|
||||||
Stmt *stmt = alloc_stmt (vis, start, tok, def);
|
|
||||||
if (comment)
|
|
||||||
{
|
|
||||||
append_stmt (&fns, comment);
|
|
||||||
stmt->vis |= V_prefix_comment;
|
|
||||||
}
|
|
||||||
append_stmt (&fns, stmt);
|
|
||||||
tok = parse_insn (tok);
|
|
||||||
}
|
|
||||||
else
|
|
||||||
{
|
|
||||||
int assign = tok->kind == '=';
|
|
||||||
|
|
||||||
tok++->end = 1;
|
|
||||||
if ((vis & V_mask) == V_var && !is_decl)
|
|
||||||
{
|
|
||||||
/* variable */
|
|
||||||
Stmt *stmt = alloc_stmt (vis, start, tok, def);
|
|
||||||
if (comment)
|
|
||||||
{
|
|
||||||
append_stmt (&vars, comment);
|
|
||||||
stmt->vis |= V_prefix_comment;
|
|
||||||
}
|
|
||||||
append_stmt (&vars, stmt);
|
|
||||||
if (assign)
|
|
||||||
tok = parse_init (tok);
|
|
||||||
}
|
|
||||||
else
|
|
||||||
{
|
|
||||||
/* declaration */
|
|
||||||
Stmt *stmt = alloc_stmt (vis, start, tok, 0);
|
|
||||||
if (comment)
|
|
||||||
{
|
|
||||||
append_stmt (&decls, comment);
|
|
||||||
stmt->vis |= V_prefix_comment;
|
|
||||||
}
|
|
||||||
append_stmt (&decls, stmt);
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
else
|
|
||||||
{
|
|
||||||
/* Something strange. Ignore it. */
|
|
||||||
if (comment)
|
|
||||||
append_stmt (&fns, comment);
|
|
||||||
|
|
||||||
do
|
|
||||||
tok++;
|
|
||||||
while (tok->kind && !tok->end);
|
|
||||||
}
|
|
||||||
return tok;
|
|
||||||
}
|
|
||||||
|
|
||||||
/* Parse STR, saving found tokens into PVALUES and return their number.
|
/* Parse STR, saving found tokens into PVALUES and return their number.
|
||||||
Tokens are assumed to be delimited by ':'. */
|
Tokens are assumed to be delimited by ':'. */
|
||||||
static unsigned
|
static unsigned
|
||||||
|
|
@ -839,22 +220,55 @@ access_check (const char *name, int mode)
|
||||||
static void
|
static void
|
||||||
process (FILE *in, FILE *out)
|
process (FILE *in, FILE *out)
|
||||||
{
|
{
|
||||||
const char *input = read_file (in);
|
size_t len = 0;
|
||||||
Token *tok = tokenize (input);
|
const char *input = read_file (in, &len);
|
||||||
const char *comma;
|
const char *comma;
|
||||||
id_map const *id;
|
id_map const *id;
|
||||||
unsigned obj_count = 0;
|
unsigned obj_count = 0;
|
||||||
unsigned ix;
|
unsigned ix;
|
||||||
|
|
||||||
do
|
/* Dump out char arrays for each PTX object file. These are
|
||||||
tok = parse_file (tok);
|
terminated by a NUL. */
|
||||||
while (tok->kind);
|
for (size_t i = 0; i != len;)
|
||||||
|
{
|
||||||
|
char c;
|
||||||
|
|
||||||
fprintf (out, "static const char ptx_code_%u[] = \n", obj_count++);
|
fprintf (out, "static const char ptx_code_%u[] =\n\t\"", obj_count++);
|
||||||
write_stmts (out, rev_stmts (decls));
|
while ((c = input[i++]))
|
||||||
write_stmts (out, rev_stmts (vars));
|
{
|
||||||
write_stmts (out, rev_stmts (fns));
|
switch (c)
|
||||||
fprintf (out, ";\n\n");
|
{
|
||||||
|
case '\r':
|
||||||
|
continue;
|
||||||
|
case '\n':
|
||||||
|
fprintf (out, "\\n\"\n\t\"");
|
||||||
|
/* Look for mappings on subsequent lines. */
|
||||||
|
while (strncmp (input + i, "//:", 3) == 0)
|
||||||
|
{
|
||||||
|
i += 3;
|
||||||
|
|
||||||
|
if (strncmp (input + i, "VAR_MAP ", 8) == 0)
|
||||||
|
record_id (input + i + 8, &vars_tail);
|
||||||
|
else if (strncmp (input + i, "FUNC_MAP ", 9) == 0)
|
||||||
|
record_id (input + i + 9, &funcs_tail);
|
||||||
|
else
|
||||||
|
abort ();
|
||||||
|
/* Skip to next line. */
|
||||||
|
while (input[i++] != '\n')
|
||||||
|
continue;
|
||||||
|
}
|
||||||
|
continue;
|
||||||
|
case '"':
|
||||||
|
case '\\':
|
||||||
|
putc ('\\', out);
|
||||||
|
break;
|
||||||
|
default:
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
putc (c, out);
|
||||||
|
}
|
||||||
|
fprintf (out, "\";\n\n");
|
||||||
|
}
|
||||||
|
|
||||||
/* Dump out array of pointers to ptx object strings. */
|
/* Dump out array of pointers to ptx object strings. */
|
||||||
fprintf (out, "static const struct ptx_obj {\n"
|
fprintf (out, "static const struct ptx_obj {\n"
|
||||||
|
|
@ -1068,7 +482,6 @@ main (int argc, char **argv)
|
||||||
default:
|
default:
|
||||||
gcc_unreachable ();
|
gcc_unreachable ();
|
||||||
}
|
}
|
||||||
obstack_ptr_grow (&argv_obstack, "-S");
|
|
||||||
|
|
||||||
for (int ix = 1; ix != argc; ix++)
|
for (int ix = 1; ix != argc; ix++)
|
||||||
{
|
{
|
||||||
|
|
|
||||||
|
|
@ -1,3 +1,13 @@
|
||||||
|
2015-10-02 Thomas Schwinge <thomas@codesourcery.com>
|
||||||
|
|
||||||
|
* oacc-ptx.h: Remove file, moving its content into...
|
||||||
|
* config/nvptx/fortran.c: ... here...
|
||||||
|
* config/nvptx/oacc-init.c: ..., here...
|
||||||
|
* config/nvptx/oacc-parallel.c: ..., and here.
|
||||||
|
* config/nvptx/openacc.f90: New file.
|
||||||
|
* plugin/plugin-nvptx.c: Don't include "oacc-ptx.h".
|
||||||
|
(link_ptx): Don't link in predefined bits of PTX code.
|
||||||
|
|
||||||
2015-09-30 Nathan Sidwell <nathan@codesourcery.com>
|
2015-09-30 Nathan Sidwell <nathan@codesourcery.com>
|
||||||
Bernd Schmidt <bernds@codesourcery.com>
|
Bernd Schmidt <bernds@codesourcery.com>
|
||||||
|
|
||||||
|
|
|
||||||
|
|
@ -0,0 +1,40 @@
|
||||||
|
/* OpenACC Runtime Fortran wrapper routines
|
||||||
|
|
||||||
|
Copyright (C) 2014-2015 Free Software Foundation, Inc.
|
||||||
|
|
||||||
|
Contributed by Mentor Embedded.
|
||||||
|
|
||||||
|
This file is part of the GNU Offloading and Multi Processing Library
|
||||||
|
(libgomp).
|
||||||
|
|
||||||
|
Libgomp is free software; you can redistribute it and/or modify it
|
||||||
|
under the terms of the GNU General Public License as published by
|
||||||
|
the Free Software Foundation; either version 3, or (at your option)
|
||||||
|
any later version.
|
||||||
|
|
||||||
|
Libgomp is distributed in the hope that it will be useful, but WITHOUT ANY
|
||||||
|
WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
|
||||||
|
FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
||||||
|
more details.
|
||||||
|
|
||||||
|
Under Section 7 of GPL version 3, you are granted additional
|
||||||
|
permissions described in the GCC Runtime Library Exception, version
|
||||||
|
3.1, as published by the Free Software Foundation.
|
||||||
|
|
||||||
|
You should have received a copy of the GNU General Public License and
|
||||||
|
a copy of the GCC Runtime Library Exception along with this program;
|
||||||
|
see the files COPYING3 and COPYING.RUNTIME respectively. If not, see
|
||||||
|
<http://www.gnu.org/licenses/>. */
|
||||||
|
|
||||||
|
/* Temporary hack; this will be provided by libgfortran. */
|
||||||
|
|
||||||
|
extern void _gfortran_abort (void);
|
||||||
|
|
||||||
|
__asm__ ("// BEGIN GLOBAL FUNCTION DECL: _gfortran_abort\n"
|
||||||
|
".visible .func _gfortran_abort;\n"
|
||||||
|
"// BEGIN GLOBAL FUNCTION DEF: _gfortran_abort\n"
|
||||||
|
".visible .func _gfortran_abort\n"
|
||||||
|
"{\n"
|
||||||
|
"trap;\n"
|
||||||
|
"ret;\n"
|
||||||
|
"}\n");
|
||||||
|
|
@ -0,0 +1,42 @@
|
||||||
|
/* OpenACC Runtime initialization routines
|
||||||
|
|
||||||
|
Copyright (C) 2014-2015 Free Software Foundation, Inc.
|
||||||
|
|
||||||
|
Contributed by Mentor Embedded.
|
||||||
|
|
||||||
|
This file is part of the GNU Offloading and Multi Processing Library
|
||||||
|
(libgomp).
|
||||||
|
|
||||||
|
Libgomp is free software; you can redistribute it and/or modify it
|
||||||
|
under the terms of the GNU General Public License as published by
|
||||||
|
the Free Software Foundation; either version 3, or (at your option)
|
||||||
|
any later version.
|
||||||
|
|
||||||
|
Libgomp is distributed in the hope that it will be useful, but WITHOUT ANY
|
||||||
|
WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
|
||||||
|
FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
||||||
|
more details.
|
||||||
|
|
||||||
|
Under Section 7 of GPL version 3, you are granted additional
|
||||||
|
permissions described in the GCC Runtime Library Exception, version
|
||||||
|
3.1, as published by the Free Software Foundation.
|
||||||
|
|
||||||
|
You should have received a copy of the GNU General Public License and
|
||||||
|
a copy of the GCC Runtime Library Exception along with this program;
|
||||||
|
see the files COPYING3 and COPYING.RUNTIME respectively. If not, see
|
||||||
|
<http://www.gnu.org/licenses/>. */
|
||||||
|
|
||||||
|
#include "openacc.h"
|
||||||
|
|
||||||
|
/* For -O and higher, the compiler always attempts to expand acc_on_device, but
|
||||||
|
if the user disables the builtin, or calls it via a pointer, we'll need this
|
||||||
|
version.
|
||||||
|
|
||||||
|
Compile this with optimization, so that the compiler expands
|
||||||
|
this, rather than generating infinitely recursive code. */
|
||||||
|
|
||||||
|
int __attribute__ ((__optimize__ ("O2")))
|
||||||
|
acc_on_device (acc_device_t dev)
|
||||||
|
{
|
||||||
|
return __builtin_acc_on_device (dev);
|
||||||
|
}
|
||||||
|
|
@ -0,0 +1,358 @@
|
||||||
|
/* OpenACC constructs
|
||||||
|
|
||||||
|
Copyright (C) 2014-2015 Free Software Foundation, Inc.
|
||||||
|
|
||||||
|
Contributed by Mentor Embedded.
|
||||||
|
|
||||||
|
This file is part of the GNU Offloading and Multi Processing Library
|
||||||
|
(libgomp).
|
||||||
|
|
||||||
|
Libgomp is free software; you can redistribute it and/or modify it
|
||||||
|
under the terms of the GNU General Public License as published by
|
||||||
|
the Free Software Foundation; either version 3, or (at your option)
|
||||||
|
any later version.
|
||||||
|
|
||||||
|
Libgomp is distributed in the hope that it will be useful, but WITHOUT ANY
|
||||||
|
WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
|
||||||
|
FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
||||||
|
more details.
|
||||||
|
|
||||||
|
Under Section 7 of GPL version 3, you are granted additional
|
||||||
|
permissions described in the GCC Runtime Library Exception, version
|
||||||
|
3.1, as published by the Free Software Foundation.
|
||||||
|
|
||||||
|
You should have received a copy of the GNU General Public License and
|
||||||
|
a copy of the GCC Runtime Library Exception along with this program;
|
||||||
|
see the files COPYING3 and COPYING.RUNTIME respectively. If not, see
|
||||||
|
<http://www.gnu.org/licenses/>. */
|
||||||
|
|
||||||
|
#include "libgomp_g.h"
|
||||||
|
|
||||||
|
__asm__ (".visible .func (.param .u32 %out_retval) GOACC_tid (.param .u32 %in_ar1);\n"
|
||||||
|
".visible .func (.param .u32 %out_retval) GOACC_ntid (.param .u32 %in_ar1);\n"
|
||||||
|
".visible .func (.param .u32 %out_retval) GOACC_ctaid (.param .u32 %in_ar1);\n"
|
||||||
|
".visible .func (.param .u32 %out_retval) GOACC_nctaid (.param .u32 %in_ar1);\n"
|
||||||
|
"// BEGIN GLOBAL FUNCTION DECL: GOACC_get_num_threads\n"
|
||||||
|
".visible .func (.param .u32 %out_retval) GOACC_get_num_threads;\n"
|
||||||
|
"// BEGIN GLOBAL FUNCTION DECL: GOACC_get_thread_num\n"
|
||||||
|
".visible .func (.param .u32 %out_retval) GOACC_get_thread_num;\n"
|
||||||
|
"// BEGIN GLOBAL FUNCTION DECL: abort\n"
|
||||||
|
".extern .func abort;\n"
|
||||||
|
".visible .func (.param .u32 %out_retval) GOACC_tid (.param .u32 %in_ar1)\n"
|
||||||
|
"{\n"
|
||||||
|
".reg .u32 %ar1;\n"
|
||||||
|
".reg .u32 %retval;\n"
|
||||||
|
".reg .u64 %hr10;\n"
|
||||||
|
".reg .u32 %r22;\n"
|
||||||
|
".reg .u32 %r23;\n"
|
||||||
|
".reg .u32 %r24;\n"
|
||||||
|
".reg .u32 %r25;\n"
|
||||||
|
".reg .u32 %r26;\n"
|
||||||
|
".reg .u32 %r27;\n"
|
||||||
|
".reg .u32 %r28;\n"
|
||||||
|
".reg .u32 %r29;\n"
|
||||||
|
".reg .pred %r30;\n"
|
||||||
|
".reg .u32 %r31;\n"
|
||||||
|
".reg .pred %r32;\n"
|
||||||
|
".reg .u32 %r33;\n"
|
||||||
|
".reg .pred %r34;\n"
|
||||||
|
".local .align 8 .b8 %frame[4];\n"
|
||||||
|
"ld.param.u32 %ar1,[%in_ar1];\n"
|
||||||
|
"mov.u32 %r27,%ar1;\n"
|
||||||
|
"st.local.u32 [%frame],%r27;\n"
|
||||||
|
"ld.local.u32 %r28,[%frame];\n"
|
||||||
|
"mov.u32 %r29,1;\n"
|
||||||
|
"setp.eq.u32 %r30,%r28,%r29;\n"
|
||||||
|
"@%r30 bra $L4;\n"
|
||||||
|
"mov.u32 %r31,2;\n"
|
||||||
|
"setp.eq.u32 %r32,%r28,%r31;\n"
|
||||||
|
"@%r32 bra $L5;\n"
|
||||||
|
"mov.u32 %r33,0;\n"
|
||||||
|
"setp.eq.u32 %r34,%r28,%r33;\n"
|
||||||
|
"@!%r34 bra $L8;\n"
|
||||||
|
"mov.u32 %r23,%tid.x;\n"
|
||||||
|
"mov.u32 %r22,%r23;\n"
|
||||||
|
"bra $L7;\n"
|
||||||
|
"$L4:\n"
|
||||||
|
"mov.u32 %r24,%tid.y;\n"
|
||||||
|
"mov.u32 %r22,%r24;\n"
|
||||||
|
"bra $L7;\n"
|
||||||
|
"$L5:\n"
|
||||||
|
"mov.u32 %r25,%tid.z;\n"
|
||||||
|
"mov.u32 %r22,%r25;\n"
|
||||||
|
"bra $L7;\n"
|
||||||
|
"$L8:\n"
|
||||||
|
"{\n"
|
||||||
|
"{\n"
|
||||||
|
"call abort;\n"
|
||||||
|
"}\n"
|
||||||
|
"}\n"
|
||||||
|
"$L7:\n"
|
||||||
|
"mov.u32 %r26,%r22;\n"
|
||||||
|
"mov.u32 %retval,%r26;\n"
|
||||||
|
"st.param.u32 [%out_retval],%retval;\n"
|
||||||
|
"ret;\n"
|
||||||
|
"}\n"
|
||||||
|
".visible .func (.param .u32 %out_retval) GOACC_ntid (.param .u32 %in_ar1)\n"
|
||||||
|
"{\n"
|
||||||
|
".reg .u32 %ar1;\n"
|
||||||
|
".reg .u32 %retval;\n"
|
||||||
|
".reg .u64 %hr10;\n"
|
||||||
|
".reg .u32 %r22;\n"
|
||||||
|
".reg .u32 %r23;\n"
|
||||||
|
".reg .u32 %r24;\n"
|
||||||
|
".reg .u32 %r25;\n"
|
||||||
|
".reg .u32 %r26;\n"
|
||||||
|
".reg .u32 %r27;\n"
|
||||||
|
".reg .u32 %r28;\n"
|
||||||
|
".reg .u32 %r29;\n"
|
||||||
|
".reg .pred %r30;\n"
|
||||||
|
".reg .u32 %r31;\n"
|
||||||
|
".reg .pred %r32;\n"
|
||||||
|
".reg .u32 %r33;\n"
|
||||||
|
".reg .pred %r34;\n"
|
||||||
|
".local .align 8 .b8 %frame[4];\n"
|
||||||
|
"ld.param.u32 %ar1,[%in_ar1];\n"
|
||||||
|
"mov.u32 %r27,%ar1;\n"
|
||||||
|
"st.local.u32 [%frame],%r27;\n"
|
||||||
|
"ld.local.u32 %r28,[%frame];\n"
|
||||||
|
"mov.u32 %r29,1;\n"
|
||||||
|
"setp.eq.u32 %r30,%r28,%r29;\n"
|
||||||
|
"@%r30 bra $L11;\n"
|
||||||
|
"mov.u32 %r31,2;\n"
|
||||||
|
"setp.eq.u32 %r32,%r28,%r31;\n"
|
||||||
|
"@%r32 bra $L12;\n"
|
||||||
|
"mov.u32 %r33,0;\n"
|
||||||
|
"setp.eq.u32 %r34,%r28,%r33;\n"
|
||||||
|
"@!%r34 bra $L15;\n"
|
||||||
|
"mov.u32 %r23,%ntid.x;\n"
|
||||||
|
"mov.u32 %r22,%r23;\n"
|
||||||
|
"bra $L14;\n"
|
||||||
|
"$L11:\n"
|
||||||
|
"mov.u32 %r24,%ntid.y;\n"
|
||||||
|
"mov.u32 %r22,%r24;\n"
|
||||||
|
"bra $L14;\n"
|
||||||
|
"$L12:\n"
|
||||||
|
"mov.u32 %r25,%ntid.z;\n"
|
||||||
|
"mov.u32 %r22,%r25;\n"
|
||||||
|
"bra $L14;\n"
|
||||||
|
"$L15:\n"
|
||||||
|
"{\n"
|
||||||
|
"{\n"
|
||||||
|
"call abort;\n"
|
||||||
|
"}\n"
|
||||||
|
"}\n"
|
||||||
|
"$L14:\n"
|
||||||
|
"mov.u32 %r26,%r22;\n"
|
||||||
|
"mov.u32 %retval,%r26;\n"
|
||||||
|
"st.param.u32 [%out_retval],%retval;\n"
|
||||||
|
"ret;\n"
|
||||||
|
"}\n"
|
||||||
|
".visible .func (.param .u32 %out_retval) GOACC_ctaid (.param .u32 %in_ar1)\n"
|
||||||
|
"{\n"
|
||||||
|
".reg .u32 %ar1;\n"
|
||||||
|
".reg .u32 %retval;\n"
|
||||||
|
".reg .u64 %hr10;\n"
|
||||||
|
".reg .u32 %r22;\n"
|
||||||
|
".reg .u32 %r23;\n"
|
||||||
|
".reg .u32 %r24;\n"
|
||||||
|
".reg .u32 %r25;\n"
|
||||||
|
".reg .u32 %r26;\n"
|
||||||
|
".reg .u32 %r27;\n"
|
||||||
|
".reg .u32 %r28;\n"
|
||||||
|
".reg .u32 %r29;\n"
|
||||||
|
".reg .pred %r30;\n"
|
||||||
|
".reg .u32 %r31;\n"
|
||||||
|
".reg .pred %r32;\n"
|
||||||
|
".reg .u32 %r33;\n"
|
||||||
|
".reg .pred %r34;\n"
|
||||||
|
".local .align 8 .b8 %frame[4];\n"
|
||||||
|
"ld.param.u32 %ar1,[%in_ar1];\n"
|
||||||
|
"mov.u32 %r27,%ar1;\n"
|
||||||
|
"st.local.u32 [%frame],%r27;\n"
|
||||||
|
"ld.local.u32 %r28,[%frame];\n"
|
||||||
|
"mov.u32 %r29,1;\n"
|
||||||
|
"setp.eq.u32 %r30,%r28,%r29;\n"
|
||||||
|
"@%r30 bra $L18;\n"
|
||||||
|
"mov.u32 %r31,2;\n"
|
||||||
|
"setp.eq.u32 %r32,%r28,%r31;\n"
|
||||||
|
"@%r32 bra $L19;\n"
|
||||||
|
"mov.u32 %r33,0;\n"
|
||||||
|
"setp.eq.u32 %r34,%r28,%r33;\n"
|
||||||
|
"@!%r34 bra $L22;\n"
|
||||||
|
"mov.u32 %r23,%ctaid.x;\n"
|
||||||
|
"mov.u32 %r22,%r23;\n"
|
||||||
|
"bra $L21;\n"
|
||||||
|
"$L18:\n"
|
||||||
|
"mov.u32 %r24,%ctaid.y;\n"
|
||||||
|
"mov.u32 %r22,%r24;\n"
|
||||||
|
"bra $L21;\n"
|
||||||
|
"$L19:\n"
|
||||||
|
"mov.u32 %r25,%ctaid.z;\n"
|
||||||
|
"mov.u32 %r22,%r25;\n"
|
||||||
|
"bra $L21;\n"
|
||||||
|
"$L22:\n"
|
||||||
|
"{\n"
|
||||||
|
"{\n"
|
||||||
|
"call abort;\n"
|
||||||
|
"}\n"
|
||||||
|
"}\n"
|
||||||
|
"$L21:\n"
|
||||||
|
"mov.u32 %r26,%r22;\n"
|
||||||
|
"mov.u32 %retval,%r26;\n"
|
||||||
|
"st.param.u32 [%out_retval],%retval;\n"
|
||||||
|
"ret;\n"
|
||||||
|
"}\n"
|
||||||
|
".visible .func (.param .u32 %out_retval) GOACC_nctaid (.param .u32 %in_ar1)\n"
|
||||||
|
"{\n"
|
||||||
|
".reg .u32 %ar1;\n"
|
||||||
|
".reg .u32 %retval;\n"
|
||||||
|
".reg .u64 %hr10;\n"
|
||||||
|
".reg .u32 %r22;\n"
|
||||||
|
".reg .u32 %r23;\n"
|
||||||
|
".reg .u32 %r24;\n"
|
||||||
|
".reg .u32 %r25;\n"
|
||||||
|
".reg .u32 %r26;\n"
|
||||||
|
".reg .u32 %r27;\n"
|
||||||
|
".reg .u32 %r28;\n"
|
||||||
|
".reg .u32 %r29;\n"
|
||||||
|
".reg .pred %r30;\n"
|
||||||
|
".reg .u32 %r31;\n"
|
||||||
|
".reg .pred %r32;\n"
|
||||||
|
".reg .u32 %r33;\n"
|
||||||
|
".reg .pred %r34;\n"
|
||||||
|
".local .align 8 .b8 %frame[4];\n"
|
||||||
|
"ld.param.u32 %ar1,[%in_ar1];\n"
|
||||||
|
"mov.u32 %r27,%ar1;\n"
|
||||||
|
"st.local.u32 [%frame],%r27;\n"
|
||||||
|
"ld.local.u32 %r28,[%frame];\n"
|
||||||
|
"mov.u32 %r29,1;\n"
|
||||||
|
"setp.eq.u32 %r30,%r28,%r29;\n"
|
||||||
|
"@%r30 bra $L25;\n"
|
||||||
|
"mov.u32 %r31,2;\n"
|
||||||
|
"setp.eq.u32 %r32,%r28,%r31;\n"
|
||||||
|
"@%r32 bra $L26;\n"
|
||||||
|
"mov.u32 %r33,0;\n"
|
||||||
|
"setp.eq.u32 %r34,%r28,%r33;\n"
|
||||||
|
"@!%r34 bra $L29;\n"
|
||||||
|
"mov.u32 %r23,%nctaid.x;\n"
|
||||||
|
"mov.u32 %r22,%r23;\n"
|
||||||
|
"bra $L28;\n"
|
||||||
|
"$L25:\n"
|
||||||
|
"mov.u32 %r24,%nctaid.y;\n"
|
||||||
|
"mov.u32 %r22,%r24;\n"
|
||||||
|
"bra $L28;\n"
|
||||||
|
"$L26:\n"
|
||||||
|
"mov.u32 %r25,%nctaid.z;\n"
|
||||||
|
"mov.u32 %r22,%r25;\n"
|
||||||
|
"bra $L28;\n"
|
||||||
|
"$L29:\n"
|
||||||
|
"{\n"
|
||||||
|
"{\n"
|
||||||
|
"call abort;\n"
|
||||||
|
"}\n"
|
||||||
|
"}\n"
|
||||||
|
"$L28:\n"
|
||||||
|
"mov.u32 %r26,%r22;\n"
|
||||||
|
"mov.u32 %retval,%r26;\n"
|
||||||
|
"st.param.u32 [%out_retval],%retval;\n"
|
||||||
|
"ret;\n"
|
||||||
|
"}\n"
|
||||||
|
"// BEGIN GLOBAL FUNCTION DEF: GOACC_get_num_threads\n"
|
||||||
|
".visible .func (.param .u32 %out_retval) GOACC_get_num_threads\n"
|
||||||
|
"{\n"
|
||||||
|
".reg .u32 %retval;\n"
|
||||||
|
".reg .u64 %hr10;\n"
|
||||||
|
".reg .u32 %r22;\n"
|
||||||
|
".reg .u32 %r23;\n"
|
||||||
|
".reg .u32 %r24;\n"
|
||||||
|
".reg .u32 %r25;\n"
|
||||||
|
".reg .u32 %r26;\n"
|
||||||
|
".reg .u32 %r27;\n"
|
||||||
|
".reg .u32 %r28;\n"
|
||||||
|
".reg .u32 %r29;\n"
|
||||||
|
"mov.u32 %r26,0;\n"
|
||||||
|
"{\n"
|
||||||
|
".param .u32 %retval_in;\n"
|
||||||
|
"{\n"
|
||||||
|
".param .u32 %out_arg0;\n"
|
||||||
|
"st.param.u32 [%out_arg0],%r26;\n"
|
||||||
|
"call (%retval_in),GOACC_ntid,(%out_arg0);\n"
|
||||||
|
"}\n"
|
||||||
|
"ld.param.u32 %r27,[%retval_in];\n"
|
||||||
|
"}\n"
|
||||||
|
"mov.u32 %r22,%r27;\n"
|
||||||
|
"mov.u32 %r28,0;\n"
|
||||||
|
"{\n"
|
||||||
|
".param .u32 %retval_in;\n"
|
||||||
|
"{\n"
|
||||||
|
".param .u32 %out_arg0;\n"
|
||||||
|
"st.param.u32 [%out_arg0],%r28;\n"
|
||||||
|
"call (%retval_in),GOACC_nctaid,(%out_arg0);\n"
|
||||||
|
"}\n"
|
||||||
|
"ld.param.u32 %r29,[%retval_in];\n"
|
||||||
|
"}\n"
|
||||||
|
"mov.u32 %r23,%r29;\n"
|
||||||
|
"mul.lo.u32 %r24,%r22,%r23;\n"
|
||||||
|
"mov.u32 %r25,%r24;\n"
|
||||||
|
"mov.u32 %retval,%r25;\n"
|
||||||
|
"st.param.u32 [%out_retval],%retval;\n"
|
||||||
|
"ret;\n"
|
||||||
|
"}\n"
|
||||||
|
"// BEGIN GLOBAL FUNCTION DEF: GOACC_get_thread_num\n"
|
||||||
|
".visible .func (.param .u32 %out_retval) GOACC_get_thread_num\n"
|
||||||
|
"{\n"
|
||||||
|
".reg .u32 %retval;\n"
|
||||||
|
".reg .u64 %hr10;\n"
|
||||||
|
".reg .u32 %r22;\n"
|
||||||
|
".reg .u32 %r23;\n"
|
||||||
|
".reg .u32 %r24;\n"
|
||||||
|
".reg .u32 %r25;\n"
|
||||||
|
".reg .u32 %r26;\n"
|
||||||
|
".reg .u32 %r27;\n"
|
||||||
|
".reg .u32 %r28;\n"
|
||||||
|
".reg .u32 %r29;\n"
|
||||||
|
".reg .u32 %r30;\n"
|
||||||
|
".reg .u32 %r31;\n"
|
||||||
|
".reg .u32 %r32;\n"
|
||||||
|
".reg .u32 %r33;\n"
|
||||||
|
"mov.u32 %r28,0;\n"
|
||||||
|
"{\n"
|
||||||
|
".param .u32 %retval_in;\n"
|
||||||
|
"{\n"
|
||||||
|
".param .u32 %out_arg0;\n"
|
||||||
|
"st.param.u32 [%out_arg0],%r28;\n"
|
||||||
|
"call (%retval_in),GOACC_ntid,(%out_arg0);\n"
|
||||||
|
"}\n"
|
||||||
|
"ld.param.u32 %r29,[%retval_in];\n"
|
||||||
|
"}\n"
|
||||||
|
"mov.u32 %r22,%r29;\n"
|
||||||
|
"mov.u32 %r30,0;\n"
|
||||||
|
"{\n"
|
||||||
|
".param .u32 %retval_in;\n"
|
||||||
|
"{\n"
|
||||||
|
".param .u32 %out_arg0;\n"
|
||||||
|
"st.param.u32 [%out_arg0],%r30;\n"
|
||||||
|
"call (%retval_in),GOACC_ctaid,(%out_arg0);\n"
|
||||||
|
"}\n"
|
||||||
|
"ld.param.u32 %r31,[%retval_in];\n"
|
||||||
|
"}\n"
|
||||||
|
"mov.u32 %r23,%r31;\n"
|
||||||
|
"mul.lo.u32 %r24,%r22,%r23;\n"
|
||||||
|
"mov.u32 %r32,0;\n"
|
||||||
|
"{\n"
|
||||||
|
".param .u32 %retval_in;\n"
|
||||||
|
"{\n"
|
||||||
|
".param .u32 %out_arg0;\n"
|
||||||
|
"st.param.u32 [%out_arg0],%r32;\n"
|
||||||
|
"call (%retval_in),GOACC_tid,(%out_arg0);\n"
|
||||||
|
"}\n"
|
||||||
|
"ld.param.u32 %r33,[%retval_in];\n"
|
||||||
|
"}\n"
|
||||||
|
"mov.u32 %r25,%r33;\n"
|
||||||
|
"add.u32 %r26,%r24,%r25;\n"
|
||||||
|
"mov.u32 %r27,%r26;\n"
|
||||||
|
"mov.u32 %retval,%r27;\n"
|
||||||
|
"st.param.u32 [%out_retval],%retval;\n"
|
||||||
|
"ret;\n"
|
||||||
|
"}\n");
|
||||||
|
|
@ -0,0 +1,102 @@
|
||||||
|
! OpenACC Runtime Library Definitions.
|
||||||
|
|
||||||
|
! Copyright (C) 2014-2015 Free Software Foundation, Inc.
|
||||||
|
|
||||||
|
! Contributed by Tobias Burnus <burnus@net-b.de>
|
||||||
|
! and Mentor Embedded.
|
||||||
|
|
||||||
|
! This file is part of the GNU Offloading and Multi Processing Library
|
||||||
|
! (libgomp).
|
||||||
|
|
||||||
|
! Libgomp is free software; you can redistribute it and/or modify it
|
||||||
|
! under the terms of the GNU General Public License as published by
|
||||||
|
! the Free Software Foundation; either version 3, or (at your option)
|
||||||
|
! any later version.
|
||||||
|
|
||||||
|
! Libgomp is distributed in the hope that it will be useful, but WITHOUT ANY
|
||||||
|
! WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
|
||||||
|
! FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
||||||
|
! more details.
|
||||||
|
|
||||||
|
! Under Section 7 of GPL version 3, you are granted additional
|
||||||
|
! permissions described in the GCC Runtime Library Exception, version
|
||||||
|
! 3.1, as published by the Free Software Foundation.
|
||||||
|
|
||||||
|
! You should have received a copy of the GNU General Public License and
|
||||||
|
! a copy of the GCC Runtime Library Exception along with this program;
|
||||||
|
! see the files COPYING3 and COPYING.RUNTIME respectively. If not, see
|
||||||
|
! <http://www.gnu.org/licenses/>.
|
||||||
|
|
||||||
|
! Wrapper functions will be built from openacc.f90. We use a separate file
|
||||||
|
! here, because for using ../../openacc.f90, implementations are required for
|
||||||
|
! all the functions that it wraps, which we currently don't provide, so linking
|
||||||
|
! would fail.
|
||||||
|
|
||||||
|
module openacc_kinds
|
||||||
|
use iso_fortran_env, only: int32
|
||||||
|
implicit none
|
||||||
|
|
||||||
|
private :: int32
|
||||||
|
public :: acc_device_kind
|
||||||
|
|
||||||
|
integer, parameter :: acc_device_kind = int32
|
||||||
|
|
||||||
|
public :: acc_device_none, acc_device_default, acc_device_host
|
||||||
|
public :: acc_device_not_host, acc_device_nvidia
|
||||||
|
|
||||||
|
! Keep in sync with include/gomp-constants.h.
|
||||||
|
integer (acc_device_kind), parameter :: acc_device_none = 0
|
||||||
|
integer (acc_device_kind), parameter :: acc_device_default = 1
|
||||||
|
integer (acc_device_kind), parameter :: acc_device_host = 2
|
||||||
|
! integer (acc_device_kind), parameter :: acc_device_host_nonshm = 3 removed.
|
||||||
|
integer (acc_device_kind), parameter :: acc_device_not_host = 4
|
||||||
|
integer (acc_device_kind), parameter :: acc_device_nvidia = 5
|
||||||
|
|
||||||
|
end module
|
||||||
|
|
||||||
|
module openacc_internal
|
||||||
|
use openacc_kinds
|
||||||
|
implicit none
|
||||||
|
|
||||||
|
interface
|
||||||
|
function acc_on_device_h (d)
|
||||||
|
import
|
||||||
|
integer (acc_device_kind) d
|
||||||
|
logical acc_on_device_h
|
||||||
|
end function
|
||||||
|
end interface
|
||||||
|
|
||||||
|
interface
|
||||||
|
function acc_on_device_l (d) &
|
||||||
|
bind (C, name = "acc_on_device")
|
||||||
|
use iso_c_binding, only: c_int
|
||||||
|
integer (c_int) :: acc_on_device_l
|
||||||
|
integer (c_int), value :: d
|
||||||
|
end function
|
||||||
|
end interface
|
||||||
|
end module
|
||||||
|
|
||||||
|
module openacc
|
||||||
|
use openacc_kinds
|
||||||
|
use openacc_internal
|
||||||
|
implicit none
|
||||||
|
|
||||||
|
public :: acc_on_device
|
||||||
|
|
||||||
|
interface acc_on_device
|
||||||
|
procedure :: acc_on_device_h
|
||||||
|
end interface
|
||||||
|
|
||||||
|
end module openacc
|
||||||
|
|
||||||
|
function acc_on_device_h (d)
|
||||||
|
use openacc_internal, only: acc_on_device_l
|
||||||
|
use openacc_kinds
|
||||||
|
integer (acc_device_kind) d
|
||||||
|
logical acc_on_device_h
|
||||||
|
if (acc_on_device_l (d) .eq. 1) then
|
||||||
|
acc_on_device_h = .TRUE.
|
||||||
|
else
|
||||||
|
acc_on_device_h = .FALSE.
|
||||||
|
end if
|
||||||
|
end function
|
||||||
|
|
@ -620,7 +620,11 @@ acc_set_device_num (int ord, acc_device_t d)
|
||||||
|
|
||||||
ialias (acc_set_device_num)
|
ialias (acc_set_device_num)
|
||||||
|
|
||||||
/* Compile on_device with optimization, so that the compiler expands
|
/* For -O and higher, the compiler always attempts to expand acc_on_device, but
|
||||||
|
if the user disables the builtin, or calls it via a pointer, we'll need this
|
||||||
|
version.
|
||||||
|
|
||||||
|
Compile this with optimization, so that the compiler expands
|
||||||
this, rather than generating infinitely recursive code. */
|
this, rather than generating infinitely recursive code. */
|
||||||
|
|
||||||
int __attribute__ ((__optimize__ ("O2")))
|
int __attribute__ ((__optimize__ ("O2")))
|
||||||
|
|
|
||||||
|
|
@ -1,426 +0,0 @@
|
||||||
/* Copyright (C) 2014-2015 Free Software Foundation, Inc.
|
|
||||||
|
|
||||||
Contributed by Mentor Embedded.
|
|
||||||
|
|
||||||
This file is part of the GNU Offloading and Multi Processing Library
|
|
||||||
(libgomp).
|
|
||||||
|
|
||||||
Libgomp is free software; you can redistribute it and/or modify it
|
|
||||||
under the terms of the GNU General Public License as published by
|
|
||||||
the Free Software Foundation; either version 3, or (at your option)
|
|
||||||
any later version.
|
|
||||||
|
|
||||||
Libgomp is distributed in the hope that it will be useful, but WITHOUT ANY
|
|
||||||
WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
|
|
||||||
FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
|
||||||
more details.
|
|
||||||
|
|
||||||
Under Section 7 of GPL version 3, you are granted additional
|
|
||||||
permissions described in the GCC Runtime Library Exception, version
|
|
||||||
3.1, as published by the Free Software Foundation.
|
|
||||||
|
|
||||||
You should have received a copy of the GNU General Public License and
|
|
||||||
a copy of the GCC Runtime Library Exception along with this program;
|
|
||||||
see the files COPYING3 and COPYING.RUNTIME respectively. If not, see
|
|
||||||
<http://www.gnu.org/licenses/>. */
|
|
||||||
|
|
||||||
#define ABORT_PTX \
|
|
||||||
".version 3.1\n" \
|
|
||||||
".target sm_30\n" \
|
|
||||||
".address_size 64\n" \
|
|
||||||
".visible .func abort;\n" \
|
|
||||||
".visible .func abort\n" \
|
|
||||||
"{\n" \
|
|
||||||
"trap;\n" \
|
|
||||||
"ret;\n" \
|
|
||||||
"}\n" \
|
|
||||||
".visible .func _gfortran_abort;\n" \
|
|
||||||
".visible .func _gfortran_abort\n" \
|
|
||||||
"{\n" \
|
|
||||||
"trap;\n" \
|
|
||||||
"ret;\n" \
|
|
||||||
"}\n" \
|
|
||||||
|
|
||||||
/* Generated with:
|
|
||||||
|
|
||||||
$ echo 'int acc_on_device(int d) { return __builtin_acc_on_device(d); } int acc_on_device_h_(int *d) { return acc_on_device(*d); }' | accel-gcc/xgcc -Baccel-gcc -x c - -o - -S -m64 -O3 -fno-builtin-acc_on_device -fno-inline
|
|
||||||
*/
|
|
||||||
#define ACC_ON_DEVICE_PTX \
|
|
||||||
" .version 3.1\n" \
|
|
||||||
" .target sm_30\n" \
|
|
||||||
" .address_size 64\n" \
|
|
||||||
".visible .func (.param.u32 %out_retval)acc_on_device(.param.u32 %in_ar1);\n" \
|
|
||||||
".visible .func (.param.u32 %out_retval)acc_on_device(.param.u32 %in_ar1)\n" \
|
|
||||||
"{\n" \
|
|
||||||
" .reg.u32 %ar1;\n" \
|
|
||||||
".reg.u32 %retval;\n" \
|
|
||||||
" .reg.u64 %hr10;\n" \
|
|
||||||
" .reg.u32 %r24;\n" \
|
|
||||||
" .reg.u32 %r25;\n" \
|
|
||||||
" .reg.pred %r27;\n" \
|
|
||||||
" .reg.u32 %r30;\n" \
|
|
||||||
" ld.param.u32 %ar1, [%in_ar1];\n" \
|
|
||||||
" mov.u32 %r24, %ar1;\n" \
|
|
||||||
" setp.ne.u32 %r27,%r24,4;\n" \
|
|
||||||
" set.u32.eq.u32 %r30,%r24,5;\n" \
|
|
||||||
" neg.s32 %r25, %r30;\n" \
|
|
||||||
" @%r27 bra $L3;\n" \
|
|
||||||
" mov.u32 %r25, 1;\n" \
|
|
||||||
"$L3:\n" \
|
|
||||||
" mov.u32 %retval, %r25;\n" \
|
|
||||||
" st.param.u32 [%out_retval], %retval;\n" \
|
|
||||||
" ret;\n" \
|
|
||||||
" }\n" \
|
|
||||||
".visible .func (.param.u32 %out_retval)acc_on_device_h_(.param.u64 %in_ar1);\n" \
|
|
||||||
".visible .func (.param.u32 %out_retval)acc_on_device_h_(.param.u64 %in_ar1)\n" \
|
|
||||||
"{\n" \
|
|
||||||
" .reg.u64 %ar1;\n" \
|
|
||||||
".reg.u32 %retval;\n" \
|
|
||||||
" .reg.u64 %hr10;\n" \
|
|
||||||
" .reg.u64 %r25;\n" \
|
|
||||||
" .reg.u32 %r26;\n" \
|
|
||||||
" .reg.u32 %r27;\n" \
|
|
||||||
" ld.param.u64 %ar1, [%in_ar1];\n" \
|
|
||||||
" mov.u64 %r25, %ar1;\n" \
|
|
||||||
" ld.u32 %r26, [%r25];\n" \
|
|
||||||
" {\n" \
|
|
||||||
" .param.u32 %retval_in;\n" \
|
|
||||||
" {\n" \
|
|
||||||
" .param.u32 %out_arg0;\n" \
|
|
||||||
" st.param.u32 [%out_arg0], %r26;\n" \
|
|
||||||
" call (%retval_in), acc_on_device, (%out_arg0);\n" \
|
|
||||||
" }\n" \
|
|
||||||
" ld.param.u32 %r27, [%retval_in];\n" \
|
|
||||||
"}\n" \
|
|
||||||
" mov.u32 %retval, %r27;\n" \
|
|
||||||
" st.param.u32 [%out_retval], %retval;\n" \
|
|
||||||
" ret;\n" \
|
|
||||||
" }"
|
|
||||||
|
|
||||||
#define GOACC_INTERNAL_PTX \
|
|
||||||
".version 3.1\n" \
|
|
||||||
".target sm_30\n" \
|
|
||||||
".address_size 64\n" \
|
|
||||||
".visible .func (.param .u32 %out_retval) GOACC_tid (.param .u32 %in_ar1);\n" \
|
|
||||||
".visible .func (.param .u32 %out_retval) GOACC_ntid (.param .u32 %in_ar1);\n" \
|
|
||||||
".visible .func (.param .u32 %out_retval) GOACC_ctaid (.param .u32 %in_ar1);\n" \
|
|
||||||
".visible .func (.param .u32 %out_retval) GOACC_nctaid (.param .u32 %in_ar1);\n" \
|
|
||||||
".visible .func (.param .u32 %out_retval) GOACC_get_num_threads;\n" \
|
|
||||||
".visible .func (.param .u32 %out_retval) GOACC_get_thread_num;\n" \
|
|
||||||
".extern .func abort;\n" \
|
|
||||||
".visible .func (.param .u32 %out_retval) GOACC_tid (.param .u32 %in_ar1)\n" \
|
|
||||||
"{\n" \
|
|
||||||
".reg .u32 %ar1;\n" \
|
|
||||||
".reg .u32 %retval;\n" \
|
|
||||||
".reg .u64 %hr10;\n" \
|
|
||||||
".reg .u32 %r22;\n" \
|
|
||||||
".reg .u32 %r23;\n" \
|
|
||||||
".reg .u32 %r24;\n" \
|
|
||||||
".reg .u32 %r25;\n" \
|
|
||||||
".reg .u32 %r26;\n" \
|
|
||||||
".reg .u32 %r27;\n" \
|
|
||||||
".reg .u32 %r28;\n" \
|
|
||||||
".reg .u32 %r29;\n" \
|
|
||||||
".reg .pred %r30;\n" \
|
|
||||||
".reg .u32 %r31;\n" \
|
|
||||||
".reg .pred %r32;\n" \
|
|
||||||
".reg .u32 %r33;\n" \
|
|
||||||
".reg .pred %r34;\n" \
|
|
||||||
".local .align 8 .b8 %frame[4];\n" \
|
|
||||||
"ld.param.u32 %ar1,[%in_ar1];\n" \
|
|
||||||
"mov.u32 %r27,%ar1;\n" \
|
|
||||||
"st.local.u32 [%frame],%r27;\n" \
|
|
||||||
"ld.local.u32 %r28,[%frame];\n" \
|
|
||||||
"mov.u32 %r29,1;\n" \
|
|
||||||
"setp.eq.u32 %r30,%r28,%r29;\n" \
|
|
||||||
"@%r30 bra $L4;\n" \
|
|
||||||
"mov.u32 %r31,2;\n" \
|
|
||||||
"setp.eq.u32 %r32,%r28,%r31;\n" \
|
|
||||||
"@%r32 bra $L5;\n" \
|
|
||||||
"mov.u32 %r33,0;\n" \
|
|
||||||
"setp.eq.u32 %r34,%r28,%r33;\n" \
|
|
||||||
"@!%r34 bra $L8;\n" \
|
|
||||||
"mov.u32 %r23,%tid.x;\n" \
|
|
||||||
"mov.u32 %r22,%r23;\n" \
|
|
||||||
"bra $L7;\n" \
|
|
||||||
"$L4:\n" \
|
|
||||||
"mov.u32 %r24,%tid.y;\n" \
|
|
||||||
"mov.u32 %r22,%r24;\n" \
|
|
||||||
"bra $L7;\n" \
|
|
||||||
"$L5:\n" \
|
|
||||||
"mov.u32 %r25,%tid.z;\n" \
|
|
||||||
"mov.u32 %r22,%r25;\n" \
|
|
||||||
"bra $L7;\n" \
|
|
||||||
"$L8:\n" \
|
|
||||||
"{\n" \
|
|
||||||
"{\n" \
|
|
||||||
"call abort;\n" \
|
|
||||||
"}\n" \
|
|
||||||
"}\n" \
|
|
||||||
"$L7:\n" \
|
|
||||||
"mov.u32 %r26,%r22;\n" \
|
|
||||||
"mov.u32 %retval,%r26;\n" \
|
|
||||||
"st.param.u32 [%out_retval],%retval;\n" \
|
|
||||||
"ret;\n" \
|
|
||||||
"}\n" \
|
|
||||||
".visible .func (.param .u32 %out_retval) GOACC_ntid (.param .u32 %in_ar1)\n" \
|
|
||||||
"{\n" \
|
|
||||||
".reg .u32 %ar1;\n" \
|
|
||||||
".reg .u32 %retval;\n" \
|
|
||||||
".reg .u64 %hr10;\n" \
|
|
||||||
".reg .u32 %r22;\n" \
|
|
||||||
".reg .u32 %r23;\n" \
|
|
||||||
".reg .u32 %r24;\n" \
|
|
||||||
".reg .u32 %r25;\n" \
|
|
||||||
".reg .u32 %r26;\n" \
|
|
||||||
".reg .u32 %r27;\n" \
|
|
||||||
".reg .u32 %r28;\n" \
|
|
||||||
".reg .u32 %r29;\n" \
|
|
||||||
".reg .pred %r30;\n" \
|
|
||||||
".reg .u32 %r31;\n" \
|
|
||||||
".reg .pred %r32;\n" \
|
|
||||||
".reg .u32 %r33;\n" \
|
|
||||||
".reg .pred %r34;\n" \
|
|
||||||
".local .align 8 .b8 %frame[4];\n" \
|
|
||||||
"ld.param.u32 %ar1,[%in_ar1];\n" \
|
|
||||||
"mov.u32 %r27,%ar1;\n" \
|
|
||||||
"st.local.u32 [%frame],%r27;\n" \
|
|
||||||
"ld.local.u32 %r28,[%frame];\n" \
|
|
||||||
"mov.u32 %r29,1;\n" \
|
|
||||||
"setp.eq.u32 %r30,%r28,%r29;\n" \
|
|
||||||
"@%r30 bra $L11;\n" \
|
|
||||||
"mov.u32 %r31,2;\n" \
|
|
||||||
"setp.eq.u32 %r32,%r28,%r31;\n" \
|
|
||||||
"@%r32 bra $L12;\n" \
|
|
||||||
"mov.u32 %r33,0;\n" \
|
|
||||||
"setp.eq.u32 %r34,%r28,%r33;\n" \
|
|
||||||
"@!%r34 bra $L15;\n" \
|
|
||||||
"mov.u32 %r23,%ntid.x;\n" \
|
|
||||||
"mov.u32 %r22,%r23;\n" \
|
|
||||||
"bra $L14;\n" \
|
|
||||||
"$L11:\n" \
|
|
||||||
"mov.u32 %r24,%ntid.y;\n" \
|
|
||||||
"mov.u32 %r22,%r24;\n" \
|
|
||||||
"bra $L14;\n" \
|
|
||||||
"$L12:\n" \
|
|
||||||
"mov.u32 %r25,%ntid.z;\n" \
|
|
||||||
"mov.u32 %r22,%r25;\n" \
|
|
||||||
"bra $L14;\n" \
|
|
||||||
"$L15:\n" \
|
|
||||||
"{\n" \
|
|
||||||
"{\n" \
|
|
||||||
"call abort;\n" \
|
|
||||||
"}\n" \
|
|
||||||
"}\n" \
|
|
||||||
"$L14:\n" \
|
|
||||||
"mov.u32 %r26,%r22;\n" \
|
|
||||||
"mov.u32 %retval,%r26;\n" \
|
|
||||||
"st.param.u32 [%out_retval],%retval;\n" \
|
|
||||||
"ret;\n" \
|
|
||||||
"}\n" \
|
|
||||||
".visible .func (.param .u32 %out_retval) GOACC_ctaid (.param .u32 %in_ar1)\n" \
|
|
||||||
"{\n" \
|
|
||||||
".reg .u32 %ar1;\n" \
|
|
||||||
".reg .u32 %retval;\n" \
|
|
||||||
".reg .u64 %hr10;\n" \
|
|
||||||
".reg .u32 %r22;\n" \
|
|
||||||
".reg .u32 %r23;\n" \
|
|
||||||
".reg .u32 %r24;\n" \
|
|
||||||
".reg .u32 %r25;\n" \
|
|
||||||
".reg .u32 %r26;\n" \
|
|
||||||
".reg .u32 %r27;\n" \
|
|
||||||
".reg .u32 %r28;\n" \
|
|
||||||
".reg .u32 %r29;\n" \
|
|
||||||
".reg .pred %r30;\n" \
|
|
||||||
".reg .u32 %r31;\n" \
|
|
||||||
".reg .pred %r32;\n" \
|
|
||||||
".reg .u32 %r33;\n" \
|
|
||||||
".reg .pred %r34;\n" \
|
|
||||||
".local .align 8 .b8 %frame[4];\n" \
|
|
||||||
"ld.param.u32 %ar1,[%in_ar1];\n" \
|
|
||||||
"mov.u32 %r27,%ar1;\n" \
|
|
||||||
"st.local.u32 [%frame],%r27;\n" \
|
|
||||||
"ld.local.u32 %r28,[%frame];\n" \
|
|
||||||
"mov.u32 %r29,1;\n" \
|
|
||||||
"setp.eq.u32 %r30,%r28,%r29;\n" \
|
|
||||||
"@%r30 bra $L18;\n" \
|
|
||||||
"mov.u32 %r31,2;\n" \
|
|
||||||
"setp.eq.u32 %r32,%r28,%r31;\n" \
|
|
||||||
"@%r32 bra $L19;\n" \
|
|
||||||
"mov.u32 %r33,0;\n" \
|
|
||||||
"setp.eq.u32 %r34,%r28,%r33;\n" \
|
|
||||||
"@!%r34 bra $L22;\n" \
|
|
||||||
"mov.u32 %r23,%ctaid.x;\n" \
|
|
||||||
"mov.u32 %r22,%r23;\n" \
|
|
||||||
"bra $L21;\n" \
|
|
||||||
"$L18:\n" \
|
|
||||||
"mov.u32 %r24,%ctaid.y;\n" \
|
|
||||||
"mov.u32 %r22,%r24;\n" \
|
|
||||||
"bra $L21;\n" \
|
|
||||||
"$L19:\n" \
|
|
||||||
"mov.u32 %r25,%ctaid.z;\n" \
|
|
||||||
"mov.u32 %r22,%r25;\n" \
|
|
||||||
"bra $L21;\n" \
|
|
||||||
"$L22:\n" \
|
|
||||||
"{\n" \
|
|
||||||
"{\n" \
|
|
||||||
"call abort;\n" \
|
|
||||||
"}\n" \
|
|
||||||
"}\n" \
|
|
||||||
"$L21:\n" \
|
|
||||||
"mov.u32 %r26,%r22;\n" \
|
|
||||||
"mov.u32 %retval,%r26;\n" \
|
|
||||||
"st.param.u32 [%out_retval],%retval;\n" \
|
|
||||||
"ret;\n" \
|
|
||||||
"}\n" \
|
|
||||||
".visible .func (.param .u32 %out_retval) GOACC_nctaid (.param .u32 %in_ar1)\n" \
|
|
||||||
"{\n" \
|
|
||||||
".reg .u32 %ar1;\n" \
|
|
||||||
".reg .u32 %retval;\n" \
|
|
||||||
".reg .u64 %hr10;\n" \
|
|
||||||
".reg .u32 %r22;\n" \
|
|
||||||
".reg .u32 %r23;\n" \
|
|
||||||
".reg .u32 %r24;\n" \
|
|
||||||
".reg .u32 %r25;\n" \
|
|
||||||
".reg .u32 %r26;\n" \
|
|
||||||
".reg .u32 %r27;\n" \
|
|
||||||
".reg .u32 %r28;\n" \
|
|
||||||
".reg .u32 %r29;\n" \
|
|
||||||
".reg .pred %r30;\n" \
|
|
||||||
".reg .u32 %r31;\n" \
|
|
||||||
".reg .pred %r32;\n" \
|
|
||||||
".reg .u32 %r33;\n" \
|
|
||||||
".reg .pred %r34;\n" \
|
|
||||||
".local .align 8 .b8 %frame[4];\n" \
|
|
||||||
"ld.param.u32 %ar1,[%in_ar1];\n" \
|
|
||||||
"mov.u32 %r27,%ar1;\n" \
|
|
||||||
"st.local.u32 [%frame],%r27;\n" \
|
|
||||||
"ld.local.u32 %r28,[%frame];\n" \
|
|
||||||
"mov.u32 %r29,1;\n" \
|
|
||||||
"setp.eq.u32 %r30,%r28,%r29;\n" \
|
|
||||||
"@%r30 bra $L25;\n" \
|
|
||||||
"mov.u32 %r31,2;\n" \
|
|
||||||
"setp.eq.u32 %r32,%r28,%r31;\n" \
|
|
||||||
"@%r32 bra $L26;\n" \
|
|
||||||
"mov.u32 %r33,0;\n" \
|
|
||||||
"setp.eq.u32 %r34,%r28,%r33;\n" \
|
|
||||||
"@!%r34 bra $L29;\n" \
|
|
||||||
"mov.u32 %r23,%nctaid.x;\n" \
|
|
||||||
"mov.u32 %r22,%r23;\n" \
|
|
||||||
"bra $L28;\n" \
|
|
||||||
"$L25:\n" \
|
|
||||||
"mov.u32 %r24,%nctaid.y;\n" \
|
|
||||||
"mov.u32 %r22,%r24;\n" \
|
|
||||||
"bra $L28;\n" \
|
|
||||||
"$L26:\n" \
|
|
||||||
"mov.u32 %r25,%nctaid.z;\n" \
|
|
||||||
"mov.u32 %r22,%r25;\n" \
|
|
||||||
"bra $L28;\n" \
|
|
||||||
"$L29:\n" \
|
|
||||||
"{\n" \
|
|
||||||
"{\n" \
|
|
||||||
"call abort;\n" \
|
|
||||||
"}\n" \
|
|
||||||
"}\n" \
|
|
||||||
"$L28:\n" \
|
|
||||||
"mov.u32 %r26,%r22;\n" \
|
|
||||||
"mov.u32 %retval,%r26;\n" \
|
|
||||||
"st.param.u32 [%out_retval],%retval;\n" \
|
|
||||||
"ret;\n" \
|
|
||||||
"}\n" \
|
|
||||||
".visible .func (.param .u32 %out_retval) GOACC_get_num_threads\n" \
|
|
||||||
"{\n" \
|
|
||||||
".reg .u32 %retval;\n" \
|
|
||||||
".reg .u64 %hr10;\n" \
|
|
||||||
".reg .u32 %r22;\n" \
|
|
||||||
".reg .u32 %r23;\n" \
|
|
||||||
".reg .u32 %r24;\n" \
|
|
||||||
".reg .u32 %r25;\n" \
|
|
||||||
".reg .u32 %r26;\n" \
|
|
||||||
".reg .u32 %r27;\n" \
|
|
||||||
".reg .u32 %r28;\n" \
|
|
||||||
".reg .u32 %r29;\n" \
|
|
||||||
"mov.u32 %r26,0;\n" \
|
|
||||||
"{\n" \
|
|
||||||
".param .u32 %retval_in;\n" \
|
|
||||||
"{\n" \
|
|
||||||
".param .u32 %out_arg0;\n" \
|
|
||||||
"st.param.u32 [%out_arg0],%r26;\n" \
|
|
||||||
"call (%retval_in),GOACC_ntid,(%out_arg0);\n" \
|
|
||||||
"}\n" \
|
|
||||||
"ld.param.u32 %r27,[%retval_in];\n" \
|
|
||||||
"}\n" \
|
|
||||||
"mov.u32 %r22,%r27;\n" \
|
|
||||||
"mov.u32 %r28,0;\n" \
|
|
||||||
"{\n" \
|
|
||||||
".param .u32 %retval_in;\n" \
|
|
||||||
"{\n" \
|
|
||||||
".param .u32 %out_arg0;\n" \
|
|
||||||
"st.param.u32 [%out_arg0],%r28;\n" \
|
|
||||||
"call (%retval_in),GOACC_nctaid,(%out_arg0);\n" \
|
|
||||||
"}\n" \
|
|
||||||
"ld.param.u32 %r29,[%retval_in];\n" \
|
|
||||||
"}\n" \
|
|
||||||
"mov.u32 %r23,%r29;\n" \
|
|
||||||
"mul.lo.u32 %r24,%r22,%r23;\n" \
|
|
||||||
"mov.u32 %r25,%r24;\n" \
|
|
||||||
"mov.u32 %retval,%r25;\n" \
|
|
||||||
"st.param.u32 [%out_retval],%retval;\n" \
|
|
||||||
"ret;\n" \
|
|
||||||
"}\n" \
|
|
||||||
".visible .func (.param .u32 %out_retval) GOACC_get_thread_num\n" \
|
|
||||||
"{\n" \
|
|
||||||
".reg .u32 %retval;\n" \
|
|
||||||
".reg .u64 %hr10;\n" \
|
|
||||||
".reg .u32 %r22;\n" \
|
|
||||||
".reg .u32 %r23;\n" \
|
|
||||||
".reg .u32 %r24;\n" \
|
|
||||||
".reg .u32 %r25;\n" \
|
|
||||||
".reg .u32 %r26;\n" \
|
|
||||||
".reg .u32 %r27;\n" \
|
|
||||||
".reg .u32 %r28;\n" \
|
|
||||||
".reg .u32 %r29;\n" \
|
|
||||||
".reg .u32 %r30;\n" \
|
|
||||||
".reg .u32 %r31;\n" \
|
|
||||||
".reg .u32 %r32;\n" \
|
|
||||||
".reg .u32 %r33;\n" \
|
|
||||||
"mov.u32 %r28,0;\n" \
|
|
||||||
"{\n" \
|
|
||||||
".param .u32 %retval_in;\n" \
|
|
||||||
"{\n" \
|
|
||||||
".param .u32 %out_arg0;\n" \
|
|
||||||
"st.param.u32 [%out_arg0],%r28;\n" \
|
|
||||||
"call (%retval_in),GOACC_ntid,(%out_arg0);\n" \
|
|
||||||
"}\n" \
|
|
||||||
"ld.param.u32 %r29,[%retval_in];\n" \
|
|
||||||
"}\n" \
|
|
||||||
"mov.u32 %r22,%r29;\n" \
|
|
||||||
"mov.u32 %r30,0;\n" \
|
|
||||||
"{\n" \
|
|
||||||
".param .u32 %retval_in;\n" \
|
|
||||||
"{\n" \
|
|
||||||
".param .u32 %out_arg0;\n" \
|
|
||||||
"st.param.u32 [%out_arg0],%r30;\n" \
|
|
||||||
"call (%retval_in),GOACC_ctaid,(%out_arg0);\n" \
|
|
||||||
"}\n" \
|
|
||||||
"ld.param.u32 %r31,[%retval_in];\n" \
|
|
||||||
"}\n" \
|
|
||||||
"mov.u32 %r23,%r31;\n" \
|
|
||||||
"mul.lo.u32 %r24,%r22,%r23;\n" \
|
|
||||||
"mov.u32 %r32,0;\n" \
|
|
||||||
"{\n" \
|
|
||||||
".param .u32 %retval_in;\n" \
|
|
||||||
"{\n" \
|
|
||||||
".param .u32 %out_arg0;\n" \
|
|
||||||
"st.param.u32 [%out_arg0],%r32;\n" \
|
|
||||||
"call (%retval_in),GOACC_tid,(%out_arg0);\n" \
|
|
||||||
"}\n" \
|
|
||||||
"ld.param.u32 %r33,[%retval_in];\n" \
|
|
||||||
"}\n" \
|
|
||||||
"mov.u32 %r25,%r33;\n" \
|
|
||||||
"add.u32 %r26,%r24,%r25;\n" \
|
|
||||||
"mov.u32 %r27,%r26;\n" \
|
|
||||||
"mov.u32 %retval,%r27;\n" \
|
|
||||||
"st.param.u32 [%out_retval],%retval;\n" \
|
|
||||||
"ret;\n" \
|
|
||||||
"}\n"
|
|
||||||
|
|
@ -34,7 +34,6 @@
|
||||||
#include "openacc.h"
|
#include "openacc.h"
|
||||||
#include "config.h"
|
#include "config.h"
|
||||||
#include "libgomp-plugin.h"
|
#include "libgomp-plugin.h"
|
||||||
#include "oacc-ptx.h"
|
|
||||||
#include "oacc-plugin.h"
|
#include "oacc-plugin.h"
|
||||||
#include "gomp-constants.h"
|
#include "gomp-constants.h"
|
||||||
|
|
||||||
|
|
@ -750,35 +749,6 @@ link_ptx (CUmodule *module, const struct targ_ptx_obj *ptx_objs,
|
||||||
if (r != CUDA_SUCCESS)
|
if (r != CUDA_SUCCESS)
|
||||||
GOMP_PLUGIN_fatal ("cuLinkCreate error: %s", cuda_error (r));
|
GOMP_PLUGIN_fatal ("cuLinkCreate error: %s", cuda_error (r));
|
||||||
|
|
||||||
char *abort_ptx = ABORT_PTX;
|
|
||||||
r = cuLinkAddData (linkstate, CU_JIT_INPUT_PTX, abort_ptx,
|
|
||||||
strlen (abort_ptx) + 1, 0, 0, 0, 0);
|
|
||||||
if (r != CUDA_SUCCESS)
|
|
||||||
{
|
|
||||||
GOMP_PLUGIN_error ("Link error log %s\n", &elog[0]);
|
|
||||||
GOMP_PLUGIN_fatal ("cuLinkAddData (abort) error: %s", cuda_error (r));
|
|
||||||
}
|
|
||||||
|
|
||||||
char *acc_on_device_ptx = ACC_ON_DEVICE_PTX;
|
|
||||||
r = cuLinkAddData (linkstate, CU_JIT_INPUT_PTX, acc_on_device_ptx,
|
|
||||||
strlen (acc_on_device_ptx) + 1, 0, 0, 0, 0);
|
|
||||||
if (r != CUDA_SUCCESS)
|
|
||||||
{
|
|
||||||
GOMP_PLUGIN_error ("Link error log %s\n", &elog[0]);
|
|
||||||
GOMP_PLUGIN_fatal ("cuLinkAddData (acc_on_device) error: %s",
|
|
||||||
cuda_error (r));
|
|
||||||
}
|
|
||||||
|
|
||||||
char *goacc_internal_ptx = GOACC_INTERNAL_PTX;
|
|
||||||
r = cuLinkAddData (linkstate, CU_JIT_INPUT_PTX, goacc_internal_ptx,
|
|
||||||
strlen (goacc_internal_ptx) + 1, 0, 0, 0, 0);
|
|
||||||
if (r != CUDA_SUCCESS)
|
|
||||||
{
|
|
||||||
GOMP_PLUGIN_error ("Link error log %s\n", &elog[0]);
|
|
||||||
GOMP_PLUGIN_fatal ("cuLinkAddData (goacc_internal_ptx) error: %s",
|
|
||||||
cuda_error (r));
|
|
||||||
}
|
|
||||||
|
|
||||||
for (; num_objs--; ptx_objs++)
|
for (; num_objs--; ptx_objs++)
|
||||||
{
|
{
|
||||||
/* cuLinkAddData's 'data' argument erroneously omits the const
|
/* cuLinkAddData's 'data' argument erroneously omits the const
|
||||||
|
|
|
||||||
Loading…
Reference in New Issue