ソースを参照

Real-time assembler for Cell SPE.

tags/mesa_20090313
Ian Romanick 17年前
コミット
77a1488620
3個のファイルの変更662行の追加0行の削除
  1. 351
    0
      src/mesa/ppc/rtasm/spe_asm.c
  2. 310
    0
      src/mesa/ppc/rtasm/spe_asm.h
  3. 1
    0
      src/mesa/sources

+ 351
- 0
src/mesa/ppc/rtasm/spe_asm.c ファイルの表示

@@ -0,0 +1,351 @@
/*
* (C) Copyright IBM Corporation 2008
* All Rights Reserved.
*
* Permission is hereby granted, free of charge, to any person obtaining a
* copy of this software and associated documentation files (the "Software"),
* to deal in the Software without restriction, including without limitation
* on the rights to use, copy, modify, merge, publish, distribute, sub
* license, and/or sell copies of the Software, and to permit persons to whom
* the Software is furnished to do so, subject to the following conditions:
*
* The above copyright notice and this permission notice (including the next
* paragraph) shall be included in all copies or substantial portions of the
* Software.
*
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
* FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
* AUTHORS, COPYRIGHT HOLDERS, AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
* DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
* OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
* USE OR OTHER DEALINGS IN THE SOFTWARE.
*/

/**
* \file spe_asm.c
* Real-time assembly generation interface for Cell B.E. SPEs.
*
* \author Ian Romanick <idr@us.ibm.com>
*/
#ifdef GALLIUM_CELL
#include <inttypes.h>
#include <imports.h>
#include "spe_asm.h"

/**
* SPE instruction types
*
* There are 6 primary instruction encodings used on the Cell's SPEs. Each of
* the following unions encodes one type.
*
* \bug
* If, at some point, we start generating SPE code from a little-endian host
* these unions will not work.
*/
/*@{*/
/**
* Encode one output register with two input registers
*/
union spe_inst_RR {
uint32_t bits;
struct {
unsigned op:11;
unsigned rB:7;
unsigned rA:7;
unsigned rT:7;
} inst;
};


/**
* Encode one output register with three input registers
*/
union spe_inst_RRR {
uint32_t bits;
struct {
unsigned op:4;
unsigned rT:7;
unsigned rB:7;
unsigned rA:7;
unsigned rC:7;
} inst;
};


/**
* Encode one output register with one input reg. and a 7-bit signed immed
*/
union spe_inst_RI7 {
uint32_t bits;
struct {
unsigned op:11;
unsigned i7:7;
unsigned rA:7;
unsigned rT:7;
} inst;
};


/**
* Encode one output register with one input reg. and a 10-bit signed immed
*/
union spe_inst_RI10 {
uint32_t bits;
struct {
unsigned op:8;
unsigned i10:10;
unsigned rA:7;
unsigned rT:7;
} inst;
};


/**
* Encode one output register with a 16-bit signed immediate
*/
union spe_inst_RI16 {
uint32_t bits;
struct {
unsigned op:9;
unsigned i16:16;
unsigned rT:7;
} inst;
};


/**
* Encode one output register with a 18-bit signed immediate
*/
union spe_inst_RI18 {
uint32_t bits;
struct {
unsigned op:7;
unsigned i18:18;
unsigned rT:7;
} inst;
};
/*@}*/


static void emit_RR(struct spe_function *p, unsigned op, unsigned rT,
unsigned rA, unsigned rB)
{
union spe_inst_RR inst;
inst.inst.op = op;
inst.inst.rB = rB;
inst.inst.rA = rA;
inst.inst.rT = rT;
*p->csr = inst.bits;
p->csr++;
}


static void emit_RRR(struct spe_function *p, unsigned op, unsigned rT,
unsigned rA, unsigned rB, unsigned rC)
{
union spe_inst_RRR inst;
inst.inst.op = op;
inst.inst.rT = rT;
inst.inst.rB = rB;
inst.inst.rA = rA;
inst.inst.rC = rC;
*p->csr = inst.bits;
p->csr++;
}


static void emit_RI7(struct spe_function *p, unsigned op, unsigned rT,
unsigned rA, int imm)
{
union spe_inst_RI7 inst;
inst.inst.op = op;
inst.inst.i7 = imm;
inst.inst.rA = rA;
inst.inst.rT = rT;
*p->csr = inst.bits;
p->csr++;
}



static void emit_RI10(struct spe_function *p, unsigned op, unsigned rT,
unsigned rA, int imm)
{
union spe_inst_RI10 inst;
inst.inst.op = op;
inst.inst.i10 = imm;
inst.inst.rA = rA;
inst.inst.rT = rT;
*p->csr = inst.bits;
p->csr++;
}


static void emit_RI16(struct spe_function *p, unsigned op, unsigned rT,
int imm)
{
union spe_inst_RI16 inst;
inst.inst.op = op;
inst.inst.i16 = imm;
inst.inst.rT = rT;
*p->csr = inst.bits;
p->csr++;
}


static void emit_RI18(struct spe_function *p, unsigned op, unsigned rT,
int imm)
{
union spe_inst_RI18 inst;
inst.inst.op = op;
inst.inst.i18 = imm;
inst.inst.rT = rT;
*p->csr = inst.bits;
p->csr++;
}




#define EMIT_(_name, _op) \
void _name (struct spe_function *p, unsigned rT) \
{ \
emit_RR(p, _op, rT, 0, 0); \
}

#define EMIT_R(_name, _op) \
void _name (struct spe_function *p, unsigned rT, unsigned rA) \
{ \
emit_RR(p, _op, rT, rA, 0); \
}

#define EMIT_RR(_name, _op) \
void _name (struct spe_function *p, unsigned rT, unsigned rA, unsigned rB) \
{ \
emit_RR(p, _op, rT, rA, rB); \
}

#define EMIT_RRR(_name, _op) \
void _name (struct spe_function *p, unsigned rT, unsigned rA, unsigned rB, unsigned rC) \
{ \
emit_RRR(p, _op, rT, rA, rB, rC); \
}

#define EMIT_RI7(_name, _op) \
void _name (struct spe_function *p, unsigned rT, unsigned rA, int imm) \
{ \
emit_RI7(p, _op, rT, rA, imm); \
}

#define EMIT_RI10(_name, _op) \
void _name (struct spe_function *p, unsigned rT, unsigned rA, int imm) \
{ \
emit_RI10(p, _op, rT, rA, imm); \
}

#define EMIT_RI16(_name, _op) \
void _name (struct spe_function *p, unsigned rT, int imm) \
{ \
emit_RI16(p, _op, rT, imm); \
}

#define EMIT_RI18(_name, _op) \
void _name (struct spe_function *p, unsigned rT, int imm) \
{ \
emit_RI18(p, _op, rT, imm); \
}

#define EMIT_I16(_name, _op) \
void _name (struct spe_function *p, int imm) \
{ \
emit_RI16(p, _op, 0, imm); \
}

#include "spe_asm.h"


/*
*/
void spe_init_func(struct spe_function *p, unsigned code_size)
{
p->store = _mesa_align_malloc(code_size, 16);
p->csr = p->store;
}


void spe_release_func(struct spe_function *p)
{
_mesa_align_free(p->store);
p->store = NULL;
p->csr = NULL;
}


void spu_bi(struct spe_function *p, unsigned rA, int d, int e)
{
emit_RI7(p, 0x1a8, 0, rA, (d << 5) | (e << 4));
}

void spu_iret(struct spe_function *p, unsigned rA, int d, int e)
{
emit_RI7(p, 0x1aa, 0, rA, (d << 5) | (e << 4));
}

void spu_bisled(struct spe_function *p, unsigned rT, unsigned rA, int d,
int e)
{
emit_RI7(p, 0x1ab, rT, rA, (d << 5) | (e << 4));
}

void spu_bisl(struct spe_function *p, unsigned rT, unsigned rA, int d,
int e)
{
emit_RI7(p, 0x1a9, rT, rA, (d << 5) | (e << 4));
}

void spu_biz(struct spe_function *p, unsigned rT, unsigned rA, int d,
int e)
{
emit_RI7(p, 0x128, rT, rA, (d << 5) | (e << 4));
}

void spu_binz(struct spe_function *p, unsigned rT, unsigned rA, int d, int e)
{
emit_RI7(p, 0x129, rT, rA, (d << 5) | (e << 4));
}

void spu_bihz(struct spe_function *p, unsigned rT, unsigned rA, int d, int e)
{
emit_RI7(p, 0x12a, rT, rA, (d << 5) | (e << 4));
}

void spu_bihnz(struct spe_function *p, unsigned rT, unsigned rA, int d, int e)
{
emit_RI7(p, 0x12b, rT, rA, (d << 5) | (e << 4));
}


/* Hint-for-branch instructions
*/
#if 0
hbr;
hbra;
hbrr;
#endif


/* Control instructions
*/
#if 0
stop;
EMIT_RR (spu_stopd, 0x140);
EMIT_ (spu_lnop, 0x001);
EMIT_ (spu_nop, 0x201);
sync;
EMIT_ (spu_dsync, 0x003);
EMIT_R (spu_mfspr, 0x00c);
EMIT_R (spu_mtspr, 0x10c);
#endif

#endif /* GALLIUM_CELL */

+ 310
- 0
src/mesa/ppc/rtasm/spe_asm.h ファイルの表示

@@ -0,0 +1,310 @@
/*
* (C) Copyright IBM Corporation 2008
* All Rights Reserved.
*
* Permission is hereby granted, free of charge, to any person obtaining a
* copy of this software and associated documentation files (the "Software"),
* to deal in the Software without restriction, including without limitation
* on the rights to use, copy, modify, merge, publish, distribute, sub
* license, and/or sell copies of the Software, and to permit persons to whom
* the Software is furnished to do so, subject to the following conditions:
*
* The above copyright notice and this permission notice (including the next
* paragraph) shall be included in all copies or substantial portions of the
* Software.
*
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
* FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
* AUTHORS, COPYRIGHT HOLDERS, AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
* DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
* OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
* USE OR OTHER DEALINGS IN THE SOFTWARE.
*/

/**
* \file spe_asm.h
* Real-time assembly generation interface for Cell B.E. SPEs.
*
* \author Ian Romanick <idr@us.ibm.com>
*/

#ifndef SPE_ASM_H
#define SPE_ASM_H

struct spe_function {
/**
*
*/
uint32_t *store;
uint32_t *csr;
const char *fn;
};

extern void spe_init_func(struct spe_function *p, unsigned code_size);
extern void spe_release_func(struct spe_function *p);

#endif /* SPE_ASM_H */

#ifndef EMIT_
#define EMIT_(name, _op) \
extern void _name (struct spe_function *p, unsigned rT)
#define EMIT_R(_name, _op) \
extern void _name (struct spe_function *p, unsigned rT, unsigned rA)
#define EMIT_RR(_name, _op) \
extern void _name (struct spe_function *p, unsigned rT, unsigned rA, \
unsigned rB)
#define EMIT_RRR(_name, _op) \
extern void _name (struct spe_function *p, unsigned rT, unsigned rA, \
unsigned rB, unsigned rC)
#define EMIT_RI7(_name, _op) \
extern void _name (struct spe_function *p, unsigned rT, unsigned rA, \
int imm)
#define EMIT_RI10(_name, _op) \
extern void _name (struct spe_function *p, unsigned rT, unsigned rA, \
int imm)
#define EMIT_RI16(_name, _op) \
extern void _name (struct spe_function *p, unsigned rT, int imm)
#define EMIT_RI18(_name, _op) \
extern void _name (struct spe_function *p, unsigned rT, int imm)
#define EMIT_I16(_name, _op) \
extern void _name (struct spe_function *p, int imm)
#define UNDEF_EMIT_MACROS
#endif /* EMIT_ */


/* Memory load / store instructions
*/
EMIT_RI10(spu_ldq, 0x034);
EMIT_RR (spu_lqx, 0x1c4);
EMIT_RI16(spu_lqa, 0x061);
EMIT_RI16(spu_lqr, 0x067);
EMIT_RI10(spu_stqd, 0x024);
EMIT_RR (spu_stqx, 0x144);
EMIT_RI16(spu_stqa, 0x041);
EMIT_RI16(spu_stqr, 0x047);
EMIT_RI7 (spu_cbd, 0x1f4);
EMIT_RR (spu_cbx, 0x1d4);
EMIT_RI7 (spu_chd, 0x1f5);
EMIT_RI7 (spu_chx, 0x1d5);
EMIT_RI7 (spu_cwd, 0x1f6);
EMIT_RI7 (spu_cwx, 0x1d6);
EMIT_RI7 (spu_cdd, 0x1f7);
EMIT_RI7 (spu_cdx, 0x1d7);


/* Constant formation instructions
*/
EMIT_RI16(spu_ilh, 0x083);
EMIT_RI16(spu_ilhu, 0x082);
EMIT_RI16(spu_il, 0x081);
EMIT_RI18(spu_ila, 0x021);
EMIT_RI16(spu_iohl, 0x0c1);
EMIT_RI16(spu_fsmbi, 0x0c5);


/* Integer and logical instructions
*/
EMIT_RR (spe_ah, 0x0c8);
EMIT_RI10(spe_ahi, 0x01d);
EMIT_RR (spe_a, 0x0c0);
EMIT_RI10(spe_ai, 0x01c);
EMIT_RR (spe_sfh, 0x048);
EMIT_RI10(spe_sfhi, 0x00d);
EMIT_RR (spe_sf, 0x040);
EMIT_RI10(spe_sfi, 0x00c);
EMIT_RR (spe_addx, 0x340);
EMIT_RR (spu_cg, 0x0c2);
EMIT_RR (spu_cgx, 0x342);
EMIT_RR (spe_sfx, 0x341);
EMIT_RR (spu_bg, 0x042);
EMIT_RR (spu_bgx, 0x343);
EMIT_RR (spu_mpy, 0x3c4);
EMIT_RR (spu_mpyu, 0x3cc);
EMIT_RI10(spu_mpyi, 0x074);
EMIT_RI10(spu_mpyui, 0x075);
EMIT_RRR (spy_mpya, 0x00c);
EMIT_RR (spu_mpyh, 0x3c5);
EMIT_RR (spu_mpys, 0x3c7);
EMIT_RR (spu_mpyhh, 0x3c6);
EMIT_RR (spu_mpyhha, 0x346);
EMIT_RR (spu_mpyhhu, 0x3ce);
EMIT_RR (spu_mpyhhau, 0x34e);
EMIT_R (spe_clz, 0x2a5);
EMIT_R (spe_cntb, 0x2b4);
EMIT_R (spe_fsmb, 0x1b6);
EMIT_R (spe_fsmh, 0x1b5);
EMIT_R (spe_fsm, 0x1b4);
EMIT_R (spe_gbb, 0x1b2);
EMIT_R (spe_gbh, 0x1b1);
EMIT_R (spe_gb, 0x1b0);
EMIT_RR (spe_avgb, 0x0d3);
EMIT_RR (spe_absdb, 0x053);
EMIT_RR (spe_sumb, 0x253);
EMIT_R (spe_xsbh, 0x2b6);
EMIT_R (spe_xshw, 0x2ae);
EMIT_R (spe_xswd, 0x2a6);
EMIT_RR (spe_and, 0x0c1);
EMIT_RR (spe_andc, 0x2c1);
EMIT_RI10(spu_andbi, 0x016);
EMIT_RI10(spu_andhi, 0x015);
EMIT_RI10(spu_andi, 0x014);
EMIT_RR (spe_or, 0x041);
EMIT_RR (spe_orc, 0x2c9);
EMIT_RI10(spu_orbi, 0x006);
EMIT_RI10(spu_orhi, 0x005);
EMIT_RI10(spu_ori, 0x004);
EMIT_R (spu_orx, 0x1f0);
EMIT_RR (spu_xor, 0x241);
EMIT_RI10(spu_xorbi, 0x026);
EMIT_RI10(spu_xorhi, 0x025);
EMIT_RI10(spu_xori, 0x024);
EMIT_RR (spe_nand, 0x0c9);
EMIT_RR (spe_nor, 0x049);
EMIT_RR (spe_eqv, 0x249);
EMIT_RRR (spy_selb, 0x008);
EMIT_RRR (spy_shufb, 0x00b);


/* Shift and rotate instructions
*/
EMIT_RR (spe_shlh, 0x05f);
EMIT_RI7 (spe_shlhi, 0x07f);
EMIT_RR (spe_shl, 0x05b);
EMIT_RI7 (spe_shli, 0x07b);
EMIT_RR (spe_shlqbi, 0x1db);
EMIT_RI7 (spe_shlqbii, 0x1fb);
EMIT_RR (spe_shlqby, 0x1df);
EMIT_RI7 (spe_shlqbyi, 0x1ff);
EMIT_RR (spe_shlqbybi, 0x1cf);
EMIT_RR (spe_roth, 0x05c);
EMIT_RI7 (spe_rothi, 0x07c);
EMIT_RR (spe_rot, 0x058);
EMIT_RI7 (spe_roti, 0x078);
EMIT_RR (spe_rotqby, 0x1dc);
EMIT_RI7 (spe_rotqbyi, 0x1fc);
EMIT_RR (spe_rotqbybi, 0x1cc);
EMIT_RR (spe_rotqbi, 0x1d8);
EMIT_RI7 (spe_rotqbii, 0x1f8);
EMIT_RR (spe_rothm, 0x05d);
EMIT_RI7 (spe_rothmi, 0x07d);
EMIT_RR (spe_rotm, 0x059);
EMIT_RI7 (spe_rotmi, 0x079);
EMIT_RR (spe_rotqmby, 0x1dd);
EMIT_RI7 (spe_rotqmbyi, 0x1fd);
EMIT_RR (spe_rotqmbybi, 0x1cd);
EMIT_RR (spe_rotqmbi, 0x1c9);
EMIT_RI7 (spe_rotqmbii, 0x1f9);
EMIT_RR (spe_rotmah, 0x05e);
EMIT_RI7 (spe_rotmahi, 0x07e);
EMIT_RR (spe_rotma, 0x05a);
EMIT_RI7 (spe_rotmai, 0x07a);


/* Compare, branch, and halt instructions
*/
EMIT_RR (spe_heq, 0x3d8);
EMIT_RI10(spe_heqi, 0x07f);
EMIT_RR (spe_hgt, 0x258);
EMIT_RI10(spe_hgti, 0x04f);
EMIT_RR (spe_hlgt, 0x2d8);
EMIT_RI10(spe_hlgti, 0x05f);
EMIT_RR (spe_ceqb, 0x3d0);
EMIT_RI10(spe_ceqbi, 0x07e);
EMIT_RR (spe_ceqh, 0x3c8);
EMIT_RI10(spe_ceqhi, 0x07d);
EMIT_RR (spe_ceq, 0x3c0);
EMIT_RI10(spe_ceqi, 0x07c);
EMIT_RR (spe_cgtb, 0x250);
EMIT_RI10(spe_cgtbi, 0x04e);
EMIT_RR (spe_cgth, 0x248);
EMIT_RI10(spe_cgthi, 0x04d);
EMIT_RR (spe_cgt, 0x240);
EMIT_RI10(spe_cgti, 0x04c);
EMIT_RR (spe_clgtb, 0x2d0);
EMIT_RI10(spe_clgtbi, 0x05e);
EMIT_RR (spe_clgth, 0x2c8);
EMIT_RI10(spe_clgthi, 0x05d);
EMIT_RR (spe_clgt, 0x2c0);
EMIT_RI10(spe_clgti, 0x05c);
EMIT_I16 (spe_br, 0x064);
EMIT_I16 (spe_bra, 0x060);
EMIT_RI16(spu_brsl, 0x066);
EMIT_RI16(spu_brasl, 0x062);
EMIT_RI16(spu_brnz, 0x042);
EMIT_RI16(spu_brz, 0x040);
EMIT_RI16(spu_brhnz, 0x046);
EMIT_RI16(spu_brhz, 0x044);

extern void spu_bi(struct spe_function *p, unsigned rA, int d, int e);
extern void spu_iret(struct spe_function *p, unsigned rA, int d, int e);
extern void spu_bisled(struct spe_function *p, unsigned rT, unsigned rA,
int d, int e);
extern void spu_bisl(struct spe_function *p, unsigned rT, unsigned rA,
int d, int e);
extern void spu_biz(struct spe_function *p, unsigned rT, unsigned rA,
int d, int e);
extern void spu_binz(struct spe_function *p, unsigned rT, unsigned rA,
int d, int e);
extern void spu_bihz(struct spe_function *p, unsigned rT, unsigned rA,
int d, int e);
extern void spu_bihnz(struct spe_function *p, unsigned rT, unsigned rA,
int d, int e);


/* Floating-point instructions
*/
EMIT_RR (spu_fa, 0x2c4);
EMIT_RR (spu_dfa, 0x2cc);
EMIT_RR (spu_fs, 0x2c5);
EMIT_RR (spu_dfs, 0x2cd);
EMIT_RR (spu_fm, 0x2c6);
EMIT_RR (spu_dfm, 0x2ce);
EMIT_RRR (spu_fma, 0x00e);
EMIT_RR (spu_dfma, 0x35c);
EMIT_RRR (spu_fnms, 0x00d);
EMIT_RR (spu_dfnms, 0x35e);
EMIT_RRR (spu_fms, 0x00f);
EMIT_RR (spu_dfms, 0x35d);
EMIT_RR (spu_dfnma, 0x35f);
EMIT_R (spu_frest, 0x1b8);
EMIT_R (spu_frsqest, 0x1b9);
EMIT_RR (spu_fi, 0x3d4);
EMIT_RI7 (spu_csflt, 0x3da);
EMIT_RI7 (spu_cflts, 0x3d8);
EMIT_RI7 (spu_cuflt, 0x3db);
EMIT_RI7 (spu_cfltu, 0x3d9);
EMIT_R (spu_frds, 0x3b9);
EMIT_R (spu_fesd, 0x3b8);
EMIT_RR (spu_dfceq, 0x3c3);
EMIT_RR (spu_dfcmeq, 0x3cb);
EMIT_RR (spu_dfcgt, 0x2c3);
EMIT_RR (spu_dfcmgt, 0x2cb);
EMIT_RI7 (spu_dftsv, 0x3bf);
EMIT_RR (spu_fceq, 0x3c2);
EMIT_RR (spu_fcmeq, 0x3ca);
EMIT_RR (spu_fcgt, 0x2c2);
EMIT_RR (spu_fcmgt, 0x2ca);
EMIT_R (spu_fscrwr, 0x3ba);
EMIT_ (spu_fscrrd, 0x398);


/* Channel instructions
*/
EMIT_R (spu_rdch, 0x00d);
EMIT_R (spu_rdchcnt, 0x00f);
EMIT_R (spu_wrch, 0x10d);


#ifdef UNDEF_EMIT_MACROS
#undef EMIT_
#undef EMIT_R
#undef EMIT_RR
#undef EMIT_RRR
#undef EMIT_RI7
#undef EMIT_RI10
#undef EMIT_RI16
#undef EMIT_RI18
#undef EMIT_I16
#undef UNDEF_EMIT_MACROS
#endif /* EMIT_ */

+ 1
- 0
src/mesa/sources ファイルの表示

@@ -288,6 +288,7 @@ ASM_C_SOURCES = \
x86/rtasm/x86sse.c \
sparc/sparc.c \
ppc/common_ppc.c \
ppc/rtasm/spe_asm.c \
x86-64/x86-64.c

X86_SOURCES = \

読み込み中…
キャンセル
保存