573 lines
18 KiB
C++
573 lines
18 KiB
C++
/* libs/pixelflinger/codeflinger/GGLAssembler.h
|
|
**
|
|
** Copyright 2006, The Android Open Source Project
|
|
**
|
|
** Licensed under the Apache License, Version 2.0 (the "License");
|
|
** you may not use this file except in compliance with the License.
|
|
** You may obtain a copy of the License at
|
|
**
|
|
** http://www.apache.org/licenses/LICENSE-2.0
|
|
**
|
|
** Unless required by applicable law or agreed to in writing, software
|
|
** distributed under the License is distributed on an "AS IS" BASIS,
|
|
** WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
** See the License for the specific language governing permissions and
|
|
** limitations under the License.
|
|
*/
|
|
|
|
|
|
#ifndef ANDROID_GGLASSEMBLER_H
|
|
#define ANDROID_GGLASSEMBLER_H
|
|
|
|
#include <stdint.h>
|
|
#include <sys/types.h>
|
|
|
|
#include <private/pixelflinger/ggl_context.h>
|
|
|
|
#include "ARMAssemblerProxy.h"
|
|
|
|
|
|
namespace android {
|
|
|
|
// ----------------------------------------------------------------------------
|
|
|
|
#define CONTEXT_ADDR_LOAD(REG, FIELD) \
|
|
ADDR_LDR(AL, REG, mBuilderContext.Rctx, immed12_pre(GGL_OFFSETOF(FIELD)))
|
|
|
|
#define CONTEXT_ADDR_STORE(REG, FIELD) \
|
|
ADDR_STR(AL, REG, mBuilderContext.Rctx, immed12_pre(GGL_OFFSETOF(FIELD)))
|
|
|
|
#define CONTEXT_LOAD(REG, FIELD) \
|
|
LDR(AL, REG, mBuilderContext.Rctx, immed12_pre(GGL_OFFSETOF(FIELD)))
|
|
|
|
#define CONTEXT_STORE(REG, FIELD) \
|
|
STR(AL, REG, mBuilderContext.Rctx, immed12_pre(GGL_OFFSETOF(FIELD)))
|
|
|
|
|
|
class RegisterAllocator
|
|
{
|
|
public:
|
|
class RegisterFile;
|
|
|
|
RegisterAllocator(int arch); // NOLINT, implicit
|
|
RegisterFile& registerFile();
|
|
int reserveReg(int reg);
|
|
int obtainReg();
|
|
void recycleReg(int reg);
|
|
void reset();
|
|
|
|
class RegisterFile
|
|
{
|
|
public:
|
|
RegisterFile(int arch); // NOLINT, implicit
|
|
RegisterFile(const RegisterFile& rhs, int arch);
|
|
~RegisterFile();
|
|
|
|
void reset();
|
|
|
|
bool operator == (const RegisterFile& rhs) const;
|
|
bool operator != (const RegisterFile& rhs) const {
|
|
return !operator == (rhs);
|
|
}
|
|
|
|
int reserve(int reg);
|
|
void reserveSeveral(uint32_t regMask);
|
|
|
|
void recycle(int reg);
|
|
void recycleSeveral(uint32_t regMask);
|
|
|
|
int obtain();
|
|
inline int isUsed(int reg) const;
|
|
|
|
bool hasFreeRegs() const;
|
|
int countFreeRegs() const;
|
|
|
|
uint32_t touched() const;
|
|
inline uint32_t status() const { return mStatus; }
|
|
|
|
enum {
|
|
OUT_OF_REGISTERS = 0x1
|
|
};
|
|
|
|
private:
|
|
uint32_t mRegs;
|
|
uint32_t mTouched;
|
|
uint32_t mStatus;
|
|
int mArch;
|
|
uint32_t mRegisterOffset; // lets reg alloc use 2..17 for mips
|
|
// while arm uses 0..15
|
|
};
|
|
|
|
class Scratch
|
|
{
|
|
public:
|
|
explicit Scratch(RegisterFile& regFile)
|
|
: mRegFile(regFile), mScratch(0) {
|
|
}
|
|
~Scratch() {
|
|
mRegFile.recycleSeveral(mScratch);
|
|
}
|
|
int obtain() {
|
|
int reg = mRegFile.obtain();
|
|
mScratch |= 1<<reg;
|
|
return reg;
|
|
}
|
|
void recycle(int reg) {
|
|
mRegFile.recycle(reg);
|
|
mScratch &= ~(1<<reg);
|
|
}
|
|
bool isUsed(int reg) {
|
|
return (mScratch & (1<<reg));
|
|
}
|
|
int countFreeRegs() {
|
|
return mRegFile.countFreeRegs();
|
|
}
|
|
private:
|
|
RegisterFile& mRegFile;
|
|
uint32_t mScratch;
|
|
};
|
|
|
|
class Spill
|
|
{
|
|
public:
|
|
Spill(RegisterFile& regFile, ARMAssemblerInterface& gen, uint32_t reglist)
|
|
: mRegFile(regFile), mGen(gen), mRegList(reglist), mCount(0)
|
|
{
|
|
if (reglist) {
|
|
int count = 0;
|
|
while (reglist) {
|
|
count++;
|
|
reglist &= ~(1 << (31 - __builtin_clz(reglist)));
|
|
}
|
|
if (count == 1) {
|
|
int reg = 31 - __builtin_clz(mRegList);
|
|
mGen.STR(mGen.AL, reg, mGen.SP, mGen.immed12_pre(-4, 1));
|
|
} else {
|
|
mGen.STM(mGen.AL, mGen.DB, mGen.SP, 1, mRegList);
|
|
}
|
|
mRegFile.recycleSeveral(mRegList);
|
|
mCount = count;
|
|
}
|
|
}
|
|
~Spill() {
|
|
if (mRegList) {
|
|
if (mCount == 1) {
|
|
int reg = 31 - __builtin_clz(mRegList);
|
|
mGen.LDR(mGen.AL, reg, mGen.SP, mGen.immed12_post(4));
|
|
} else {
|
|
mGen.LDM(mGen.AL, mGen.IA, mGen.SP, 1, mRegList);
|
|
}
|
|
mRegFile.reserveSeveral(mRegList);
|
|
}
|
|
}
|
|
private:
|
|
RegisterFile& mRegFile;
|
|
ARMAssemblerInterface& mGen;
|
|
uint32_t mRegList;
|
|
int mCount;
|
|
};
|
|
|
|
private:
|
|
RegisterFile mRegs;
|
|
};
|
|
|
|
// ----------------------------------------------------------------------------
|
|
|
|
class GGLAssembler : public ARMAssemblerProxy, public RegisterAllocator
|
|
{
|
|
public:
|
|
|
|
explicit GGLAssembler(ARMAssemblerInterface* target);
|
|
virtual ~GGLAssembler();
|
|
|
|
uint32_t* base() const { return 0; } // XXX
|
|
uint32_t* pc() const { return 0; } // XXX
|
|
|
|
void reset(int opt_level);
|
|
|
|
virtual void prolog();
|
|
virtual void epilog(uint32_t touched);
|
|
|
|
// generate scanline code for given needs
|
|
int scanline(const needs_t& needs, context_t const* c);
|
|
int scanline_core(const needs_t& needs, context_t const* c);
|
|
|
|
enum {
|
|
CLEAR_LO = 0x0001,
|
|
CLEAR_HI = 0x0002,
|
|
CORRUPTIBLE = 0x0004,
|
|
FIRST = 0x0008
|
|
};
|
|
|
|
enum { //load/store flags
|
|
WRITE_BACK = 0x0001
|
|
};
|
|
|
|
struct reg_t {
|
|
reg_t() : reg(-1), flags(0) {
|
|
}
|
|
reg_t(int r, int f=0) // NOLINT, implicit
|
|
: reg(r), flags(f) {
|
|
}
|
|
void setTo(int r, int f=0) {
|
|
reg=r; flags=f;
|
|
}
|
|
int reg;
|
|
uint16_t flags;
|
|
};
|
|
|
|
struct integer_t : public reg_t {
|
|
integer_t() : reg_t(), s(0) {
|
|
}
|
|
integer_t(int r, int sz=32, int f=0) // NOLINT, implicit
|
|
: reg_t(r, f), s(sz) {
|
|
}
|
|
void setTo(int r, int sz=32, int f=0) {
|
|
reg_t::setTo(r, f); s=sz;
|
|
}
|
|
int8_t s;
|
|
inline int size() const { return s; }
|
|
};
|
|
|
|
struct pixel_t : public reg_t {
|
|
pixel_t() : reg_t() {
|
|
memset(&format, 0, sizeof(GGLFormat));
|
|
}
|
|
pixel_t(int r, const GGLFormat* fmt, int f=0)
|
|
: reg_t(r, f), format(*fmt) {
|
|
}
|
|
void setTo(int r, const GGLFormat* fmt, int f=0) {
|
|
reg_t::setTo(r, f); format = *fmt;
|
|
}
|
|
GGLFormat format;
|
|
inline int hi(int c) const { return format.c[c].h; }
|
|
inline int low(int c) const { return format.c[c].l; }
|
|
inline int mask(int c) const { return ((1<<size(c))-1) << low(c); }
|
|
inline int size() const { return format.size*8; }
|
|
inline int size(int c) const { return component_size(c); }
|
|
inline int component_size(int c) const { return hi(c) - low(c); }
|
|
};
|
|
|
|
struct component_t : public reg_t {
|
|
component_t() : reg_t(), h(0), l(0) {
|
|
}
|
|
component_t(int r, int f=0) // NOLINT, implicit
|
|
: reg_t(r, f), h(0), l(0) {
|
|
}
|
|
component_t(int r, int lo, int hi, int f=0)
|
|
: reg_t(r, f), h(hi), l(lo) {
|
|
}
|
|
explicit component_t(const integer_t& rhs)
|
|
: reg_t(rhs.reg, rhs.flags), h(rhs.s), l(0) {
|
|
}
|
|
explicit component_t(const pixel_t& rhs, int component) {
|
|
setTo( rhs.reg,
|
|
rhs.format.c[component].l,
|
|
rhs.format.c[component].h,
|
|
rhs.flags|CLEAR_LO|CLEAR_HI);
|
|
}
|
|
void setTo(int r, int lo=0, int hi=0, int f=0) {
|
|
reg_t::setTo(r, f); h=hi; l=lo;
|
|
}
|
|
int8_t h;
|
|
int8_t l;
|
|
inline int size() const { return h-l; }
|
|
};
|
|
|
|
struct pointer_t : public reg_t {
|
|
pointer_t() : reg_t(), size(0) {
|
|
}
|
|
pointer_t(int r, int s, int f=0)
|
|
: reg_t(r, f), size(s) {
|
|
}
|
|
void setTo(int r, int s, int f=0) {
|
|
reg_t::setTo(r, f); size=s;
|
|
}
|
|
int8_t size;
|
|
};
|
|
|
|
|
|
private:
|
|
// GGLAssembler hides RegisterAllocator's and ARMAssemblerProxy's reset
|
|
// methods by providing a reset method with a different parameter set. The
|
|
// intent of GGLAssembler's reset method is to wrap the inherited reset
|
|
// methods, so make these methods private in order to prevent direct calls
|
|
// to these methods from clients.
|
|
using RegisterAllocator::reset;
|
|
using ARMAssemblerProxy::reset;
|
|
|
|
struct tex_coord_t {
|
|
reg_t s;
|
|
reg_t t;
|
|
pointer_t ptr;
|
|
};
|
|
|
|
struct fragment_parts_t {
|
|
uint32_t packed : 1;
|
|
uint32_t reload : 2;
|
|
uint32_t iterated_packed : 1;
|
|
pixel_t iterated;
|
|
pointer_t cbPtr;
|
|
pointer_t covPtr;
|
|
reg_t count;
|
|
reg_t argb[4];
|
|
reg_t argb_dx[4];
|
|
reg_t z;
|
|
reg_t dither;
|
|
pixel_t texel[GGL_TEXTURE_UNIT_COUNT];
|
|
tex_coord_t coords[GGL_TEXTURE_UNIT_COUNT];
|
|
};
|
|
|
|
struct texture_unit_t {
|
|
int format_idx;
|
|
GGLFormat format;
|
|
int bits;
|
|
int swrap;
|
|
int twrap;
|
|
int env;
|
|
int pot;
|
|
int linear;
|
|
uint8_t mask;
|
|
uint8_t replaced;
|
|
};
|
|
|
|
struct texture_machine_t {
|
|
texture_unit_t tmu[GGL_TEXTURE_UNIT_COUNT];
|
|
uint8_t mask;
|
|
uint8_t replaced;
|
|
uint8_t directTexture;
|
|
uint8_t activeUnits;
|
|
};
|
|
|
|
struct component_info_t {
|
|
bool masked : 1;
|
|
bool inDest : 1;
|
|
bool needed : 1;
|
|
bool replaced : 1;
|
|
bool iterated : 1;
|
|
bool smooth : 1;
|
|
bool blend : 1;
|
|
bool fog : 1;
|
|
};
|
|
|
|
struct builder_context_t {
|
|
context_t const* c;
|
|
needs_t needs;
|
|
int Rctx;
|
|
};
|
|
|
|
template <typename T>
|
|
void modify(T& r, Scratch& regs)
|
|
{
|
|
if (!(r.flags & CORRUPTIBLE)) {
|
|
r.reg = regs.obtain();
|
|
r.flags |= CORRUPTIBLE;
|
|
}
|
|
}
|
|
|
|
// helpers
|
|
void base_offset(const pointer_t& d, const pointer_t& b, const reg_t& o);
|
|
|
|
// texture environement
|
|
void modulate( component_t& dest,
|
|
const component_t& incoming,
|
|
const pixel_t& texel, int component);
|
|
|
|
void decal( component_t& dest,
|
|
const component_t& incoming,
|
|
const pixel_t& texel, int component);
|
|
|
|
void blend( component_t& dest,
|
|
const component_t& incoming,
|
|
const pixel_t& texel, int component, int tmu);
|
|
|
|
void add( component_t& dest,
|
|
const component_t& incoming,
|
|
const pixel_t& texel, int component);
|
|
|
|
// load/store stuff
|
|
void store(const pointer_t& addr, const pixel_t& src, uint32_t flags=0);
|
|
void load(const pointer_t& addr, const pixel_t& dest, uint32_t flags=0);
|
|
void extract(integer_t& d, const pixel_t& s, int component);
|
|
void extract(component_t& d, const pixel_t& s, int component);
|
|
void extract(integer_t& d, int s, int h, int l, int bits=32);
|
|
void expand(integer_t& d, const integer_t& s, int dbits);
|
|
void expand(integer_t& d, const component_t& s, int dbits);
|
|
void expand(component_t& d, const component_t& s, int dbits);
|
|
void downshift(pixel_t& d, int component, component_t s, const reg_t& dither);
|
|
|
|
|
|
void mul_factor( component_t& d,
|
|
const integer_t& v,
|
|
const integer_t& f);
|
|
|
|
void mul_factor_add( component_t& d,
|
|
const integer_t& v,
|
|
const integer_t& f,
|
|
const component_t& a);
|
|
|
|
void component_add( component_t& d,
|
|
const integer_t& dst,
|
|
const integer_t& src);
|
|
|
|
void component_sat( const component_t& v);
|
|
|
|
|
|
void build_scanline_prolog( fragment_parts_t& parts,
|
|
const needs_t& needs);
|
|
|
|
void build_smooth_shade(const fragment_parts_t& parts);
|
|
|
|
void build_component( pixel_t& pixel,
|
|
const fragment_parts_t& parts,
|
|
int component,
|
|
Scratch& global_scratches);
|
|
|
|
void build_incoming_component(
|
|
component_t& temp,
|
|
int dst_size,
|
|
const fragment_parts_t& parts,
|
|
int component,
|
|
Scratch& scratches,
|
|
Scratch& global_scratches);
|
|
|
|
void init_iterated_color(fragment_parts_t& parts, const reg_t& x);
|
|
|
|
void build_iterated_color( component_t& fragment,
|
|
const fragment_parts_t& parts,
|
|
int component,
|
|
Scratch& regs);
|
|
|
|
void decodeLogicOpNeeds(const needs_t& needs);
|
|
|
|
void decodeTMUNeeds(const needs_t& needs, context_t const* c);
|
|
|
|
void init_textures( tex_coord_t* coords,
|
|
const reg_t& x,
|
|
const reg_t& y);
|
|
|
|
void build_textures( fragment_parts_t& parts,
|
|
Scratch& regs);
|
|
|
|
void filter8( const fragment_parts_t& parts,
|
|
pixel_t& texel, const texture_unit_t& tmu,
|
|
int U, int V, pointer_t& txPtr,
|
|
int FRAC_BITS);
|
|
|
|
void filter16( const fragment_parts_t& parts,
|
|
pixel_t& texel, const texture_unit_t& tmu,
|
|
int U, int V, pointer_t& txPtr,
|
|
int FRAC_BITS);
|
|
|
|
void filter24( const fragment_parts_t& parts,
|
|
pixel_t& texel, const texture_unit_t& tmu,
|
|
int U, int V, pointer_t& txPtr,
|
|
int FRAC_BITS);
|
|
|
|
void filter32( const fragment_parts_t& parts,
|
|
pixel_t& texel, const texture_unit_t& tmu,
|
|
int U, int V, pointer_t& txPtr,
|
|
int FRAC_BITS);
|
|
|
|
void build_texture_environment( component_t& fragment,
|
|
const fragment_parts_t& parts,
|
|
int component,
|
|
Scratch& regs);
|
|
|
|
void wrapping( int d,
|
|
int coord, int size,
|
|
int tx_wrap, int tx_linear);
|
|
|
|
void build_fog( component_t& temp,
|
|
int component,
|
|
Scratch& parent_scratches);
|
|
|
|
void build_blending( component_t& in_out,
|
|
const pixel_t& pixel,
|
|
int component,
|
|
Scratch& parent_scratches);
|
|
|
|
void build_blend_factor(
|
|
integer_t& factor, int f, int component,
|
|
const pixel_t& dst_pixel,
|
|
integer_t& fragment,
|
|
integer_t& fb,
|
|
Scratch& scratches);
|
|
|
|
void build_blendFOneMinusF( component_t& temp,
|
|
const integer_t& factor,
|
|
const integer_t& fragment,
|
|
const integer_t& fb);
|
|
|
|
void build_blendOneMinusFF( component_t& temp,
|
|
const integer_t& factor,
|
|
const integer_t& fragment,
|
|
const integer_t& fb);
|
|
|
|
void build_coverage_application(component_t& fragment,
|
|
const fragment_parts_t& parts,
|
|
Scratch& regs);
|
|
|
|
void build_alpha_test(component_t& fragment, const fragment_parts_t& parts);
|
|
|
|
enum { Z_TEST=1, Z_WRITE=2 };
|
|
void build_depth_test(const fragment_parts_t& parts, uint32_t mask);
|
|
void build_iterate_z(const fragment_parts_t& parts);
|
|
void build_iterate_f(const fragment_parts_t& parts);
|
|
void build_iterate_texture_coordinates(const fragment_parts_t& parts);
|
|
|
|
void build_logic_op(pixel_t& pixel, Scratch& regs);
|
|
|
|
void build_masking(pixel_t& pixel, Scratch& regs);
|
|
|
|
void build_and_immediate(int d, int s, uint32_t mask, int bits);
|
|
|
|
bool isAlphaSourceNeeded() const;
|
|
|
|
enum {
|
|
FACTOR_SRC=1, FACTOR_DST=2, BLEND_SRC=4, BLEND_DST=8
|
|
};
|
|
|
|
enum {
|
|
LOGIC_OP=1, LOGIC_OP_SRC=2, LOGIC_OP_DST=4
|
|
};
|
|
|
|
static int blending_codes(int fs, int fd);
|
|
|
|
builder_context_t mBuilderContext;
|
|
texture_machine_t mTextureMachine;
|
|
component_info_t mInfo[4];
|
|
int mBlending;
|
|
int mMasking;
|
|
int mAllMasked;
|
|
int mLogicOp;
|
|
int mAlphaTest;
|
|
int mAA;
|
|
int mDithering;
|
|
int mDepthTest;
|
|
|
|
int mSmooth;
|
|
int mFog;
|
|
pixel_t mDstPixel;
|
|
|
|
GGLFormat mCbFormat;
|
|
|
|
int mBlendFactorCached;
|
|
integer_t mAlphaSource;
|
|
|
|
int mBaseRegister;
|
|
|
|
int mBlendSrc;
|
|
int mBlendDst;
|
|
int mBlendSrcA;
|
|
int mBlendDstA;
|
|
|
|
int mOptLevel;
|
|
};
|
|
|
|
// ----------------------------------------------------------------------------
|
|
|
|
}; // namespace android
|
|
|
|
#endif // ANDROID_GGLASSEMBLER_H
|