GPUOcelot
|
#include <ATIExecutableKernel.h>
Classes | |
struct | cb_t |
Type of the constant buffer (cb) | |
Public Member Functions | |
ATIExecutableKernel (ir::IRKernel &k, CALcontext *context, CALevent *event, CALresource *uav0, CALresource *cb0, CALresource *cb1, Device *d) | |
Constructor. | |
void | launchGrid (int width, int height, int depth) |
Launch a kernel on a 2D grid. | |
void | setKernelShape (int x, int y, int z) |
Sets the shape of a kernel. | |
void | setExternSharedMemorySize (unsigned int bytes) |
Changes the amount of external shared memory. | |
void | setWorkerThreads (unsigned int workerThreadLimit) |
Sets the max number of pthreads this kernel can use. | |
void | updateArgumentMemory () |
Indicate that the kernels arguments have been updated. | |
void | updateMemory () |
Indicate that other memory has been updated. | |
TextureVector | textureReferences () const |
Get a vector of all textures references by the kernel. | |
void | addTraceGenerator (trace::TraceGenerator *generator) |
adds a trace generator to the EmulatedKernel | |
void | removeTraceGenerator (trace::TraceGenerator *generator) |
removes a trace generator from an EmulatedKernel | |
void | setExternalFunctionSet (const ir::ExternalFunctionSet &s) |
void | clearExternalFunctionSet () |
void | updateGlobals () |
Copies data from global objects into const and global memory. | |
Public Attributes | |
ir::PTXKernel::RegisterMap | registerMap |
executive::ATIExecutableKernel::ATIExecutableKernel | ( | ir::IRKernel & | k, |
CALcontext * | context, | ||
CALevent * | event, | ||
CALresource * | uav0, | ||
CALresource * | cb0, | ||
CALresource * | cb1, | ||
Device * | d | ||
) |
Constructor.
void executive::ATIExecutableKernel::addTraceGenerator | ( | trace::TraceGenerator * | generator | ) | [virtual] |
adds a trace generator to the EmulatedKernel
Reimplemented from executive::ExecutableKernel.
void executive::ATIExecutableKernel::clearExternalFunctionSet | ( | ) | [virtual] |
clear the external function table for the emulated kernel
Implements executive::ExecutableKernel.
void executive::ATIExecutableKernel::launchGrid | ( | int | width, |
int | height, | ||
int | depth | ||
) | [virtual] |
Launch a kernel on a 2D grid.
Implements executive::ExecutableKernel.
void executive::ATIExecutableKernel::removeTraceGenerator | ( | trace::TraceGenerator * | generator | ) | [virtual] |
removes a trace generator from an EmulatedKernel
Reimplemented from executive::ExecutableKernel.
void executive::ATIExecutableKernel::setExternalFunctionSet | ( | const ir::ExternalFunctionSet & | s | ) | [virtual] |
sets an external function table for the emulated kernel
Implements executive::ExecutableKernel.
void executive::ATIExecutableKernel::setExternSharedMemorySize | ( | unsigned int | bytes | ) | [virtual] |
Changes the amount of external shared memory.
Implements executive::ExecutableKernel.
void executive::ATIExecutableKernel::setKernelShape | ( | int | x, |
int | y, | ||
int | z | ||
) | [virtual] |
Sets the shape of a kernel.
Implements executive::ExecutableKernel.
void executive::ATIExecutableKernel::setWorkerThreads | ( | unsigned int | workerThreadLimit | ) | [virtual] |
Sets the max number of pthreads this kernel can use.
Implements executive::ExecutableKernel.
ExecutableKernel::TextureVector executive::ATIExecutableKernel::textureReferences | ( | ) | const [virtual] |
Get a vector of all textures references by the kernel.
Implements executive::ExecutableKernel.
void executive::ATIExecutableKernel::updateArgumentMemory | ( | ) | [virtual] |
Indicate that the kernels arguments have been updated.
Implements executive::ExecutableKernel.
void executive::ATIExecutableKernel::updateGlobals | ( | ) |
Copies data from global objects into const and global memory.
void executive::ATIExecutableKernel::updateMemory | ( | ) | [virtual] |
Indicate that other memory has been updated.
Implements executive::ExecutableKernel.
A map of register name to register number