OpenCL-TTL/html/dir_efd9e86757b3bd5f887d318858fcf15e.html

#include "TTL/TTL.h"


__kernel void TTL_double_buffering(__global uchar *restrict ext_base_in, int external_stride_in,

                                   __global uchar *restrict ext_base_out, int external_stride_out, int width,

                                   int height, int tile_width, int tile_height) {

    __local uchar l_in1[MEMSZ];

    __local uchar l_in2[MEMSZ];

    __local uchar l_out1[MEMSZ];

    __local uchar l_out2[MEMSZ];


    // Logical Tiling

    const TTL_shape_t global_tensor = TTL_create_shape(width, height);

    const TTL_shape_t tile_shape = TTL_create_shape(tile_width, tile_height);

    const TTL_tiler_t tiler = TTL_create_tiler(global_tensor, tile_shape);


    // External layouts.

    const TTL_layout_t ext_layout_in = TTL_create_layout(external_stride_in);

    const TTL_layout_t ext_layout_out = TTL_create_layout(external_stride_out);


    const TTL_const_ext_tensor_t ext_input_tensor =

        TTL_create_const_ext_tensor(ext_base_in, global_tensor, ext_layout_in);

    const TTL_ext_tensor_t ext_output_tensor = TTL_create_ext_tensor(ext_base_out, global_tensor, ext_layout_out);


    // TTL_start_import_double_buffering will being the import of the first tile

    TTL_event_t import_DB_e = TTL_get_event();

    TTL_import_double_buffering_t import_db = TTL_start_import_double_buffering(

        l_in1, l_in2, ext_input_tensor, &import_DB_e, TTL_get_tile(0, tiler));


    TTL_event_t export_DB_e = TTL_get_event();

    TTL_export_double_buffering_t export_db =

        TTL_start_export_double_buffering(l_out1, l_out2, ext_output_tensor, &export_DB_e);


    for (int i = 0; i < TTL_number_of_tiles(tiler); ++i) {

        TTL_tile_t tile_next_import = TTL_get_tile(i + 1, tiler);

        TTL_tile_t tile_current_export = TTL_get_tile(i, tiler);


        // These wait for the current transfers to complete, and begin the next

        TTL_int_sub_tensor_t imported_to = TTL_step_buffering(&import_db, tile_next_import);

        TTL_int_sub_tensor_t exported_from = TTL_step_buffering(&export_db, tile_current_export);


        // Compute whilst the transfers are taking place (on separate buffers)

        compute(imported_to, exported_from);

    }


    // These wait for the last transfers to complete.

    TTL_finish_buffering(&import_db);

    TTL_finish_buffering(&export_db);

}

TTL.h

TTL_finish_buffering
static void TTL_finish_buffering(TTL_import_double_const_void_tensor_buffering_t *import_double_buffering)
Definition TTL_double_scheme.h:104

TTL_step_buffering
static TTL_int_void_sub_tensor_t TTL_step_buffering(TTL_import_double_const_void_tensor_buffering_t *const db, const TTL_tile_t next_tile)
Wait for the previous import operation to complete before beginning an import of the next tile.
Definition TTL_double_scheme.h:34

TTL_start_export_double_buffering
static TTL_export_double_const_void_tensor_buffering_t TTL_start_export_double_buffering(__local void *int_base1, __local void *int_base2, TTL_ext_void_tensor_t ext_tensor, TTL_event_t *event)
Create a TTL_export_double_buffering_t and begin the buffering process.
Definition TTL_double_scheme_template.h:243

TTL_start_import_double_buffering
static TTL_import_double_const_void_tensor_buffering_t TTL_start_import_double_buffering(__local void *int_base1, __local void *int_base2, TTL_const_ext_void_tensor_t ext_tensor, TTL_event_t *event, TTL_tile_t first_tile)
Create a TTL_import_double_buffering_t and begin the buffering process.
Definition TTL_double_scheme_template.h:111

TTL_const_ext_tensor_t
TTL_const_ext_void_tensor_t TTL_const_ext_tensor_t
Definition TTL_ext_tensors.h:25

TTL_ext_tensor_t
TTL_ext_void_tensor_t TTL_ext_tensor_t
Definition TTL_ext_tensors.h:24

TTL_create_ext_tensor
static TTL_ext_void_tensor_t TTL_create_ext_tensor(__global void *base, const TTL_shape_t shape, const TTL_layout_t layout, const TTL_offset_t offset, const TTL_dim_t elem_size)
const and non-const tensor creation functions.
Definition TTL_int_ext_typed_tensors.h:76

TTL_create_const_ext_tensor
static TTL_const_ext_void_tensor_t TTL_create_const_ext_tensor(__global const void *base, const TTL_shape_t shape, const TTL_layout_t layout, const TTL_offset_t offset, const TTL_dim_t elem_size)
create TTL_create_int_tensor_impl
Definition TTL_int_ext_typed_tensors.h:173

TTL_int_sub_tensor_t
TTL_int_void_sub_tensor_t TTL_int_sub_tensor_t
Definition TTL_int_tensors.h:26

TTL_create_layout
static TTL_layout_t TTL_create_layout(void)
Create a 1D Description of a Tensor layout in memory.
Definition TTL_tensors_common.h:96

TTL_get_tile
static TTL_tile_t TTL_get_tile(const int tile_id, const TTL_tiler_t tiler)
Return the tile_id'th tile of a tile array in row-major order.
Definition TTL_tiles.h:319

TTL_number_of_tiles
static int TTL_number_of_tiles(TTL_tiler_t tiler)
Return the number of tiles that this tile can produce.
Definition TTL_tiles.h:161

TTL_create_tiler
static TTL_tiler_t TTL_create_tiler(const TTL_shape_t shape, const TTL_shape_t tile)
Definition TTL_tiles.h:229

TTL_event_t
event_t TTL_event_t
TTL_event_t is a pseudonym for OpenCL event_t.
Definition c/TTL_import_export.h:33

__global
#define __global
The opencl __global namespace is not supported in C.
Definition c/TTL_types.h:26

__local
#define __local
The opencl __local namespace is not supported in C.
Definition c/TTL_types.h:27

uchar
unsigned char uchar
opencl and so TTL supports a type called uchar which is not part of C
Definition c/TTL_types.h:25

TTL_get_event
static TTL_event_t TTL_get_event()
Return an empty event of type TTL_event_t.
Definition opencl/TTL_import_export.h:32

TTL_layout_t
Description of a Tensor layout in memory.
Definition TTL_tensors_common.h:50

TTL_shape_t
Description of a Shape.
Definition tensors/TTL_types.h:30

TTL_tile_t
Definition TTL_tiles.h:124

TTL_tiler_t
TTL_tiler_t is the basic unit that describes how a tile is subdivided.
Definition TTL_tiles.h:135

TTL_create_shape
static TTL_shape_t TTL_create_shape(TTL_dim_t width, TTL_dim_t height, TTL_dim_t depth)
Create a description of a Shape.
Definition tensors/TTL_types.h:48
Files
	TTL.h

	TTL_core.h

	TTL_create_type.h

	TTL_create_types.h

	TTL_debug.h

	TTL_import_export.h

	TTL_macros.h

	TTL_pipeline_schemes.h

	TTL_tensors.h

	TTL_tiles.h

	TTL_trace_macros.h

	TTL_types.h