OpenCL-TTL/html/p_2pipelines_2TTL__double__scheme_8h_source.html

/*

 * TTL_double_scheme.h

 *

 * Copyright (c) 2025 Mobileye

 *

 * Licensed under the Apache License, Version 2.0 (the License);

 * you may not use this file except in compliance with the License.

 * You may obtain a copy of the License at

 *

 *     http://www.apache.org/licenses/LICENSE-2.0

 *

 * Unless required by applicable law or agreed to in writing, software

 * distributed under the License is distributed on an AS IS BASIS,

 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

 * See the License for the specific language governing permissions and

 * limitations under the License.

 */


// This file presumes that the following have been pre included.

// this is not done here for path reasons.

// #include "TTL_core.h"

// #include "TTL_import_export.h"

// #include TTL_IMPORT_EXPORT_INCLUDE_H

#include "TTL/TTL_c/TTL_macros.h"

#include "TTL_schemes_common.h"


/**

 * @brief Wait for the previous import operation to complete before beginning an

 * import of the next tile.

 *

 * @param db TTL_import_double_buffering describing the attributes of the

 * transfer

 * @param next_tile A description of the tile to begin importing.

 *

 */

template <typename TENSORTYPE>


struct TTL_import_double_buffering {

    /**

     * @brief Create a TTL_import_double_buffering and begin the buffering process

     *

     * @param int_base1 A pointer to the 1st local buffer

     * @param int_base2 A pointer to the 2nd local buffer

     * @param ext_tensor A tensor describing the input in global memory

     * @param event A pointer to the event to use for the inward (external to

     * internal) transfer completion

     * @param first_tile The first tile to fetch for the scheme

     *

     * @return The TTL_import_double_buffering created from the input parameters.

     *

     * Example:

     * @code

     * TTL_event import_DB_e = TTL_get_event();

     * TTL_import_double_buffering import_db(l_in1, l_in2, ext_base_in, ext_layout_in, &import_DB_e);

     * @endcode

     * \n

     *

     * This can be optimized and standardized using the TTL_step_buffering

     * call.

     *

     * @startuml

     *

     * start

     *

     *

     * stop

     *

     * @enduml

     */


    TTL_import_double_buffering(TTL_local(TENSORTYPE *) int_base1, TTL_local(TENSORTYPE *) int_base2,

                                TTL_tensor<TENSORTYPE> ext_tensor, TTL_event *event, TTL_tile first_tile) {

        m_common.int_base[0] = int_base1;

        m_common.int_base[1] = int_base2;


        m_common.ext_tensor_in = ext_tensor;

        m_event = event;

        m_common.index = 0;


        m_prev_tile = TTL_tile();


        step_buffering(first_tile);

    }


    TTL_sub_tensor<TENSORTYPE> step_buffering(const TTL_tile next_tile) {

        // For performance, compute everything possible before waiting for the

        // previous operations to finish.

        const TTL_layout int_layout(next_tile.shape.width, next_tile.shape.height);

        const TTL_sub_tensor<TENSORTYPE> import_to(

            m_common.int_base[m_common.index], next_tile.shape, int_layout, m_common.ext_tensor_in, next_tile.offset);


        const TTL_tensor<TENSORTYPE> import_from(m_common.ext_tensor_in.base,

                                                 next_tile.shape,

                                                 m_common.ext_tensor_in.layout,

                                                 next_tile.offset,

                                                 m_common.ext_tensor_in.elem_size);


        TTL_wait(1, m_event);


        if (next_tile.empty() == false) {

            TTL_import_sub_tensor(import_to, import_from, m_event);

        }


        m_common.index = (m_common.index + 1) % 2;


        const TTL_layout prev_int_layout(m_prev_tile.shape.width, m_prev_tile.shape.height);

        const TTL_sub_tensor<TENSORTYPE> result(m_common.int_base[m_common.index],

                                                m_prev_tile.shape,

                                                prev_int_layout,

                                                m_common.ext_tensor_in,

                                                m_prev_tile.offset);


        m_prev_tile = next_tile;


        return result;

    }


    /**

     * @brief Complete any transfers required to finish the buffering process.

     *

     * Any transfers that are still in progress will be completed and any transfers

     * that need to be started and completed before finish_buffering returns

     */


    void finish_buffering() {

        // Nothing to do.

    }


    TTL_event *m_event;    ///< A pointer to the event that is used to

                           ///< track the progress of the transfer

    TTL_tile m_prev_tile;  ///< Store of the previous imported tile */


    TTL_common_buffering<TENSORTYPE, 2> m_common;  ///< The information that is m_common to all pipeline schemes

};


template <typename TENSORTYPE>


struct TTL_export_double_buffering {

    /**

     * @brief Create a TTL_import_double_buffering and begin the buffering process

     *

     * @param int_base1 A pointer to the 1st local buffer

     * @param int_base2 A pointer to the 2nd local buffer

     * @param ext_tensor A tensor describing the input in global memory

     * @param event A pointer to the event to use for the inward (external to

     * internal) transfer completion

     *

     * @return The TTL_export_double_buffering created from the input parameters.

     *

     * Example:

     * @code

     * TTL_event import_DB_e = TTL_get_event();

     * TTL_export_double_buffering import_db(

     *       l_in1, l_in2, ext_base_in, ext_layout_in, &import_DB_e);

     * @endcode

     * \n

     *

     * This can be optimized and standardized using the TTL_step_buffering

     * call.

     *

     * @startuml

     *

     * start

     *

     *

     * stop

     *

     * @enduml

     */


    TTL_export_double_buffering(TTL_local(TENSORTYPE *) int_base1, TTL_local(TENSORTYPE *) int_base2,

                                TTL_tensor<TENSORTYPE> ext_tensor, TTL_event *event) {

        m_common.int_base[0] = int_base1;

        m_common.int_base[1] = int_base2;


        m_common.ext_tensor_in = ext_tensor;

        m_event = event;

        m_common.index = 0;


        m_prev_tile = TTL_tile();

    }


    /**

     * @brief Wait for the previous import operation to complete before beginning an

     * export of next tile.

     *

     * @param tile_current A description of the tile to begin exporting.

     *

     */


    TTL_sub_tensor<TENSORTYPE> step_buffering(TTL_tile tile_current) {

        const TTL_layout int_layout(m_prev_tile.shape.width, m_prev_tile.shape.height);

        const TTL_tensor export_from(

            m_common.int_base[m_common.index], m_prev_tile.shape, int_layout, m_common.ext_tensor_in.elem_size);

        const TTL_tensor export_to(m_common.ext_tensor_in.base,

                                   m_prev_tile.shape,

                                   m_common.ext_tensor_in.layout,

                                   m_prev_tile.offset,

                                   m_common.ext_tensor_in.elem_size);


        TTL_wait(1, m_event);


        if (m_prev_tile.empty() == false) TTL_export(export_from, export_to, m_event);


        m_common.index = (m_common.index + 1) % 2;  // TTL_ARRAYSIZE(m_common.int_base);

        const TTL_layout curr_int_layout(tile_current.shape.width, tile_current.shape.height);

        const TTL_sub_tensor result(m_common.int_base[m_common.index],

                                    tile_current.shape,

                                    curr_int_layout,

                                    m_common.ext_tensor_in,

                                    tile_current.offset);

        m_prev_tile = tile_current;


        return result;

    }


    /**

     * @brief Complete any transfers required to finish the buffering process.

     *

     * Any transfers that are still in progress will be completed and any transfers

     * that need to be started and completed before finish_buffering returns

     */


    void finish_buffering() {

        step_buffering(TTL_tile());

        step_buffering(TTL_tile());

    }


    TTL_event *m_event;    ///< A pointer to the event that is used to

                           ///< track the progress of the transfer

    TTL_tile m_prev_tile;  ///< Store of the previous imported tile */


    TTL_common_buffering<TENSORTYPE, 2> m_common;  ///< The information that is m_common to all pipeline schemes

};


TTL_macros.h

TTL_wait
static void TTL_wait(const int num_events, TTL_event_t *const events)
Definition TTL_c/opencl/TTL_import_export.h:41

TTL_event
event_t TTL_event
TTL_event is a pseudonym for OpenCL event_t.
Definition TTL_cpp/c/TTL_import_export.h:33

TTL_local
#define TTL_local(type)
Create a typed reference in the __local address space.
Definition TTL_cpp/opencl/TTL_types.h:77

TTL_import_sub_tensor
static void TTL_import_sub_tensor(const TTL_int_void_sub_tensor_t internal_sub_tensor, const TTL_const_ext_void_tensor_t const_external_tensor, TTL_event_t *event)
Implementation of TTL_import_sub_tensor.
Definition TTL_typed_import_export.h:86

TTL_export
static void TTL_export(const TTL_const_int_void_tensor_t internal_tensor, const TTL_ext_void_tensor_t external_tensor, TTL_event_t *event)
Export the external tensor to the internal tensor returning when complete.
Definition TTL_typed_import_export.h:115

TTL_schemes_common.h

TTL_common_buffering
Definition p/pipelines/TTL_schemes_common.h:35

TTL_export_double_buffering::m_event
TTL_event * m_event
Definition p/pipelines/TTL_double_scheme.h:222

TTL_export_double_buffering::step_buffering
TTL_sub_tensor< TENSORTYPE > step_buffering(TTL_tile tile_current)
Wait for the previous import operation to complete before beginning an export of next tile.
Definition p/pipelines/TTL_double_scheme.h:185

TTL_export_double_buffering::m_common
TTL_common_buffering< TENSORTYPE, 2 > m_common
The information that is m_common to all pipeline schemes.
Definition p/pipelines/TTL_double_scheme.h:226

TTL_export_double_buffering::m_prev_tile
TTL_tile m_prev_tile
Store of the previous imported tile *‍/.
Definition p/pipelines/TTL_double_scheme.h:224

TTL_export_double_buffering::finish_buffering
void finish_buffering()
Complete any transfers required to finish the buffering process.
Definition p/pipelines/TTL_double_scheme.h:217

TTL_export_double_buffering::TTL_export_double_buffering
TTL_export_double_buffering(TTL_local(TENSORTYPE *) int_base1, TTL_local(TENSORTYPE *) int_base2, TTL_tensor< TENSORTYPE > ext_tensor, TTL_event *event)
Create a TTL_import_double_buffering and begin the buffering process.
Definition p/pipelines/TTL_double_scheme.h:166

TTL_import_double_buffering::step_buffering
TTL_sub_tensor< TENSORTYPE > step_buffering(const TTL_tile next_tile)
Definition p/pipelines/TTL_double_scheme.h:83

TTL_import_double_buffering::m_common
TTL_common_buffering< TENSORTYPE, 2 > m_common
The information that is m_common to all pipeline schemes.
Definition p/pipelines/TTL_double_scheme.h:130

TTL_import_double_buffering::finish_buffering
void finish_buffering()
Complete any transfers required to finish the buffering process.
Definition p/pipelines/TTL_double_scheme.h:122

TTL_import_double_buffering::TTL_import_double_buffering
TTL_import_double_buffering(TTL_local(TENSORTYPE *) int_base1, TTL_local(TENSORTYPE *) int_base2, TTL_tensor< TENSORTYPE > ext_tensor, TTL_event *event, TTL_tile first_tile)
Create a TTL_import_double_buffering and begin the buffering process.
Definition p/pipelines/TTL_double_scheme.h:69

TTL_import_double_buffering::m_event
TTL_event * m_event
Definition p/pipelines/TTL_double_scheme.h:126

TTL_import_double_buffering::m_prev_tile
TTL_tile m_prev_tile
Store of the previous imported tile *‍/.
Definition p/pipelines/TTL_double_scheme.h:128

TTL_layout
Description of a Tensor layout in memory.
Definition TTL_cpp/TTL_tensors.h:55

TTL_shape::height
TTL_dim height
Number of rows along dimension y.
Definition TTL_cpp/TTL_types.h:53

TTL_shape::width
TTL_dim width
Number of elements along dimension x.
Definition TTL_cpp/TTL_types.h:52

TTL_sub_tensor
A tensor plus its reference to its parent tensor.
Definition TTL_cpp/TTL_tensors.h:275

TTL_tensor
A poor mans base class for an a tensor in the passed address space.
Definition TTL_cpp/TTL_tensors.h:102

TTL_tile
Definition TTL_cpp/TTL_tiles.h:88

TTL_tile::offset
TTL_offset offset
Definition TTL_cpp/TTL_tiles.h:112

TTL_tile::shape
TTL_shape shape
Definition TTL_cpp/TTL_tiles.h:111

TTL_tile::empty
bool empty() const
Check if the tile passed is empty.
Definition TTL_cpp/TTL_tiles.h:107