doxygen/openfpm/device__spmv_8cuh_source.html

/******************************************************************************

 * Copyright (c) 2011, Duane Merrill.  All rights reserved.

 * Copyright (c) 2011-2018, NVIDIA CORPORATION.  All rights reserved.

 *

 * Redistribution and use in source and binary forms, with or without

 * modification, are permitted provided that the following conditions are met:

 *     * Redistributions of source code must retain the above copyright

 *       notice, this list of conditions and the following disclaimer.

 *     * Redistributions in binary form must reproduce the above copyright

 *       notice, this list of conditions and the following disclaimer in the

 *       documentation and/or other materials provided with the distribution.

 *     * Neither the name of the NVIDIA CORPORATION nor the

 *       names of its contributors may be used to endorse or promote products

 *       derived from this software without specific prior written permission.

 *

 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND

 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED

 * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE

 * DISCLAIMED. IN NO EVENT SHALL NVIDIA CORPORATION BE LIABLE FOR ANY

 * DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES

 * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;

 * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND

 * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT

 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS

 * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

 *

 ******************************************************************************/


#pragma once


#include <stdio.h>

#include <iterator>

#include <limits>


#include "dispatch/dispatch_spmv_orig.cuh"

#include "../util_namespace.cuh"


CUB_NS_PREFIX


namespace cub {


struct DeviceSpmv

{

    /******************************************************************/


    template <

        typename            ValueT>

    CUB_RUNTIME_FUNCTION

    static cudaError_t CsrMV(

        void*               d_temp_storage,

        size_t&             temp_storage_bytes,

        ValueT*             d_values,

        int*                d_row_offsets,

        int*                d_column_indices,

        ValueT*             d_vector_x,

        ValueT*             d_vector_y,

        int                 num_rows,

        int                 num_cols,

        int                 num_nonzeros,

        cudaStream_t        stream                  = 0,

        bool                debug_synchronous       = false)

    {

        SpmvParams<ValueT, int> spmv_params;

        spmv_params.d_values             = d_values;

        spmv_params.d_row_end_offsets    = d_row_offsets + 1;

        spmv_params.d_column_indices     = d_column_indices;

        spmv_params.d_vector_x           = d_vector_x;

        spmv_params.d_vector_y           = d_vector_y;

        spmv_params.num_rows             = num_rows;

        spmv_params.num_cols             = num_cols;

        spmv_params.num_nonzeros         = num_nonzeros;

        spmv_params.alpha                = 1.0;

        spmv_params.beta                 = 0.0;


        return DispatchSpmv<ValueT, int>::Dispatch(

            d_temp_storage,

            temp_storage_bytes,

            spmv_params,

            stream,

            debug_synchronous);

    }


};


}               // CUB namespace

CUB_NS_POSTFIX  // Optional outer namespace(s)


dispatch_spmv_orig.cuh

cub
Optional outer namespace(s)
Definition agent_histogram.cuh:48

cub::spmv_params
OffsetT spmv_params
[in] SpMV input parameter bundle
Definition dispatch_spmv_orig.cuh:159

cub::num_rows
ArrayWrapper< int, NUM_ACTIVE_CHANNELS > ArrayWrapper< int, NUM_ACTIVE_CHANNELS > ArrayWrapper< CounterT *, NUM_ACTIVE_CHANNELS > ArrayWrapper< CounterT *, NUM_ACTIVE_CHANNELS > ArrayWrapper< OutputDecodeOpT, NUM_ACTIVE_CHANNELS > ArrayWrapper< PrivatizedDecodeOpT, NUM_ACTIVE_CHANNELS > OffsetT OffsetT num_rows
The number of rows in the region of interest.
Definition dispatch_histogram.cuh:109

cub::DeviceSpmv
DeviceSpmv provides device-wide parallel operations for performing sparse-matrix * dense-vector multi...
Definition device_spmv.cuh:71

cub::DeviceSpmv::CsrMV
static CUB_RUNTIME_FUNCTION cudaError_t CsrMV(void *d_temp_storage, size_t &temp_storage_bytes, ValueT *d_values, int *d_row_offsets, int *d_column_indices, ValueT *d_vector_x, ValueT *d_vector_y, int num_rows, int num_cols, int num_nonzeros, cudaStream_t stream=0, bool debug_synchronous=false)
This function performs the matrix-vector operation y = A*x.
Definition device_spmv.cuh:132

cub::DispatchSpmv::Dispatch
CUB_RUNTIME_FUNCTION static __forceinline__ cudaError_t Dispatch(void *d_temp_storage, size_t &temp_storage_bytes, SpmvParamsT &spmv_params, cudaStream_t stream, bool debug_synchronous, Spmv1ColKernelT spmv_1col_kernel, SpmvSearchKernelT spmv_search_kernel, SpmvKernelT spmv_kernel, SegmentFixupKernelT segment_fixup_kernel, KernelConfig spmv_config, KernelConfig segment_fixup_config)
< Function type of cub::DeviceSegmentFixupKernelT
Definition dispatch_spmv_orig.cuh:578

cub::SpmvParams
< Signed integer type for sequence offsets
Definition agent_spmv_orig.cuh:100

cub::SpmvParams::d_values
ValueT * d_values
Pointer to the array of num_nonzeros values of the corresponding nonzero elements of matrix A.
Definition agent_spmv_orig.cuh:101