亚洲欧美第一页_禁久久精品乱码_粉嫩av一区二区三区免费野_久草精品视频

? 歡迎來到蟲蟲下載站! | ?? 資源下載 ?? 資源專輯 ?? 關(guān)于我們
? 蟲蟲下載站

?? marsscan.cu

?? GPU實(shí)現(xiàn)的MapReduce framework,對(duì)于學(xué)習(xí)并行編程和cuda平臺(tái)的編程方面有著極好的參考價(jià)值
?? CU
?? 第 1 頁 / 共 2 頁
字號(hào):
/*
 * Copyright 1993-2006 NVIDIA Corporation.  All rights reserved.
 *
 * NOTICE TO USER:   
 *
 * This source code is subject to NVIDIA ownership rights under U.S. and 
 * international Copyright laws.  
 * 
 * NVIDIA MAKES NO REPRESENTATION ABOUT THE SUITABILITY OF THIS SOURCE 
 * CODE FOR ANY PURPOSE.  IT IS PROVIDED "AS IS" WITHOUT EXPRESS OR 
 * IMPLIED WARRANTY OF ANY KIND.  NVIDIA DISCLAIMS ALL WARRANTIES WITH 
 * REGARD TO THIS SOURCE CODE, INCLUDING ALL IMPLIED WARRANTIES OF 
 * MERCHANTABILITY, NONINFRINGEMENT, AND FITNESS FOR A PARTICULAR PURPOSE.   
 * IN NO EVENT SHALL NVIDIA BE LIABLE FOR ANY SPECIAL, INDIRECT, INCIDENTAL, 
 * OR CONSEQUENTIAL DAMAGES, OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS 
 * OF USE, DATA OR PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE 
 * OR OTHER TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE 
 * OR PERFORMANCE OF THIS SOURCE CODE.  
 *
 * U.S. Government End Users.  This source code is a "commercial item" as 
 * that term is defined at 48 C.F.R. 2.101 (OCT 1995), consisting  of 
 * "commercial computer software" and "commercial computer software 
 * documentation" as such terms are used in 48 C.F.R. 12.212 (SEPT 1995) 
 * and is provided to the U.S. Government only as a commercial end item.  
 * Consistent with 48 C.F.R.12.212 and 48 C.F.R. 227.7202-1 through 
 * 227.7202-4 (JUNE 1995), all U.S. Government End Users acquire the 
 * source code with only those rights set forth herein.
 */

#include "MarsInc.h"
#include "MarsInc/MarsConfig.h"

// Define this to more rigorously avoid bank conflicts, 
// even at the lower (root) levels of the tree
// Note that due to the higher addressing overhead, performance 
// is lower with ZERO_BANK_CONFLICTS enabled.  It is provided
// as an example.
//#define ZERO_BANK_CONFLICTS 

// 16 banks on G80
#define NUM_BANKS 16
#define LOG_NUM_BANKS 4

#ifdef ZERO_BANK_CONFLICTS
#define CONFLICT_FREE_OFFSET(index) ((index) >> LOG_NUM_BANKS + (index) >> (2*LOG_NUM_BANKS))
#else
#define CONFLICT_FREE_OFFSET(index) ((index) >> LOG_NUM_BANKS)
#endif

///////////////////////////////////////////////////////////////////////////////
// Work-efficient compute implementation of scan, one thread per 2 elements
// Work-efficient: O(log(n)) steps, and O(n) adds.
// Also shared storage efficient: Uses n + n/NUM_BANKS shared memory -- no ping-ponging
// Also avoids most bank conflicts using single-element offsets every NUM_BANKS elements.
//
// In addition, If ZERO_BANK_CONFLICTS is defined, uses 
//     n + n/NUM_BANKS + n/(NUM_BANKS*NUM_BANKS) 
// shared memory. If ZERO_BANK_CONFLICTS is defined, avoids ALL bank conflicts using 
// single-element offsets every NUM_BANKS elements, plus additional single-element offsets 
// after every NUM_BANKS^2 elements.
//
// Uses a balanced tree type algorithm.  See Blelloch, 1990 "Prefix Sums 
// and Their Applications", or Prins and Chatterjee PRAM course notes:
// http://www.cs.unc.edu/~prins/Classes/203/Handouts/pram.pdf
// 
// This work-efficient version is based on the algorithm presented in Guy Blelloch's
// excellent paper "Prefix sums and their applications".
// http://www-2.cs.cmu.edu/afs/cs.cmu.edu/project/scandal/public/papers/CMU-CS-90-190.html
//
// Pro: Work Efficient, very few bank conflicts (or zero if ZERO_BANK_CONFLICTS is defined)
// Con: More instructions to compute bank-conflict-free shared memory addressing,
// and slightly more shared memory storage used.
//

template <bool isNP2>
__device__ void loadSharedChunkFromMem(int *s_data,
                                       const int *g_idata, 
                                       int n, int baseIndex,
                                       int& ai, int& bi, 
                                       int& mem_ai, int& mem_bi, 
                                       int& bankOffsetA, int& bankOffsetB)
{
    int thid = threadIdx.x;
    mem_ai = baseIndex + threadIdx.x;
    mem_bi = mem_ai + blockDim.x;

    ai = thid;
    bi = thid + blockDim.x;

    // compute spacing to avoid bank conflicts
    bankOffsetA = CONFLICT_FREE_OFFSET(ai);
    bankOffsetB = CONFLICT_FREE_OFFSET(bi);

    // Cache the computational window in shared memory
    // pad values beyond n with zeros
    s_data[ai + bankOffsetA] = g_idata[mem_ai]; 
    
    if (isNP2) // compile-time decision
    {
        s_data[bi + bankOffsetB] = (bi < n) ? g_idata[mem_bi] : 0; 
    }
    else
    {
        s_data[bi + bankOffsetB] = g_idata[mem_bi]; 
    }
}

template <bool isNP2>
__device__ void storeSharedChunkToMem(int* g_odata, 
                                      const int* s_data,
                                      int n, 
                                      int ai, int bi, 
                                      int mem_ai, int mem_bi,
                                      int bankOffsetA, int bankOffsetB)
{
    __syncthreads();

    // write results to global memory
    g_odata[mem_ai] = s_data[ai + bankOffsetA]; 
    if (isNP2) // compile-time decision
    {
        if (bi < n)
            g_odata[mem_bi] = s_data[bi + bankOffsetB]; 
    }
    else
    {
        g_odata[mem_bi] = s_data[bi + bankOffsetB]; 
    }
}

template <bool storeSum>
__device__ void clearLastElement(int* s_data, 
                                 int *g_blockSums, 
                                 int blockIndex)
{
    if (threadIdx.x == 0)
    {
        int index = (blockDim.x << 1) - 1;
        index += CONFLICT_FREE_OFFSET(index);
        
        if (storeSum) // compile-time decision
        {
            // write this block's total sum to the corresponding index in the blockSums array
            g_blockSums[blockIndex] = s_data[index];
        }

        // zero the last element in the scan so it will propagate back to the front
        s_data[index] = 0;
    }
}



__device__ unsigned int buildSum(int *s_data)
{
    unsigned int thid = threadIdx.x;
    unsigned int stride = 1;
    
    // build the sum in place up the tree
    for (int d = blockDim.x; d > 0; d >>= 1)
    {
        __syncthreads();

        if (thid < d)      
        {
            int i  = __mul24(__mul24(2, stride), thid);
            int ai = i + stride - 1;
            int bi = ai + stride;

            ai += CONFLICT_FREE_OFFSET(ai);
            bi += CONFLICT_FREE_OFFSET(bi);

            s_data[bi] += s_data[ai];
        }

        stride *= 2;
    }

    return stride;
}

__device__ void scanRootToLeaves(int *s_data, unsigned int stride)
{
     unsigned int thid = threadIdx.x;

    // traverse down the tree building the scan in place
    for (int d = 1; d <= blockDim.x; d *= 2)
    {
        stride >>= 1;

        __syncthreads();

        if (thid < d)
        {
            int i  = __mul24(__mul24(2, stride), thid);
            int ai = i + stride - 1;
            int bi = ai + stride;

            ai += CONFLICT_FREE_OFFSET(ai);
            bi += CONFLICT_FREE_OFFSET(bi);

            int t  = s_data[ai];
            s_data[ai] = s_data[bi];
            s_data[bi] += t;
        }
    }
}

template <bool storeSum>
__device__ void prescanBlock(int *data, int blockIndex, int *blockSums)
{
    int stride = buildSum(data);               // build the sum in place up the tree
    clearLastElement<storeSum>(data, blockSums, 
                               (blockIndex == 0) ? blockIdx.x : blockIndex);
    scanRootToLeaves(data, stride);            // traverse down tree to build the scan 
}

template <bool storeSum, bool isNP2>
__global__ void prescan(int *g_odata, 
                        const int *g_idata, 
                        int *g_blockSums, 
                        int n, 
                        int blockIndex, 
                        int baseIndex)
{
    int ai, bi, mem_ai, mem_bi, bankOffsetA, bankOffsetB;
    extern __shared__ int s_data[];

    // load data into shared memory
    loadSharedChunkFromMem<isNP2>(s_data, g_idata, n, 
                                  (baseIndex == 0) ? 
                                  __mul24(blockIdx.x, (blockDim.x << 1)):baseIndex,
                                  ai, bi, mem_ai, mem_bi, 
                                  bankOffsetA, bankOffsetB); 
    // scan the data in each block
    prescanBlock<storeSum>(s_data, blockIndex, g_blockSums); 
    // write results to device memory
    storeSharedChunkToMem<isNP2>(g_odata, s_data, n, 
                                 ai, bi, mem_ai, mem_bi, 
                                 bankOffsetA, bankOffsetB);  
}


__global__ void uniformAdd(int *g_data, 
                           int *uniforms, 
                           int n, 
                           int blockOffset, 
                           int baseIndex)
{
    __shared__ int uni;
    if (threadIdx.x == 0)
        uni = uniforms[blockIdx.x + blockOffset];
    

?? 快捷鍵說明

復(fù)制代碼 Ctrl + C
搜索代碼 Ctrl + F
全屏模式 F11
切換主題 Ctrl + Shift + D
顯示快捷鍵 ?
增大字號(hào) Ctrl + =
減小字號(hào) Ctrl + -
亚洲欧美第一页_禁久久精品乱码_粉嫩av一区二区三区免费野_久草精品视频
亚洲精品日韩专区silk| 免费一级欧美片在线观看| 欧美日韩成人在线| 国产精品亚洲午夜一区二区三区 | va亚洲va日韩不卡在线观看| 亚洲大片在线观看| 国产精品你懂的在线欣赏| 欧美成人猛片aaaaaaa| 欧美在线视频全部完| 国产精品1024| 日韩成人精品在线| 亚洲自拍偷拍网站| 中文av一区二区| 久久精品视频在线看| 5566中文字幕一区二区电影| 日本久久精品电影| 成人av资源站| 国产一区二区精品久久| 爽好久久久欧美精品| 夜夜嗨av一区二区三区网页| 亚洲欧洲日韩在线| 欧美激情资源网| 久久―日本道色综合久久| 日韩免费高清av| 日韩一区二区影院| 欧美一区二区三区在线视频| 欧美日韩免费不卡视频一区二区三区| 成人免费高清在线| 国产精品一区二区久久精品爱涩| 捆绑调教美女网站视频一区| 日日夜夜免费精品| 日韩精品电影一区亚洲| 亚洲妇熟xx妇色黄| 亚洲成在线观看| 亚洲va欧美va天堂v国产综合| 亚洲欧洲日韩综合一区二区| 亚洲欧洲精品一区二区三区| 欧美—级在线免费片| 国产免费久久精品| 中文字幕一区二区三区四区不卡| 国产精品丝袜91| 国产精品传媒在线| 亚洲日本成人在线观看| 亚洲欧美二区三区| 一区二区三区在线不卡| 亚洲一区二区高清| 亚洲成人你懂的| 日本va欧美va欧美va精品| 另类中文字幕网| 国产成a人无v码亚洲福利| 丁香婷婷综合网| 97成人超碰视| 欧美在线一二三| 欧美一区二区三区喷汁尤物| 精品国产伦一区二区三区观看方式 | 午夜国产精品一区| 丝袜美腿成人在线| 国产一区二区精品久久99| 成人h动漫精品一区二| 色婷婷亚洲综合| 欧美日韩成人激情| 亚洲精品一区二区三区香蕉| 国产色91在线| 亚洲综合无码一区二区| 日韩精品每日更新| 国产在线视视频有精品| av在线播放一区二区三区| 欧美影视一区在线| 精品成人一区二区三区四区| 国产精品久久久久四虎| 亚洲综合网站在线观看| 久草在线在线精品观看| 国产不卡免费视频| 欧美日韩日本视频| 久久久久久久免费视频了| 亚洲欧美视频在线观看| 人人狠狠综合久久亚洲| 成人国产一区二区三区精品| 欧美亚洲综合网| 欧美精品一区二区三区久久久| 国产精品毛片久久久久久| 亚洲成av人片在线| 粉嫩aⅴ一区二区三区四区| 欧美日韩亚洲综合在线 欧美亚洲特黄一级 | 久久久精品人体av艺术| 亚洲综合丁香婷婷六月香| 久久99国产精品久久99| 91视频免费观看| 欧美精品一区二区三区蜜臀 | 中文字幕一区日韩精品欧美| 日韩不卡免费视频| 99精品视频在线观看| 日韩一区二区中文字幕| 亚洲精品乱码久久久久久日本蜜臀| 麻豆精品久久久| 日本韩国一区二区三区视频| 日韩女优av电影| 亚洲自拍欧美精品| 成人理论电影网| 日韩小视频在线观看专区| 亚洲精品高清视频在线观看| 久久国产精品色婷婷| 欧美亚洲尤物久久| 国产精品福利一区| 国产在线播精品第三| 欧美久久久久久久久久| 国产精品二三区| 国产风韵犹存在线视精品| 日韩欧美亚洲国产精品字幕久久久| 亚洲欧美激情插| 成人黄页毛片网站| 久久网站最新地址| 青青草97国产精品免费观看| 色一区在线观看| 亚洲欧洲日韩在线| 成人看片黄a免费看在线| 久久综合国产精品| 免费美女久久99| 7777精品伊人久久久大香线蕉经典版下载 | 91精品国产入口在线| 亚洲激情自拍视频| eeuss鲁片一区二区三区在线看| 日韩精品中文字幕一区| 视频在线观看国产精品| 91黄色免费看| 亚洲人成网站在线| 成人97人人超碰人人99| 国产亚洲1区2区3区| 国产一区二区在线影院| 精品少妇一区二区| 毛片不卡一区二区| 精品美女被调教视频大全网站| 蜜桃av一区二区| 欧美成人a∨高清免费观看| 视频一区二区三区入口| 欧美日韩精品一区二区三区四区| 亚洲综合清纯丝袜自拍| 欧美三级三级三级爽爽爽| 亚洲成人1区2区| 91精品国产色综合久久不卡电影| 青青青伊人色综合久久| 日韩午夜小视频| 麻豆国产91在线播放| 欧美不卡一区二区三区| 黄页视频在线91| 久久久久国产成人精品亚洲午夜| 国产成人av电影免费在线观看| 亚洲国产高清在线观看视频| 不卡一区中文字幕| 夜夜嗨av一区二区三区四季av| 欧美日韩成人在线| 激情文学综合网| 国产午夜精品久久久久久免费视| 成人av综合在线| 亚洲一区二区三区爽爽爽爽爽| 久久97超碰色| 国产精品久久久久影院亚瑟| 色哟哟精品一区| 日韩不卡免费视频| 国产色综合久久| 色激情天天射综合网| 天天操天天色综合| 欧美变态tickling挠脚心| 高清成人免费视频| 亚洲区小说区图片区qvod| 欧美人动与zoxxxx乱| 国内成人免费视频| 1024成人网| 日韩视频免费直播| 成人理论电影网| 亚洲成a人片综合在线| 精品国产伦一区二区三区观看方式| 成人午夜免费视频| 亚洲午夜精品一区二区三区他趣| 精品美女一区二区| 91国产福利在线| 激情五月播播久久久精品| 亚洲日韩欧美一区二区在线| 欧美人伦禁忌dvd放荡欲情| 国产精品自拍毛片| 亚洲国产精品欧美一二99| 久久久噜噜噜久久中文字幕色伊伊 | 亚洲欧美偷拍另类a∨色屁股| 欧美一区二区三区不卡| 成人精品电影在线观看| 午夜精品久久久久久久久久| 日本一区二区三区免费乱视频| 欧美视频在线观看一区二区| 国产精品主播直播| 午夜视频一区在线观看| 日本一区二区成人在线| 91麻豆精品国产91久久久久久久久 | 精品欧美一区二区在线观看| 91丨porny丨国产入口| 久久99国产精品麻豆| 一区二区三区在线观看视频| 国产日韩精品一区二区三区| 欧美高清视频在线高清观看mv色露露十八| 国产精品一区专区| 日本最新不卡在线|