亚洲欧美第一页_禁久久精品乱码_粉嫩av一区二区三区免费野_久草精品视频

? 歡迎來到蟲蟲下載站! | ?? 資源下載 ?? 資源專輯 ?? 關于我們
? 蟲蟲下載站

?? marsgpulib.cu

?? GPU實現的MapReduce framework,對于學習并行編程和cuda平臺的編程方面有著極好的參考價值
?? CU
?? 第 1 頁 / 共 2 頁
字號:
/**
 *This is the source code for Mars, a MapReduce framework on graphics
 *processors.
 *Author: Wenbin Fang (HKUST), Bingsheng He (HKUST)
 *Mentor: Naga K. Govindaraju (Microsoft Corp.), Qiong Luo (HKUST), Tuyong
 *Wang (Sina.com).
 *If you have any question on the code, please contact us at {saven,
 *wenbin, luo}@cse.ust.hk.
 *The copyright is held by HKUST. Mars is provided "as is" without any 
 *guarantees of any kind.
 */
 
#undef __CPU_MAP__
#undef __CPU_REDUCE__
#undef __COMPARE__
#define __GPU_MAP__
#define __GPU_REDUCE__
#include "MarsInc.h"
#include "MarsInc/MarsConfig.h"
#include "MarsGPUEmit.cu"

//------------------------------------------------------
//get key/value in a record
//------------------------------------------------------
__device__ char *gpuGetRecordFromBuf(char *buf, 
			int4 *offsetSizes, int index, char type,
			 size_t keyOffset, size_t valOffset)
{
	int offset = ((type == 0)?(offsetSizes[index].x-keyOffset):
		(offsetSizes[index].z-valOffset));
	return (buf + offset);
}
 
//------------------------------------------------------
//efficiently copy data in gpu kernel function
//------------------------------------------------------
__device__ void copyData(char4 *des, char4 *src, size_t size)
{
	//if data size is less than 4, simply copy it
	if (size < 4)
	{
		for (int i = 0; i < size; i++)
			des[i] = src[i];
		return;
	} 
  
	//if data size is greater than 4, use vector
	int size4 = size >> 2;
 
	char *pDes = NULL;
	char *pSrc = NULL;

	for (int i = 0; i < size4; i++)
	{
		pDes = (char*)&des[i];
		pSrc = (char*)&src[i];

		for (int j = 0; j < 4; j++)
			pDes[j] = pSrc[j];
	}

	int remainder = size & 3;

	if (remainder > 0)
	{
		pDes += 4;
		pSrc += 4;

		for (int i = 0; i < remainder; i++)
			pDes[i] = pSrc[i];	
	}
}

__device__ char *gpuGetVal(void *vals, int4 *index, size_t valStartIndex,
				size_t valCount, size_t i)
{
	if (i >= valCount) return NULL;
	char *val = (char*)vals+index[valStartIndex+i].z - index[valStartIndex].z;
	//BenLog("--val:%d--", *(int*)val);
	return val;
}
 
__device__ size_t gpuGetValSize(void *vals, int4 *index, size_t valStartIndex,
				size_t valCount, size_t i)
{
	if (i >= valCount) return NULL;
	return index[valStartIndex+i].w;
}
//----------------------------------------------------
//called by 
//----------------------------------------------------
__device__ void gpuEmitInterCount(size_t	keySize,
						       size_t	valSize,
						       size_t*	interKeysSizePerTask,
						       size_t*	interValsSizePerTask,
						       size_t*	interCountPerTask)
{
	size_t index = (blockIdx.x * blockDim.x + threadIdx.x);	

	interKeysSizePerTask[index] += keySize;
	interValsSizePerTask[index] += valSize;
	interCountPerTask[index]++;
}

//-------------------------------------------------------
//gpu kernel function, called by StartGPUMap
//-------------------------------------------------------
__global__ void gpuMapCount(char*	inputKeys,
			char*	inputVals,
			int4*	inputOffsetSizes,
			size_t*	interKeysSizePerTask,
			size_t*	interValsSizePerTask,
			size_t*	interCountPerTask,
			size_t recordNum, 
			size_t recordsPerTask,
			size_t taskNum,
			size_t keyOffset,
			size_t valOffset)
{ 
	size_t index = (blockIdx.x * blockDim.x + threadIdx.x);

	for (int i = 0; i <= recordsPerTask; i++)
	{
                
		int cindex = i*taskNum+index;
		if (cindex >= recordNum) return;

		char *key = gpuGetRecordFromBuf(inputKeys,
			inputOffsetSizes, cindex, 0, keyOffset, valOffset);
		char *val = gpuGetRecordFromBuf(inputVals,
			inputOffsetSizes, cindex, 1, keyOffset, valOffset);
		gpu_map_count(key,
		          val,
				  inputOffsetSizes[cindex].y,
				  inputOffsetSizes[cindex].w,
				  interKeysSizePerTask,
				  interValsSizePerTask,
				  interCountPerTask);
	}
}
 
//-------------------------------------------------------
//gpu kernel function, called by StartGPUMap
//-------------------------------------------------------
__global__ void gpuMap(char*	inputKeys,
					   char*	inputVals,
					   int4*	inputOffsetSizes,
					   size_t*	psKeySizes,
					   size_t*	psValSizes,
					   size_t*	psCounts,
					   int2*	keyValOffsets,
					   char*	interKeys,
					   char*	interVals,
					   int4*	interOffsetSizes,
					   size_t*	curIndex,
					   size_t	recordNum, 
					   size_t	recordsPerTask,
					   size_t	taskNum,
					   size_t	keyOffset,
					   size_t	valOffset)
{
	size_t index = (blockIdx.x * blockDim.x + threadIdx.x);

	interOffsetSizes[psCounts[index]].x = psKeySizes[index];
	interOffsetSizes[psCounts[index]].z = psValSizes[index];

	for (int i = 0; i <= recordsPerTask; i++)
	{
		int cindex = i*taskNum+index;
		if (cindex >= recordNum) return;
		char *key = gpuGetRecordFromBuf(inputKeys, 
			inputOffsetSizes, cindex, 0, keyOffset, valOffset);
		char *val = gpuGetRecordFromBuf(inputVals, 
			inputOffsetSizes, cindex, 1, keyOffset, valOffset);
		
		gpu_map(key,
			val,
			inputOffsetSizes[cindex].y,
			inputOffsetSizes[cindex].w,
			psKeySizes,
			psValSizes,
			psCounts,
			keyValOffsets,
			interKeys,
			interVals,
			interOffsetSizes,
			curIndex);
	}	
}

//----------------------------------------------------
//main gpu map procedure
//----------------------------------------------------
void StartGPUMap(Schedule_t *sched, char mode)
{
	//D_ENTER_FUNC("StartGPUMap");
	//EnterFunc("StartGPUMap");
	BEN_ASSERT(sched != NULL);

	//-------------------------------------------------------
	//get map input data
	//-------------------------------------------------------
	//!!!need to be small chunk!!!!
	size_t	inputRecCount = sched->inputSmallChunk.recCount;
	size_t	inputKeySize = sched->inputSmallChunk.keySize;
	size_t	inputValSize = sched->inputSmallChunk.valSize;
	size_t	inputKeyOffset = sched->inputSmallChunk.keyOffset;
	size_t	inputValOffset = sched->inputSmallChunk.valOffset;

	if (inputRecCount <= 0) return;

	char *inputKeys = sched->inputSmallChunk.keys;
	char *inputVals = sched->inputSmallChunk.vals;
	int4 *inputIndex = sched->inputSmallChunk.index;
	//!!!
 
	//----------------------------------------------
	//determine the number of threads to run
	//----------------------------------------------
	size_t gridDim = sched->gpuMapGridDim;
	size_t blockDim = sched->gpuMapBlockDim;
	size_t sharedMemSize = sched->gpuMapSharedMemSize;
	size_t threadNum = sched->gpuMapGridDim*sched->gpuMapBlockDim;
	size_t recPerThread = inputRecCount / threadNum;
	if (0 == recPerThread)
		recPerThread = 1;
 
	//-------------------------------------------------------
	//upload map input data onto device memory
	//-------------------------------------------------------
	char*	d_inputKeys = D_MALLOC(inputKeySize);
	D_MEMCPY_H2D(d_inputKeys, inputKeys, inputKeySize);

	char*	d_inputVals = D_MALLOC(inputValSize);
	D_MEMCPY_H2D(d_inputVals, inputVals, inputValSize);

	int4*	d_inputIndex = (int4*)D_MALLOC(sizeof(int4)*inputRecCount);
	D_MEMCPY_H2D(d_inputIndex, inputIndex, sizeof(int4)*inputRecCount);

	//----------------------------------------------
	//calculate intermediate data keys'buf size 
	//	 and values' buf size
	//----------------------------------------------
	size_t*	d_interKeySizePerThread = (size_t*)D_MALLOC(sizeof(size_t)*threadNum);
	size_t*	d_interValSizePerThread = (size_t*)D_MALLOC(sizeof(size_t)*threadNum);
	size_t*	d_interCountPerThread = (size_t*)D_MALLOC(sizeof(size_t)*threadNum);

	gpuMapCount<<<gridDim, blockDim, sharedMemSize>>>(d_inputKeys,
					   d_inputVals,
					   d_inputIndex,
					   d_interKeySizePerThread,
					   d_interValSizePerThread,
					   d_interCountPerThread,
					   inputRecCount, 
					   recPerThread,
					   threadNum,
					   inputKeyOffset,
					   inputValOffset);

	//----------------------------------------------
	//do prefix sum
	//----------------------------------------------
	size_t *d_psKeySizes = (size_t*)D_MALLOC(sizeof(size_t)*threadNum);
	size_t allKeySize = prefexSum((int*)d_interKeySizePerThread, (int*)d_psKeySizes, threadNum);

	size_t *d_psValSizes = (size_t*)D_MALLOC(sizeof(size_t)*threadNum);
	size_t allValSize = prefexSum((int*)d_interValSizePerThread, (int*)d_psValSizes, threadNum);

	size_t *d_psCounts = (size_t*)D_MALLOC(sizeof(size_t)*threadNum);
	size_t allCounts = prefexSum((int*)d_interCountPerThread, (int*)d_psCounts, threadNum);

	//-----------------------------------------------
	//allocate intermediate memory on device memory
	//-----------------------------------------------
	char*	d_interKeys = NULL;
	char*	d_interVals = NULL;
	int4*	d_interIndex = NULL;
	int2*	d_keyValOffsets = NULL;
	size_t*	d_curIndex = NULL;

	if (allCounts == 0)
		goto GPU_MAP_EXIT;

	d_interKeys = D_MALLOC(allKeySize);
	d_interVals = D_MALLOC(allValSize);
	d_interIndex = (int4*)D_MALLOC(sizeof(int4)*allCounts);

	//--------------------------------------------------
	// start map
	//--------------------------------------------------
	d_keyValOffsets = (int2*)D_MALLOC(sizeof(int2)*threadNum);

	d_curIndex = (size_t*)D_MALLOC(sizeof(size_t)*threadNum);

	gpuMap<<<gridDim, blockDim, sharedMemSize>>>(d_inputKeys,
					  d_inputVals,
					  d_inputIndex,
					  d_psKeySizes,
					  d_psValSizes,
					  d_psCounts,
					  d_keyValOffsets,
					  d_interKeys,
					  d_interVals,
					  d_interIndex,
					  d_curIndex,
					  inputRecCount, 
					  recPerThread,
					  threadNum,
					  inputKeyOffset,
					  inputValOffset);


	sched->outputSmallChunk.keys = d_interKeys;
	sched->outputSmallChunk.vals = d_interVals;
	sched->outputSmallChunk.index = d_interIndex;
	sched->outputSmallChunk.keySize = allKeySize;
	sched->outputSmallChunk.valSize = allValSize;
	sched->outputSmallChunk.indexSize = allCounts*sizeof(int4);
	sched->outputSmallChunk.rangeSize = 0;//sizeof(int2)*interDiffKeyCount;
	sched->outputSmallChunk.recCount = allCounts;


	//PrintRecords(&(sched->outputSmallChunks[cur]), NULL, INT, INT, 100);
	//---------------------------------------------
	//clean
	//---------------------------------------------
GPU_MAP_EXIT:
	D_FREE(d_interKeySizePerThread, sizeof(size_t)*threadNum);
	D_FREE(d_interValSizePerThread, sizeof(size_t)*threadNum);
	D_FREE(d_interCountPerThread, sizeof(size_t)*threadNum);

//	D_FREE(d_interKeys, allKeySize);
//	D_FREE(d_interVals, allValSize);
//	D_FREE(d_interIndex, sizeof(int4)*allCounts);

	D_FREE(d_keyValOffsets, sizeof(int2)*threadNum);
	D_FREE(d_curIndex, sizeof(size_t)*threadNum);

	D_FREE(d_inputKeys, inputKeySize);
	D_FREE(d_inputVals, inputValSize);
	D_FREE(d_inputIndex, sizeof(int4)*inputRecCount);

	D_FREE(d_psKeySizes, sizeof(size_t)*threadNum);
	D_FREE(d_psValSizes, sizeof(size_t)*threadNum);
	D_FREE(d_psCounts, sizeof(size_t)*threadNum);

	//D_LEAVE_FUNC("StartGPUMap");
	//LeaveFunc("StartGPUMap");
}
 
void StartGPUSort_cpu(Schedule_t *sched, char mode)
{
	char *d_interKeys = sched->outputSmallChunk.keys;
	char *d_interVals = sched->outputSmallChunk.vals;
	int4 *d_interIndex = (int4*)sched->outputSmallChunk.index;

	size_t allKeySize = sched->outputSmallChunk.keySize;
	size_t allValSize = sched->outputSmallChunk.valSize;
	size_t allCounts = sched->outputSmallChunk.recCount;

	char *interKeys = (char*)BenMalloc(allKeySize);
	char *interVals = (char*)BenMalloc(allValSize);
	int4 *interIndex = (int4*)BenMalloc(sizeof(int4)*allCounts);

	D_MEMCPY_D2H(interKeys, d_interKeys, allKeySize);
	D_MEMCPY_D2H(interVals, d_interVals, allValSize);
	D_MEMCPY_D2H(interIndex, d_interIndex, sizeof(int4)*allCounts);

	sched->outputSmallChunk.keys = interKeys;
	sched->outputSmallChunk.vals = interVals;
	sched->outputSmallChunk.index = interIndex;

	if (mode & MAP_SORT || mode & MAP_SORT_REDUCE)
	{
		if (mode & USE_FILE)
			sched->outputSmallChunk.keyOffset = 0;
		QuickSortMem(&sched->outputSmallChunk);
		GroupByMem(&sched->outputSmallChunk);
		sched->outputSmallChunk.rangeSize = sched->outputSmallChunk.diffKeyCount*sizeof(int2);
	}  

	D_FREE(d_interKeys, allKeySize);
	D_FREE(d_interVals, allValSize);
	D_FREE(d_interIndex, sizeof(int4)*allCounts);
}

?? 快捷鍵說明

復制代碼 Ctrl + C
搜索代碼 Ctrl + F
全屏模式 F11
切換主題 Ctrl + Shift + D
顯示快捷鍵 ?
增大字號 Ctrl + =
減小字號 Ctrl + -
亚洲欧美第一页_禁久久精品乱码_粉嫩av一区二区三区免费野_久草精品视频
欧美一级片在线| 欧美精品一级二级三级| 亚洲免费观看在线视频| 日韩写真欧美这视频| 99精品视频中文字幕| 日韩国产欧美视频| 亚洲视频在线观看三级| 日韩一区二区免费在线电影 | 樱花影视一区二区| 亚洲精品在线网站| 欧美高清www午色夜在线视频| 国产成人免费视频网站| 久色婷婷小香蕉久久| 亚洲一区精品在线| 国产精品久久久久久久久免费相片 | 日韩免费观看高清完整版| 91亚洲大成网污www| 国产一区二区美女| 欧美aaaaa成人免费观看视频| 亚洲免费在线视频一区 二区| 精品免费一区二区三区| 91精品国产综合久久福利| 色av一区二区| 99在线精品一区二区三区| 国产二区国产一区在线观看| 免费高清在线视频一区·| 亚洲成人动漫av| 亚洲国产精品久久人人爱蜜臀| 成人免费在线视频观看| 国产精品国产三级国产a| 国产亚洲欧美色| 久久免费视频色| 久久免费的精品国产v∧| 欧美v亚洲v综合ⅴ国产v| 日韩欧美一区二区视频| 91精品国产免费久久综合| 欧美丰满一区二区免费视频| 欧美日韩一区二区三区在线 | 一区二区不卡在线播放| 亚洲女爱视频在线| 亚洲欧美日韩在线播放| 国产精品卡一卡二卡三| 中文字幕一区二区三区在线观看 | 99精品国产99久久久久久白柏| 国产白丝精品91爽爽久久 | 欧美日韩免费观看一区三区| 在线观看国产91| 欧美体内she精高潮| 欧美三级电影精品| 欧美三级三级三级爽爽爽| 在线成人小视频| 精品污污网站免费看| 欧美另类变人与禽xxxxx| 欧美一级午夜免费电影| 久久综合色婷婷| 久久精品日韩一区二区三区| 国产精品私人影院| |精品福利一区二区三区| 一区二区三区国产| 性做久久久久久| 国内精品久久久久影院一蜜桃| 国产成人精品午夜视频免费| 99视频一区二区三区| 在线欧美小视频| 日韩精品一区二区三区中文不卡| 久久久久久麻豆| 日韩伦理av电影| 亚洲国产日韩一级| 久久成人综合网| 成人免费视频视频| 欧美日本不卡视频| 久久综合久久鬼色中文字| 日韩毛片精品高清免费| 人人精品人人爱| 国产成人精品免费视频网站| 日本精品一区二区三区四区的功能| 欧美色老头old∨ideo| 久久青草国产手机看片福利盒子 | 麻豆精品精品国产自在97香蕉 | 粗大黑人巨茎大战欧美成人| 91日韩精品一区| 日韩你懂的在线观看| 国产精品卡一卡二卡三| 日本中文在线一区| 成人美女在线观看| 在线播放日韩导航| 国产精品精品国产色婷婷| 青青草国产精品97视觉盛宴| 成人免费视频app| 欧美一区二区三区色| 日韩一区在线播放| 免费成人美女在线观看| 91在线视频网址| 欧美va亚洲va| 一区二区视频在线看| 国产在线播放一区二区三区| 欧美亚洲国产一卡| 国产日韩欧美精品在线| 青青草一区二区三区| 欧洲精品视频在线观看| 国产欧美视频一区二区三区| 视频一区二区三区中文字幕| av一区二区三区黑人| 欧美精品一区二区三区高清aⅴ| 亚洲精品成人少妇| 成人性视频网站| 精品国产a毛片| 天天综合日日夜夜精品| 成人av电影在线| 2024国产精品| 麻豆中文一区二区| 欧美午夜寂寞影院| 成人欧美一区二区三区黑人麻豆| 国产综合色视频| 日韩三级电影网址| 亚洲国产视频一区| 一本色道久久综合亚洲aⅴ蜜桃| 久久婷婷久久一区二区三区| 日韩不卡免费视频| 欧美日韩精品欧美日韩精品一综合| 中文字幕五月欧美| 国产成人av影院| 久久午夜国产精品| 国内精品免费在线观看| 精品免费视频一区二区| 麻豆传媒一区二区三区| 欧美老肥妇做.爰bbww视频| 亚洲午夜视频在线| 欧美色老头old∨ideo| 亚洲午夜av在线| 欧美日韩精品久久久| 一区二区三区 在线观看视频| 99re这里只有精品视频首页| 国产精品伦一区二区三级视频| 国产一区二区三区四| 久久久久久久精| 国产高清不卡一区二区| 久久久精品人体av艺术| 国产69精品久久久久毛片| 中文字幕av一区二区三区| 粉嫩嫩av羞羞动漫久久久| 国产精品青草综合久久久久99| 国产精品18久久久| 中文字幕欧美三区| 色综合久久六月婷婷中文字幕| 国产精品久久久久久久久久久免费看| 成人永久免费视频| 亚洲三级在线免费观看| 欧美综合一区二区| 婷婷中文字幕综合| 日韩精品专区在线| 精品午夜一区二区三区在线观看 | 最新久久zyz资源站| 91网站最新网址| 亚洲午夜私人影院| 欧美成人三级电影在线| 国产精品一区二区视频| 中文字幕欧美一| 欧美性xxxxxxxx| 精品一区二区久久| 中文字幕中文字幕在线一区| 欧美图片一区二区三区| 久久精品国产一区二区三| 欧美精彩视频一区二区三区| 91免费看`日韩一区二区| 午夜精品福利久久久| 精品久久99ma| 99国产精品99久久久久久| 丝袜诱惑亚洲看片| 久久久精品tv| 在线视频中文字幕一区二区| 蜜桃一区二区三区在线| 国产精品久久久久久亚洲毛片| 欧美亚州韩日在线看免费版国语版| 欧美aaaaaa午夜精品| 国产精品嫩草久久久久| 在线不卡a资源高清| 成人午夜精品一区二区三区| 亚洲美女电影在线| 欧美不卡视频一区| 91麻豆国产自产在线观看| 日韩成人免费电影| 成人欧美一区二区三区黑人麻豆 | 国产欧美一区二区精品性| 色综合久久综合网欧美综合网| 日韩精品91亚洲二区在线观看| 国产亚洲成aⅴ人片在线观看| 欧美伊人久久久久久久久影院 | 国产精品久久免费看| 欧美精品日韩一区| 国产成人小视频| 青草国产精品久久久久久| 亚洲视频中文字幕| 久久久午夜精品| 欧美日韩国产乱码电影| 丁香亚洲综合激情啪啪综合| 天天av天天翘天天综合网色鬼国产| 中文字幕免费观看一区| 日韩一区二区影院| 欧美日韩一卡二卡三卡|