《GPU高性能编程CUDA实战》附录三关于book.h

▶ 本书中用到的公用函数放到了头文件book.h中

 #ifndef __BOOK_H__

 #define __BOOK_H__

 #include <stdio.h>

 #include <stdlib.h>         // 自己加的

 #include "cuda_runtime.h"   // 自己加的

 static void HandleError( cudaError_t err, const char *file, int line )//定义报错函数，通过传入的返回值和文件名、行号来提示信息

 {

     if (err != cudaSuccess)

     {

         printf( "%s in %s at line %d\n", cudaGetErrorString( err ),file, line );

         exit( EXIT_FAILURE );

     }

 }

 #define HANDLE_ERROR( err ) (HandleError( err, __FILE__, __LINE__ ))// 将报错函数包装为宏，自动填塞文件名和行号

 #define HANDLE_NULL( a )/* 空指针报错函数，代码中malloc失败时报错 */              \

 {                                                                             \

     if (a == NULL)                                                            \

     {                                                                         \

         printf( "Host memory failed in %s at line %d\n", __FILE__, __LINE__ );\

         exit(EXIT_FAILURE);                                                   \

     }                                                                         \

 }

 template< typename T >// 泛型交换（全书都没用到？）

 void swap( T& a, T& b )

 {

     T t = a;

     a = b;

     b = t;

 }

 void* big_random_block( int size )//在主机中生成随机数组，无符号字符型

 {

     unsigned char *data = (unsigned char*)malloc( size );

     HANDLE_NULL( data );

     for (int i = ; i < size; data[i] = rand(), i++);

     return data;

 }

 int* big_random_block_int( int size )//在主机中生成随机数组，整型

 {

     int *data = (int*)malloc( size * sizeof(int) );

     HANDLE_NULL( data );

     for (int i = ; i < size; data[i] = rand(), i++);

     return data;

 }

 // 公用设备函数

 __device__ unsigned char value(float n1, float n2, int hue)

 {

     if (hue > )

         hue -= ;

     else if (hue < )

         hue += ;

     if (hue < )

         return (unsigned char)( * (n1 + (n2 - n1)*hue / ));

     if (hue < )

         return (unsigned char)( * n2);

     if (hue < )

         return (unsigned char)( * (n1 + (n2 - n1)*( - hue) / ));

     return (unsigned char)( * n1);

 }

 __global__ void float_to_color(unsigned char *optr, const float *outSrc)

 {

     int x = threadIdx.x + blockIdx.x * blockDim.x;

     int y = threadIdx.y + blockIdx.y * blockDim.y;

     int offset = x + y * blockDim.x * gridDim.x;

     float l = outSrc[offset];

     float s = ;

     int h = ( + (int)(360.0f * outSrc[offset])) % ;

     float m1, m2;

     if (l <= 0.5f)

         m2 = l * ( + s);

     else

         m2 = l + s - l * s;

     m1 =  * l - m2; 

     optr[offset *  + ] = value(m1, m2, h + );

     optr[offset *  + ] = value(m1, m2, h);

     optr[offset *  + ] = value(m1, m2, h - );

     optr[offset *  + ] = ;

 }

 __global__ void float_to_color( uchar4 *optr,const float *outSrc )

 {

     int x = threadIdx.x + blockIdx.x * blockDim.x;

     int y = threadIdx.y + blockIdx.y * blockDim.y;

     int offset = x + y * blockDim.x * gridDim.x;

     float l = outSrc[offset];

     float s = ;

     int h = ( + (int)(360.0f * outSrc[offset])) % ;

     float m1, m2;

     if (l <= 0.5f)

         m2 = l * ( + s);

     else

         m2 = l + s - l * s;

     m1 =  * l - m2;

     optr[offset].x = value(m1, m2, h + );

     optr[offset].y = value(m1, m2, h);

     optr[offset].z = value(m1, m2, h - );

     optr[offset].w = ;

 }

 // 有关线程的设置

 #if _WIN32

     //Windows threads.

     #include <windows.h>

     typedef HANDLE CUTThread;// 统一包装

     typedef unsigned (WINAPI *CUT_THREADROUTINE)(void *);

     #define CUT_THREADPROC unsigned WINAPI

     #define  CUT_THREADEND return 0

 #else

     //POSIX threads.

     #include <pthread.h>

     typedef pthread_t CUTThread;

     typedef void *(*CUT_THREADROUTINE)(void *);

     #define CUT_THREADPROC void

     #define  CUT_THREADEND

 #endif

 // 线程的创造，单线程结束，单线程销毁和多线程等待

 CUTThread start_thread( CUT_THREADROUTINE, void *data );

 void end_thread( CUTThread thread );

 void destroy_thread( CUTThread thread );

 void wait_for_threads( const CUTThread *threads, int num );

 #if _WIN32

     CUTThread start_thread(CUT_THREADROUTINE func, void *data)

     {

         return CreateThread(NULL, , (LPTHREAD_START_ROUTINE)func, data, , NULL);

     }

     void end_thread(CUTThread thread)

     {

         WaitForSingleObject(thread, INFINITE);

         CloseHandle(thread);

     }

     void destroy_thread( CUTThread thread )

     {

         TerminateThread(thread, );

         CloseHandle(thread);

     }

     void wait_for_threads(const CUTThread * threads, int num){

         WaitForMultipleObjects(num, threads, true, INFINITE);

         for(int i = ; i < num; i++)

             CloseHandle(threads[i]);

     }

 #else

     CUTThread start_thread(CUT_THREADROUTINE func, void * data)

     {

         pthread_t thread;

         pthread_create(&thread, NULL, func, data);

         return thread;

     }

     void end_thread(CUTThread thread)

     {

         pthread_join(thread, NULL);

     }

     void destroy_thread( CUTThread thread )

     {

         pthread_cancel(thread);

     }

     void wait_for_threads(const CUTThread * threads, int num)

     {

         for(int i = ; i < num; i++)

             end_thread( threads[i] );

     }

 #endif

 #endif  // __BOOK_H__

《GPU高性能编程CUDA实战》附录三关于book.h的更多相关文章

[问题解决]《GPU高性能编程CUDA实战》中第4章Julia实例“显示器驱动已停止响应，并且已恢复”问题的解决方法
以下问题的出现及解决都基于"WIN7+CUDA7.5". 问题描述:当我编译运行<GPU高性能编程CUDA实战>中第4章所给Julia实例代码时,出现了显示器闪动的现象 ...
《GPU高性能编程CUDA实战》附录二散列表
▶ 使用CPU和GPU分别实现散列表 ● CPU方法 #include <stdio.h> #include <time.h> #include "cuda_runt ...
《GPU高性能编程CUDA实战》第三章 CUDA设备相关
▶ 这章介绍了与CUDA设备相关的参数,并给出了了若干用于查询参数的函数. ● 代码(已合并) #include <stdio.h> #include "cuda_runtime ...
《GPU高性能编程CUDA实战》附录四其他头文件
▶ cpu_bitmap.h #ifndef __CPU_BITMAP_H__ #define __CPU_BITMAP_H__ #include "gl_helper.h" st ...
《GPU高性能编程CUDA实战》附录一高级原子操作
▶ 本章介绍了手动实现原子操作.重构了第五章向量点积的过程.核心是通过定义结构Lock及其运算,实现锁定,读写,解锁的过程. ● 章节代码 #include <stdio.h> #incl ...
《GPU高性能编程CUDA实战》第五章线程并行
▶ 本章介绍了线程并行,并给出四个例子.长向量加法.波纹效果.点积和显示位图. ● 长向量加法(线程块并行 + 线程并行) #include <stdio.h> #include &quo ...
《GPU高性能编程CUDA实战》第十一章多GPU系统的CUDA C
▶ 本章介绍了多设备胸膛下的 CUDA 编程,以及一些特殊存储类型对计算速度的影响 ● 显存和零拷贝内存的拷贝与计算对比 #include <stdio.h> #include " ...
《GPU高性能编程CUDA实战》第四章简单的线程块并行
▶ 本章介绍了线程块并行,并给出两个例子:长向量加法和绘制julia集. ● 长向量加法,中规中矩的GPU加法,包含申请内存和显存,赋值,显存传入,计算,显存传出,处理结果,清理内存和显存.用到了 t ...
《GPU高性能编程CUDA实战》第八章图形互操作性
▶ OpenGL与DirectX,等待填坑. ● basic_interop #include <stdio.h> #include "cuda_runtime.h" ...

随机推荐

51Nod1526 分配笔名
分析在trie树上贪心,将所有串加入trie树中,在深度较深的地方匹配会更优. 由于只需要知道最后的总质量,所以直接取每个点的子树中最大的匹配即可复杂度$O(\sum len)$ 加串的时候把 ...
Ubuntu配置操作总结
一.fstab和mtab的区别 /etc/fstab:是开机自动挂载的配置文件,在开机时起作用.相当于启动linux的时候,自动使用检查分区的fsck命令和挂载分区的mount命令,检查分区和挂载分区 ...
构建一个dbt 数据库适配器
脚手架新的适配器首先,将odbc适配器模板复制到同一目录中的新文件. 更新dbt / adapters / factory.py以将新适配器包含为类型.还要将类型添加到dbt / contracts ...
hasura graphql server event trigger 试用
hasura graphql server 是一个很不错的graphql 引擎,当前版本已经支持event triiger 了使用此功能我们可以方便的集成webhook功能,实现灵活,稳定,快捷的消 ...
smarty学习——内建函数部分
Smarty自带一些内建函数. 内建函数是模板语言的一部分. 用户不能创建名称和内建函数一样的自定义函数,也不能修改内建函数. 一.包含的内建函数 {$var=...}{append}{assign} ...
【转】每天一个linux命令（35）：ln 命令
原文网址:http://www.cnblogs.com/peida/archive/2012/12/11/2812294.html ln是linux中又一个非常重要命令,它的功能是为某一个文件在另外一 ...
poj 2096 Collecting Bugs && ZOJ 3329 One Person Game && hdu 4035 Maze——期望DP
poj 2096 题目:http://poj.org/problem?id=2096 f[ i ][ j ] 表示收集了 i 个 n 的那个. j 个 s 的那个的期望步数. #include< ...
java数组变量
数组变量是一种引用类型的变量,能够指向数组对象.数组对象存储在堆内存中,当数组变量为局部变量时存储在栈内存中. int[] p = new int[]{5, 6, 7, 8, 9}; p是数组变量,指 ...
【python】class之类的内建函数
【python】常用的一些内置函数
1.cmp cmp(A,B)函数,比较A,B的大小,如果A大于B,返回1,A小于B返回-1,A等于B返回0 print cmp(12,33) >>>-1 print cmp(&quo ...

《GPU高性能编程CUDA实战》附录三 关于book.h

《GPU高性能编程CUDA实战》附录三 关于book.h的更多相关文章

随机推荐

热门专题

《GPU高性能编程CUDA实战》附录三关于book.h

《GPU高性能编程CUDA实战》附录三关于book.h的更多相关文章