blob: a7bcd4e48f9c6e181053b04a5a98716a832b1901 (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
|
#include <iostream>
#include "file1.h"
#include "file2.h"
#ifdef _WIN32
#define EXPORT __declspec(dllexport)
#define IMPORT __declspec(dllimport)
#else
#define EXPORT
#define IMPORT
#endif
result_type __device__ file1_func(int x);
result_type_dynamic __device__ file2_func(int x);
IMPORT void __host__ cuda_dynamic_lib_func();
static
__global__
void mixed_kernel(result_type& r, int x)
{
r = file1_func(x);
result_type_dynamic rd = file2_func(x);
}
EXPORT int mixed_launch_kernel(int x)
{
cuda_dynamic_lib_func();
result_type r;
mixed_kernel <<<1,1>>> (r,x);
cudaError_t err = cudaGetLastError();
if(err != cudaSuccess)
{
std::cerr << "mixed_kernel [SYNC] failed: "
<< cudaGetErrorString(err) << std::endl;
return x;
}
err = cudaDeviceSynchronize();
if(err != cudaSuccess)
{
std::cerr << "mixed_kernel [ASYNC] failed: "
<< cudaGetErrorString(cudaGetLastError()) << std::endl;
return x;
}
return r.sum;
}
|