-
Notifications
You must be signed in to change notification settings - Fork 9
/
rad.cpp
114 lines (100 loc) · 3.31 KB
/
rad.cpp
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
#include "sph/sph_sha2.h"
#include "miner.h"
#include "cuda_helper.h"
extern void rad_cpu_init(int thr_id);
extern void rad_cpu_hash(int thr_id, uint32_t threads, uint32_t startNounce, const uint64_t *const data, uint32_t *const h_nounce);
extern void rad_midstate(const uint32_t *data, uint32_t *midstate);
void rad_hash(uint32_t *output, const uint32_t *data, uint32_t nonce)
{
uint32_t header[20];
for (int i = 0; i < 20; i++) {
header[i] = swab32(data[i]);
}
header[19] = swab32(nonce);
sph_sha512_context ctx;
sph_sha512_256_init(&ctx);
sph_sha512(&ctx, header, 80);
uint32_t hash1[16];
sph_sha512_close(&ctx, hash1);
uint32_t hash2[16];
sph_sha512_256_init(&ctx);
sph_sha512(&ctx, hash1, 32);
sph_sha512_close(&ctx, hash2);
for (int i = 0; i < 8; i++) {
output[i] = hash2[i];
}
}
int scanhash_rad(int thr_id, uint32_t *pdata,
uint32_t *ptarget, uint32_t max_nonce,
uint32_t *hashes_done)
{
static THREAD uint32_t *h_nounce = nullptr;
const uint32_t first_nonce = pdata[19];
uint32_t throughputmax = device_intensity(device_map[thr_id], __func__, 1U << 28);
uint32_t throughput = min(throughputmax, (max_nonce - first_nonce)) & 0xfffffc00;
if (opt_benchmark)
ptarget[7] = 0x0005;
static THREAD volatile bool init = false;
if(!init)
{
if(throughputmax == 1<<28)
applog(LOG_INFO, "GPU #%d: using default intensity 28", device_map[thr_id]);
CUDA_SAFE_CALL(cudaSetDevice(device_map[thr_id]));
CUDA_SAFE_CALL(cudaDeviceReset());
CUDA_SAFE_CALL(cudaSetDeviceFlags(cudaschedule));
CUDA_SAFE_CALL(cudaDeviceSetCacheConfig(cudaFuncCachePreferL1));
CUDA_SAFE_CALL(cudaStreamCreate(&gpustream[thr_id]));
rad_cpu_init(thr_id);
CUDA_SAFE_CALL(cudaMallocHost(&h_nounce, 2 * sizeof(uint32_t)));
mining_has_stopped[thr_id] = false;
init = true;
}
do
{
rad_cpu_hash(thr_id, throughput, pdata[19], (uint64_t *)pdata, h_nounce);
if(stop_mining) {mining_has_stopped[thr_id] = true; cudaStreamDestroy(gpustream[thr_id]); pthread_exit(nullptr);}
if(h_nounce[0] != UINT32_MAX)
{
uint32_t vhash64[8]={0};
rad_hash(vhash64, pdata, h_nounce[0]);
if (!opt_verify || (vhash64[7] == 0 && fulltest(vhash64, ptarget)))
{
int res = 1;
// check if there was some other ones...
*hashes_done = pdata[19] - first_nonce + throughput;
if (h_nounce[1] != 0xffffffff)
{
rad_hash(vhash64, pdata, h_nounce[1]);
if (!opt_verify || (vhash64[7] == 0 && fulltest(vhash64, ptarget)))
{
pdata[21] = h_nounce[1];
res++;
if (opt_benchmark)
applog(LOG_INFO, "GPU #%d Found second nounce %08x", device_map[thr_id], h_nounce[1]);
}
else
{
if (vhash64[7] > 0)
{
applog(LOG_WARNING, "GPU #%d: result for %08x does not validate on CPU!", device_map[thr_id], h_nounce[1]);
}
}
}
pdata[19] = h_nounce[0];
if (opt_benchmark)
applog(LOG_INFO, "GPU #%d Found nounce %08x", device_map[thr_id], h_nounce[0]);
return res;
}
else
{
if (vhash64[7] > 0)
{
applog(LOG_WARNING, "GPU #%d: result for %08x does not validate on CPU!", device_map[thr_id], h_nounce[0]);
}
}
}
pdata[19] += throughput; CUDA_SAFE_CALL(cudaGetLastError());
} while (!work_restart[thr_id].restart && ((uint64_t)max_nonce > ((uint64_t)(pdata[19]) + (uint64_t)throughput)));
*hashes_done = pdata[19] - first_nonce ;
return 0;
}