Improve and modularize compile-time CPU detection. Ideally, we should move this to autoconf.
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104
diff --git a/cpu-miner.c b/cpu-miner.c
index abe2a21..f7dc37b 100644
--- a/cpu-miner.c
+++ b/cpu-miner.c
@@ -37,8 +37,8 @@ enum {
};
enum sha256_algos {
- ALGO_C,
- ALGO_4WAY
+ ALGO_C, /* plain C */
+ ALGO_4WAY, /* parallel SSE2 */
};
static bool opt_debug;
@@ -63,7 +63,7 @@ static struct option_help options_help[] = {
{ "algo XXX",
"(-a XXX) Specify sha256 implementation:\n"
"\tc\t\tLinux kernel sha256, implemented in C (default)"
-#ifdef __SSE2__
+#ifdef WANT_SSE2_4WAY
"\n\t4way\t\ttcatm's 4-way SSE2 implementation (EXPERIMENTAL)"
#endif
},
@@ -301,18 +301,23 @@ static void *miner_thread(void *thr_id_int)
gettimeofday(&tv_start, NULL);
/* scan nonces for a proof-of-work hash */
- if (opt_algo == ALGO_C)
+ switch (opt_algo) {
+ case ALGO_C:
rc = scanhash(work.midstate, work.data + 64,
work.hash1, work.hash, &hashes_done);
-#ifdef __SSE2__
- else {
+ break;
+
+#ifdef WANT_SSE2_4WAY
+ case ALGO_4WAY: {
unsigned int rc4 =
ScanHash_4WaySSE2(work.midstate, work.data + 64,
work.hash1, work.hash,
&hashes_done);
rc = (rc4 == -1) ? false : true;
- }
+ }
+ break;
#endif
+ }
hashmeter(thr_id, &tv_start, hashes_done);
@@ -347,7 +352,7 @@ static void parse_arg (int key, char *arg)
case 'a':
if (!strcmp(arg, "c"))
opt_algo = ALGO_C;
-#ifdef __SSE2__
+#ifdef WANT_SSE2_4WAY
else if (!strcmp(arg, "4way"))
opt_algo = ALGO_4WAY;
#endif
diff --git a/miner.h b/miner.h
index 69c56a7..ff5bddc 100644
--- a/miner.h
+++ b/miner.h
@@ -4,6 +4,10 @@
#include <stdbool.h>
#include <jansson.h>
+#ifdef __SSE2__
+#define WANT_SSE2_4WAY 1
+#endif
+
#ifndef ARRAY_SIZE
#define ARRAY_SIZE(arr) (sizeof(arr) / sizeof((arr)[0]))
#endif
diff --git a/sha256_4way.c b/sha256_4way.c
index ae30f76..3fe3114 100644
--- a/sha256_4way.c
+++ b/sha256_4way.c
@@ -4,14 +4,15 @@
// tcatm's 4-way 128-bit SSE2 SHA-256
-#ifdef __SSE2__
-
#include <string.h>
#include <assert.h>
#include <xmmintrin.h>
#include <stdint.h>
#include <stdio.h>
+#include "miner.h"
+
+#ifdef WANT_SSE2_4WAY
#define NPAR 32
@@ -467,4 +468,4 @@ static void DoubleBlockSHA256(const void* pin, void* pad, const void *pre, unsig
}
-#endif /* __SSE2__ */
+#endif /* WANT_SSE2_4WAY */