]> git.proxmox.com Git - ceph.git/blob - ceph/src/spdk/isa-l/examples/ec/ec_piggyback_example.c
eb2d374b9e0fd7d94c1f7f315639dd4c3af37530
[ceph.git] / ceph / src / spdk / isa-l / examples / ec / ec_piggyback_example.c
1 /**********************************************************************
2 Copyright(c) 2011-2018 Intel Corporation All rights reserved.
3
4 Redistribution and use in source and binary forms, with or without
5 modification, are permitted provided that the following conditions
6 are met:
7 * Redistributions of source code must retain the above copyright
8 notice, this list of conditions and the following disclaimer.
9 * Redistributions in binary form must reproduce the above copyright
10 notice, this list of conditions and the following disclaimer in
11 the documentation and/or other materials provided with the
12 distribution.
13 * Neither the name of Intel Corporation nor the names of its
14 contributors may be used to endorse or promote products derived
15 from this software without specific prior written permission.
16
17 THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
18 "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
19 LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
20 A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
21 OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
22 SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
23 LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
24 DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
25 THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
26 (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
27 OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
28 **********************************************************************/
29
30 #include <stdio.h>
31 #include <stdlib.h>
32 #include <string.h>
33 #include <getopt.h>
34 #include "erasure_code.h" // use <isa-l.h> instead when linking against installed
35 #include "test.h"
36
37 #define MMAX 255
38 #define KMAX 255
39
40 typedef unsigned char u8;
41 int verbose = 0;
42
43 int usage(void)
44 {
45 fprintf(stderr,
46 "Usage: ec_piggyback_example [options]\n"
47 " -h Help\n"
48 " -k <val> Number of source fragments\n"
49 " -p <val> Number of parity fragments\n"
50 " -l <val> Length of fragments\n"
51 " -e <val> Simulate erasure on frag index val. Zero based. Can be repeated.\n"
52 " -v Verbose\n"
53 " -b Run timed benchmark\n"
54 " -s Toggle use of sparse matrix opt\n"
55 " -r <seed> Pick random (k, p) with seed\n");
56 exit(0);
57 }
58
59 // Cauchy-based matrix
60 void gf_gen_full_pb_cauchy_matrix(u8 * a, int m, int k)
61 {
62 int i, j, p = m - k;
63
64 // Identity matrix in top k x k to indicate a symetric code
65 memset(a, 0, k * m);
66 for (i = 0; i < k; i++)
67 a[k * i + i] = 1;
68
69 for (i = k; i < (k + p / 2); i++) {
70 for (j = 0; j < k / 2; j++)
71 a[k * i + j] = gf_inv(i ^ j);
72 for (; j < k; j++)
73 a[k * i + j] = 0;
74 }
75 for (; i < m; i++) {
76 for (j = 0; j < k / 2; j++)
77 a[k * i + j] = 0;
78 for (; j < k; j++)
79 a[k * i + j] = gf_inv((i - p / 2) ^ (j - k / 2));
80 }
81
82 // Fill in mixture of B parity depending on a few localized A sources
83 int r = 0, c = 0;
84 int repeat_len = k / (p - 2);
85 int parity_rows = p / 2;
86
87 for (i = 1 + k + parity_rows; i < m; i++, r++) {
88 if (r == (parity_rows - 1) - ((k / 2 % (parity_rows - 1))))
89 repeat_len++;
90
91 for (j = 0; j < repeat_len; j++, c++)
92 a[k * i + c] = gf_inv((k + 1) ^ c);
93 }
94 }
95
96 // Vandermonde based matrix - not recommended due to limits when invertable
97 void gf_gen_full_pb_vand_matrix(u8 * a, int m, int k)
98 {
99 int i, j, p = m - k;
100 unsigned char q, gen = 1;
101
102 // Identity matrix in top k x k to indicate a symetric code
103 memset(a, 0, k * m);
104 for (i = 0; i < k; i++)
105 a[k * i + i] = 1;
106
107 for (i = k; i < (k + (p / 2)); i++) {
108 q = 1;
109 for (j = 0; j < k / 2; j++) {
110 a[k * i + j] = q;
111 q = gf_mul(q, gen);
112 }
113 for (; j < k; j++)
114 a[k * i + j] = 0;
115 gen = gf_mul(gen, 2);
116 }
117 gen = 1;
118 for (; i < m; i++) {
119 q = 1;
120 for (j = 0; j < k / 2; j++) {
121 a[k * i + j] = 0;
122 }
123 for (; j < k; j++) {
124 a[k * i + j] = q;
125 q = gf_mul(q, gen);
126 }
127 gen = gf_mul(gen, 2);
128 }
129
130 // Fill in mixture of B parity depending on a few localized A sources
131 int r = 0, c = 0;
132 int repeat_len = k / (p - 2);
133 int parity_rows = p / 2;
134
135 for (i = 1 + k + parity_rows; i < m; i++, r++) {
136 if (r == (parity_rows - 1) - ((k / 2 % (parity_rows - 1))))
137 repeat_len++;
138
139 for (j = 0; j < repeat_len; j++)
140 a[k * i + c++] = 1;
141 }
142 }
143
144 void print_matrix(int m, int k, unsigned char *s, const char *msg)
145 {
146 int i, j;
147
148 printf("%s:\n", msg);
149 for (i = 0; i < m; i++) {
150 printf("%3d- ", i);
151 for (j = 0; j < k; j++) {
152 printf(" %2x", 0xff & s[j + (i * k)]);
153 }
154 printf("\n");
155 }
156 printf("\n");
157 }
158
159 void print_list(int n, unsigned char *s, const char *msg)
160 {
161 int i;
162 if (!verbose)
163 return;
164
165 printf("%s: ", msg);
166 for (i = 0; i < n; i++)
167 printf(" %d", s[i]);
168 printf("\n");
169 }
170
171 static int gf_gen_decode_matrix(u8 * encode_matrix,
172 u8 * decode_matrix,
173 u8 * invert_matrix,
174 u8 * temp_matrix,
175 u8 * decode_index,
176 u8 * frag_err_list, int nerrs, int k, int m);
177
178 int main(int argc, char *argv[])
179 {
180 int i, j, m, c, e, ret;
181 int k = 10, p = 4, len = 8 * 1024; // Default params
182 int nerrs = 0;
183 int benchmark = 0;
184 int sparse_matrix_opt = 1;
185
186 // Fragment buffer pointers
187 u8 *frag_ptrs[MMAX];
188 u8 *parity_ptrs[KMAX];
189 u8 *recover_srcs[KMAX];
190 u8 *recover_outp[KMAX];
191 u8 frag_err_list[MMAX];
192
193 // Coefficient matrices
194 u8 *encode_matrix, *decode_matrix;
195 u8 *invert_matrix, *temp_matrix;
196 u8 *g_tbls;
197 u8 decode_index[MMAX];
198
199 if (argc == 1)
200 for (i = 0; i < p; i++)
201 frag_err_list[nerrs++] = rand() % (k + p);
202
203 while ((c = getopt(argc, argv, "k:p:l:e:r:hvbs")) != -1) {
204 switch (c) {
205 case 'k':
206 k = atoi(optarg);
207 break;
208 case 'p':
209 p = atoi(optarg);
210 break;
211 case 'l':
212 len = atoi(optarg);
213 if (len < 0)
214 usage();
215 break;
216 case 'e':
217 e = atoi(optarg);
218 frag_err_list[nerrs++] = e;
219 break;
220 case 'r':
221 srand(atoi(optarg));
222 k = (rand() % MMAX) / 4;
223 k = (k < 2) ? 2 : k;
224 p = (rand() % (MMAX - k)) / 4;
225 p = (p < 2) ? 2 : p;
226 for (i = 0; i < k && nerrs < p; i++)
227 if (rand() & 1)
228 frag_err_list[nerrs++] = i;
229 break;
230 case 'v':
231 verbose++;
232 break;
233 case 'b':
234 benchmark = 1;
235 break;
236 case 's':
237 sparse_matrix_opt = !sparse_matrix_opt;
238 break;
239 case 'h':
240 default:
241 usage();
242 break;
243 }
244 }
245 m = k + p;
246
247 // Check for valid parameters
248 if (m > (MMAX / 2) || k > (KMAX / 2) || m < 0 || p < 2 || k < 1) {
249 printf(" Input test parameter error m=%d, k=%d, p=%d, erasures=%d\n",
250 m, k, p, nerrs);
251 usage();
252 }
253 if (nerrs > p) {
254 printf(" Number of erasures chosen exceeds power of code erasures=%d p=%d\n",
255 nerrs, p);
256 }
257 for (i = 0; i < nerrs; i++) {
258 if (frag_err_list[i] >= m)
259 printf(" fragment %d not in range\n", frag_err_list[i]);
260 }
261
262 printf("ec_piggyback_example:\n");
263
264 /*
265 * One simple way to implement piggyback codes is to keep a 2x wide matrix
266 * that covers the how each parity is related to both A and B sources. This
267 * keeps it easy to generalize in parameters m,k and the resulting sparse
268 * matrix multiplication can be optimized by pre-removal of zero items.
269 */
270
271 int k2 = 2 * k;
272 int p2 = 2 * p;
273 int m2 = k2 + p2;
274 int nerrs2 = nerrs;
275
276 encode_matrix = malloc(m2 * k2);
277 decode_matrix = malloc(m2 * k2);
278 invert_matrix = malloc(m2 * k2);
279 temp_matrix = malloc(m2 * k2);
280 g_tbls = malloc(k2 * p2 * 32);
281
282 if (encode_matrix == NULL || decode_matrix == NULL
283 || invert_matrix == NULL || temp_matrix == NULL || g_tbls == NULL) {
284 printf("Test failure! Error with malloc\n");
285 return -1;
286 }
287 // Allocate the src fragments
288 for (i = 0; i < k; i++) {
289 if (NULL == (frag_ptrs[i] = malloc(len))) {
290 printf("alloc error: Fail\n");
291 return -1;
292 }
293 }
294 // Allocate the parity fragments
295 for (i = 0; i < p2; i++) {
296 if (NULL == (parity_ptrs[i] = malloc(len / 2))) {
297 printf("alloc error: Fail\n");
298 return -1;
299 }
300 }
301
302 // Allocate buffers for recovered data
303 for (i = 0; i < p2; i++) {
304 if (NULL == (recover_outp[i] = malloc(len / 2))) {
305 printf("alloc error: Fail\n");
306 return -1;
307 }
308 }
309
310 // Fill sources with random data
311 for (i = 0; i < k; i++)
312 for (j = 0; j < len; j++)
313 frag_ptrs[i][j] = rand();
314
315 printf(" encode (m,k,p)=(%d,%d,%d) len=%d\n", m, k, p, len);
316
317 // Pick an encode matrix.
318 gf_gen_full_pb_cauchy_matrix(encode_matrix, m2, k2);
319
320 if (verbose)
321 print_matrix(m2, k2, encode_matrix, "encode matrix");
322
323 // Initialize g_tbls from encode matrix
324 ec_init_tables(k2, p2, &encode_matrix[k2 * k2], g_tbls);
325
326 // Fold A and B into single list of fragments
327 for (i = 0; i < k; i++)
328 frag_ptrs[i + k] = &frag_ptrs[i][len / 2];
329
330 if (!sparse_matrix_opt) {
331 // Standard encode using no assumptions on the encode matrix
332
333 // Generate EC parity blocks from sources
334 ec_encode_data(len / 2, k2, p2, g_tbls, frag_ptrs, parity_ptrs);
335
336 if (benchmark) {
337 struct perf start, stop;
338 unsigned long long iterations = (1ull << 32) / (m * len);
339 perf_start(&start);
340 for (i = 0; i < iterations; i++) {
341 ec_encode_data(len / 2, k2, p2, g_tbls, frag_ptrs,
342 parity_ptrs);
343 }
344 perf_stop(&stop);
345 printf("ec_piggyback_encode_std: ");
346 perf_print(stop, start, iterations * m2 * len / 2);
347 }
348 } else {
349 // Sparse matrix optimization - use fact that input matrix is sparse
350
351 // Keep an encode matrix with some zero elements removed
352 u8 *encode_matrix_faster, *g_tbls_faster;
353 encode_matrix_faster = malloc(m * k);
354 g_tbls_faster = malloc(k * p * 32);
355 if (encode_matrix_faster == NULL || g_tbls_faster == NULL) {
356 printf("Test failure! Error with malloc\n");
357 return -1;
358 }
359
360 /*
361 * Pack with only the part that we know are non-zero. Alternatively
362 * we could search and keep track of non-zero elements but for
363 * simplicity we just skip the lower quadrant.
364 */
365 for (i = k, j = k2; i < m; i++, j++)
366 memcpy(&encode_matrix_faster[k * i], &encode_matrix[k2 * j], k);
367
368 if (verbose) {
369 print_matrix(p, k, &encode_matrix_faster[k * k],
370 "encode via sparse-opt");
371 print_matrix(p2 / 2, k2, &encode_matrix[(k2 + p2 / 2) * k2],
372 "encode via sparse-opt");
373 }
374 // Initialize g_tbls from encode matrix
375 ec_init_tables(k, p, &encode_matrix_faster[k * k], g_tbls_faster);
376
377 // Generate EC parity blocks from sources
378 ec_encode_data(len / 2, k, p, g_tbls_faster, frag_ptrs, parity_ptrs);
379 ec_encode_data(len / 2, k2, p, &g_tbls[k2 * p * 32], frag_ptrs,
380 &parity_ptrs[p]);
381
382 if (benchmark) {
383 struct perf start, stop;
384 unsigned long long iterations = (1ull << 32) / (m * len);
385 perf_start(&start);
386 for (i = 0; i < iterations; i++) {
387 ec_encode_data(len / 2, k, p, g_tbls_faster, frag_ptrs,
388 parity_ptrs);
389 ec_encode_data(len / 2, k2, p, &g_tbls[k2 * p * 32], frag_ptrs,
390 &parity_ptrs[p]);
391 }
392 perf_stop(&stop);
393 printf("ec_piggyback_encode_sparse: ");
394 perf_print(stop, start, iterations * m2 * len / 2);
395 }
396 }
397
398 if (nerrs <= 0)
399 return 0;
400
401 printf(" recover %d fragments\n", nerrs);
402
403 // Set frag pointers to correspond to parity
404 for (i = k2; i < m2; i++)
405 frag_ptrs[i] = parity_ptrs[i - k2];
406
407 print_list(nerrs2, frag_err_list, " frag err list");
408
409 // Find a decode matrix to regenerate all erasures from remaining frags
410 ret = gf_gen_decode_matrix(encode_matrix, decode_matrix,
411 invert_matrix, temp_matrix, decode_index, frag_err_list,
412 nerrs2, k2, m2);
413
414 if (ret != 0) {
415 printf("Fail on generate decode matrix\n");
416 return -1;
417 }
418 // Pack recovery array pointers as list of valid fragments
419 for (i = 0; i < k2; i++)
420 if (decode_index[i] < k2)
421 recover_srcs[i] = frag_ptrs[decode_index[i]];
422 else
423 recover_srcs[i] = parity_ptrs[decode_index[i] - k2];
424
425 print_list(k2, decode_index, " decode index");
426
427 // Recover data
428 ec_init_tables(k2, nerrs2, decode_matrix, g_tbls);
429 ec_encode_data(len / 2, k2, nerrs2, g_tbls, recover_srcs, recover_outp);
430
431 if (benchmark) {
432 struct perf start, stop;
433 unsigned long long iterations = (1ull << 32) / (k * len);
434 perf_start(&start);
435 for (i = 0; i < iterations; i++) {
436 ec_encode_data(len / 2, k2, nerrs2, g_tbls, recover_srcs,
437 recover_outp);
438 }
439 perf_stop(&stop);
440 printf("ec_piggyback_decode: ");
441 perf_print(stop, start, iterations * (k2 + nerrs2) * len / 2);
442 }
443 // Check that recovered buffers are the same as original
444 printf(" check recovery of block {");
445 for (i = 0; i < nerrs2; i++) {
446 printf(" %d", frag_err_list[i]);
447 if (memcmp(recover_outp[i], frag_ptrs[frag_err_list[i]], len / 2)) {
448 printf(" Fail erasure recovery %d, frag %d\n", i, frag_err_list[i]);
449 return -1;
450 }
451 }
452 printf(" } done all: Pass\n");
453
454 return 0;
455 }
456
457 // Generate decode matrix from encode matrix and erasure list
458
459 static int gf_gen_decode_matrix(u8 * encode_matrix,
460 u8 * decode_matrix,
461 u8 * invert_matrix,
462 u8 * temp_matrix,
463 u8 * decode_index, u8 * frag_err_list, int nerrs, int k, int m)
464 {
465 int i, j, p, r;
466 int nsrcerrs = 0;
467 u8 s, *b = temp_matrix;
468 u8 frag_in_err[MMAX];
469
470 memset(frag_in_err, 0, sizeof(frag_in_err));
471
472 // Order the fragments in erasure for easier sorting
473 for (i = 0; i < nerrs; i++) {
474 if (frag_err_list[i] < k)
475 nsrcerrs++;
476 frag_in_err[frag_err_list[i]] = 1;
477 }
478
479 // Construct b (matrix that encoded remaining frags) by removing erased rows
480 for (i = 0, r = 0; i < k; i++, r++) {
481 while (frag_in_err[r])
482 r++;
483 for (j = 0; j < k; j++)
484 b[k * i + j] = encode_matrix[k * r + j];
485 decode_index[i] = r;
486 }
487 if (verbose > 1)
488 print_matrix(k, k, b, "matrix to invert");
489
490 // Invert matrix to get recovery matrix
491 if (gf_invert_matrix(b, invert_matrix, k) < 0)
492 return -1;
493
494 if (verbose > 2)
495 print_matrix(k, k, invert_matrix, "matrix inverted");
496
497 // Get decode matrix with only wanted recovery rows
498 for (i = 0; i < nsrcerrs; i++) {
499 for (j = 0; j < k; j++) {
500 decode_matrix[k * i + j] = invert_matrix[k * frag_err_list[i] + j];
501 }
502 }
503
504 // For non-src (parity) erasures need to multiply encode matrix * invert
505 for (p = nsrcerrs; p < nerrs; p++) {
506 for (i = 0; i < k; i++) {
507 s = 0;
508 for (j = 0; j < k; j++)
509 s ^= gf_mul(invert_matrix[j * k + i],
510 encode_matrix[k * frag_err_list[p] + j]);
511
512 decode_matrix[k * p + i] = s;
513 }
514 }
515 if (verbose > 1)
516 print_matrix(nerrs, k, decode_matrix, "decode matrix");
517 return 0;
518 }