NetBSD/sys/dev/raidframe/rf_nwayxor.c
oster 38a3987b69 RAIDframe, version 1.1, from the Parallel Data Laboratory at
Carnegie Mellon University.  Full RAID implementation, including
levels 0, 1, 4, 5, 6, parity logging, and a few other goodies.
Ported to NetBSD by Greg Oster.
1998-11-13 04:20:26 +00:00

454 lines
13 KiB
C

/* $NetBSD: rf_nwayxor.c,v 1.1 1998/11/13 04:20:31 oster Exp $ */
/*
* Copyright (c) 1995 Carnegie-Mellon University.
* All rights reserved.
*
* Author: Mark Holland, Daniel Stodolsky
*
* Permission to use, copy, modify and distribute this software and
* its documentation is hereby granted, provided that both the copyright
* notice and this permission notice appear in all copies of the
* software, derivative works or modified versions, and any portions
* thereof, and that both notices appear in supporting documentation.
*
* CARNEGIE MELLON ALLOWS FREE USE OF THIS SOFTWARE IN ITS "AS IS"
* CONDITION. CARNEGIE MELLON DISCLAIMS ANY LIABILITY OF ANY KIND
* FOR ANY DAMAGES WHATSOEVER RESULTING FROM THE USE OF THIS SOFTWARE.
*
* Carnegie Mellon requests users of this software to return to
*
* Software Distribution Coordinator or Software.Distribution@CS.CMU.EDU
* School of Computer Science
* Carnegie Mellon University
* Pittsburgh PA 15213-3890
*
* any improvements or extensions that they make and grant Carnegie the
* rights to redistribute these changes.
*/
/************************************************************
*
* nwayxor.c -- code to do N-way xors for reconstruction
*
* nWayXorN xors N input buffers into the destination buffer.
* adapted from danner's longword_bxor code.
*
************************************************************/
/* :
* Log: rf_nwayxor.c,v
* Revision 1.6 1996/06/12 03:31:18 jimz
* only print call counts if rf_showXorCallCounts != 0
*
* Revision 1.5 1996/06/10 11:55:47 jimz
* Straightened out some per-array/not-per-array distinctions, fixed
* a couple bugs related to confusion. Added shutdown lists. Removed
* layout shutdown function (now subsumed by shutdown lists).
*
* Revision 1.4 1996/06/02 17:31:48 jimz
* Moved a lot of global stuff into array structure, where it belongs.
* Fixed up paritylogging, pss modules in this manner. Some general
* code cleanup. Removed lots of dead code, some dead files.
*
* Revision 1.3 1996/05/18 19:51:34 jimz
* major code cleanup- fix syntax, make some types consistent,
* add prototypes, clean out dead code, et cetera
*
* Revision 1.2 1995/12/01 19:29:14 root
* added copyright info
*
*/
#include "rf_nwayxor.h"
#include "rf_shutdown.h"
static int callcount[10];
static void rf_ShutdownNWayXor(void *);
static void rf_ShutdownNWayXor(ignored)
void *ignored;
{
int i;
if (rf_showXorCallCounts == 0)
return;
printf("Call counts for n-way xor routines: ");
for (i=0; i<10; i++)
printf("%d ",callcount[i]);
printf("\n");
}
int rf_ConfigureNWayXor(listp)
RF_ShutdownList_t **listp;
{
int i, rc;
for (i=0; i<10; i++)
callcount[i] = 0;
rc = rf_ShutdownCreate(listp, rf_ShutdownNWayXor, NULL);
return(rc);
}
void rf_nWayXor1(src_rbs, dest_rb, len)
RF_ReconBuffer_t **src_rbs;
RF_ReconBuffer_t *dest_rb;
int len;
{
register unsigned long *src = (unsigned long *) src_rbs[0]->buffer;
register unsigned long *dest= (unsigned long *) dest_rb->buffer;
register unsigned long *end = src+len;
register unsigned long d0, d1, d2, d3, s0, s1, s2, s3;
callcount[1]++;
while (len >= 4 )
{
d0 = dest[0];
d1 = dest[1];
d2 = dest[2];
d3 = dest[3];
s0 = src[0];
s1 = src[1];
s2 = src[2];
s3 = src[3];
dest[0] = d0 ^ s0;
dest[1] = d1 ^ s1;
dest[2] = d2 ^ s2;
dest[3] = d3 ^ s3;
src += 4;
dest += 4;
len -= 4;
}
while (src < end) {*dest++ ^= *src++;}
}
void rf_nWayXor2(src_rbs, dest_rb, len)
RF_ReconBuffer_t **src_rbs;
RF_ReconBuffer_t *dest_rb;
int len;
{
register unsigned long *dst = (unsigned long *) dest_rb->buffer;
register unsigned long *a = dst;
register unsigned long *b = (unsigned long *) src_rbs[0]->buffer;
register unsigned long *c = (unsigned long *) src_rbs[1]->buffer;
unsigned long a0,a1,a2,a3, b0,b1,b2,b3;
callcount[2]++;
/* align dest to cache line */
while ((((unsigned long) dst) & 0x1f))
{
*dst++ = *a++ ^ *b++ ^ *c++;
len--;
}
while (len > 4 )
{
a0 = a[0]; len -= 4;
a1 = a[1];
a2 = a[2];
a3 = a[3]; a += 4;
b0 = b[0];
b1 = b[1];
b2 = b[2];
b3 = b[3];
/* start dual issue */
a0 ^= b0; b0 = c[0];
b += 4; a1 ^= b1;
a2 ^= b2; a3 ^= b3;
b1 = c[1]; a0 ^= b0;
b2 = c[2]; a1 ^= b1;
b3 = c[3]; a2 ^= b2;
dst[0] = a0; a3 ^= b3;
dst[1] = a1; c += 4;
dst[2] = a2;
dst[3] = a3; dst += 4;
}
while (len)
{
*dst++ = *a++ ^ *b++ ^ *c++;
len--;
}
}
/* note that first arg is not incremented but 2nd arg is */
#define LOAD_FIRST(_dst,_b) \
a0 = _dst[0]; len -= 4; \
a1 = _dst[1]; \
a2 = _dst[2]; \
a3 = _dst[3]; \
b0 = _b[0]; \
b1 = _b[1]; \
b2 = _b[2]; \
b3 = _b[3]; _b += 4;
/* note: arg is incremented */
#define XOR_AND_LOAD_NEXT(_n) \
a0 ^= b0; b0 = _n[0]; \
a1 ^= b1; b1 = _n[1]; \
a2 ^= b2; b2 = _n[2]; \
a3 ^= b3; b3 = _n[3]; \
_n += 4;
/* arg is incremented */
#define XOR_AND_STORE(_dst) \
a0 ^= b0; _dst[0] = a0; \
a1 ^= b1; _dst[1] = a1; \
a2 ^= b2; _dst[2] = a2; \
a3 ^= b3; _dst[3] = a3; \
_dst += 4;
void rf_nWayXor3(src_rbs, dest_rb, len)
RF_ReconBuffer_t **src_rbs;
RF_ReconBuffer_t *dest_rb;
int len;
{
register unsigned long *dst = (unsigned long *) dest_rb->buffer;
register unsigned long *b = (unsigned long *) src_rbs[0]->buffer;
register unsigned long *c = (unsigned long *) src_rbs[1]->buffer;
register unsigned long *d = (unsigned long *) src_rbs[2]->buffer;
unsigned long a0,a1,a2,a3, b0,b1,b2,b3;
callcount[3]++;
/* align dest to cache line */
while ((((unsigned long) dst) & 0x1f)) {
*dst++ ^= *b++ ^ *c++ ^ *d++;
len--;
}
while (len > 4 ) {
LOAD_FIRST(dst,b);
XOR_AND_LOAD_NEXT(c);
XOR_AND_LOAD_NEXT(d);
XOR_AND_STORE(dst);
}
while (len) {
*dst++ ^= *b++ ^ *c++ ^ *d++;
len--;
}
}
void rf_nWayXor4(src_rbs, dest_rb, len)
RF_ReconBuffer_t **src_rbs;
RF_ReconBuffer_t *dest_rb;
int len;
{
register unsigned long *dst = (unsigned long *) dest_rb->buffer;
register unsigned long *b = (unsigned long *) src_rbs[0]->buffer;
register unsigned long *c = (unsigned long *) src_rbs[1]->buffer;
register unsigned long *d = (unsigned long *) src_rbs[2]->buffer;
register unsigned long *e = (unsigned long *) src_rbs[3]->buffer;
unsigned long a0,a1,a2,a3, b0,b1,b2,b3;
callcount[4]++;
/* align dest to cache line */
while ((((unsigned long) dst) & 0x1f)) {
*dst++ ^= *b++ ^ *c++ ^ *d++ ^ *e++;
len--;
}
while (len > 4 ) {
LOAD_FIRST(dst,b);
XOR_AND_LOAD_NEXT(c);
XOR_AND_LOAD_NEXT(d);
XOR_AND_LOAD_NEXT(e);
XOR_AND_STORE(dst);
}
while (len) {
*dst++ ^= *b++ ^ *c++ ^ *d++ ^ *e++;
len--;
}
}
void rf_nWayXor5(src_rbs, dest_rb, len)
RF_ReconBuffer_t **src_rbs;
RF_ReconBuffer_t *dest_rb;
int len;
{
register unsigned long *dst = (unsigned long *) dest_rb->buffer;
register unsigned long *b = (unsigned long *) src_rbs[0]->buffer;
register unsigned long *c = (unsigned long *) src_rbs[1]->buffer;
register unsigned long *d = (unsigned long *) src_rbs[2]->buffer;
register unsigned long *e = (unsigned long *) src_rbs[3]->buffer;
register unsigned long *f = (unsigned long *) src_rbs[4]->buffer;
unsigned long a0,a1,a2,a3, b0,b1,b2,b3;
callcount[5]++;
/* align dest to cache line */
while ((((unsigned long) dst) & 0x1f)) {
*dst++ ^= *b++ ^ *c++ ^ *d++ ^ *e++ ^ *f++;
len--;
}
while (len > 4 ) {
LOAD_FIRST(dst,b);
XOR_AND_LOAD_NEXT(c);
XOR_AND_LOAD_NEXT(d);
XOR_AND_LOAD_NEXT(e);
XOR_AND_LOAD_NEXT(f);
XOR_AND_STORE(dst);
}
while (len) {
*dst++ ^= *b++ ^ *c++ ^ *d++ ^ *e++ ^ *f++;
len--;
}
}
void rf_nWayXor6(src_rbs, dest_rb, len)
RF_ReconBuffer_t **src_rbs;
RF_ReconBuffer_t *dest_rb;
int len;
{
register unsigned long *dst = (unsigned long *) dest_rb->buffer;
register unsigned long *b = (unsigned long *) src_rbs[0]->buffer;
register unsigned long *c = (unsigned long *) src_rbs[1]->buffer;
register unsigned long *d = (unsigned long *) src_rbs[2]->buffer;
register unsigned long *e = (unsigned long *) src_rbs[3]->buffer;
register unsigned long *f = (unsigned long *) src_rbs[4]->buffer;
register unsigned long *g = (unsigned long *) src_rbs[5]->buffer;
unsigned long a0,a1,a2,a3, b0,b1,b2,b3;
callcount[6]++;
/* align dest to cache line */
while ((((unsigned long) dst) & 0x1f)) {
*dst++ ^= *b++ ^ *c++ ^ *d++ ^ *e++ ^ *f++ ^ *g++;
len--;
}
while (len > 4 ) {
LOAD_FIRST(dst,b);
XOR_AND_LOAD_NEXT(c);
XOR_AND_LOAD_NEXT(d);
XOR_AND_LOAD_NEXT(e);
XOR_AND_LOAD_NEXT(f);
XOR_AND_LOAD_NEXT(g);
XOR_AND_STORE(dst);
}
while (len) {
*dst++ ^= *b++ ^ *c++ ^ *d++ ^ *e++ ^ *f++ ^ *g++;
len--;
}
}
void rf_nWayXor7(src_rbs, dest_rb, len)
RF_ReconBuffer_t **src_rbs;
RF_ReconBuffer_t *dest_rb;
int len;
{
register unsigned long *dst = (unsigned long *) dest_rb->buffer;
register unsigned long *b = (unsigned long *) src_rbs[0]->buffer;
register unsigned long *c = (unsigned long *) src_rbs[1]->buffer;
register unsigned long *d = (unsigned long *) src_rbs[2]->buffer;
register unsigned long *e = (unsigned long *) src_rbs[3]->buffer;
register unsigned long *f = (unsigned long *) src_rbs[4]->buffer;
register unsigned long *g = (unsigned long *) src_rbs[5]->buffer;
register unsigned long *h = (unsigned long *) src_rbs[6]->buffer;
unsigned long a0,a1,a2,a3, b0,b1,b2,b3;
callcount[7]++;
/* align dest to cache line */
while ((((unsigned long) dst) & 0x1f)) {
*dst++ ^= *b++ ^ *c++ ^ *d++ ^ *e++ ^ *f++ ^ *g++ ^ *h++;
len--;
}
while (len > 4 ) {
LOAD_FIRST(dst,b);
XOR_AND_LOAD_NEXT(c);
XOR_AND_LOAD_NEXT(d);
XOR_AND_LOAD_NEXT(e);
XOR_AND_LOAD_NEXT(f);
XOR_AND_LOAD_NEXT(g);
XOR_AND_LOAD_NEXT(h);
XOR_AND_STORE(dst);
}
while (len) {
*dst++ ^= *b++ ^ *c++ ^ *d++ ^ *e++ ^ *f++ ^ *g++ ^ *h++;
len--;
}
}
void rf_nWayXor8(src_rbs, dest_rb, len)
RF_ReconBuffer_t **src_rbs;
RF_ReconBuffer_t *dest_rb;
int len;
{
register unsigned long *dst = (unsigned long *) dest_rb->buffer;
register unsigned long *b = (unsigned long *) src_rbs[0]->buffer;
register unsigned long *c = (unsigned long *) src_rbs[1]->buffer;
register unsigned long *d = (unsigned long *) src_rbs[2]->buffer;
register unsigned long *e = (unsigned long *) src_rbs[3]->buffer;
register unsigned long *f = (unsigned long *) src_rbs[4]->buffer;
register unsigned long *g = (unsigned long *) src_rbs[5]->buffer;
register unsigned long *h = (unsigned long *) src_rbs[6]->buffer;
register unsigned long *i = (unsigned long *) src_rbs[7]->buffer;
unsigned long a0,a1,a2,a3, b0,b1,b2,b3;
callcount[8]++;
/* align dest to cache line */
while ((((unsigned long) dst) & 0x1f)) {
*dst++ ^= *b++ ^ *c++ ^ *d++ ^ *e++ ^ *f++ ^ *g++ ^ *h++ ^ *i++;
len--;
}
while (len > 4 ) {
LOAD_FIRST(dst,b);
XOR_AND_LOAD_NEXT(c);
XOR_AND_LOAD_NEXT(d);
XOR_AND_LOAD_NEXT(e);
XOR_AND_LOAD_NEXT(f);
XOR_AND_LOAD_NEXT(g);
XOR_AND_LOAD_NEXT(h);
XOR_AND_LOAD_NEXT(i);
XOR_AND_STORE(dst);
}
while (len) {
*dst++ ^= *b++ ^ *c++ ^ *d++ ^ *e++ ^ *f++ ^ *g++ ^ *h++ ^ *i++;
len--;
}
}
void rf_nWayXor9(src_rbs, dest_rb, len)
RF_ReconBuffer_t **src_rbs;
RF_ReconBuffer_t *dest_rb;
int len;
{
register unsigned long *dst = (unsigned long *) dest_rb->buffer;
register unsigned long *b = (unsigned long *) src_rbs[0]->buffer;
register unsigned long *c = (unsigned long *) src_rbs[1]->buffer;
register unsigned long *d = (unsigned long *) src_rbs[2]->buffer;
register unsigned long *e = (unsigned long *) src_rbs[3]->buffer;
register unsigned long *f = (unsigned long *) src_rbs[4]->buffer;
register unsigned long *g = (unsigned long *) src_rbs[5]->buffer;
register unsigned long *h = (unsigned long *) src_rbs[6]->buffer;
register unsigned long *i = (unsigned long *) src_rbs[7]->buffer;
register unsigned long *j = (unsigned long *) src_rbs[8]->buffer;
unsigned long a0,a1,a2,a3, b0,b1,b2,b3;
callcount[9]++;
/* align dest to cache line */
while ((((unsigned long) dst) & 0x1f)) {
*dst++ ^= *b++ ^ *c++ ^ *d++ ^ *e++ ^ *f++ ^ *g++ ^ *h++ ^ *i++ ^ *j++;
len--;
}
while (len > 4 ) {
LOAD_FIRST(dst,b);
XOR_AND_LOAD_NEXT(c);
XOR_AND_LOAD_NEXT(d);
XOR_AND_LOAD_NEXT(e);
XOR_AND_LOAD_NEXT(f);
XOR_AND_LOAD_NEXT(g);
XOR_AND_LOAD_NEXT(h);
XOR_AND_LOAD_NEXT(i);
XOR_AND_LOAD_NEXT(j);
XOR_AND_STORE(dst);
}
while (len) {
*dst++ ^= *b++ ^ *c++ ^ *d++ ^ *e++ ^ *f++ ^ *g++ ^ *h++ ^ *i++ ^ *j++;
len--;
}
}