void threefish_decrypt_512()

in drivers/staging/skein/threefish_block.c [2100:3359]


void threefish_decrypt_512(struct threefish_key *key_ctx, u64 *input,
			   u64 *output)
{
	u64 b0 = input[0], b1 = input[1],
	    b2 = input[2], b3 = input[3],
	    b4 = input[4], b5 = input[5],
	    b6 = input[6], b7 = input[7];
	u64 k0 = key_ctx->key[0], k1 = key_ctx->key[1],
	    k2 = key_ctx->key[2], k3 = key_ctx->key[3],
	    k4 = key_ctx->key[4], k5 = key_ctx->key[5],
	    k6 = key_ctx->key[6], k7 = key_ctx->key[7],
	    k8 = key_ctx->key[8];
	u64 t0 = key_ctx->tweak[0], t1 = key_ctx->tweak[1],
	    t2 = key_ctx->tweak[2];

	u64 tmp;

	b0 -= k0;
	b1 -= k1;
	b2 -= k2;
	b3 -= k3;
	b4 -= k4;
	b5 -= k5 + t0;
	b6 -= k6 + t1;
	b7 -= k7 + 18;

	tmp = b3 ^ b4;
	b3 = (tmp >> 22) | (tmp << (64 - 22));
	b4 -= b3;

	tmp = b5 ^ b2;
	b5 = (tmp >> 56) | (tmp << (64 - 56));
	b2 -= b5;

	tmp = b7 ^ b0;
	b7 = (tmp >> 35) | (tmp << (64 - 35));
	b0 -= b7;

	tmp = b1 ^ b6;
	b1 = (tmp >> 8) | (tmp << (64 - 8));
	b6 -= b1;

	tmp = b7 ^ b2;
	b7 = (tmp >> 43) | (tmp << (64 - 43));
	b2 -= b7;

	tmp = b5 ^ b0;
	b5 = (tmp >> 39) | (tmp << (64 - 39));
	b0 -= b5;

	tmp = b3 ^ b6;
	b3 = (tmp >> 29) | (tmp << (64 - 29));
	b6 -= b3;

	tmp = b1 ^ b4;
	b1 = (tmp >> 25) | (tmp << (64 - 25));
	b4 -= b1;

	tmp = b3 ^ b0;
	b3 = (tmp >> 17) | (tmp << (64 - 17));
	b0 -= b3;

	tmp = b5 ^ b6;
	b5 = (tmp >> 10) | (tmp << (64 - 10));
	b6 -= b5;

	tmp = b7 ^ b4;
	b7 = (tmp >> 50) | (tmp << (64 - 50));
	b4 -= b7;

	tmp = b1 ^ b2;
	b1 = (tmp >> 13) | (tmp << (64 - 13));
	b2 -= b1;

	tmp = b7 ^ b6;
	b7 = (tmp >> 24) | (tmp << (64 - 24));
	b6 -= b7 + k5 + t0;
	b7 -= k6 + 17;

	tmp = b5 ^ b4;
	b5 = (tmp >> 34) | (tmp << (64 - 34));
	b4 -= b5 + k3;
	b5 -= k4 + t2;

	tmp = b3 ^ b2;
	b3 = (tmp >> 30) | (tmp << (64 - 30));
	b2 -= b3 + k1;
	b3 -= k2;

	tmp = b1 ^ b0;
	b1 = (tmp >> 39) | (tmp << (64 - 39));
	b0 -= b1 + k8;
	b1 -= k0;

	tmp = b3 ^ b4;
	b3 = (tmp >> 56) | (tmp << (64 - 56));
	b4 -= b3;

	tmp = b5 ^ b2;
	b5 = (tmp >> 54) | (tmp << (64 - 54));
	b2 -= b5;

	tmp = b7 ^ b0;
	b7 = (tmp >> 9) | (tmp << (64 - 9));
	b0 -= b7;

	tmp = b1 ^ b6;
	b1 = (tmp >> 44) | (tmp << (64 - 44));
	b6 -= b1;

	tmp = b7 ^ b2;
	b7 = (tmp >> 39) | (tmp << (64 - 39));
	b2 -= b7;

	tmp = b5 ^ b0;
	b5 = (tmp >> 36) | (tmp << (64 - 36));
	b0 -= b5;

	tmp = b3 ^ b6;
	b3 = (tmp >> 49) | (tmp << (64 - 49));
	b6 -= b3;

	tmp = b1 ^ b4;
	b1 = (tmp >> 17) | (tmp << (64 - 17));
	b4 -= b1;

	tmp = b3 ^ b0;
	b3 = (tmp >> 42) | (tmp << (64 - 42));
	b0 -= b3;

	tmp = b5 ^ b6;
	b5 = (tmp >> 14) | (tmp << (64 - 14));
	b6 -= b5;

	tmp = b7 ^ b4;
	b7 = (tmp >> 27) | (tmp << (64 - 27));
	b4 -= b7;

	tmp = b1 ^ b2;
	b1 = (tmp >> 33) | (tmp << (64 - 33));
	b2 -= b1;

	tmp = b7 ^ b6;
	b7 = (tmp >> 37) | (tmp << (64 - 37));
	b6 -= b7 + k4 + t2;
	b7 -= k5 + 16;

	tmp = b5 ^ b4;
	b5 = (tmp >> 19) | (tmp << (64 - 19));
	b4 -= b5 + k2;
	b5 -= k3 + t1;

	tmp = b3 ^ b2;
	b3 = (tmp >> 36) | (tmp << (64 - 36));
	b2 -= b3 + k0;
	b3 -= k1;

	tmp = b1 ^ b0;
	b1 = (tmp >> 46) | (tmp << (64 - 46));
	b0 -= b1 + k7;
	b1 -= k8;

	tmp = b3 ^ b4;
	b3 = (tmp >> 22) | (tmp << (64 - 22));
	b4 -= b3;

	tmp = b5 ^ b2;
	b5 = (tmp >> 56) | (tmp << (64 - 56));
	b2 -= b5;

	tmp = b7 ^ b0;
	b7 = (tmp >> 35) | (tmp << (64 - 35));
	b0 -= b7;

	tmp = b1 ^ b6;
	b1 = (tmp >> 8) | (tmp << (64 - 8));
	b6 -= b1;

	tmp = b7 ^ b2;
	b7 = (tmp >> 43) | (tmp << (64 - 43));
	b2 -= b7;

	tmp = b5 ^ b0;
	b5 = (tmp >> 39) | (tmp << (64 - 39));
	b0 -= b5;

	tmp = b3 ^ b6;
	b3 = (tmp >> 29) | (tmp << (64 - 29));
	b6 -= b3;

	tmp = b1 ^ b4;
	b1 = (tmp >> 25) | (tmp << (64 - 25));
	b4 -= b1;

	tmp = b3 ^ b0;
	b3 = (tmp >> 17) | (tmp << (64 - 17));
	b0 -= b3;

	tmp = b5 ^ b6;
	b5 = (tmp >> 10) | (tmp << (64 - 10));
	b6 -= b5;

	tmp = b7 ^ b4;
	b7 = (tmp >> 50) | (tmp << (64 - 50));
	b4 -= b7;

	tmp = b1 ^ b2;
	b1 = (tmp >> 13) | (tmp << (64 - 13));
	b2 -= b1;

	tmp = b7 ^ b6;
	b7 = (tmp >> 24) | (tmp << (64 - 24));
	b6 -= b7 + k3 + t1;
	b7 -= k4 + 15;

	tmp = b5 ^ b4;
	b5 = (tmp >> 34) | (tmp << (64 - 34));
	b4 -= b5 + k1;
	b5 -= k2 + t0;

	tmp = b3 ^ b2;
	b3 = (tmp >> 30) | (tmp << (64 - 30));
	b2 -= b3 + k8;
	b3 -= k0;

	tmp = b1 ^ b0;
	b1 = (tmp >> 39) | (tmp << (64 - 39));
	b0 -= b1 + k6;
	b1 -= k7;

	tmp = b3 ^ b4;
	b3 = (tmp >> 56) | (tmp << (64 - 56));
	b4 -= b3;

	tmp = b5 ^ b2;
	b5 = (tmp >> 54) | (tmp << (64 - 54));
	b2 -= b5;

	tmp = b7 ^ b0;
	b7 = (tmp >> 9) | (tmp << (64 - 9));
	b0 -= b7;

	tmp = b1 ^ b6;
	b1 = (tmp >> 44) | (tmp << (64 - 44));
	b6 -= b1;

	tmp = b7 ^ b2;
	b7 = (tmp >> 39) | (tmp << (64 - 39));
	b2 -= b7;

	tmp = b5 ^ b0;
	b5 = (tmp >> 36) | (tmp << (64 - 36));
	b0 -= b5;

	tmp = b3 ^ b6;
	b3 = (tmp >> 49) | (tmp << (64 - 49));
	b6 -= b3;

	tmp = b1 ^ b4;
	b1 = (tmp >> 17) | (tmp << (64 - 17));
	b4 -= b1;

	tmp = b3 ^ b0;
	b3 = (tmp >> 42) | (tmp << (64 - 42));
	b0 -= b3;

	tmp = b5 ^ b6;
	b5 = (tmp >> 14) | (tmp << (64 - 14));
	b6 -= b5;

	tmp = b7 ^ b4;
	b7 = (tmp >> 27) | (tmp << (64 - 27));
	b4 -= b7;

	tmp = b1 ^ b2;
	b1 = (tmp >> 33) | (tmp << (64 - 33));
	b2 -= b1;

	tmp = b7 ^ b6;
	b7 = (tmp >> 37) | (tmp << (64 - 37));
	b6 -= b7 + k2 + t0;
	b7 -= k3 + 14;

	tmp = b5 ^ b4;
	b5 = (tmp >> 19) | (tmp << (64 - 19));
	b4 -= b5 + k0;
	b5 -= k1 + t2;

	tmp = b3 ^ b2;
	b3 = (tmp >> 36) | (tmp << (64 - 36));
	b2 -= b3 + k7;
	b3 -= k8;

	tmp = b1 ^ b0;
	b1 = (tmp >> 46) | (tmp << (64 - 46));
	b0 -= b1 + k5;
	b1 -= k6;

	tmp = b3 ^ b4;
	b3 = (tmp >> 22) | (tmp << (64 - 22));
	b4 -= b3;

	tmp = b5 ^ b2;
	b5 = (tmp >> 56) | (tmp << (64 - 56));
	b2 -= b5;

	tmp = b7 ^ b0;
	b7 = (tmp >> 35) | (tmp << (64 - 35));
	b0 -= b7;

	tmp = b1 ^ b6;
	b1 = (tmp >> 8) | (tmp << (64 - 8));
	b6 -= b1;

	tmp = b7 ^ b2;
	b7 = (tmp >> 43) | (tmp << (64 - 43));
	b2 -= b7;

	tmp = b5 ^ b0;
	b5 = (tmp >> 39) | (tmp << (64 - 39));
	b0 -= b5;

	tmp = b3 ^ b6;
	b3 = (tmp >> 29) | (tmp << (64 - 29));
	b6 -= b3;

	tmp = b1 ^ b4;
	b1 = (tmp >> 25) | (tmp << (64 - 25));
	b4 -= b1;

	tmp = b3 ^ b0;
	b3 = (tmp >> 17) | (tmp << (64 - 17));
	b0 -= b3;

	tmp = b5 ^ b6;
	b5 = (tmp >> 10) | (tmp << (64 - 10));
	b6 -= b5;

	tmp = b7 ^ b4;
	b7 = (tmp >> 50) | (tmp << (64 - 50));
	b4 -= b7;

	tmp = b1 ^ b2;
	b1 = (tmp >> 13) | (tmp << (64 - 13));
	b2 -= b1;

	tmp = b7 ^ b6;
	b7 = (tmp >> 24) | (tmp << (64 - 24));
	b6 -= b7 + k1 + t2;
	b7 -= k2 + 13;

	tmp = b5 ^ b4;
	b5 = (tmp >> 34) | (tmp << (64 - 34));
	b4 -= b5 + k8;
	b5 -= k0 + t1;

	tmp = b3 ^ b2;
	b3 = (tmp >> 30) | (tmp << (64 - 30));
	b2 -= b3 + k6;
	b3 -= k7;

	tmp = b1 ^ b0;
	b1 = (tmp >> 39) | (tmp << (64 - 39));
	b0 -= b1 + k4;
	b1 -= k5;

	tmp = b3 ^ b4;
	b3 = (tmp >> 56) | (tmp << (64 - 56));
	b4 -= b3;

	tmp = b5 ^ b2;
	b5 = (tmp >> 54) | (tmp << (64 - 54));
	b2 -= b5;

	tmp = b7 ^ b0;
	b7 = (tmp >> 9) | (tmp << (64 - 9));
	b0 -= b7;

	tmp = b1 ^ b6;
	b1 = (tmp >> 44) | (tmp << (64 - 44));
	b6 -= b1;

	tmp = b7 ^ b2;
	b7 = (tmp >> 39) | (tmp << (64 - 39));
	b2 -= b7;

	tmp = b5 ^ b0;
	b5 = (tmp >> 36) | (tmp << (64 - 36));
	b0 -= b5;

	tmp = b3 ^ b6;
	b3 = (tmp >> 49) | (tmp << (64 - 49));
	b6 -= b3;

	tmp = b1 ^ b4;
	b1 = (tmp >> 17) | (tmp << (64 - 17));
	b4 -= b1;

	tmp = b3 ^ b0;
	b3 = (tmp >> 42) | (tmp << (64 - 42));
	b0 -= b3;

	tmp = b5 ^ b6;
	b5 = (tmp >> 14) | (tmp << (64 - 14));
	b6 -= b5;

	tmp = b7 ^ b4;
	b7 = (tmp >> 27) | (tmp << (64 - 27));
	b4 -= b7;

	tmp = b1 ^ b2;
	b1 = (tmp >> 33) | (tmp << (64 - 33));
	b2 -= b1;

	tmp = b7 ^ b6;
	b7 = (tmp >> 37) | (tmp << (64 - 37));
	b6 -= b7 + k0 + t1;
	b7 -= k1 + 12;

	tmp = b5 ^ b4;
	b5 = (tmp >> 19) | (tmp << (64 - 19));
	b4 -= b5 + k7;
	b5 -= k8 + t0;

	tmp = b3 ^ b2;
	b3 = (tmp >> 36) | (tmp << (64 - 36));
	b2 -= b3 + k5;
	b3 -= k6;

	tmp = b1 ^ b0;
	b1 = (tmp >> 46) | (tmp << (64 - 46));
	b0 -= b1 + k3;
	b1 -= k4;

	tmp = b3 ^ b4;
	b3 = (tmp >> 22) | (tmp << (64 - 22));
	b4 -= b3;

	tmp = b5 ^ b2;
	b5 = (tmp >> 56) | (tmp << (64 - 56));
	b2 -= b5;

	tmp = b7 ^ b0;
	b7 = (tmp >> 35) | (tmp << (64 - 35));
	b0 -= b7;

	tmp = b1 ^ b6;
	b1 = (tmp >> 8) | (tmp << (64 - 8));
	b6 -= b1;

	tmp = b7 ^ b2;
	b7 = (tmp >> 43) | (tmp << (64 - 43));
	b2 -= b7;

	tmp = b5 ^ b0;
	b5 = (tmp >> 39) | (tmp << (64 - 39));
	b0 -= b5;

	tmp = b3 ^ b6;
	b3 = (tmp >> 29) | (tmp << (64 - 29));
	b6 -= b3;

	tmp = b1 ^ b4;
	b1 = (tmp >> 25) | (tmp << (64 - 25));
	b4 -= b1;

	tmp = b3 ^ b0;
	b3 = (tmp >> 17) | (tmp << (64 - 17));
	b0 -= b3;

	tmp = b5 ^ b6;
	b5 = (tmp >> 10) | (tmp << (64 - 10));
	b6 -= b5;

	tmp = b7 ^ b4;
	b7 = (tmp >> 50) | (tmp << (64 - 50));
	b4 -= b7;

	tmp = b1 ^ b2;
	b1 = (tmp >> 13) | (tmp << (64 - 13));
	b2 -= b1;

	tmp = b7 ^ b6;
	b7 = (tmp >> 24) | (tmp << (64 - 24));
	b6 -= b7 + k8 + t0;
	b7 -= k0 + 11;

	tmp = b5 ^ b4;
	b5 = (tmp >> 34) | (tmp << (64 - 34));
	b4 -= b5 + k6;
	b5 -= k7 + t2;

	tmp = b3 ^ b2;
	b3 = (tmp >> 30) | (tmp << (64 - 30));
	b2 -= b3 + k4;
	b3 -= k5;

	tmp = b1 ^ b0;
	b1 = (tmp >> 39) | (tmp << (64 - 39));
	b0 -= b1 + k2;
	b1 -= k3;

	tmp = b3 ^ b4;
	b3 = (tmp >> 56) | (tmp << (64 - 56));
	b4 -= b3;

	tmp = b5 ^ b2;
	b5 = (tmp >> 54) | (tmp << (64 - 54));
	b2 -= b5;

	tmp = b7 ^ b0;
	b7 = (tmp >> 9) | (tmp << (64 - 9));
	b0 -= b7;

	tmp = b1 ^ b6;
	b1 = (tmp >> 44) | (tmp << (64 - 44));
	b6 -= b1;

	tmp = b7 ^ b2;
	b7 = (tmp >> 39) | (tmp << (64 - 39));
	b2 -= b7;

	tmp = b5 ^ b0;
	b5 = (tmp >> 36) | (tmp << (64 - 36));
	b0 -= b5;

	tmp = b3 ^ b6;
	b3 = (tmp >> 49) | (tmp << (64 - 49));
	b6 -= b3;

	tmp = b1 ^ b4;
	b1 = (tmp >> 17) | (tmp << (64 - 17));
	b4 -= b1;

	tmp = b3 ^ b0;
	b3 = (tmp >> 42) | (tmp << (64 - 42));
	b0 -= b3;

	tmp = b5 ^ b6;
	b5 = (tmp >> 14) | (tmp << (64 - 14));
	b6 -= b5;

	tmp = b7 ^ b4;
	b7 = (tmp >> 27) | (tmp << (64 - 27));
	b4 -= b7;

	tmp = b1 ^ b2;
	b1 = (tmp >> 33) | (tmp << (64 - 33));
	b2 -= b1;

	tmp = b7 ^ b6;
	b7 = (tmp >> 37) | (tmp << (64 - 37));
	b6 -= b7 + k7 + t2;
	b7 -= k8 + 10;

	tmp = b5 ^ b4;
	b5 = (tmp >> 19) | (tmp << (64 - 19));
	b4 -= b5 + k5;
	b5 -= k6 + t1;

	tmp = b3 ^ b2;
	b3 = (tmp >> 36) | (tmp << (64 - 36));
	b2 -= b3 + k3;
	b3 -= k4;

	tmp = b1 ^ b0;
	b1 = (tmp >> 46) | (tmp << (64 - 46));
	b0 -= b1 + k1;
	b1 -= k2;

	tmp = b3 ^ b4;
	b3 = (tmp >> 22) | (tmp << (64 - 22));
	b4 -= b3;

	tmp = b5 ^ b2;
	b5 = (tmp >> 56) | (tmp << (64 - 56));
	b2 -= b5;

	tmp = b7 ^ b0;
	b7 = (tmp >> 35) | (tmp << (64 - 35));
	b0 -= b7;

	tmp = b1 ^ b6;
	b1 = (tmp >> 8) | (tmp << (64 - 8));
	b6 -= b1;

	tmp = b7 ^ b2;
	b7 = (tmp >> 43) | (tmp << (64 - 43));
	b2 -= b7;

	tmp = b5 ^ b0;
	b5 = (tmp >> 39) | (tmp << (64 - 39));
	b0 -= b5;

	tmp = b3 ^ b6;
	b3 = (tmp >> 29) | (tmp << (64 - 29));
	b6 -= b3;

	tmp = b1 ^ b4;
	b1 = (tmp >> 25) | (tmp << (64 - 25));
	b4 -= b1;

	tmp = b3 ^ b0;
	b3 = (tmp >> 17) | (tmp << (64 - 17));
	b0 -= b3;

	tmp = b5 ^ b6;
	b5 = (tmp >> 10) | (tmp << (64 - 10));
	b6 -= b5;

	tmp = b7 ^ b4;
	b7 = (tmp >> 50) | (tmp << (64 - 50));
	b4 -= b7;

	tmp = b1 ^ b2;
	b1 = (tmp >> 13) | (tmp << (64 - 13));
	b2 -= b1;

	tmp = b7 ^ b6;
	b7 = (tmp >> 24) | (tmp << (64 - 24));
	b6 -= b7 + k6 + t1;
	b7 -= k7 + 9;

	tmp = b5 ^ b4;
	b5 = (tmp >> 34) | (tmp << (64 - 34));
	b4 -= b5 + k4;
	b5 -= k5 + t0;

	tmp = b3 ^ b2;
	b3 = (tmp >> 30) | (tmp << (64 - 30));
	b2 -= b3 + k2;
	b3 -= k3;

	tmp = b1 ^ b0;
	b1 = (tmp >> 39) | (tmp << (64 - 39));
	b0 -= b1 + k0;
	b1 -= k1;

	tmp = b3 ^ b4;
	b3 = (tmp >> 56) | (tmp << (64 - 56));
	b4 -= b3;

	tmp = b5 ^ b2;
	b5 = (tmp >> 54) | (tmp << (64 - 54));
	b2 -= b5;

	tmp = b7 ^ b0;
	b7 = (tmp >> 9) | (tmp << (64 - 9));
	b0 -= b7;

	tmp = b1 ^ b6;
	b1 = (tmp >> 44) | (tmp << (64 - 44));
	b6 -= b1;

	tmp = b7 ^ b2;
	b7 = (tmp >> 39) | (tmp << (64 - 39));
	b2 -= b7;

	tmp = b5 ^ b0;
	b5 = (tmp >> 36) | (tmp << (64 - 36));
	b0 -= b5;

	tmp = b3 ^ b6;
	b3 = (tmp >> 49) | (tmp << (64 - 49));
	b6 -= b3;

	tmp = b1 ^ b4;
	b1 = (tmp >> 17) | (tmp << (64 - 17));
	b4 -= b1;

	tmp = b3 ^ b0;
	b3 = (tmp >> 42) | (tmp << (64 - 42));
	b0 -= b3;

	tmp = b5 ^ b6;
	b5 = (tmp >> 14) | (tmp << (64 - 14));
	b6 -= b5;

	tmp = b7 ^ b4;
	b7 = (tmp >> 27) | (tmp << (64 - 27));
	b4 -= b7;

	tmp = b1 ^ b2;
	b1 = (tmp >> 33) | (tmp << (64 - 33));
	b2 -= b1;

	tmp = b7 ^ b6;
	b7 = (tmp >> 37) | (tmp << (64 - 37));
	b6 -= b7 + k5 + t0;
	b7 -= k6 + 8;

	tmp = b5 ^ b4;
	b5 = (tmp >> 19) | (tmp << (64 - 19));
	b4 -= b5 + k3;
	b5 -= k4 + t2;

	tmp = b3 ^ b2;
	b3 = (tmp >> 36) | (tmp << (64 - 36));
	b2 -= b3 + k1;
	b3 -= k2;

	tmp = b1 ^ b0;
	b1 = (tmp >> 46) | (tmp << (64 - 46));
	b0 -= b1 + k8;
	b1 -= k0;

	tmp = b3 ^ b4;
	b3 = (tmp >> 22) | (tmp << (64 - 22));
	b4 -= b3;

	tmp = b5 ^ b2;
	b5 = (tmp >> 56) | (tmp << (64 - 56));
	b2 -= b5;

	tmp = b7 ^ b0;
	b7 = (tmp >> 35) | (tmp << (64 - 35));
	b0 -= b7;

	tmp = b1 ^ b6;
	b1 = (tmp >> 8) | (tmp << (64 - 8));
	b6 -= b1;

	tmp = b7 ^ b2;
	b7 = (tmp >> 43) | (tmp << (64 - 43));
	b2 -= b7;

	tmp = b5 ^ b0;
	b5 = (tmp >> 39) | (tmp << (64 - 39));
	b0 -= b5;

	tmp = b3 ^ b6;
	b3 = (tmp >> 29) | (tmp << (64 - 29));
	b6 -= b3;

	tmp = b1 ^ b4;
	b1 = (tmp >> 25) | (tmp << (64 - 25));
	b4 -= b1;

	tmp = b3 ^ b0;
	b3 = (tmp >> 17) | (tmp << (64 - 17));
	b0 -= b3;

	tmp = b5 ^ b6;
	b5 = (tmp >> 10) | (tmp << (64 - 10));
	b6 -= b5;

	tmp = b7 ^ b4;
	b7 = (tmp >> 50) | (tmp << (64 - 50));
	b4 -= b7;

	tmp = b1 ^ b2;
	b1 = (tmp >> 13) | (tmp << (64 - 13));
	b2 -= b1;

	tmp = b7 ^ b6;
	b7 = (tmp >> 24) | (tmp << (64 - 24));
	b6 -= b7 + k4 + t2;
	b7 -= k5 + 7;

	tmp = b5 ^ b4;
	b5 = (tmp >> 34) | (tmp << (64 - 34));
	b4 -= b5 + k2;
	b5 -= k3 + t1;

	tmp = b3 ^ b2;
	b3 = (tmp >> 30) | (tmp << (64 - 30));
	b2 -= b3 + k0;
	b3 -= k1;

	tmp = b1 ^ b0;
	b1 = (tmp >> 39) | (tmp << (64 - 39));
	b0 -= b1 + k7;
	b1 -= k8;

	tmp = b3 ^ b4;
	b3 = (tmp >> 56) | (tmp << (64 - 56));
	b4 -= b3;

	tmp = b5 ^ b2;
	b5 = (tmp >> 54) | (tmp << (64 - 54));
	b2 -= b5;

	tmp = b7 ^ b0;
	b7 = (tmp >> 9) | (tmp << (64 - 9));
	b0 -= b7;

	tmp = b1 ^ b6;
	b1 = (tmp >> 44) | (tmp << (64 - 44));
	b6 -= b1;

	tmp = b7 ^ b2;
	b7 = (tmp >> 39) | (tmp << (64 - 39));
	b2 -= b7;

	tmp = b5 ^ b0;
	b5 = (tmp >> 36) | (tmp << (64 - 36));
	b0 -= b5;

	tmp = b3 ^ b6;
	b3 = (tmp >> 49) | (tmp << (64 - 49));
	b6 -= b3;

	tmp = b1 ^ b4;
	b1 = (tmp >> 17) | (tmp << (64 - 17));
	b4 -= b1;

	tmp = b3 ^ b0;
	b3 = (tmp >> 42) | (tmp << (64 - 42));
	b0 -= b3;

	tmp = b5 ^ b6;
	b5 = (tmp >> 14) | (tmp << (64 - 14));
	b6 -= b5;

	tmp = b7 ^ b4;
	b7 = (tmp >> 27) | (tmp << (64 - 27));
	b4 -= b7;

	tmp = b1 ^ b2;
	b1 = (tmp >> 33) | (tmp << (64 - 33));
	b2 -= b1;

	tmp = b7 ^ b6;
	b7 = (tmp >> 37) | (tmp << (64 - 37));
	b6 -= b7 + k3 + t1;
	b7 -= k4 + 6;

	tmp = b5 ^ b4;
	b5 = (tmp >> 19) | (tmp << (64 - 19));
	b4 -= b5 + k1;
	b5 -= k2 + t0;

	tmp = b3 ^ b2;
	b3 = (tmp >> 36) | (tmp << (64 - 36));
	b2 -= b3 + k8;
	b3 -= k0;

	tmp = b1 ^ b0;
	b1 = (tmp >> 46) | (tmp << (64 - 46));
	b0 -= b1 + k6;
	b1 -= k7;

	tmp = b3 ^ b4;
	b3 = (tmp >> 22) | (tmp << (64 - 22));
	b4 -= b3;

	tmp = b5 ^ b2;
	b5 = (tmp >> 56) | (tmp << (64 - 56));
	b2 -= b5;

	tmp = b7 ^ b0;
	b7 = (tmp >> 35) | (tmp << (64 - 35));
	b0 -= b7;

	tmp = b1 ^ b6;
	b1 = (tmp >> 8) | (tmp << (64 - 8));
	b6 -= b1;

	tmp = b7 ^ b2;
	b7 = (tmp >> 43) | (tmp << (64 - 43));
	b2 -= b7;

	tmp = b5 ^ b0;
	b5 = (tmp >> 39) | (tmp << (64 - 39));
	b0 -= b5;

	tmp = b3 ^ b6;
	b3 = (tmp >> 29) | (tmp << (64 - 29));
	b6 -= b3;

	tmp = b1 ^ b4;
	b1 = (tmp >> 25) | (tmp << (64 - 25));
	b4 -= b1;

	tmp = b3 ^ b0;
	b3 = (tmp >> 17) | (tmp << (64 - 17));
	b0 -= b3;

	tmp = b5 ^ b6;
	b5 = (tmp >> 10) | (tmp << (64 - 10));
	b6 -= b5;

	tmp = b7 ^ b4;
	b7 = (tmp >> 50) | (tmp << (64 - 50));
	b4 -= b7;

	tmp = b1 ^ b2;
	b1 = (tmp >> 13) | (tmp << (64 - 13));
	b2 -= b1;

	tmp = b7 ^ b6;
	b7 = (tmp >> 24) | (tmp << (64 - 24));
	b6 -= b7 + k2 + t0;
	b7 -= k3 + 5;

	tmp = b5 ^ b4;
	b5 = (tmp >> 34) | (tmp << (64 - 34));
	b4 -= b5 + k0;
	b5 -= k1 + t2;

	tmp = b3 ^ b2;
	b3 = (tmp >> 30) | (tmp << (64 - 30));
	b2 -= b3 + k7;
	b3 -= k8;

	tmp = b1 ^ b0;
	b1 = (tmp >> 39) | (tmp << (64 - 39));
	b0 -= b1 + k5;
	b1 -= k6;

	tmp = b3 ^ b4;
	b3 = (tmp >> 56) | (tmp << (64 - 56));
	b4 -= b3;

	tmp = b5 ^ b2;
	b5 = (tmp >> 54) | (tmp << (64 - 54));
	b2 -= b5;

	tmp = b7 ^ b0;
	b7 = (tmp >> 9) | (tmp << (64 - 9));
	b0 -= b7;

	tmp = b1 ^ b6;
	b1 = (tmp >> 44) | (tmp << (64 - 44));
	b6 -= b1;

	tmp = b7 ^ b2;
	b7 = (tmp >> 39) | (tmp << (64 - 39));
	b2 -= b7;

	tmp = b5 ^ b0;
	b5 = (tmp >> 36) | (tmp << (64 - 36));
	b0 -= b5;

	tmp = b3 ^ b6;
	b3 = (tmp >> 49) | (tmp << (64 - 49));
	b6 -= b3;

	tmp = b1 ^ b4;
	b1 = (tmp >> 17) | (tmp << (64 - 17));
	b4 -= b1;

	tmp = b3 ^ b0;
	b3 = (tmp >> 42) | (tmp << (64 - 42));
	b0 -= b3;

	tmp = b5 ^ b6;
	b5 = (tmp >> 14) | (tmp << (64 - 14));
	b6 -= b5;

	tmp = b7 ^ b4;
	b7 = (tmp >> 27) | (tmp << (64 - 27));
	b4 -= b7;

	tmp = b1 ^ b2;
	b1 = (tmp >> 33) | (tmp << (64 - 33));
	b2 -= b1;

	tmp = b7 ^ b6;
	b7 = (tmp >> 37) | (tmp << (64 - 37));
	b6 -= b7 + k1 + t2;
	b7 -= k2 + 4;

	tmp = b5 ^ b4;
	b5 = (tmp >> 19) | (tmp << (64 - 19));
	b4 -= b5 + k8;
	b5 -= k0 + t1;

	tmp = b3 ^ b2;
	b3 = (tmp >> 36) | (tmp << (64 - 36));
	b2 -= b3 + k6;
	b3 -= k7;

	tmp = b1 ^ b0;
	b1 = (tmp >> 46) | (tmp << (64 - 46));
	b0 -= b1 + k4;
	b1 -= k5;

	tmp = b3 ^ b4;
	b3 = (tmp >> 22) | (tmp << (64 - 22));
	b4 -= b3;

	tmp = b5 ^ b2;
	b5 = (tmp >> 56) | (tmp << (64 - 56));
	b2 -= b5;

	tmp = b7 ^ b0;
	b7 = (tmp >> 35) | (tmp << (64 - 35));
	b0 -= b7;

	tmp = b1 ^ b6;
	b1 = (tmp >> 8) | (tmp << (64 - 8));
	b6 -= b1;

	tmp = b7 ^ b2;
	b7 = (tmp >> 43) | (tmp << (64 - 43));
	b2 -= b7;

	tmp = b5 ^ b0;
	b5 = (tmp >> 39) | (tmp << (64 - 39));
	b0 -= b5;

	tmp = b3 ^ b6;
	b3 = (tmp >> 29) | (tmp << (64 - 29));
	b6 -= b3;

	tmp = b1 ^ b4;
	b1 = (tmp >> 25) | (tmp << (64 - 25));
	b4 -= b1;

	tmp = b3 ^ b0;
	b3 = (tmp >> 17) | (tmp << (64 - 17));
	b0 -= b3;

	tmp = b5 ^ b6;
	b5 = (tmp >> 10) | (tmp << (64 - 10));
	b6 -= b5;

	tmp = b7 ^ b4;
	b7 = (tmp >> 50) | (tmp << (64 - 50));
	b4 -= b7;

	tmp = b1 ^ b2;
	b1 = (tmp >> 13) | (tmp << (64 - 13));
	b2 -= b1;

	tmp = b7 ^ b6;
	b7 = (tmp >> 24) | (tmp << (64 - 24));
	b6 -= b7 + k0 + t1;
	b7 -= k1 + 3;

	tmp = b5 ^ b4;
	b5 = (tmp >> 34) | (tmp << (64 - 34));
	b4 -= b5 + k7;
	b5 -= k8 + t0;

	tmp = b3 ^ b2;
	b3 = (tmp >> 30) | (tmp << (64 - 30));
	b2 -= b3 + k5;
	b3 -= k6;

	tmp = b1 ^ b0;
	b1 = (tmp >> 39) | (tmp << (64 - 39));
	b0 -= b1 + k3;
	b1 -= k4;

	tmp = b3 ^ b4;
	b3 = (tmp >> 56) | (tmp << (64 - 56));
	b4 -= b3;

	tmp = b5 ^ b2;
	b5 = (tmp >> 54) | (tmp << (64 - 54));
	b2 -= b5;

	tmp = b7 ^ b0;
	b7 = (tmp >> 9) | (tmp << (64 - 9));
	b0 -= b7;

	tmp = b1 ^ b6;
	b1 = (tmp >> 44) | (tmp << (64 - 44));
	b6 -= b1;

	tmp = b7 ^ b2;
	b7 = (tmp >> 39) | (tmp << (64 - 39));
	b2 -= b7;

	tmp = b5 ^ b0;
	b5 = (tmp >> 36) | (tmp << (64 - 36));
	b0 -= b5;

	tmp = b3 ^ b6;
	b3 = (tmp >> 49) | (tmp << (64 - 49));
	b6 -= b3;

	tmp = b1 ^ b4;
	b1 = (tmp >> 17) | (tmp << (64 - 17));
	b4 -= b1;

	tmp = b3 ^ b0;
	b3 = (tmp >> 42) | (tmp << (64 - 42));
	b0 -= b3;

	tmp = b5 ^ b6;
	b5 = (tmp >> 14) | (tmp << (64 - 14));
	b6 -= b5;

	tmp = b7 ^ b4;
	b7 = (tmp >> 27) | (tmp << (64 - 27));
	b4 -= b7;

	tmp = b1 ^ b2;
	b1 = (tmp >> 33) | (tmp << (64 - 33));
	b2 -= b1;

	tmp = b7 ^ b6;
	b7 = (tmp >> 37) | (tmp << (64 - 37));
	b6 -= b7 + k8 + t0;
	b7 -= k0 + 2;

	tmp = b5 ^ b4;
	b5 = (tmp >> 19) | (tmp << (64 - 19));
	b4 -= b5 + k6;
	b5 -= k7 + t2;

	tmp = b3 ^ b2;
	b3 = (tmp >> 36) | (tmp << (64 - 36));
	b2 -= b3 + k4;
	b3 -= k5;

	tmp = b1 ^ b0;
	b1 = (tmp >> 46) | (tmp << (64 - 46));
	b0 -= b1 + k2;
	b1 -= k3;

	tmp = b3 ^ b4;
	b3 = (tmp >> 22) | (tmp << (64 - 22));
	b4 -= b3;

	tmp = b5 ^ b2;
	b5 = (tmp >> 56) | (tmp << (64 - 56));
	b2 -= b5;

	tmp = b7 ^ b0;
	b7 = (tmp >> 35) | (tmp << (64 - 35));
	b0 -= b7;

	tmp = b1 ^ b6;
	b1 = (tmp >> 8) | (tmp << (64 - 8));
	b6 -= b1;

	tmp = b7 ^ b2;
	b7 = (tmp >> 43) | (tmp << (64 - 43));
	b2 -= b7;

	tmp = b5 ^ b0;
	b5 = (tmp >> 39) | (tmp << (64 - 39));
	b0 -= b5;

	tmp = b3 ^ b6;
	b3 = (tmp >> 29) | (tmp << (64 - 29));
	b6 -= b3;

	tmp = b1 ^ b4;
	b1 = (tmp >> 25) | (tmp << (64 - 25));
	b4 -= b1;

	tmp = b3 ^ b0;
	b3 = (tmp >> 17) | (tmp << (64 - 17));
	b0 -= b3;

	tmp = b5 ^ b6;
	b5 = (tmp >> 10) | (tmp << (64 - 10));
	b6 -= b5;

	tmp = b7 ^ b4;
	b7 = (tmp >> 50) | (tmp << (64 - 50));
	b4 -= b7;

	tmp = b1 ^ b2;
	b1 = (tmp >> 13) | (tmp << (64 - 13));
	b2 -= b1;

	tmp = b7 ^ b6;
	b7 = (tmp >> 24) | (tmp << (64 - 24));
	b6 -= b7 + k7 + t2;
	b7 -= k8 + 1;

	tmp = b5 ^ b4;
	b5 = (tmp >> 34) | (tmp << (64 - 34));
	b4 -= b5 + k5;
	b5 -= k6 + t1;

	tmp = b3 ^ b2;
	b3 = (tmp >> 30) | (tmp << (64 - 30));
	b2 -= b3 + k3;
	b3 -= k4;

	tmp = b1 ^ b0;
	b1 = (tmp >> 39) | (tmp << (64 - 39));
	b0 -= b1 + k1;
	b1 -= k2;

	tmp = b3 ^ b4;
	b3 = (tmp >> 56) | (tmp << (64 - 56));
	b4 -= b3;

	tmp = b5 ^ b2;
	b5 = (tmp >> 54) | (tmp << (64 - 54));
	b2 -= b5;

	tmp = b7 ^ b0;
	b7 = (tmp >> 9) | (tmp << (64 - 9));
	b0 -= b7;

	tmp = b1 ^ b6;
	b1 = (tmp >> 44) | (tmp << (64 - 44));
	b6 -= b1;

	tmp = b7 ^ b2;
	b7 = (tmp >> 39) | (tmp << (64 - 39));
	b2 -= b7;

	tmp = b5 ^ b0;
	b5 = (tmp >> 36) | (tmp << (64 - 36));
	b0 -= b5;

	tmp = b3 ^ b6;
	b3 = (tmp >> 49) | (tmp << (64 - 49));
	b6 -= b3;

	tmp = b1 ^ b4;
	b1 = (tmp >> 17) | (tmp << (64 - 17));
	b4 -= b1;

	tmp = b3 ^ b0;
	b3 = (tmp >> 42) | (tmp << (64 - 42));
	b0 -= b3;

	tmp = b5 ^ b6;
	b5 = (tmp >> 14) | (tmp << (64 - 14));
	b6 -= b5;

	tmp = b7 ^ b4;
	b7 = (tmp >> 27) | (tmp << (64 - 27));
	b4 -= b7;

	tmp = b1 ^ b2;
	b1 = (tmp >> 33) | (tmp << (64 - 33));
	b2 -= b1;

	tmp = b7 ^ b6;
	b7 = (tmp >> 37) | (tmp << (64 - 37));
	b6 -= b7 + k6 + t1;
	b7 -= k7;

	tmp = b5 ^ b4;
	b5 = (tmp >> 19) | (tmp << (64 - 19));
	b4 -= b5 + k4;
	b5 -= k5 + t0;

	tmp = b3 ^ b2;
	b3 = (tmp >> 36) | (tmp << (64 - 36));
	b2 -= b3 + k2;
	b3 -= k3;

	tmp = b1 ^ b0;
	b1 = (tmp >> 46) | (tmp << (64 - 46));
	b0 -= b1 + k0;
	b1 -= k1;

	output[0] = b0;
	output[1] = b1;
	output[2] = b2;
	output[3] = b3;

	output[7] = b7;
	output[6] = b6;
	output[5] = b5;
	output[4] = b4;
}