doublecmd/components/dcpcrypt/Hashes/dcblake2.pp
2015-09-06 16:39:22 +00:00

500 lines
14 KiB
ObjectPascal

{
BLAKE2 reference source code package - reference C implementations
Written in 2012 by Samuel Neves <sneves@dei.uc.pt>
Pascal tranlastion in 2014-2015 by Alexander Koblov (alexx2000@mail.ru)
To the extent possible under law, the author(s) have dedicated all copyright
and related and neighboring rights to this software to the public domain
worldwide. This software is distributed without any warranty.
You should have received a copy of the CC0 Public Domain Dedication along with
this software. If not, see <http://creativecommons.org/publicdomain/zero/1.0/>.
}
unit DCblake2;
{$mode objfpc}{$H+}
{$macro on}{$R-}{$Q-}
{$define USE_MTPROCS}
interface
uses
SysUtils, CTypes;
const
PARALLELISM_DEGREE = 8;
BLAKE2S_BLOCKBYTES = 64;
BLAKE2S_OUTBYTES = 32;
BLAKE2S_KEYBYTES = 32;
BLAKE2S_SALTBYTES = 8;
BLAKE2S_PERSONALBYTES = 8;
type
{$packrecords 1}
Pblake2s_param = ^blake2s_param;
blake2s_param = record
digest_length: cuint8; // 1
key_length: cuint8; // 2
fanout: cuint8; // 3
depth: cuint8; // 4
leaf_length: cuint32; // 8
node_offset: array[0..5] of cuint8;// 14
node_depth: cuint8; // 15
inner_length: cuint8; // 16
// uint8_t reserved[0];
salt: array[0..Pred(BLAKE2S_SALTBYTES)] of cuint8; // 24
personal: array[0..Pred(BLAKE2S_PERSONALBYTES)] of cuint8; // 32
end;
{$packrecords 8}
Pblake2s_state = ^blake2s_state;
blake2s_state = record
h: array[0..7] of cuint32;
t: array[0..1] of cuint32;
f: array[0..1] of cuint32;
buf: array[0..Pred(2 * BLAKE2S_BLOCKBYTES)] of cuint8;
buflen: csize_t;
last_node: cuint8;
end;
{$packrecords 1}
Pblake2sp_state = ^blake2sp_state;
blake2sp_state = record
S: array[0..7] of blake2s_state;
R: blake2s_state;
buf: array[0..Pred(8 * BLAKE2S_BLOCKBYTES)] of cuint8;
buflen: csize_t;
inlen: csize_t;
inp: PByte;
end;
{$packrecords default}
function blake2s_init( S: Pblake2s_state; const outlen: cuint8 ): cint;
function blake2s_update( S: Pblake2s_state; inp: pcuint8; inlen: cuint64 ): cint;
function blake2s_final( S: Pblake2s_state; outp: pcuint8; outlen: cuint8 ): cint;
function blake2sp_init( S: Pblake2sp_state; const outlen: cuint8 ): cint;
function blake2sp_update( S: Pblake2sp_state; inp: pcuint8; inlen: cuint64 ): cint;
function blake2sp_final( S: Pblake2sp_state; outp: pcuint8; const outlen: cuint8 ): cint;
implementation
{$IF DEFINED(USE_MTPROCS)}
uses
MTProcs;
{$ELSE}
type
TMultiThreadProcItem = Pointer;
{$ENDIF}
const blake2s_IV: array[0..7] of cuint32 =
(
$6A09E667, $BB67AE85, $3C6EF372, $A54FF53A,
$510E527F, $9B05688C, $1F83D9AB, $5BE0CD19
);
const blake2s_sigma: array[0..9] of array[0..15] of cuint8 =
(
( 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15 ) ,
( 14, 10, 4, 8, 9, 15, 13, 6, 1, 12, 0, 2, 11, 7, 5, 3 ) ,
( 11, 8, 12, 0, 5, 2, 15, 13, 10, 14, 3, 6, 7, 1, 9, 4 ) ,
( 7, 9, 3, 1, 13, 12, 11, 14, 2, 6, 5, 10, 4, 0, 15, 8 ) ,
( 9, 0, 5, 7, 2, 4, 10, 15, 14, 1, 11, 12, 6, 8, 3, 13 ) ,
( 2, 12, 6, 10, 0, 11, 8, 3, 4, 13, 7, 5, 15, 14, 1, 9 ) ,
( 12, 5, 1, 15, 14, 13, 4, 10, 0, 7, 6, 3, 9, 2, 8, 11 ) ,
( 13, 11, 7, 14, 12, 1, 3, 9, 5, 0, 15, 4, 8, 6, 2, 10 ) ,
( 6, 15, 14, 9, 11, 3, 0, 8, 12, 2, 13, 7, 1, 4, 10, 5 ) ,
( 10, 2, 8, 4, 7, 6, 1, 5, 15, 11, 9, 14, 3, 12, 13 , 0 )
);
function load32( const src: Pointer ): cuint32; inline;
begin
Result := NtoLE(pcuint32(src)^);
end;
function load64( const src: pointer ): cuint64; inline;
begin
Result := NtoLE(pcuint64(src)^);
end;
procedure store32( dst: pointer; w: cuint32 ); inline;
begin
pcuint32(dst)^ := LEtoN(w);
end;
procedure store64( dst: pointer; w: cuint64 ); inline;
begin
pcuint64(dst)^ := LEtoN(w);
end;
function load48( const src: pointer ): cuint64; inline;
var
w: cuint64;
p: pcuint8;
begin
p := pcuint8(src);
w := p^; Inc(p);
w := w or cuint64( p^ ) shl 8; inc(p);
w := w or cuint64( p^ ) shl 16; inc(p);
w := w or cuint64( p^ ) shl 24; inc(p);
w := w or cuint64( p^ ) shl 32; inc(p);
w := w or cuint64( p^ ) shl 40; inc(p);
Result := w;
end;
procedure store48( dst: pointer; w: cuint64 ); inline;
var
p: pcuint8;
begin
p := pcuint8(dst);
p^ := cuint8(w); w := w shr 8; inc(p);
p^ := cuint8(w); w := w shr 8; inc(p);
p^ := cuint8(w); w := w shr 8; inc(p);
p^ := cuint8(w); w := w shr 8; inc(p);
p^ := cuint8(w); w := w shr 8; inc(p);
p^ := cuint8(w); inc(p);
end;
function blake2s_set_lastnode( S: Pblake2s_state ): cint; inline;
begin
S^.f[1] := $FFFFFFFF;
Result := 0;
end;
function blake2s_clear_lastnode( S: Pblake2s_state ): cint; inline;
begin
S^.f[1] := 0;
Result := 0;
end;
//* Some helper functions, not necessarily useful */
function blake2s_set_lastblock( S: Pblake2s_state ): cint; inline;
begin
if( S^.last_node <> 0 ) then blake2s_set_lastnode( S );
S^.f[0] := $FFFFFFFF;
Result := 0;
end;
function blake2s_clear_lastblock( S: Pblake2s_state ): cint; inline;
begin
if( S^.last_node <> 0 ) then blake2s_clear_lastnode( S );
S^.f[0] := 0;
Result := 0;
end;
function blake2s_increment_counter( S: Pblake2s_state; const inc: cuint32 ): cint; inline;
begin
S^.t[0] += inc;
S^.t[1] += cuint32( S^.t[0] < inc );
Result := 0;
end;
function blake2s_init0( S: Pblake2s_state ): cint; inline;
var
i: cint;
begin
FillChar( S^, sizeof( blake2s_state ), 0 );
for i := 0 to 8 - 1 do S^.h[i] := blake2s_IV[i];
Result := 0;
end;
//* init2 xors IV with input parameter block */
function blake2s_init_param( S: Pblake2s_state; const P: Pblake2s_param ): cint;
var
i: csize_t;
pp: pcuint32;
begin
blake2s_init0( S );
pp := pcuint32( P );
//* IV XOR ParamBlock */
// for i := 0; i < 8; ++i )
for i := 0 to 8 - 1 do
S^.h[i] := S^.h[i] xor load32( @pp[i] );
Result := 0;
end;
// Sequential blake2s initialization
function blake2s_init( S: Pblake2s_state; const outlen: cuint8 ): cint;
var
P: blake2s_param;
begin
//* Move interval verification here? */
if ( ( outlen = 0 ) or ( outlen > BLAKE2S_OUTBYTES ) ) then Exit(-1);
P.digest_length := outlen;
P.key_length := 0;
P.fanout := 1;
P.depth := 1;
store32( @P.leaf_length, 0 );
store48( @P.node_offset, 0 );
P.node_depth := 0;
P.inner_length := 0;
// memset(P^.reserved, 0, sizeof(P^.reserved) );
FillChar( P.salt, sizeof( P.salt ), 0 );
FillChar( P.personal, sizeof( P.personal ), 0 );
Result := blake2s_init_param( S, @P );
end;
function blake2s_compress( S: Pblake2s_state; const block: pcuint8 ): cint;
var
i: csize_t;
m: array[0..15] of cuint32;
v: array[0..15] of cuint32;
procedure G(r,i: cuint32; var a,b,c,d: cuint32); inline;
begin
a := a + b + m[blake2s_sigma[r][2*i+0]];
d := RorDWord(d xor a, 16);
c := c + d;
b := RorDWord(b xor c, 12);
a := a + b + m[blake2s_sigma[r][2*i+1]];
d := RorDWord(d xor a, 8);
c := c + d;
b := RorDWord(b xor c, 7);
end;
{$define ROUND_MACRO:=
G(r_,0,v[ 0],v[ 4],v[ 8],v[12]);
G(r_,1,v[ 1],v[ 5],v[ 9],v[13]);
G(r_,2,v[ 2],v[ 6],v[10],v[14]);
G(r_,3,v[ 3],v[ 7],v[11],v[15]);
G(r_,4,v[ 0],v[ 5],v[10],v[15]);
G(r_,5,v[ 1],v[ 6],v[11],v[12]);
G(r_,6,v[ 2],v[ 7],v[ 8],v[13]);
G(r_,7,v[ 3],v[ 4],v[ 9],v[14]);
}
begin
for i := 0 to 15 do
m[i] := load32( @block[i * sizeof( m[i] )] );
for i := 0 to 7 do
v[i] := S^.h[i];
v[ 8] := blake2s_IV[0];
v[ 9] := blake2s_IV[1];
v[10] := blake2s_IV[2];
v[11] := blake2s_IV[3];
v[12] := S^.t[0] xor blake2s_IV[4];
v[13] := S^.t[1] xor blake2s_IV[5];
v[14] := S^.f[0] xor blake2s_IV[6];
v[15] := S^.f[1] xor blake2s_IV[7];
{$define r_:= 0} ROUND_MACRO;
{$define r_:= 1} ROUND_MACRO;
{$define r_:= 2} ROUND_MACRO;
{$define r_:= 3} ROUND_MACRO;
{$define r_:= 4} ROUND_MACRO;
{$define r_:= 5} ROUND_MACRO;
{$define r_:= 6} ROUND_MACRO;
{$define r_:= 7} ROUND_MACRO;
{$define r_:= 8} ROUND_MACRO;
{$define r_:= 9} ROUND_MACRO;
for i := 0 to 7 do
S^.h[i] := S^.h[i] xor v[i] xor v[i + 8];
Result := 0;
end;
function blake2s_update( S: Pblake2s_state; inp: pcuint8; inlen: cuint64 ): cint;
var
left, fill: csize_t;
begin
while( inlen > 0 ) do
begin
left := S^.buflen;
fill := 2 * BLAKE2S_BLOCKBYTES - left;
if( inlen > fill ) then
begin
Move( inp^, S^.buf[left], fill ); // Fill buffer
S^.buflen += fill;
blake2s_increment_counter( S, BLAKE2S_BLOCKBYTES );
blake2s_compress( S, S^.buf ); // Compress
Move( S^.buf[BLAKE2S_BLOCKBYTES], S^.buf, BLAKE2S_BLOCKBYTES ); // Shift buffer left
S^.buflen -= BLAKE2S_BLOCKBYTES;
inp += fill;
inlen -= fill;
end
else // inlen <= fill
begin
Move( inp^, S^.buf [left], inlen );
S^.buflen += inlen; // Be lazy, do not compress
inp += inlen;
inlen -= inlen;
end;
end;
Result := 0;
end;
function blake2s_final( S: Pblake2s_state; outp: pcuint8; outlen: cuint8 ): cint;
var
i: cint;
buffer: array[0..Pred(BLAKE2S_OUTBYTES)] of cuint8;
begin
if( S^.buflen > BLAKE2S_BLOCKBYTES ) then
begin
blake2s_increment_counter( S, BLAKE2S_BLOCKBYTES );
blake2s_compress( S, S^.buf);
S^.buflen -= BLAKE2S_BLOCKBYTES;
Move( S^.buf[BLAKE2S_BLOCKBYTES], S^.buf, S^.buflen );
end;
blake2s_increment_counter( S, cuint32(S^.buflen) );
blake2s_set_lastblock( S );
FillChar( S^.buf[S^.buflen], 2 * BLAKE2S_BLOCKBYTES - S^.buflen, 0 ); //* Padding */
blake2s_compress( S, S^.buf );
for i := 0 to 7 do //* Output full hash to temp buffer */
store32( @buffer[sizeof( S^.h[i] ) * i], S^.h[i] );
Move( buffer, outp^, outlen );
Result := 0;
end;
function blake2sp_init_leaf(S: Pblake2s_state; outlen: cuint8; keylen: cuint8; offset: cuint64):cint; inline;
var
P: blake2s_param;
begin
P.digest_length := outlen;
P.key_length := keylen;
P.fanout := PARALLELISM_DEGREE;
P.depth := 2;
store32( @P.leaf_length, 0 );
store48( @P.node_offset[0], offset );
P.node_depth := 0;
P.inner_length := BLAKE2S_OUTBYTES;
FillChar( P.salt, sizeof( P.salt ), 0 );
FillChar( P.personal, sizeof( P.personal ), 0 );
Result:= blake2s_init_param( S, @P );
end;
function blake2sp_init_root( S: Pblake2s_state; outlen: cuint8; keylen: cuint8 ): cint; inline;
var
P: blake2s_param;
begin
P.digest_length := outlen;
P.key_length := keylen;
P.fanout := PARALLELISM_DEGREE;
P.depth := 2;
store32( @P.leaf_length, 0 );
store48( @P.node_offset[0], 0 );
P.node_depth := 1;
P.inner_length := BLAKE2S_OUTBYTES;
FillChar( P.salt, sizeof( P.salt ), 0 );
FillChar( P.personal, sizeof( P.personal ), 0 );
Result:= blake2s_init_param( S, @P );
end;
function blake2sp_init( S: Pblake2sp_state; const outlen: cuint8 ): cint;
var
i: csize_t;
begin
if (outlen = 0) or (outlen > BLAKE2S_OUTBYTES) then Exit(-1);
FillChar( S^.buf, sizeof( S^.buf ), 0 );
S^.buflen := 0;
if( blake2sp_init_root( @S^.R, outlen, 0 ) < 0 ) then Exit(-1);
for i := 0 to PARALLELISM_DEGREE - 1 do
if ( blake2sp_init_leaf( @S^.S[i], outlen, 0, i ) < 0 ) then Exit(-1);
S^.R.last_node := 1;
S^.S[PARALLELISM_DEGREE - 1].last_node := 1;
Result := 0;
end;
procedure MTProcedure(id__: PtrInt; Data: Pointer; Item: TMultiThreadProcItem);
var
in__: pcuint8;
inlen__: cuint64;
S: Pblake2sp_state absolute Data;
begin
in__ := S^.inp;
inlen__ := S^.inlen;
in__ += id__ * BLAKE2S_BLOCKBYTES;
while ( inlen__ >= PARALLELISM_DEGREE * BLAKE2S_BLOCKBYTES ) do
begin
blake2s_update( @S^.S[id__], in__, BLAKE2S_BLOCKBYTES );
in__ += PARALLELISM_DEGREE * BLAKE2S_BLOCKBYTES;
inlen__ -= PARALLELISM_DEGREE * BLAKE2S_BLOCKBYTES;
end;
end;
function blake2sp_update( S: Pblake2sp_state; inp: pcuint8; inlen: cuint64 ): cint;
var
i, left, fill: csize_t;
begin
left := S^.buflen;
fill := sizeof( S^.buf ) - left;
if ( left <> 0) and (inlen >= fill ) then
begin
Move(inp^, S^.buf[left], fill);
for i := 0 to PARALLELISM_DEGREE - 1 do
blake2s_update( @S^.S[i], @S^.buf[ i * BLAKE2S_BLOCKBYTES], BLAKE2S_BLOCKBYTES );
inp += fill;
inlen -= fill;
left := 0;
end;
S^.inp := inp;
S^.inlen := inlen;
{$IF DEFINED(USE_MTPROCS)}
ProcThreadPool.DoParallel(@MTProcedure, 0, PARALLELISM_DEGREE - 1, S);
{$ELSE}
for i := 0 to PARALLELISM_DEGREE - 1 do MTProcedure(i, S, nil);
{$ENDIF}
inp += inlen - inlen mod ( PARALLELISM_DEGREE * BLAKE2S_BLOCKBYTES );
inlen := inlen mod (PARALLELISM_DEGREE * BLAKE2S_BLOCKBYTES);
if ( inlen > 0 ) then
Move(inp^, S^.buf[left], inlen );
S^.buflen := left + inlen;
Result := 0;
end;
function blake2sp_final( S: Pblake2sp_state; outp: pcuint8; const outlen: cuint8 ): cint;
var
i, left: csize_t;
hash: array[0..Pred(PARALLELISM_DEGREE), 0..Pred(BLAKE2S_OUTBYTES)] of cuint8;
begin
for i := 0 to PARALLELISM_DEGREE - 1 do
begin
if ( S^.buflen > i * BLAKE2S_BLOCKBYTES ) then
begin
left := S^.buflen - i * BLAKE2S_BLOCKBYTES;
if ( left > BLAKE2S_BLOCKBYTES ) then left := BLAKE2S_BLOCKBYTES;
blake2s_update( @S^.S[i], @S^.buf[i * BLAKE2S_BLOCKBYTES], left );
end;
blake2s_final( @S^.S[i], hash[i], BLAKE2S_OUTBYTES );
end;
for i := 0 to PARALLELISM_DEGREE - 1 do
blake2s_update( @S^.R, hash[i], BLAKE2S_OUTBYTES );
blake2s_final( @S^.R, outp, outlen );
Result := 0;
end;
end.