forked from kristapsdz/openrsync
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathhash.c
135 lines (116 loc) · 3.13 KB
/
hash.c
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
/*
* Copyright (c) 2019 Kristaps Dzonsons <[email protected]>
*
* Permission to use, copy, modify, and distribute this software for any
* purpose with or without fee is hereby granted, provided that the above
* copyright notice and this permission notice appear in all copies.
*
* THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
* WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
* MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
* ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
* WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
* ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
* OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
*/
#include "config.h"
#include <sys/mman.h>
#include <sys/types.h>
#include <assert.h>
#include COMPAT_ENDIAN_H
#include <stdint.h>
#include <stdlib.h>
#include <errno.h>
#include <fcntl.h>
#include <unistd.h>
#include "md4.h"
#include "extern.h"
/*
* A fast 32-bit hash.
* Described in Tridgell's "Efficient Algorithms for Sorting and
* Synchronization" thesis and the "Rolling checksum" document.
*/
uint32_t
hash_fast(const void *buf, size_t len)
{
size_t i = 0;
uint32_t a = 0, /* part of a(k, l) */
b = 0; /* b(k, l) */
const signed char *dat = buf;
if (len > 4)
for ( ; i < len - 4; i += 4) {
b += 4 * (a + dat[i]) +
3 * dat[i + 1] +
2 * dat[i + 2] +
dat[i + 3];
a += dat[i + 0] +
dat[i + 1] +
dat[i + 2] +
dat[i + 3];
}
for ( ; i < len; i++) {
a += dat[i];
b += a;
}
/* s(k, l) = (eps % M) + 2^16 b(k, l) % M */
return (a & 0xffff) + (b << 16);
}
/*
* Slow MD4-based hash with trailing seed.
*/
void
hash_slow(const void *buf, size_t len,
unsigned char *md, const struct sess *sess)
{
MD4_CTX ctx;
int32_t seed = htole32(sess->seed);
MD4_Init(&ctx);
MD4_Update(&ctx, buf, len);
MD4_Update(&ctx, (unsigned char *)&seed, sizeof(int32_t));
MD4_Final(md, &ctx);
}
/*
* Hash an entire file.
* This is similar to hash_slow() except the seed is hashed at the end
* of the sequence, not the beginning.
* Note that if sess is NULL then the seed is not included (this
* feature is used to compute seedless hashes for --checksum).
*/
void
hash_file(const void *buf, size_t len,
unsigned char *md, const struct sess *sess)
{
MD4_CTX ctx;
MD4_Init(&ctx);
if (sess != NULL) {
int32_t seed = htole32(sess->seed);
MD4_Update(&ctx, &seed, sizeof(int32_t));
}
MD4_Update(&ctx, buf, len);
MD4_Final(md, &ctx);
}
/*
* This function is primarily used to compute whole-file seedless
* checksums for the --checksum option, for contexts in which the
* file is not already open nor mapped.
*/
int
hash_file_by_path(int rootfd, const char *path, size_t len, unsigned char *md)
{
int fd, save;
char *map;
fd = openat(rootfd, path, O_RDONLY | O_NOFOLLOW);
if (fd == -1)
return -1;
map = mmap(NULL, len, PROT_READ, MAP_PRIVATE, fd, 0);
if (map == MAP_FAILED) {
save = errno;
close(fd);
errno = save;
return -1;
}
hash_file(map, len, md, NULL);
munmap(map, len);
close(fd);
return 0;
}