1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
|
// Copyright (C) 2020-2022 Joel Rosdahl and other contributors
//
// See doc/AUTHORS.adoc for a complete list of contributors.
//
// This program is free software; you can redistribute it and/or modify it
// under the terms of the GNU General Public License as published by the Free
// Software Foundation; either version 3 of the License, or (at your option)
// any later version.
//
// This program is distributed in the hope that it will be useful, but WITHOUT
// ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
// FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
// more details.
//
// You should have received a copy of the GNU General Public License along with
// this program; if not, write to the Free Software Foundation, Inc., 51
// Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
#pragma once
#include "Digest.hpp"
#include "third_party/blake3/blake3.h"
#include <third_party/nonstd/expected.hpp>
#include <cstdint>
#include <cstdio>
#include <string_view>
// This class represents a hash state.
class Hash
{
public:
enum class HashType { binary, text };
Hash();
Hash(const Hash& other) = default;
Hash& operator=(const Hash& other) = default;
// Enable debug logging of the hashed input to a binary and a text file.
void enable_debug(std::string_view section_name,
FILE* debug_binary,
FILE* debug_text);
// Retrieve the digest.
Digest digest() const;
// Hash some data that is unlikely to occur in the input. The idea is twofold:
//
// - Delimit things like arguments from each other (e.g., so that -I -O2 and
// -I-O2 hash differently).
// - Tag different types of hashed information so that it's possible to do
// conditional hashing of information in a safe way (e.g., if we want to
// hash information X if CCACHE_A is set and information Y if CCACHE_B is
// set, there should never be a hash collision risk).
Hash& hash_delimiter(std::string_view type);
// Add bytes to the hash.
//
// If hash debugging is enabled:
//
// - If `hash_type` is `HashType::binary`, the buffer content is written in
// hex format to the text input file.
// - If `hash_type` is `HashType::text`, the buffer content is written
// verbatim to the text input file.
//
// In both cases a newline character is added as well.
Hash&
hash(const void* data, size_t size, HashType hash_type = HashType::text);
// Add a string to the hash.
//
// If hash debugging is enabled, the string is written to the text input file
// followed by a newline.
Hash& hash(std::string_view data);
// Add an integer to the hash.
//
// If hash debugging is enabled, the integer is written in text form to the
// text input file followed by a newline.
Hash& hash(int64_t x);
// Add file contents to the hash.
//
// If hash debugging is enabled, the data is written verbatim to the text
// input file.
nonstd::expected<void, std::string> hash_file(const std::string& path);
// Add contents read from an open file descriptor to the hash.
//
// If hash debugging is enabled, the data is written verbatim to the text
// input file.
nonstd::expected<void, std::string> hash_fd(int fd);
// Add `text` to the text debug file.
void add_debug_text(std::string_view text);
private:
blake3_hasher m_hasher;
FILE* m_debug_binary = nullptr;
FILE* m_debug_text = nullptr;
void hash_buffer(std::string_view buffer);
};
|