mirror of
https://github.com/zeek/zeek.git
synced 2025-10-07 00:58:19 +00:00
Refactor HashKey class to support read/write operations
This preserves the optimization of storing values directly in the key_u member union when feasible, and using a variable size buffer otherwise. It also adds bounds-checking for that buffer, moves size arguments to size_t, decouples construction from hash computation, emulates the tagging feature found in SerializationFormat to assist troubleshooting, and switches feasible reinterpret_casts to static_casts.
This commit is contained in:
parent
2585ccd873
commit
82822b1e07
2 changed files with 427 additions and 83 deletions
126
src/Hash.h
126
src/Hash.h
|
@ -1,7 +1,7 @@
|
|||
// See the file "COPYING" in the main distribution directory for copyright.
|
||||
|
||||
/***
|
||||
* This file contains functions to generate hashes used keyed hash functions.
|
||||
* This file contains functions to generate hashes using keyed hash functions.
|
||||
* Keyed hash functions make it difficult/impossible to find information about the
|
||||
* output of a hash when the key is unknown to the attacker. This fact holds, even
|
||||
* when the input value is known.
|
||||
|
@ -10,8 +10,7 @@
|
|||
* It is important that these hashes are not easily guessable to prevent complexity attacks.
|
||||
*
|
||||
* The HashKey class is the actual class that is used to generate Hash keys that are used
|
||||
* internally, e.g. for lookups in hash-tables; the Hashes are also used for connection ID
|
||||
* generation.
|
||||
* internally, e.g. for lookups in hash-tables and connection ID generation.
|
||||
*
|
||||
* This means that the hashes created by most functions in this file will be different each run,
|
||||
* unless a seed file is used. There are a few functions that create hashes that are static over
|
||||
|
@ -228,14 +227,18 @@ constexpr int NUM_HASH_KEYS = HASH_KEY_STRING + 1;
|
|||
class HashKey
|
||||
{
|
||||
public:
|
||||
explicit HashKey(bro_int_t i);
|
||||
explicit HashKey(bro_uint_t u);
|
||||
explicit HashKey() { }
|
||||
explicit HashKey(bool b);
|
||||
explicit HashKey(int i);
|
||||
explicit HashKey(bro_int_t bi);
|
||||
explicit HashKey(bro_uint_t bu);
|
||||
explicit HashKey(uint32_t u);
|
||||
HashKey(const uint32_t u[], int n);
|
||||
HashKey(const uint32_t u[], size_t n);
|
||||
explicit HashKey(double d);
|
||||
explicit HashKey(const void* p);
|
||||
explicit HashKey(const char* s);
|
||||
explicit HashKey(const String* s);
|
||||
explicit HashKey(const char* s); // No copying, no ownership
|
||||
explicit HashKey(const String* s); // No copying, no ownership
|
||||
|
||||
~HashKey()
|
||||
{
|
||||
if ( is_our_dynamic )
|
||||
|
@ -250,19 +253,19 @@ public:
|
|||
// The calling sequence here is unusual (normally key would be
|
||||
// first) to avoid possible ambiguities with the next constructor,
|
||||
// which is the more commonly used one.
|
||||
HashKey(int copy_key, void* key, int size);
|
||||
HashKey(int copy_key, void* key, size_t size);
|
||||
|
||||
// Same, but automatically copies the key.
|
||||
HashKey(const void* key, int size, hash_t hash);
|
||||
HashKey(const void* key, size_t size, hash_t hash);
|
||||
|
||||
// Builds a key from the given chunk of bytes.
|
||||
HashKey(const void* bytes, int size);
|
||||
HashKey(const void* bytes, size_t size);
|
||||
|
||||
// Create a Hashkey given all of its components *without*
|
||||
// copying the key and *without* taking ownership. Note that
|
||||
// "dont_copy" is a type placeholder to differentiate this member
|
||||
// function from the one above; its value is not used.
|
||||
HashKey(const void* key, int size, hash_t hash, bool dont_copy);
|
||||
HashKey(const void* key, size_t size, hash_t hash, bool dont_copy);
|
||||
|
||||
// Hands over the key to the caller. This means that if the
|
||||
// key is our dynamic, we give it to the caller and mark it
|
||||
|
@ -271,8 +274,8 @@ public:
|
|||
void* TakeKey();
|
||||
|
||||
const void* Key() const { return key; }
|
||||
int Size() const { return size; }
|
||||
hash_t Hash() const { return hash; }
|
||||
size_t Size() const { return size; }
|
||||
hash_t Hash() const;
|
||||
|
||||
[[deprecated("Remove in v5.1. MemoryAllocation() is deprecated and will be removed. See "
|
||||
"GHI-572.")]] unsigned int
|
||||
|
@ -281,22 +284,105 @@ public:
|
|||
return padded_sizeof(*this) + util::pad_size(size);
|
||||
}
|
||||
|
||||
static hash_t HashBytes(const void* bytes, int size);
|
||||
static hash_t HashBytes(const void* bytes, size_t size);
|
||||
|
||||
// A HashKey is "allocated" when the underlying key points somewhere
|
||||
// other than our internal key_u union. This is almost like
|
||||
// is_our_dynamic, but remains true also after TakeKey().
|
||||
bool IsAllocated() const
|
||||
{
|
||||
return (key != nullptr && key != reinterpret_cast<const char*>(&key_u));
|
||||
}
|
||||
|
||||
// Buffer size reservation. Repeated calls to these methods
|
||||
// incrementally build up the eventual buffer size to be allocated via
|
||||
// Allocate().
|
||||
template <typename T> void ReserveType(const char* tag) { Reserve(tag, sizeof(T), sizeof(T)); }
|
||||
void Reserve(const char* tag, size_t addl_size, size_t alignment = 0);
|
||||
|
||||
// Allocates the reserved amount of memory
|
||||
void Allocate();
|
||||
|
||||
// Incremental writes into an allocated HashKey. The tags give context
|
||||
// to what's being written and are only used in debug-build log streams.
|
||||
// When true, the alignment boolean will cause write-marker alignment to
|
||||
// the size of the item being written, otherwise writes happen directly
|
||||
// at the current marker.
|
||||
void Write(const char* tag, bool b);
|
||||
void Write(const char* tag, int i, bool align = true);
|
||||
void Write(const char* tag, bro_int_t bi, bool align = true);
|
||||
void Write(const char* tag, bro_uint_t bu, bool align = true);
|
||||
void Write(const char* tag, uint32_t u, bool align = true);
|
||||
void Write(const char* tag, double d, bool align = true);
|
||||
|
||||
void Write(const char* tag, const void* bytes, size_t n, size_t alignment = 0);
|
||||
|
||||
// For writes that copy directly into the allocated buffer, this method
|
||||
// advances the write marker without modifying content.
|
||||
void SkipWrite(const char* tag, size_t n);
|
||||
|
||||
// Aligns the write marker to the next multiple of the given alignment size.
|
||||
void AlignWrite(size_t alignment);
|
||||
|
||||
// Bounds check: if the buffer does not have at least n bytes available
|
||||
// to write into, triggers an InternalError.
|
||||
void EnsureWriteSpace(size_t n) const;
|
||||
|
||||
// Reads don't modify our internal state except for the read offset
|
||||
// pointer. To blend in more seamlessly with the rest of Zeek we keep
|
||||
// reads a const operation.
|
||||
void ResetRead() const { read_size = 0; }
|
||||
|
||||
// Incremental reads from an allocated HashKey. As with writes, the
|
||||
// tags are only used for debug-build logging, and alignment prior
|
||||
// to the read of the item is controlled by the align boolean.
|
||||
void Read(const char* tag, bool& b) const;
|
||||
void Read(const char* tag, int& i, bool align = true) const;
|
||||
void Read(const char* tag, bro_int_t& bi, bool align = true) const;
|
||||
void Read(const char* tag, bro_uint_t& bu, bool align = true) const;
|
||||
void Read(const char* tag, uint32_t& u, bool align = true) const;
|
||||
void Read(const char* tag, double& d, bool align = true) const;
|
||||
|
||||
void Read(const char* tag, void* out, size_t n, size_t alignment = 0) const;
|
||||
|
||||
// These mirror the corresponding write methods above.
|
||||
void SkipRead(const char* tag, size_t n) const;
|
||||
void AlignRead(size_t alignment) const;
|
||||
void EnsureReadSpace(size_t n) const;
|
||||
|
||||
void* KeyAtWrite() { return static_cast<void*>(key + write_size); }
|
||||
const void* KeyAtRead() const { return static_cast<void*>(key + read_size); }
|
||||
const void* KeyEnd() const { return static_cast<void*>(key + size); }
|
||||
|
||||
protected:
|
||||
void* CopyKey(const void* key, int size) const;
|
||||
char* CopyKey(const char* key, size_t size) const;
|
||||
|
||||
// Payload setters for types stored directoly in the key_u union. These
|
||||
// adjust the size and write_size markers to indicate a full buffer, and
|
||||
// use the key_u union for storage.
|
||||
void Set(bool b);
|
||||
void Set(int i);
|
||||
void Set(bro_int_t bi);
|
||||
void Set(bro_uint_t bu);
|
||||
void Set(uint32_t u);
|
||||
void Set(double d);
|
||||
void Set(const void* p);
|
||||
|
||||
union {
|
||||
bro_int_t i;
|
||||
bool b;
|
||||
int i;
|
||||
bro_int_t bi;
|
||||
uint32_t u32;
|
||||
double d;
|
||||
const void* p;
|
||||
} key_u;
|
||||
|
||||
void* key;
|
||||
hash_t hash;
|
||||
int size;
|
||||
char* key = nullptr;
|
||||
mutable hash_t hash = 0;
|
||||
size_t size = 0;
|
||||
bool is_our_dynamic = false;
|
||||
size_t write_size = 0;
|
||||
mutable size_t read_size = 0;
|
||||
};
|
||||
|
||||
extern void init_hash_function();
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue