mirror of
https://github.com/zeek/zeek.git
synced 2025-10-05 08:08:19 +00:00
Initial import of svn+ssh:://svn.icir.org/bro/trunk/bro as of r7088
This commit is contained in:
commit
61757ac78b
1383 changed files with 380824 additions and 0 deletions
193
src/BroString.h
Normal file
193
src/BroString.h
Normal file
|
@ -0,0 +1,193 @@
|
|||
// $Id: BroString.h 6219 2008-10-01 05:39:07Z vern $
|
||||
//
|
||||
// See the file "COPYING" in the main distribution directory for copyright.
|
||||
|
||||
#ifndef brostring_h
|
||||
#define brostring_h
|
||||
|
||||
#include <vector>
|
||||
#include <string>
|
||||
#include <iostream>
|
||||
#include <stdlib.h>
|
||||
#include <sys/types.h>
|
||||
using namespace std;
|
||||
|
||||
#include "util.h"
|
||||
|
||||
typedef u_char* byte_vec;
|
||||
|
||||
// Forward declaration, for helper functions that convert (sub)string vectors
|
||||
// to and from policy-level representations.
|
||||
//
|
||||
class VectorVal;
|
||||
|
||||
class BroString {
|
||||
public:
|
||||
typedef vector<BroString*> Vec;
|
||||
typedef Vec::iterator VecIt;
|
||||
typedef Vec::const_iterator VecCIt;
|
||||
|
||||
typedef vector<const BroString*> CVec;
|
||||
typedef Vec::iterator CVecIt;
|
||||
typedef Vec::const_iterator CVecCIt;
|
||||
|
||||
// IdxVecs are vectors of indices of characters in a string.
|
||||
typedef vector<int> IdxVec;
|
||||
typedef IdxVec::iterator IdxVecIt;
|
||||
typedef IdxVec::const_iterator IdxVecCIt;
|
||||
|
||||
BroString(int arg_final_NUL, byte_vec str, int arg_n);
|
||||
BroString(const u_char* str, int arg_n, int add_NUL);
|
||||
BroString(const char* str);
|
||||
BroString(const string& str);
|
||||
BroString(const BroString& bs);
|
||||
BroString();
|
||||
~BroString() { Reset(); }
|
||||
|
||||
const BroString& operator=(const BroString& bs);
|
||||
bool operator==(const BroString& bs) const;
|
||||
bool operator<(const BroString& bs) const;
|
||||
|
||||
byte_vec Bytes() const { return b; }
|
||||
int Len() const { return n; }
|
||||
|
||||
// Releases the string's current contents, if any, and
|
||||
// adopts the byte vector of given length. The string will
|
||||
// manage the memory occupied by the string afterwards.
|
||||
//
|
||||
void Adopt(byte_vec bytes, int len);
|
||||
|
||||
// Various flavors of methods that release the string's
|
||||
// current contents, if any, and then set the string's
|
||||
// contents to a copy of the string given by the arguments.
|
||||
//
|
||||
void Set(const u_char* str, int len, int add_NUL=1);
|
||||
void Set(const char* str);
|
||||
void Set(const string& str);
|
||||
void Set(const BroString &str);
|
||||
|
||||
void SetUseFreeToDelete(int use_it)
|
||||
{ use_free_to_delete = use_it; }
|
||||
|
||||
const char* CheckString() const;
|
||||
|
||||
enum render_style {
|
||||
ESC_NONE = 0,
|
||||
|
||||
ESC_NULL = (1 << 0), // 0 -> "\0"
|
||||
ESC_DEL = (1 << 1), // DEL -> "^?"
|
||||
ESC_LOW = (1 << 2), // values <= 26 mapped into "^[A-Z]"
|
||||
ESC_ESC = (1 << 3), // '\' -> "\\"
|
||||
ESC_QUOT = (1 << 4), // '"' -> "\"", ''' -> "\'"
|
||||
ESC_HEX = (1 << 5), // Not in [32, 126]? -> "%XX"
|
||||
ESC_DOT = (1 << 6), // Not in [32, 126]? -> "."
|
||||
|
||||
// For serialization: '<string len> <string>'
|
||||
ESC_SER = (1 << 7),
|
||||
};
|
||||
|
||||
static const int EXPANDED_STRING = // the original style
|
||||
ESC_NULL | ESC_DEL | ESC_LOW | ESC_HEX;
|
||||
|
||||
static const int BRO_STRING_LITERAL = // as in a Bro string literal
|
||||
ESC_ESC | ESC_QUOT | ESC_HEX;
|
||||
|
||||
// Renders a string into a newly allocated character array that
|
||||
// you have to delete[]. You can combine the render styles given
|
||||
// above to achieve the representation you desire. If you pass a
|
||||
// pointer to an integer as the final argument, you'll receive the
|
||||
// entire length of the resulting char* in it.
|
||||
//
|
||||
// Note that you need to delete[] the resulting string.
|
||||
//
|
||||
char* Render(int format = EXPANDED_STRING, int* len = 0) const;
|
||||
|
||||
// Similar to the above, but useful for output streams.
|
||||
// Also more useful for debugging purposes since no deallocation
|
||||
// is required on your part here.
|
||||
//
|
||||
ostream& Render(ostream& os, int format = ESC_SER) const;
|
||||
|
||||
// Reads a string from an input stream. Unless you use a render
|
||||
// style combination that uses ESC_SER, note that the streams
|
||||
// will consider whitespace as a field delimiter.
|
||||
//
|
||||
istream& Read(istream& is, int format = ESC_SER);
|
||||
|
||||
// XXX Fix redundancy: strings.bif implements both to_lower
|
||||
// XXX and to_upper; the latter doesn't use BroString::ToUpper().
|
||||
void ToUpper();
|
||||
|
||||
unsigned int MemoryAllocation() const
|
||||
{ return padded_sizeof(*this) + pad_size(n + final_NUL); }
|
||||
|
||||
// Returns new string containing the substring of this string,
|
||||
// starting at @start >= 0 for going up to @length elements,
|
||||
// A negative @length means "until end of string". Other invalid
|
||||
// values result in a return value of 0.
|
||||
//
|
||||
BroString* GetSubstring(int start, int length) const;
|
||||
|
||||
// Returns the start index of s in this string, counting from 0.
|
||||
// If s is not found, -1 is returned.
|
||||
//
|
||||
int FindSubstring(const BroString* s) const;
|
||||
|
||||
// Splits the string into substrings, taking all the indices in
|
||||
// the given vector as cutting points. The vector does not need
|
||||
// to be sorted, and can have multiple entries. Out-of-bounds
|
||||
// indices are ignored. All returned strings are newly allocated.
|
||||
//
|
||||
Vec* Split(const IdxVec& indices) const;
|
||||
|
||||
// Helper functions for vectors:
|
||||
static VectorVal* VecToPolicy(Vec* vec);
|
||||
static Vec* VecFromPolicy(VectorVal* vec);
|
||||
static char* VecToString(const Vec* vec);
|
||||
|
||||
protected:
|
||||
void Reset();
|
||||
|
||||
byte_vec b;
|
||||
int n;
|
||||
unsigned int final_NUL:1; // whether we have added a final NUL
|
||||
unsigned int use_free_to_delete:1; // free() vs. operator delete
|
||||
};
|
||||
|
||||
// A comparison class that sorts pointers to BroString's according to
|
||||
// the length of the pointed-to strings. Sort order can be specified
|
||||
// through the constructor.
|
||||
//
|
||||
class BroStringLenCmp {
|
||||
public:
|
||||
BroStringLenCmp(bool increasing = true) { _increasing = increasing; }
|
||||
bool operator()(BroString*const& bst1, BroString*const& bst2);
|
||||
|
||||
private:
|
||||
unsigned int _increasing;
|
||||
};
|
||||
|
||||
// Default output stream operator, using rendering mode EXPANDED_STRING.
|
||||
ostream& operator<<(ostream& os, const BroString& bs);
|
||||
|
||||
extern int Bstr_eq(const BroString* s1, const BroString* s2);
|
||||
extern int Bstr_cmp(const BroString* s1, const BroString* s2);
|
||||
|
||||
// A data_chunk_t specifies a length-delimited constant string. It is
|
||||
// often used for substrings of other BroString's to avoid memory copy,
|
||||
// which would be necessary if BroString were used. Unlike BroString,
|
||||
// the string should not be deallocated on destruction.
|
||||
//
|
||||
// "BroConstString" might be a better name here.
|
||||
|
||||
struct data_chunk_t {
|
||||
int length;
|
||||
const char* data;
|
||||
};
|
||||
|
||||
extern BroString* concatenate(std::vector<data_chunk_t>& v);
|
||||
extern BroString* concatenate(BroString::Vec& v);
|
||||
extern BroString* concatenate(BroString::CVec& v);
|
||||
extern void delete_strings(std::vector<const BroString*>& v);
|
||||
|
||||
#endif
|
Loading…
Add table
Add a link
Reference in a new issue