2018-05-24 23:33:56 -05:00
|
|
|
// 21 may 2018
|
|
|
|
#ifdef _WIN32
|
|
|
|
#define _CRT_SECURE_CPP_OVERLOAD_STANDARD_NAMES 1
|
|
|
|
#define _CRT_SECURE_CPP_OVERLOAD_STANDARD_NAMES_COUNT 1
|
|
|
|
#include <io.h>
|
|
|
|
#include <sys/stat.h>
|
|
|
|
#define openfunc _open
|
|
|
|
#define openflags (_O_RDONLY | _O_BINARY)
|
|
|
|
#define openmode (_S_IREAD)
|
|
|
|
#define readfunc _read
|
|
|
|
#define readtype int
|
|
|
|
#define closefunc _close
|
|
|
|
#else
|
|
|
|
#endif
|
2018-05-25 20:07:45 -05:00
|
|
|
#include <typeinfo>
|
2018-05-27 14:36:16 -05:00
|
|
|
#include <map>
|
2018-05-26 16:42:11 -05:00
|
|
|
#include <algorithm>
|
2018-05-26 19:09:16 -05:00
|
|
|
#include <string.h>
|
2018-05-27 14:36:16 -05:00
|
|
|
#include <stdint.h>
|
2018-05-25 20:07:45 -05:00
|
|
|
#include "lib.hpp"
|
|
|
|
|
|
|
|
class eofError : public Error {
|
|
|
|
public:
|
|
|
|
virtual ~eofError(void);
|
|
|
|
|
|
|
|
virtual const char *String(void) const;
|
|
|
|
};
|
|
|
|
|
2018-05-26 15:56:53 -05:00
|
|
|
eofError::~eofError(void)
|
2018-05-25 20:07:45 -05:00
|
|
|
{
|
|
|
|
// do nothing
|
|
|
|
}
|
|
|
|
|
2018-05-26 15:56:53 -05:00
|
|
|
const char *eofError::String(void) const
|
2018-05-25 20:07:45 -05:00
|
|
|
{
|
|
|
|
return "EOF";
|
|
|
|
}
|
|
|
|
|
|
|
|
class shortWriteError : public Error {
|
|
|
|
public:
|
|
|
|
virtual ~shortWriteError(void);
|
|
|
|
|
|
|
|
virtual const char *String(void) const;
|
|
|
|
};
|
|
|
|
|
2018-05-26 15:56:53 -05:00
|
|
|
shortWriteError::~shortWriteError(void)
|
2018-05-25 20:07:45 -05:00
|
|
|
{
|
|
|
|
// do nothing
|
|
|
|
}
|
|
|
|
|
2018-05-26 15:56:53 -05:00
|
|
|
const char *shortWriteError::String(void) const
|
2018-05-25 20:07:45 -05:00
|
|
|
{
|
|
|
|
return "short write";
|
|
|
|
}
|
|
|
|
|
|
|
|
Error *NewEOF(void)
|
|
|
|
{
|
|
|
|
return new eofError;
|
|
|
|
}
|
|
|
|
|
|
|
|
Error *NewErrShortWrite(void)
|
|
|
|
{
|
|
|
|
return new shortWriteError;
|
|
|
|
}
|
|
|
|
|
|
|
|
bool IsEOF(Error *e)
|
|
|
|
{
|
2018-05-26 15:56:53 -05:00
|
|
|
// typeid does not work directly with pointers, alas (see https://stackoverflow.com/questions/4202877/typeid-for-polymorphic-types)
|
|
|
|
return typeid (*e) == typeid (eofError);
|
2018-05-25 20:07:45 -05:00
|
|
|
}
|
2018-05-24 23:33:56 -05:00
|
|
|
|
2018-05-27 14:36:16 -05:00
|
|
|
namespace {
|
|
|
|
|
|
|
|
struct sliceAlloc {
|
|
|
|
char *b;
|
|
|
|
size_t n;
|
|
|
|
uintmax_t refcount;
|
|
|
|
};
|
|
|
|
|
|
|
|
std::map<uintptr_t, struct sliceAlloc> sliceAllocs;
|
|
|
|
|
|
|
|
char *sliceAlloc(size_t n)
|
|
|
|
{
|
|
|
|
struct sliceAlloc sa;
|
|
|
|
|
|
|
|
sa.b = new char[n];
|
|
|
|
sa.n = n;
|
|
|
|
sa.refcount = 1;
|
|
|
|
sliceAllocs[(uintptr_t) (sa.b)] = sa;
|
|
|
|
return sa.b;
|
|
|
|
}
|
|
|
|
|
|
|
|
uintptr_t sliceLookup(char *b)
|
|
|
|
{
|
2018-05-27 14:50:00 -05:00
|
|
|
return sliceAllocs.lower_bound((uintptr_t) b)->first;
|
2018-05-27 14:36:16 -05:00
|
|
|
}
|
|
|
|
|
|
|
|
void sliceRetain(char *b)
|
|
|
|
{
|
|
|
|
if (b == NULL)
|
|
|
|
return;
|
|
|
|
sliceAllocs[sliceLookup(b)].refcount++;
|
|
|
|
}
|
|
|
|
|
|
|
|
void sliceRelease(char *b)
|
|
|
|
{
|
|
|
|
uintptr_t key;
|
|
|
|
|
|
|
|
if (b == NULL)
|
|
|
|
return;
|
|
|
|
key = sliceLookup(b);
|
|
|
|
sliceAllocs[key].refcount--;
|
|
|
|
if (sliceAllocs[key].refcount == 0) {
|
|
|
|
delete[] sliceAllocs[key].b;
|
|
|
|
sliceAllocs.erase(key);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
ByteSlice::ByteSlice(void)
|
|
|
|
{
|
|
|
|
this->data = NULL;
|
|
|
|
this->len = 0;
|
|
|
|
this->cap = 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
ByteSlice::ByteSlice(const ByteSlice &b)
|
|
|
|
{
|
|
|
|
this->data = b.data;
|
|
|
|
sliceRetain(this->data);
|
|
|
|
this->len = b.len;
|
|
|
|
this->cap = b.cap;
|
|
|
|
}
|
|
|
|
|
|
|
|
ByteSlice::ByteSlice(ByteSlice &&b)
|
|
|
|
{
|
|
|
|
this->data = b.data;
|
|
|
|
b.data = NULL;
|
|
|
|
this->len = b.len;
|
|
|
|
b.len = 0;
|
|
|
|
this->cap = b.cap;
|
|
|
|
b.cap = 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
ByteSlice::ByteSlice(const char *b, size_t n)
|
|
|
|
{
|
|
|
|
this->data = sliceAlloc(n);
|
|
|
|
memcpy(this->data, b, n * sizeof (char));
|
|
|
|
this->len = n;
|
|
|
|
this->cap = n;
|
|
|
|
}
|
|
|
|
|
|
|
|
ByteSlice::ByteSlice(size_t len, size_t cap)
|
|
|
|
{
|
|
|
|
this->data = sliceAlloc(cap);
|
|
|
|
memset(this->data, 0, len * sizeof (char));
|
|
|
|
this->len = len;
|
|
|
|
this->cap = cap;
|
|
|
|
}
|
|
|
|
|
2018-05-27 15:32:33 -05:00
|
|
|
ByteSlice::ByteSlice(int len, size_t cap) :
|
|
|
|
ByteSlice::ByteSlice((size_t) len, cap)
|
|
|
|
{
|
|
|
|
// do nothing else
|
|
|
|
}
|
|
|
|
|
2018-05-27 14:36:16 -05:00
|
|
|
ByteSlice::~ByteSlice(void)
|
|
|
|
{
|
|
|
|
sliceRelease(this->data);
|
|
|
|
}
|
|
|
|
|
|
|
|
ByteSlice &ByteSlice::operator=(const ByteSlice &b)
|
|
|
|
{
|
|
|
|
this->data = b.data;
|
|
|
|
sliceRetain(this->data);
|
|
|
|
this->len = b.len;
|
|
|
|
this->cap = b.cap;
|
|
|
|
return *this;
|
|
|
|
}
|
|
|
|
|
|
|
|
ByteSlice &ByteSlice::operator=(ByteSlice &&b)
|
|
|
|
{
|
|
|
|
this->data = b.data;
|
|
|
|
b.data = NULL;
|
|
|
|
this->len = b.len;
|
|
|
|
b.len = 0;
|
|
|
|
this->cap = b.cap;
|
|
|
|
b.cap = 0;
|
|
|
|
return *this;
|
|
|
|
}
|
|
|
|
|
|
|
|
char *ByteSlice::Data(void)
|
|
|
|
{
|
|
|
|
return this->data;
|
|
|
|
}
|
|
|
|
|
|
|
|
const char *ByteSlice::Data(void) const
|
|
|
|
{
|
|
|
|
return this->data;
|
|
|
|
}
|
|
|
|
|
|
|
|
size_t ByteSlice::Len(void) const
|
|
|
|
{
|
|
|
|
return this->len;
|
|
|
|
}
|
|
|
|
|
|
|
|
size_t ByteSlice::Cap(void) const
|
|
|
|
{
|
|
|
|
return this->cap;
|
|
|
|
}
|
|
|
|
|
|
|
|
ByteSlice ByteSlice::Slice(size_t start, size_t end)
|
|
|
|
{
|
|
|
|
ByteSlice b;
|
|
|
|
|
|
|
|
b.data = this->data + start;
|
|
|
|
sliceRetain(b.data);
|
|
|
|
b.len = end - start;
|
|
|
|
b.cap = this->cap - start;
|
|
|
|
return b;
|
|
|
|
}
|
|
|
|
|
|
|
|
ByteSlice ByteSlice::Append(const char *b, size_t n)
|
|
|
|
{
|
|
|
|
ByteSlice s;
|
|
|
|
|
|
|
|
if (this->len + n < this->cap) {
|
|
|
|
s.data = this->data;
|
|
|
|
sliceRetain(s.data);
|
|
|
|
s.len = this->len + n;
|
|
|
|
s.cap = this->cap;
|
|
|
|
memcpy(s.data + this->len, b, n * sizeof (char));
|
|
|
|
return s;
|
|
|
|
}
|
|
|
|
s.data = sliceAlloc(this->len + n);
|
|
|
|
memcpy(s.data, this->data, this->len * sizeof (char));
|
|
|
|
memcpy(s.data + this->len, b, n * sizeof (char));
|
|
|
|
s.len = this->len + n;
|
|
|
|
s.cap = this->len + n;
|
|
|
|
return s;
|
|
|
|
}
|
|
|
|
|
|
|
|
ByteSlice ByteSlice::Append(const ByteSlice &b)
|
|
|
|
{
|
|
|
|
return this->Append(b.data, b.len);
|
|
|
|
}
|
|
|
|
|
2018-05-27 14:50:00 -05:00
|
|
|
ByteSlice ByteSlice::AppendString(const char *str)
|
|
|
|
{
|
|
|
|
return this->Append(str, strlen(str));
|
|
|
|
}
|
|
|
|
|
2018-05-27 14:36:16 -05:00
|
|
|
void ByteSlice::CopyFrom(const char *b, size_t n)
|
|
|
|
{
|
|
|
|
n = std::min(this->len, n);
|
|
|
|
memcpy(this->data, b, n);
|
|
|
|
}
|
|
|
|
|
|
|
|
void ByteSlice::CopyFrom(const ByteSlice &b)
|
|
|
|
{
|
|
|
|
this->CopyFrom(b.data, b.len);
|
|
|
|
}
|
|
|
|
|
2018-05-24 23:33:56 -05:00
|
|
|
#define nbuf 1024
|
|
|
|
|
2018-05-25 20:07:45 -05:00
|
|
|
Scanner::Scanner(ReadCloser *r)
|
2018-05-24 23:33:56 -05:00
|
|
|
{
|
2018-05-25 20:07:45 -05:00
|
|
|
this->r = r;
|
2018-05-27 18:48:39 -05:00
|
|
|
this->buf = ByteSlice(nbuf, nbuf);
|
|
|
|
this->p = ByteSlice();
|
2018-05-27 14:50:00 -05:00
|
|
|
this->line = ByteSlice(0, nbuf);
|
2018-05-26 15:56:53 -05:00
|
|
|
this->err = NULL;
|
2018-05-24 23:33:56 -05:00
|
|
|
}
|
|
|
|
|
|
|
|
Scanner::~Scanner(void)
|
|
|
|
{
|
2018-05-25 20:07:45 -05:00
|
|
|
if (this->err != NULL)
|
|
|
|
delete this->err;
|
2018-05-24 23:33:56 -05:00
|
|
|
}
|
|
|
|
|
|
|
|
bool Scanner::Scan(void)
|
|
|
|
{
|
2018-05-26 15:56:53 -05:00
|
|
|
size_t n;
|
2018-05-24 23:33:56 -05:00
|
|
|
|
2018-05-25 20:07:45 -05:00
|
|
|
if (this->err != NULL)
|
2018-05-24 23:33:56 -05:00
|
|
|
return false;
|
2018-05-27 14:50:00 -05:00
|
|
|
this->line = this->line.Slice(0, 0);
|
2018-05-24 23:33:56 -05:00
|
|
|
for (;;) {
|
2018-05-27 18:48:39 -05:00
|
|
|
if (this->p.Len() > 0) {
|
2018-05-24 23:33:56 -05:00
|
|
|
size_t j;
|
|
|
|
bool haveline;
|
|
|
|
|
|
|
|
haveline = false;
|
2018-05-27 18:48:39 -05:00
|
|
|
for (j = 0; j < this->p.Len(); j++)
|
|
|
|
if (this->p.Data()[j] == '\n') {
|
2018-05-24 23:33:56 -05:00
|
|
|
haveline = true;
|
|
|
|
break;
|
|
|
|
}
|
2018-05-27 18:48:39 -05:00
|
|
|
this->line = this->line.Append(this->p.Slice(0, j));
|
|
|
|
this->p = this->p.Slice(j, this->p.Len());
|
2018-05-24 23:33:56 -05:00
|
|
|
if (haveline) {
|
|
|
|
// swallow the \n for the next time through
|
2018-05-27 18:48:39 -05:00
|
|
|
this->p = this->p.Slice(1, this->p.Len());
|
2018-05-24 23:33:56 -05:00
|
|
|
return true;
|
|
|
|
}
|
|
|
|
// otherwise, the buffer was exhausted in the middle of a line, so fall through
|
|
|
|
}
|
|
|
|
// need to refill the buffer
|
2018-05-27 15:32:33 -05:00
|
|
|
this->err = this->r->Read(this->buf, &n);
|
2018-05-25 20:07:45 -05:00
|
|
|
if (this->err != NULL)
|
2018-05-24 23:33:56 -05:00
|
|
|
return false;
|
2018-05-27 18:48:39 -05:00
|
|
|
this->p = this->buf.Slice(0, n);
|
2018-05-24 23:33:56 -05:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2018-05-27 14:50:00 -05:00
|
|
|
ByteSlice Scanner::Bytes(void) const
|
2018-05-24 23:33:56 -05:00
|
|
|
{
|
2018-05-27 14:50:00 -05:00
|
|
|
return this->line;
|
2018-05-24 23:33:56 -05:00
|
|
|
}
|
|
|
|
|
2018-05-26 15:56:53 -05:00
|
|
|
Error *Scanner::Err(void) const
|
2018-05-24 23:33:56 -05:00
|
|
|
{
|
2018-05-25 20:07:45 -05:00
|
|
|
if (!IsEOF(this->err))
|
|
|
|
return this->err;
|
|
|
|
return NULL;
|
2018-05-24 23:33:56 -05:00
|
|
|
}
|
2018-05-26 16:42:11 -05:00
|
|
|
|
2018-05-27 14:50:00 -05:00
|
|
|
std::vector<ByteSlice> ByteSliceFields(ByteSlice s)
|
2018-05-26 16:42:11 -05:00
|
|
|
{
|
2018-05-27 14:50:00 -05:00
|
|
|
std::vector<ByteSlice> ret;
|
|
|
|
const char *data;
|
|
|
|
size_t i, j;
|
2018-05-26 16:42:11 -05:00
|
|
|
|
2018-05-27 14:50:00 -05:00
|
|
|
data = s.Data();
|
|
|
|
i = 0;
|
|
|
|
while (i < s.Len()) {
|
|
|
|
if (data[i] == ' ' || data[i] == '\t') {
|
|
|
|
i++;
|
2018-05-26 16:42:11 -05:00
|
|
|
continue;
|
|
|
|
}
|
2018-05-27 14:50:00 -05:00
|
|
|
for (j = i + 1; j < s.Len(); j++)
|
|
|
|
if (data[j] == ' ' || data[j] == '\t')
|
2018-05-26 16:42:11 -05:00
|
|
|
break;
|
2018-05-27 14:50:00 -05:00
|
|
|
ret.push_back(s.Slice(i, j));
|
|
|
|
i = j;
|
2018-05-26 16:42:11 -05:00
|
|
|
}
|
|
|
|
return ret;
|
|
|
|
}
|