424 lines
15 KiB
C
424 lines
15 KiB
C
/*
|
|
* Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
|
|
*
|
|
* This program is free software: you can use, redistribute, and/or modify
|
|
* it under the terms of the GNU Affero General Public License, version 3
|
|
* or later ("AGPL"), as published by the Free Software Foundation.
|
|
*
|
|
* This program is distributed in the hope that it will be useful, but WITHOUT
|
|
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
|
* FITNESS FOR A PARTICULAR PURPOSE.
|
|
*
|
|
* You should have received a copy of the GNU Affero General Public License
|
|
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
|
*/
|
|
#ifndef _TD_DATA_FORMAT_H_
|
|
#define _TD_DATA_FORMAT_H_
|
|
|
|
#include <stdint.h>
|
|
#include <stdlib.h>
|
|
#include <string.h>
|
|
|
|
#include "talgo.h"
|
|
#include "ttype.h"
|
|
#include "tutil.h"
|
|
|
|
#ifdef __cplusplus
|
|
extern "C" {
|
|
#endif
|
|
|
|
#define STR_TO_VARSTR(x, str) \
|
|
do { \
|
|
VarDataLenT __len = (VarDataLenT)strlen(str); \
|
|
*(VarDataLenT *)(x) = __len; \
|
|
memcpy(varDataVal(x), (str), __len); \
|
|
} while (0);
|
|
|
|
#define STR_WITH_MAXSIZE_TO_VARSTR(x, str, _maxs) \
|
|
do { \
|
|
char *_e = stpncpy(varDataVal(x), (str), (_maxs)-VARSTR_HEADER_SIZE); \
|
|
varDataSetLen(x, (_e - (x)-VARSTR_HEADER_SIZE)); \
|
|
} while (0)
|
|
|
|
#define STR_WITH_SIZE_TO_VARSTR(x, str, _size) \
|
|
do { \
|
|
*(VarDataLenT *)(x) = (VarDataLenT)(_size); \
|
|
memcpy(varDataVal(x), (str), (_size)); \
|
|
} while (0);
|
|
|
|
// ----------------- TSDB COLUMN DEFINITION
|
|
typedef struct {
|
|
int8_t type; // Column type
|
|
int16_t colId; // column ID
|
|
int16_t bytes; // column bytes
|
|
int16_t offset; // point offset in SDataRow after the header part
|
|
} STColumn;
|
|
|
|
#define colType(col) ((col)->type)
|
|
#define colColId(col) ((col)->colId)
|
|
#define colBytes(col) ((col)->bytes)
|
|
#define colOffset(col) ((col)->offset)
|
|
|
|
#define colSetType(col, t) (colType(col) = (t))
|
|
#define colSetColId(col, id) (colColId(col) = (id))
|
|
#define colSetBytes(col, b) (colBytes(col) = (b))
|
|
#define colSetOffset(col, o) (colOffset(col) = (o))
|
|
|
|
// ----------------- TSDB SCHEMA DEFINITION
|
|
typedef struct {
|
|
int version; // version
|
|
int numOfCols; // Number of columns appended
|
|
int tlen; // maximum length of a SDataRow without the header part (sizeof(VarDataOffsetT) + sizeof(VarDataLenT) + (bytes))
|
|
uint16_t flen; // First part length in a SDataRow after the header part
|
|
uint16_t vlen; // pure value part length, excluded the overhead (bytes only)
|
|
STColumn columns[];
|
|
} STSchema;
|
|
|
|
#define schemaNCols(s) ((s)->numOfCols)
|
|
#define schemaVersion(s) ((s)->version)
|
|
#define schemaTLen(s) ((s)->tlen)
|
|
#define schemaFLen(s) ((s)->flen)
|
|
#define schemaVLen(s) ((s)->vlen)
|
|
#define schemaColAt(s, i) ((s)->columns + i)
|
|
#define tdFreeSchema(s) tfree((s))
|
|
|
|
STSchema *tdDupSchema(STSchema *pSchema);
|
|
int tdEncodeSchema(void **buf, STSchema *pSchema);
|
|
void * tdDecodeSchema(void *buf, STSchema **pRSchema);
|
|
|
|
static FORCE_INLINE int comparColId(const void *key1, const void *key2) {
|
|
if (*(int16_t *)key1 > ((STColumn *)key2)->colId) {
|
|
return 1;
|
|
} else if (*(int16_t *)key1 < ((STColumn *)key2)->colId) {
|
|
return -1;
|
|
} else {
|
|
return 0;
|
|
}
|
|
}
|
|
|
|
static FORCE_INLINE STColumn *tdGetColOfID(STSchema *pSchema, int16_t colId) {
|
|
void *ptr = bsearch(&colId, (void *)pSchema->columns, schemaNCols(pSchema), sizeof(STColumn), comparColId);
|
|
if (ptr == NULL) return NULL;
|
|
return (STColumn *)ptr;
|
|
}
|
|
|
|
// ----------------- SCHEMA BUILDER DEFINITION
|
|
typedef struct {
|
|
int tCols;
|
|
int nCols;
|
|
int tlen;
|
|
uint16_t flen;
|
|
uint16_t vlen;
|
|
int version;
|
|
STColumn *columns;
|
|
} STSchemaBuilder;
|
|
|
|
int tdInitTSchemaBuilder(STSchemaBuilder *pBuilder, int32_t version);
|
|
void tdDestroyTSchemaBuilder(STSchemaBuilder *pBuilder);
|
|
void tdResetTSchemaBuilder(STSchemaBuilder *pBuilder, int32_t version);
|
|
int tdAddColToSchema(STSchemaBuilder *pBuilder, int8_t type, int16_t colId, int16_t bytes);
|
|
STSchema *tdGetSchemaFromBuilder(STSchemaBuilder *pBuilder);
|
|
|
|
// ----------------- Semantic timestamp key definition
|
|
typedef uint64_t TKEY;
|
|
|
|
#define TKEY_INVALID UINT64_MAX
|
|
#define TKEY_NULL TKEY_INVALID
|
|
#define TKEY_NEGATIVE_FLAG (((TKEY)1) << 63)
|
|
#define TKEY_DELETE_FLAG (((TKEY)1) << 62)
|
|
#define TKEY_VALUE_FILTER (~(TKEY_NEGATIVE_FLAG | TKEY_DELETE_FLAG))
|
|
|
|
#define TKEY_IS_NEGATIVE(tkey) (((tkey)&TKEY_NEGATIVE_FLAG) != 0)
|
|
#define TKEY_IS_DELETED(tkey) (((tkey)&TKEY_DELETE_FLAG) != 0)
|
|
#define tdSetTKEYDeleted(tkey) ((tkey) | TKEY_DELETE_FLAG)
|
|
#define tdGetTKEY(key) (((TKEY)ABS(key)) | (TKEY_NEGATIVE_FLAG & (TKEY)(key)))
|
|
#define tdGetKey(tkey) (((TSKEY)((tkey)&TKEY_VALUE_FILTER)) * (TKEY_IS_NEGATIVE(tkey) ? -1 : 1))
|
|
|
|
#define MIN_TS_KEY ((TSKEY)0x8000000000000001)
|
|
#define MAX_TS_KEY ((TSKEY)0x3fffffffffffffff)
|
|
|
|
#define TD_TO_TKEY(key) tdGetTKEY(((key) < MIN_TS_KEY) ? MIN_TS_KEY : (((key) > MAX_TS_KEY) ? MAX_TS_KEY : key))
|
|
|
|
static FORCE_INLINE TKEY keyToTkey(TSKEY key) {
|
|
TSKEY lkey = key;
|
|
if (key > MAX_TS_KEY) {
|
|
lkey = MAX_TS_KEY;
|
|
} else if (key < MIN_TS_KEY) {
|
|
lkey = MIN_TS_KEY;
|
|
}
|
|
|
|
return tdGetTKEY(lkey);
|
|
}
|
|
|
|
static FORCE_INLINE int tkeyComparFn(const void *tkey1, const void *tkey2) {
|
|
TSKEY key1 = tdGetKey(*(TKEY *)tkey1);
|
|
TSKEY key2 = tdGetKey(*(TKEY *)tkey2);
|
|
|
|
if (key1 < key2) {
|
|
return -1;
|
|
} else if (key1 > key2) {
|
|
return 1;
|
|
} else {
|
|
return 0;
|
|
}
|
|
}
|
|
// ----------------- Data row structure
|
|
|
|
/* A data row, the format is like below:
|
|
* |<--------------------+--------------------------- len ---------------------------------->|
|
|
* |<-- Head -->|<--------- flen -------------->| |
|
|
* +---------------------+---------------------------------+---------------------------------+
|
|
* | uint16_t | int16_t | | |
|
|
* +----------+----------+---------------------------------+---------------------------------+
|
|
* | len | sversion | First part | Second part |
|
|
* +----------+----------+---------------------------------+---------------------------------+
|
|
*
|
|
* NOTE: timestamp in this row structure is TKEY instead of TSKEY
|
|
*/
|
|
typedef void *SDataRow;
|
|
|
|
#define TD_DATA_ROW_HEAD_SIZE (sizeof(uint16_t) + sizeof(int16_t))
|
|
|
|
#define dataRowLen(r) (*(uint16_t *)(r))
|
|
#define dataRowVersion(r) *(int16_t *)POINTER_SHIFT(r, sizeof(int16_t))
|
|
#define dataRowTuple(r) POINTER_SHIFT(r, TD_DATA_ROW_HEAD_SIZE)
|
|
#define dataRowTKey(r) (*(TKEY *)(dataRowTuple(r)))
|
|
#define dataRowKey(r) tdGetKey(dataRowTKey(r))
|
|
#define dataRowSetLen(r, l) (dataRowLen(r) = (l))
|
|
#define dataRowSetVersion(r, v) (dataRowVersion(r) = (v))
|
|
#define dataRowCpy(dst, r) memcpy((dst), (r), dataRowLen(r))
|
|
#define dataRowMaxBytesFromSchema(s) (schemaTLen(s) + TD_DATA_ROW_HEAD_SIZE)
|
|
#define dataRowDeleted(r) TKEY_IS_DELETED(dataRowTKey(r))
|
|
|
|
SDataRow tdNewDataRowFromSchema(STSchema *pSchema);
|
|
void tdFreeDataRow(SDataRow row);
|
|
void tdInitDataRow(SDataRow row, STSchema *pSchema);
|
|
SDataRow tdDataRowDup(SDataRow row);
|
|
|
|
// offset here not include dataRow header length
|
|
static FORCE_INLINE int tdAppendColVal(SDataRow row, void *value, int8_t type, int32_t bytes, int32_t offset) {
|
|
ASSERT(value != NULL);
|
|
int32_t toffset = offset + TD_DATA_ROW_HEAD_SIZE;
|
|
char * ptr = (char *)POINTER_SHIFT(row, dataRowLen(row));
|
|
|
|
if (IS_VAR_DATA_TYPE(type)) {
|
|
*(VarDataOffsetT *)POINTER_SHIFT(row, toffset) = dataRowLen(row);
|
|
memcpy(ptr, value, varDataTLen(value));
|
|
dataRowLen(row) += varDataTLen(value);
|
|
} else {
|
|
if (offset == 0) {
|
|
ASSERT(type == TSDB_DATA_TYPE_TIMESTAMP);
|
|
TKEY tvalue = tdGetTKEY(*(TSKEY *)value);
|
|
memcpy(POINTER_SHIFT(row, toffset), (void *)(&tvalue), TYPE_BYTES[type]);
|
|
} else {
|
|
memcpy(POINTER_SHIFT(row, toffset), value, TYPE_BYTES[type]);
|
|
}
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
// NOTE: offset here including the header size
|
|
static FORCE_INLINE void *tdGetRowDataOfCol(SDataRow row, int8_t type, int32_t offset) {
|
|
if (IS_VAR_DATA_TYPE(type)) {
|
|
return POINTER_SHIFT(row, *(VarDataOffsetT *)POINTER_SHIFT(row, offset));
|
|
} else {
|
|
return POINTER_SHIFT(row, offset);
|
|
}
|
|
}
|
|
|
|
// ----------------- Data column structure
|
|
typedef struct SDataCol {
|
|
int8_t type; // column type
|
|
int16_t colId; // column ID
|
|
int bytes; // column data bytes defined
|
|
int offset; // data offset in a SDataRow (including the header size)
|
|
int spaceSize; // Total space size for this column
|
|
int len; // column data length
|
|
VarDataOffsetT *dataOff; // For binary and nchar data, the offset in the data column
|
|
void * pData; // Actual data pointer
|
|
} SDataCol;
|
|
|
|
static FORCE_INLINE void dataColReset(SDataCol *pDataCol) { pDataCol->len = 0; }
|
|
|
|
void dataColInit(SDataCol *pDataCol, STColumn *pCol, void **pBuf, int maxPoints);
|
|
void dataColAppendVal(SDataCol *pCol, void *value, int numOfRows, int maxPoints);
|
|
void dataColSetOffset(SDataCol *pCol, int nEle);
|
|
|
|
bool isNEleNull(SDataCol *pCol, int nEle);
|
|
void dataColSetNEleNull(SDataCol *pCol, int nEle, int maxPoints);
|
|
|
|
// Get the data pointer from a column-wised data
|
|
static FORCE_INLINE void *tdGetColDataOfRow(SDataCol *pCol, int row) {
|
|
if (IS_VAR_DATA_TYPE(pCol->type)) {
|
|
return POINTER_SHIFT(pCol->pData, pCol->dataOff[row]);
|
|
} else {
|
|
return POINTER_SHIFT(pCol->pData, TYPE_BYTES[pCol->type] * row);
|
|
}
|
|
}
|
|
|
|
static FORCE_INLINE int32_t dataColGetNEleLen(SDataCol *pDataCol, int rows) {
|
|
ASSERT(rows > 0);
|
|
|
|
if (IS_VAR_DATA_TYPE(pDataCol->type)) {
|
|
return pDataCol->dataOff[rows - 1] + varDataTLen(tdGetColDataOfRow(pDataCol, rows - 1));
|
|
} else {
|
|
return TYPE_BYTES[pDataCol->type] * rows;
|
|
}
|
|
}
|
|
|
|
typedef struct {
|
|
int maxRowSize;
|
|
int maxCols; // max number of columns
|
|
int maxPoints; // max number of points
|
|
int bufSize;
|
|
|
|
int numOfRows;
|
|
int numOfCols; // Total number of cols
|
|
int sversion; // TODO: set sversion
|
|
void * buf;
|
|
SDataCol *cols;
|
|
} SDataCols;
|
|
|
|
#define keyCol(pCols) (&((pCols)->cols[0])) // Key column
|
|
#define dataColsTKeyAt(pCols, idx) ((TKEY *)(keyCol(pCols)->pData))[(idx)]
|
|
#define dataColsKeyAt(pCols, idx) tdGetKey(dataColsTKeyAt(pCols, idx))
|
|
static FORCE_INLINE TKEY dataColsTKeyFirst(SDataCols *pCols) {
|
|
if (pCols->numOfRows) {
|
|
return dataColsTKeyAt(pCols, 0);
|
|
} else {
|
|
return TKEY_INVALID;
|
|
}
|
|
}
|
|
|
|
static FORCE_INLINE TSKEY dataColsKeyFirst(SDataCols *pCols) {
|
|
if (pCols->numOfRows) {
|
|
return dataColsKeyAt(pCols, 0);
|
|
} else {
|
|
return TSDB_DATA_TIMESTAMP_NULL;
|
|
}
|
|
}
|
|
|
|
static FORCE_INLINE TKEY dataColsTKeyLast(SDataCols *pCols) {
|
|
if (pCols->numOfRows) {
|
|
return dataColsTKeyAt(pCols, pCols->numOfRows - 1);
|
|
} else {
|
|
return TKEY_INVALID;
|
|
}
|
|
}
|
|
|
|
static FORCE_INLINE TSKEY dataColsKeyLast(SDataCols *pCols) {
|
|
if (pCols->numOfRows) {
|
|
return dataColsKeyAt(pCols, pCols->numOfRows - 1);
|
|
} else {
|
|
return TSDB_DATA_TIMESTAMP_NULL;
|
|
}
|
|
}
|
|
|
|
SDataCols *tdNewDataCols(int maxRowSize, int maxCols, int maxRows);
|
|
void tdResetDataCols(SDataCols *pCols);
|
|
int tdInitDataCols(SDataCols *pCols, STSchema *pSchema);
|
|
SDataCols *tdDupDataCols(SDataCols *pCols, bool keepData);
|
|
SDataCols *tdFreeDataCols(SDataCols *pCols);
|
|
void tdAppendDataRowToDataCol(SDataRow row, STSchema *pSchema, SDataCols *pCols);
|
|
int tdMergeDataCols(SDataCols *target, SDataCols *src, int rowsToMerge);
|
|
|
|
// ----------------- K-V data row structure
|
|
/*
|
|
* +----------+----------+---------------------------------+---------------------------------+
|
|
* | int16_t | int16_t | | |
|
|
* +----------+----------+---------------------------------+---------------------------------+
|
|
* | len | ncols | cols index | data part |
|
|
* +----------+----------+---------------------------------+---------------------------------+
|
|
*/
|
|
typedef void *SKVRow;
|
|
|
|
typedef struct {
|
|
int16_t colId;
|
|
int16_t offset;
|
|
} SColIdx;
|
|
|
|
#define TD_KV_ROW_HEAD_SIZE (2 * sizeof(int16_t))
|
|
|
|
#define kvRowLen(r) (*(int16_t *)(r))
|
|
#define kvRowNCols(r) (*(int16_t *)POINTER_SHIFT(r, sizeof(int16_t)))
|
|
#define kvRowSetLen(r, len) kvRowLen(r) = (len)
|
|
#define kvRowSetNCols(r, n) kvRowNCols(r) = (n)
|
|
#define kvRowColIdx(r) (SColIdx *)POINTER_SHIFT(r, TD_KV_ROW_HEAD_SIZE)
|
|
#define kvRowValues(r) POINTER_SHIFT(r, TD_KV_ROW_HEAD_SIZE + sizeof(SColIdx) * kvRowNCols(r))
|
|
#define kvRowCpy(dst, r) memcpy((dst), (r), kvRowLen(r))
|
|
#define kvRowColVal(r, colIdx) POINTER_SHIFT(kvRowValues(r), (colIdx)->offset)
|
|
#define kvRowColIdxAt(r, i) (kvRowColIdx(r) + (i))
|
|
#define kvRowFree(r) tfree(r)
|
|
#define kvRowEnd(r) POINTER_SHIFT(r, kvRowLen(r))
|
|
|
|
SKVRow tdKVRowDup(SKVRow row);
|
|
int tdSetKVRowDataOfCol(SKVRow *orow, int16_t colId, int8_t type, void *value);
|
|
int tdEncodeKVRow(void **buf, SKVRow row);
|
|
void * tdDecodeKVRow(void *buf, SKVRow *row);
|
|
void tdSortKVRowByColIdx(SKVRow row);
|
|
|
|
static FORCE_INLINE int comparTagId(const void *key1, const void *key2) {
|
|
if (*(int16_t *)key1 > ((SColIdx *)key2)->colId) {
|
|
return 1;
|
|
} else if (*(int16_t *)key1 < ((SColIdx *)key2)->colId) {
|
|
return -1;
|
|
} else {
|
|
return 0;
|
|
}
|
|
}
|
|
|
|
static FORCE_INLINE void *tdGetKVRowValOfCol(SKVRow row, int16_t colId) {
|
|
void *ret = taosbsearch(&colId, kvRowColIdx(row), kvRowNCols(row), sizeof(SColIdx), comparTagId, TD_EQ);
|
|
if (ret == NULL) return NULL;
|
|
return kvRowColVal(row, (SColIdx *)ret);
|
|
}
|
|
|
|
// ----------------- K-V data row builder
|
|
typedef struct {
|
|
int16_t tCols;
|
|
int16_t nCols;
|
|
SColIdx *pColIdx;
|
|
int16_t alloc;
|
|
int16_t size;
|
|
void * buf;
|
|
} SKVRowBuilder;
|
|
|
|
int tdInitKVRowBuilder(SKVRowBuilder *pBuilder);
|
|
void tdDestroyKVRowBuilder(SKVRowBuilder *pBuilder);
|
|
void tdResetKVRowBuilder(SKVRowBuilder *pBuilder);
|
|
SKVRow tdGetKVRowFromBuilder(SKVRowBuilder *pBuilder);
|
|
|
|
static FORCE_INLINE int tdAddColToKVRow(SKVRowBuilder *pBuilder, int16_t colId, int8_t type, void *value) {
|
|
if (pBuilder->nCols >= pBuilder->tCols) {
|
|
pBuilder->tCols *= 2;
|
|
pBuilder->pColIdx = (SColIdx *)realloc((void *)(pBuilder->pColIdx), sizeof(SColIdx) * pBuilder->tCols);
|
|
if (pBuilder->pColIdx == NULL) return -1;
|
|
}
|
|
|
|
pBuilder->pColIdx[pBuilder->nCols].colId = colId;
|
|
pBuilder->pColIdx[pBuilder->nCols].offset = pBuilder->size;
|
|
|
|
pBuilder->nCols++;
|
|
|
|
int tlen = IS_VAR_DATA_TYPE(type) ? varDataTLen(value) : TYPE_BYTES[type];
|
|
if (tlen > pBuilder->alloc - pBuilder->size) {
|
|
while (tlen > pBuilder->alloc - pBuilder->size) {
|
|
pBuilder->alloc *= 2;
|
|
}
|
|
pBuilder->buf = realloc(pBuilder->buf, pBuilder->alloc);
|
|
if (pBuilder->buf == NULL) return -1;
|
|
}
|
|
|
|
memcpy(POINTER_SHIFT(pBuilder->buf, pBuilder->size), value, tlen);
|
|
pBuilder->size += tlen;
|
|
|
|
return 0;
|
|
}
|
|
|
|
#ifdef __cplusplus
|
|
}
|
|
#endif
|
|
|
|
#endif // _TD_DATA_FORMAT_H_
|