428 lines
14 KiB
C
428 lines
14 KiB
C
/*
|
|
* Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
|
|
*
|
|
* This program is free software: you can use, redistribute, and/or modify
|
|
* it under the terms of the GNU Affero General Public License, version 3
|
|
* or later ("AGPL"), as published by the Free Software Foundation.
|
|
*
|
|
* This program is distributed in the hope that it will be useful, but WITHOUT
|
|
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
|
* FITNESS FOR A PARTICULAR PURPOSE.
|
|
*
|
|
* You should have received a copy of the GNU Affero General Public License
|
|
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
|
*/
|
|
|
|
#ifndef _TD_COMMON_DATA_FORMAT_H_
|
|
#define _TD_COMMON_DATA_FORMAT_H_
|
|
|
|
#include "os.h"
|
|
#include "talgo.h"
|
|
#include "tarray.h"
|
|
#include "tencode.h"
|
|
#include "ttypes.h"
|
|
#include "tutil.h"
|
|
|
|
#ifdef __cplusplus
|
|
extern "C" {
|
|
#endif
|
|
|
|
typedef struct SSchema SSchema;
|
|
typedef struct STColumn STColumn;
|
|
typedef struct STSchema STSchema;
|
|
typedef struct SValue SValue;
|
|
typedef struct SColVal SColVal;
|
|
typedef struct STSRow2 STSRow2;
|
|
typedef struct STSRowBuilder STSRowBuilder;
|
|
typedef struct SColData SColData;
|
|
typedef struct STagVal STagVal;
|
|
typedef struct STag STag;
|
|
|
|
// STSchema
|
|
int32_t tTSchemaCreate(int32_t sver, SSchema *pSchema, int32_t nCols, STSchema **ppTSchema);
|
|
void tTSchemaDestroy(STSchema *pTSchema);
|
|
|
|
// SValue
|
|
int tValueCmprFn(const SValue *pValue1, const SValue *pValue2, int8_t type);
|
|
|
|
// STSRow2
|
|
#define COL_VAL_NONE(CID) ((SColVal){.cid = (CID), .isNone = 1})
|
|
#define COL_VAL_NULL(CID) ((SColVal){.cid = (CID), .isNull = 1})
|
|
#define COL_VAL_VALUE(CID, V) ((SColVal){.cid = (CID), .value = (V)})
|
|
|
|
int32_t tTSRowNew(STSRowBuilder *pBuilder, SArray *pArray, STSchema *pTSchema, STSRow2 **ppRow);
|
|
int32_t tTSRowClone(const STSRow2 *pRow, STSRow2 **ppRow);
|
|
void tTSRowFree(STSRow2 *pRow);
|
|
void tTSRowGet(STSRow2 *pRow, STSchema *pTSchema, int32_t iCol, SColVal *pColVal);
|
|
int32_t tTSRowToArray(STSRow2 *pRow, STSchema *pTSchema, SArray **ppArray);
|
|
int32_t tPutTSRow(uint8_t *p, STSRow2 *pRow);
|
|
int32_t tGetTSRow(uint8_t *p, STSRow2 *pRow);
|
|
|
|
// STSRowBuilder
|
|
#define tsRowBuilderInit() ((STSRowBuilder){0})
|
|
#define tsRowBuilderClear(B) \
|
|
do { \
|
|
if ((B)->pBuf) { \
|
|
taosMemoryFree((B)->pBuf); \
|
|
} \
|
|
} while (0)
|
|
|
|
// STag
|
|
int32_t tTagNew(SArray *pArray, int32_t version, int8_t isJson, STag **ppTag);
|
|
void tTagFree(STag *pTag);
|
|
bool tTagGet(const STag *pTag, STagVal *pTagVal);
|
|
char *tTagValToData(const STagVal *pTagVal, bool isJson);
|
|
int32_t tEncodeTag(SEncoder *pEncoder, const STag *pTag);
|
|
int32_t tDecodeTag(SDecoder *pDecoder, STag **ppTag);
|
|
int32_t tTagToValArray(const STag *pTag, SArray **ppArray);
|
|
void debugPrintSTag(STag *pTag, const char *tag, int32_t ln); // TODO: remove
|
|
void debugCheckTags(STag *pTag); // TODO: remove
|
|
|
|
// STRUCT =================
|
|
struct STColumn {
|
|
col_id_t colId;
|
|
int8_t type;
|
|
int8_t flags;
|
|
int32_t bytes;
|
|
int32_t offset;
|
|
};
|
|
|
|
struct STSchema {
|
|
int32_t numOfCols;
|
|
int32_t version;
|
|
int32_t flen;
|
|
int32_t vlen;
|
|
int32_t tlen;
|
|
STColumn columns[];
|
|
};
|
|
|
|
#define TSROW_HAS_NONE ((uint8_t)0x1)
|
|
#define TSROW_HAS_NULL ((uint8_t)0x2U)
|
|
#define TSROW_HAS_VAL ((uint8_t)0x4U)
|
|
#define TSROW_KV_SMALL ((uint8_t)0x10U)
|
|
#define TSROW_KV_MID ((uint8_t)0x20U)
|
|
#define TSROW_KV_BIG ((uint8_t)0x40U)
|
|
struct STSRow2 {
|
|
TSKEY ts;
|
|
uint8_t flags;
|
|
int32_t sver;
|
|
uint32_t nData;
|
|
uint8_t *pData;
|
|
};
|
|
|
|
struct STSRowBuilder {
|
|
STSRow2 tsRow;
|
|
int32_t szBuf;
|
|
uint8_t *pBuf;
|
|
};
|
|
|
|
struct SValue {
|
|
union {
|
|
int8_t i8; // TSDB_DATA_TYPE_BOOL||TSDB_DATA_TYPE_TINYINT
|
|
uint8_t u8; // TSDB_DATA_TYPE_UTINYINT
|
|
int16_t i16; // TSDB_DATA_TYPE_SMALLINT
|
|
uint16_t u16; // TSDB_DATA_TYPE_USMALLINT
|
|
int32_t i32; // TSDB_DATA_TYPE_INT
|
|
uint32_t u32; // TSDB_DATA_TYPE_UINT
|
|
int64_t i64; // TSDB_DATA_TYPE_BIGINT
|
|
uint64_t u64; // TSDB_DATA_TYPE_UBIGINT
|
|
TSKEY ts; // TSDB_DATA_TYPE_TIMESTAMP
|
|
float f; // TSDB_DATA_TYPE_FLOAT
|
|
double d; // TSDB_DATA_TYPE_DOUBLE
|
|
struct {
|
|
uint32_t nData;
|
|
uint8_t *pData;
|
|
};
|
|
};
|
|
};
|
|
|
|
struct SColVal {
|
|
int16_t cid;
|
|
int8_t isNone;
|
|
int8_t isNull;
|
|
SValue value;
|
|
};
|
|
|
|
#pragma pack(push, 1)
|
|
struct STagVal {
|
|
union {
|
|
int16_t cid;
|
|
char *pKey;
|
|
};
|
|
int8_t type;
|
|
union {
|
|
int64_t i64;
|
|
struct {
|
|
uint32_t nData;
|
|
uint8_t *pData;
|
|
};
|
|
};
|
|
};
|
|
|
|
#define TD_TAG_JSON ((int8_t)0x40) // distinguish JSON string and JSON value with the highest bit
|
|
#define TD_TAG_LARGE ((int8_t)0x20)
|
|
struct STag {
|
|
int8_t flags;
|
|
int16_t len;
|
|
int16_t nTag;
|
|
int32_t ver;
|
|
int8_t idx[];
|
|
};
|
|
#pragma pack(pop)
|
|
|
|
struct SColData {
|
|
int16_t cid;
|
|
uint32_t nData;
|
|
uint8_t *pData;
|
|
};
|
|
|
|
#if 1 //================================================================================================================================================
|
|
// Imported since 3.0 and use bitmap to demonstrate None/Null/Norm, while use Null/Norm below 3.0 without of bitmap.
|
|
#define TD_SUPPORT_BITMAP
|
|
#define TD_SUPPORT_READ2
|
|
#define TD_SUPPORT_BACK2 // suppport back compatibility of 2.0
|
|
|
|
#define TASSERT(x) ASSERT(x)
|
|
|
|
#define STR_TO_VARSTR(x, str) \
|
|
do { \
|
|
VarDataLenT __len = (VarDataLenT)strlen(str); \
|
|
*(VarDataLenT *)(x) = __len; \
|
|
memcpy(varDataVal(x), (str), __len); \
|
|
} while (0);
|
|
|
|
#define STR_TO_NET_VARSTR(x, str) \
|
|
do { \
|
|
VarDataLenT __len = (VarDataLenT)strlen(str); \
|
|
*(VarDataLenT *)(x) = htons(__len); \
|
|
memcpy(varDataVal(x), (str), __len); \
|
|
} while (0);
|
|
|
|
#define STR_WITH_MAXSIZE_TO_VARSTR(x, str, _maxs) \
|
|
do { \
|
|
char *_e = stpncpy(varDataVal(x), (str), (_maxs)-VARSTR_HEADER_SIZE); \
|
|
varDataSetLen(x, (_e - (x)-VARSTR_HEADER_SIZE)); \
|
|
} while (0)
|
|
|
|
#define STR_WITH_SIZE_TO_VARSTR(x, str, _size) \
|
|
do { \
|
|
*(VarDataLenT *)(x) = (VarDataLenT)(_size); \
|
|
memcpy(varDataVal(x), (str), (_size)); \
|
|
} while (0);
|
|
|
|
// ----------------- TSDB COLUMN DEFINITION
|
|
|
|
#define colType(col) ((col)->type)
|
|
#define colFlags(col) ((col)->flags)
|
|
#define colColId(col) ((col)->colId)
|
|
#define colBytes(col) ((col)->bytes)
|
|
#define colOffset(col) ((col)->offset)
|
|
|
|
#define colSetType(col, t) (colType(col) = (t))
|
|
#define colSetFlags(col, f) (colFlags(col) = (f))
|
|
#define colSetColId(col, id) (colColId(col) = (id))
|
|
#define colSetBytes(col, b) (colBytes(col) = (b))
|
|
#define colSetOffset(col, o) (colOffset(col) = (o))
|
|
|
|
// ----------------- TSDB SCHEMA DEFINITION
|
|
|
|
#define schemaNCols(s) ((s)->numOfCols)
|
|
#define schemaVersion(s) ((s)->version)
|
|
#define schemaTLen(s) ((s)->tlen)
|
|
#define schemaFLen(s) ((s)->flen)
|
|
#define schemaVLen(s) ((s)->vlen)
|
|
#define schemaColAt(s, i) ((s)->columns + i)
|
|
#define tdFreeSchema(s) taosMemoryFreeClear((s))
|
|
|
|
STSchema *tdDupSchema(const STSchema *pSchema);
|
|
int32_t tdEncodeSchema(void **buf, STSchema *pSchema);
|
|
void *tdDecodeSchema(void *buf, STSchema **pRSchema);
|
|
|
|
static FORCE_INLINE int32_t comparColId(const void *key1, const void *key2) {
|
|
if (*(int16_t *)key1 > ((STColumn *)key2)->colId) {
|
|
return 1;
|
|
} else if (*(int16_t *)key1 < ((STColumn *)key2)->colId) {
|
|
return -1;
|
|
} else {
|
|
return 0;
|
|
}
|
|
}
|
|
|
|
static FORCE_INLINE STColumn *tdGetColOfID(STSchema *pSchema, int16_t colId) {
|
|
void *ptr = bsearch(&colId, (void *)pSchema->columns, schemaNCols(pSchema), sizeof(STColumn), comparColId);
|
|
if (ptr == NULL) return NULL;
|
|
return (STColumn *)ptr;
|
|
}
|
|
|
|
// ----------------- SCHEMA BUILDER DEFINITION
|
|
typedef struct {
|
|
int32_t tCols;
|
|
int32_t nCols;
|
|
schema_ver_t version;
|
|
uint16_t flen;
|
|
int32_t vlen;
|
|
int32_t tlen;
|
|
STColumn *columns;
|
|
} STSchemaBuilder;
|
|
|
|
// use 2 bits for bitmap(default: STSRow/sub block)
|
|
#define TD_VTYPE_BITS 2
|
|
#define TD_VTYPE_PARTS 4 // PARTITIONS: 1 byte / 2 bits
|
|
#define TD_VTYPE_OPTR 3 // OPERATOR: 4 - 1, utilize to get remainder
|
|
#define TD_BITMAP_BYTES(cnt) (((cnt) + TD_VTYPE_OPTR) >> 2)
|
|
|
|
// use 1 bit for bitmap(super block)
|
|
#define TD_VTYPE_BITS_I 1
|
|
#define TD_VTYPE_PARTS_I 8 // PARTITIONS: 1 byte / 1 bit
|
|
#define TD_VTYPE_OPTR_I 7 // OPERATOR: 8 - 1, utilize to get remainder
|
|
#define TD_BITMAP_BYTES_I(cnt) (((cnt) + TD_VTYPE_OPTR_I) >> 3)
|
|
|
|
int32_t tdInitTSchemaBuilder(STSchemaBuilder *pBuilder, schema_ver_t version);
|
|
void tdDestroyTSchemaBuilder(STSchemaBuilder *pBuilder);
|
|
void tdResetTSchemaBuilder(STSchemaBuilder *pBuilder, schema_ver_t version);
|
|
int32_t tdAddColToSchema(STSchemaBuilder *pBuilder, int8_t type, int8_t flags, col_id_t colId, col_bytes_t bytes);
|
|
STSchema *tdGetSchemaFromBuilder(STSchemaBuilder *pBuilder);
|
|
|
|
// ----------------- Semantic timestamp key definition
|
|
// typedef uint64_t TKEY;
|
|
#define TKEY TSKEY
|
|
|
|
#define TKEY_INVALID UINT64_MAX
|
|
#define TKEY_NULL TKEY_INVALID
|
|
#define TKEY_NEGATIVE_FLAG (((TKEY)1) << 63)
|
|
#define TKEY_VALUE_FILTER (~(TKEY_NEGATIVE_FLAG))
|
|
|
|
#define TKEY_IS_NEGATIVE(tkey) (((tkey)&TKEY_NEGATIVE_FLAG) != 0)
|
|
#define TKEY_IS_DELETED(tkey) (false)
|
|
|
|
#define tdGetTKEY(key) (key)
|
|
#define tdGetKey(tskey) (tskey)
|
|
|
|
#define MIN_TS_KEY ((TSKEY)0x8000000000000001)
|
|
#define MAX_TS_KEY ((TSKEY)0x7fffffffffffffff)
|
|
|
|
#define TD_TO_TKEY(key) tdGetTKEY(((key) < MIN_TS_KEY) ? MIN_TS_KEY : (((key) > MAX_TS_KEY) ? MAX_TS_KEY : key))
|
|
|
|
static FORCE_INLINE TKEY keyToTkey(TSKEY key) {
|
|
TSKEY lkey = key;
|
|
if (key > MAX_TS_KEY) {
|
|
lkey = MAX_TS_KEY;
|
|
} else if (key < MIN_TS_KEY) {
|
|
lkey = MIN_TS_KEY;
|
|
}
|
|
|
|
return tdGetTKEY(lkey);
|
|
}
|
|
|
|
static FORCE_INLINE int32_t tkeyComparFn(const void *tkey1, const void *tkey2) {
|
|
TSKEY key1 = tdGetKey(*(TKEY *)tkey1);
|
|
TSKEY key2 = tdGetKey(*(TKEY *)tkey2);
|
|
|
|
if (key1 < key2) {
|
|
return -1;
|
|
} else if (key1 > key2) {
|
|
return 1;
|
|
} else {
|
|
return 0;
|
|
}
|
|
}
|
|
|
|
// ----------------- Data column structure
|
|
// SDataCol arrangement: data => bitmap => dataOffset
|
|
typedef struct SDataCol {
|
|
int8_t type; // column type
|
|
uint8_t bitmap : 1; // 0: no bitmap if all rows are NORM, 1: has bitmap if has NULL/NORM rows
|
|
uint8_t reserve : 7;
|
|
int16_t colId; // column ID
|
|
int32_t bytes; // column data bytes defined
|
|
int32_t offset; // data offset in a SDataRow (including the header size)
|
|
int32_t spaceSize; // Total space size for this column
|
|
int32_t len; // column data length
|
|
VarDataOffsetT *dataOff; // For binary and nchar data, the offset in the data column
|
|
void *pData; // Actual data pointer
|
|
void *pBitmap; // Bitmap pointer
|
|
TSKEY ts; // only used in last NULL column
|
|
} SDataCol;
|
|
|
|
#define isAllRowsNull(pCol) ((pCol)->len == 0)
|
|
#define isAllRowsNone(pCol) ((pCol)->len == 0)
|
|
static FORCE_INLINE void dataColReset(SDataCol *pDataCol) { pDataCol->len = 0; }
|
|
|
|
int32_t tdAllocMemForCol(SDataCol *pCol, int32_t maxPoints);
|
|
|
|
void dataColInit(SDataCol *pDataCol, STColumn *pCol, int32_t maxPoints);
|
|
int32_t dataColAppendVal(SDataCol *pCol, const void *value, int32_t numOfRows, int32_t maxPoints);
|
|
void *dataColSetOffset(SDataCol *pCol, int32_t nEle);
|
|
|
|
bool isNEleNull(SDataCol *pCol, int32_t nEle);
|
|
|
|
typedef struct {
|
|
col_id_t maxCols; // max number of columns
|
|
col_id_t numOfCols; // Total number of cols
|
|
int32_t maxPoints; // max number of points
|
|
int32_t numOfRows;
|
|
int32_t bitmapMode : 1; // default is 0(2 bits), otherwise 1(1 bit)
|
|
int32_t sversion : 31; // TODO: set sversion(not used yet)
|
|
SDataCol *cols;
|
|
} SDataCols;
|
|
|
|
static FORCE_INLINE bool tdDataColsIsBitmapI(SDataCols *pCols) { return pCols->bitmapMode != TSDB_BITMODE_DEFAULT; }
|
|
static FORCE_INLINE void tdDataColsSetBitmapI(SDataCols *pCols) { pCols->bitmapMode = TSDB_BITMODE_ONE_BIT; }
|
|
static FORCE_INLINE bool tdIsBitmapModeI(int8_t bitmapMode) { return bitmapMode != TSDB_BITMODE_DEFAULT; }
|
|
|
|
#define keyCol(pCols) (&((pCols)->cols[0])) // Key column
|
|
#define dataColsTKeyAt(pCols, idx) ((TKEY *)(keyCol(pCols)->pData))[(idx)] // the idx row of column-wised data
|
|
#define dataColsKeyAt(pCols, idx) tdGetKey(dataColsTKeyAt(pCols, idx))
|
|
static FORCE_INLINE TKEY dataColsTKeyFirst(SDataCols *pCols) {
|
|
if (pCols->numOfRows) {
|
|
return dataColsTKeyAt(pCols, 0);
|
|
} else {
|
|
return TKEY_INVALID;
|
|
}
|
|
}
|
|
|
|
static FORCE_INLINE TSKEY dataColsKeyAtRow(SDataCols *pCols, int32_t row) {
|
|
assert(row < pCols->numOfRows);
|
|
return dataColsKeyAt(pCols, row);
|
|
}
|
|
|
|
static FORCE_INLINE TSKEY dataColsKeyFirst(SDataCols *pCols) {
|
|
if (pCols->numOfRows) {
|
|
return dataColsKeyAt(pCols, 0);
|
|
} else {
|
|
return TSDB_DATA_TIMESTAMP_NULL;
|
|
}
|
|
}
|
|
|
|
static FORCE_INLINE TKEY dataColsTKeyLast(SDataCols *pCols) {
|
|
if (pCols->numOfRows) {
|
|
return dataColsTKeyAt(pCols, pCols->numOfRows - 1);
|
|
} else {
|
|
return TKEY_INVALID;
|
|
}
|
|
}
|
|
|
|
static FORCE_INLINE TSKEY dataColsKeyLast(SDataCols *pCols) {
|
|
if (pCols->numOfRows) {
|
|
return dataColsKeyAt(pCols, pCols->numOfRows - 1);
|
|
} else {
|
|
return TSDB_DATA_TIMESTAMP_NULL;
|
|
}
|
|
}
|
|
|
|
SDataCols *tdNewDataCols(int32_t maxCols, int32_t maxRows);
|
|
void tdResetDataCols(SDataCols *pCols);
|
|
int32_t tdInitDataCols(SDataCols *pCols, STSchema *pSchema);
|
|
SDataCols *tdDupDataCols(SDataCols *pCols, bool keepData);
|
|
SDataCols *tdFreeDataCols(SDataCols *pCols);
|
|
int32_t tdMergeDataCols(SDataCols *target, SDataCols *source, int32_t rowsToMerge, int32_t *pOffset, bool update,
|
|
TDRowVerT maxVer);
|
|
|
|
#endif
|
|
|
|
#ifdef __cplusplus
|
|
}
|
|
#endif
|
|
|
|
#endif /*_TD_COMMON_DATA_FORMAT_H_*/
|