parUtil.c 15.0 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */
15

X
Xiaoyu Wang 已提交
16
#include "parUtil.h"
17
#include "cJSON.h"
18

19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45
static char* getSyntaxErrFormat(int32_t errCode) {
  switch (errCode) {
    case TSDB_CODE_PAR_SYNTAX_ERROR:
      return "syntax error near \"%s\"";
    case TSDB_CODE_PAR_INCOMPLETE_SQL:
      return "Incomplete SQL statement";
    case TSDB_CODE_PAR_INVALID_COLUMN:
      return "Invalid column name : %s";
    case TSDB_CODE_PAR_TABLE_NOT_EXIST:
      return "Table does not exist : %s";
    case TSDB_CODE_PAR_AMBIGUOUS_COLUMN:
      return "Column ambiguously defined : %s";
    case TSDB_CODE_PAR_WRONG_VALUE_TYPE:
      return "Invalid value type : %s";
    case TSDB_CODE_PAR_INVALID_FUNTION:
      return "Invalid function name : %s";
    case TSDB_CODE_PAR_ILLEGAL_USE_AGG_FUNCTION:
      return "There mustn't be aggregation";
    case TSDB_CODE_PAR_WRONG_NUMBER_OF_SELECT:
      return "ORDER BY item must be the number of a SELECT-list expression";
    case TSDB_CODE_PAR_GROUPBY_LACK_EXPRESSION:
      return "Not a GROUP BY expression";
    case TSDB_CODE_PAR_NOT_SELECTED_EXPRESSION:
      return "Not SELECTed expression";
    case TSDB_CODE_PAR_NOT_SINGLE_GROUP:
      return "Not a single-group group function";
    case TSDB_CODE_PAR_TAGS_NOT_MATCHED:
46
      return "Tags number not matched";
47
    case TSDB_CODE_PAR_INVALID_TAG_NAME:
48
      return "Invalid tag name : %s";
49
    case TSDB_CODE_PAR_NAME_OR_PASSWD_TOO_LONG:
50
      return "Name or password too long";
51
    case TSDB_CODE_PAR_PASSWD_EMPTY:
52
      return "Password can not be empty";
53
    case TSDB_CODE_PAR_INVALID_PORT:
54
      return "Port should be an integer that is less than 65535 and greater than 0";
55
    case TSDB_CODE_PAR_INVALID_ENDPOINT:
56 57 58
      return "Endpoint should be in the format of 'fqdn:port'";
    case TSDB_CODE_PAR_EXPRIE_STATEMENT:
      return "This statement is no longer supported";
X
Xiaoyu Wang 已提交
59 60
    case TSDB_CODE_PAR_INTER_VALUE_TOO_SMALL:
      return "Interval cannot be less than %d us";
X
Xiaoyu Wang 已提交
61
    case TSDB_CODE_PAR_DB_NOT_SPECIFIED:
62
      return "Database not specified";
X
Xiaoyu Wang 已提交
63 64
    case TSDB_CODE_PAR_INVALID_IDENTIFIER_NAME:
      return "Invalid identifier name : %s";
X
Xiaoyu Wang 已提交
65
    case TSDB_CODE_PAR_CORRESPONDING_STABLE_ERR:
66
      return "Corresponding super table not in this db";
X
Xiaoyu Wang 已提交
67
    case TSDB_CODE_PAR_INVALID_RANGE_OPTION:
68
      return "Invalid option %s: %"PRId64" valid range: [%d, %d]";
X
Xiaoyu Wang 已提交
69
    case TSDB_CODE_PAR_INVALID_STR_OPTION:
70
      return "Invalid option %s: %s";
X
Xiaoyu Wang 已提交
71
    case TSDB_CODE_PAR_INVALID_ENUM_OPTION:
72
      return "Invalid option %s: %"PRId64", only %d, %d allowed";
X
Xiaoyu Wang 已提交
73
    case TSDB_CODE_PAR_INVALID_TTL_OPTION:
74
      return "Invalid option ttl: %"PRId64", should be greater than or equal to %d";
X
Xiaoyu Wang 已提交
75
    case TSDB_CODE_PAR_INVALID_KEEP_NUM:
76
      return "Invalid number of keep options";
X
Xiaoyu Wang 已提交
77
    case TSDB_CODE_PAR_INVALID_KEEP_ORDER:
78
      return "Invalid keep value, should be keep0 <= keep1 <= keep2";
X
Xiaoyu Wang 已提交
79
    case TSDB_CODE_PAR_INVALID_KEEP_VALUE:
80
      return "Invalid option keep: %d, %d, %d valid range: [%d, %d]";
X
Xiaoyu Wang 已提交
81
    case TSDB_CODE_PAR_INVALID_COMMENT_OPTION:
82
      return "Invalid option comment, length cannot exceed %d";
X
Xiaoyu Wang 已提交
83
    case TSDB_CODE_PAR_INVALID_F_RANGE_OPTION:
84
      return "Invalid option %s: %f valid range: [%d, %d]";
X
Xiaoyu Wang 已提交
85
    case TSDB_CODE_PAR_INVALID_ROLLUP_OPTION:
86
      return "Invalid option rollup: only one function is allowed";
X
Xiaoyu Wang 已提交
87
    case TSDB_CODE_PAR_INVALID_RETENTIONS_OPTION:
88
      return "Invalid option retentions";
X
Xiaoyu Wang 已提交
89 90
    case TSDB_CODE_PAR_GROUPBY_WINDOW_COEXIST:
      return "GROUP BY and WINDOW-clause can't be used together";
91 92 93 94
    case TSDB_CODE_PAR_INVALID_OPTION_UNIT:
      return "Invalid option %s unit: %c, only m, h, d allowed";
    case TSDB_CODE_PAR_INVALID_KEEP_UNIT:
      return "Invalid option keep unit: %c, %c, %c, only m, h, d allowed";
X
Xiaoyu Wang 已提交
95 96
    case TSDB_CODE_PAR_AGG_FUNC_NESTING:
      return "Aggregate functions do not support nesting";
X
Xiaoyu Wang 已提交
97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118
    case TSDB_CODE_PAR_INVALID_STATE_WIN_TYPE:
      return "Only support STATE_WINDOW on integer column";
    case TSDB_CODE_PAR_INVALID_STATE_WIN_COL:
      return "Not support STATE_WINDOW on tag column";
    case TSDB_CODE_PAR_INVALID_STATE_WIN_TABLE:
      return "STATE_WINDOW not support for super table query";
    case TSDB_CODE_PAR_INTER_SESSION_GAP:
      return "SESSION gap should be fixed time window, and greater than 0";
    case TSDB_CODE_PAR_INTER_SESSION_COL:
      return "Only support SESSION on primary timestamp column";
    case TSDB_CODE_PAR_INTER_OFFSET_NEGATIVE:
      return "Interval offset cannot be negative";
    case TSDB_CODE_PAR_INTER_OFFSET_UNIT:
      return "Cannot use 'year' as offset when interval is 'month'";
    case TSDB_CODE_PAR_INTER_OFFSET_TOO_BIG:
      return "Interval offset should be shorter than interval";
    case TSDB_CODE_PAR_INTER_SLIDING_UNIT:
      return "Does not support sliding when interval is natural month/year";
    case TSDB_CODE_PAR_INTER_SLIDING_TOO_BIG:
      return "sliding value no larger than the interval value";
    case TSDB_CODE_PAR_INTER_SLIDING_TOO_SMALL:
      return "sliding value can not less than 1% of interval value";
119 120
    case TSDB_CODE_PAR_ONLY_ONE_JSON_TAG:
      return "Only one tag if there is a json tag";
121 122 123 124 125 126 127 128 129 130 131 132
    case TSDB_CODE_OUT_OF_MEMORY:
      return "Out of memory";
    default:
      return "Unknown error";
  }
}

int32_t generateSyntaxErrMsg(SMsgBuf* pBuf, int32_t errCode, ...) {
  va_list vArgList;
  va_start(vArgList, errCode);
  vsnprintf(pBuf->buf, pBuf->len, getSyntaxErrFormat(errCode), vArgList);
  va_end(vArgList);
X
Xiaoyu Wang 已提交
133
  terrno = errCode;
134 135 136
  return errCode;
}

X
Xiaoyu Wang 已提交
137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152
int32_t buildInvalidOperationMsg(SMsgBuf* pBuf, const char* msg) {
  strncpy(pBuf->buf, msg, pBuf->len);
  return TSDB_CODE_TSC_INVALID_OPERATION;
}

int32_t buildSyntaxErrMsg(SMsgBuf* pBuf, const char* additionalInfo, const char* sourceStr) {
  const char* msgFormat1 = "syntax error near \'%s\'";
  const char* msgFormat2 = "syntax error near \'%s\' (%s)";
  const char* msgFormat3 = "%s";

  const char* prefix = "syntax error";
  if (sourceStr == NULL) {
    assert(additionalInfo != NULL);
    snprintf(pBuf->buf, pBuf->len, msgFormat1, additionalInfo);
    return TSDB_CODE_TSC_SQL_SYNTAX_ERROR;
  }
153

X
Xiaoyu Wang 已提交
154 155 156 157 158 159 160 161 162 163 164 165
  char buf[64] = {0};  // only extract part of sql string
  strncpy(buf, sourceStr, tListLen(buf) - 1);

  if (additionalInfo != NULL) {
    snprintf(pBuf->buf, pBuf->len, msgFormat2, buf, additionalInfo);
  } else {
    const char* msgFormat = (0 == strncmp(sourceStr, prefix, strlen(prefix))) ? msgFormat3 : msgFormat1;
    snprintf(pBuf->buf, pBuf->len, msgFormat, buf);
  }

  return TSDB_CODE_TSC_SQL_SYNTAX_ERROR;
}
166

X
Xiaoyu Wang 已提交
167 168
static uint32_t getTableMetaSize(const STableMeta* pTableMeta) {
  assert(pTableMeta != NULL);
169

X
Xiaoyu Wang 已提交
170 171 172
  int32_t totalCols = 0;
  if (pTableMeta->tableInfo.numOfColumns >= 0) {
    totalCols = pTableMeta->tableInfo.numOfColumns + pTableMeta->tableInfo.numOfTags;
173 174
  }

X
Xiaoyu Wang 已提交
175
  return sizeof(STableMeta) + totalCols * sizeof(SSchema);
176 177
}

X
Xiaoyu Wang 已提交
178 179 180
STableMeta* tableMetaDup(const STableMeta* pTableMeta) {
  assert(pTableMeta != NULL);
  size_t size = getTableMetaSize(pTableMeta);
181

wafwerar's avatar
wafwerar 已提交
182
  STableMeta* p = taosMemoryMalloc(size);
X
Xiaoyu Wang 已提交
183 184
  memcpy(p, pTableMeta, size);
  return p;
185 186
}

X
Xiaoyu Wang 已提交
187 188 189
SSchema *getTableColumnSchema(const STableMeta *pTableMeta) {
  assert(pTableMeta != NULL);
  return (SSchema*) pTableMeta->schema;
190 191
}

X
Xiaoyu Wang 已提交
192 193
static SSchema* getOneColumnSchema(const STableMeta* pTableMeta, int32_t colIndex) {
  assert(pTableMeta != NULL && pTableMeta->schema != NULL && colIndex >= 0 && colIndex < (getNumOfColumns(pTableMeta) + getNumOfTags(pTableMeta)));
194

X
Xiaoyu Wang 已提交
195 196
  SSchema* pSchema = (SSchema*) pTableMeta->schema;
  return &pSchema[colIndex];
197
}
198

X
Xiaoyu Wang 已提交
199 200 201
SSchema* getTableTagSchema(const STableMeta* pTableMeta) {
  assert(pTableMeta != NULL && (pTableMeta->tableType == TSDB_SUPER_TABLE || pTableMeta->tableType == TSDB_CHILD_TABLE));
  return getOneColumnSchema(pTableMeta, getTableInfo(pTableMeta).numOfColumns);
202 203
}

X
Xiaoyu Wang 已提交
204 205 206 207
int32_t getNumOfColumns(const STableMeta* pTableMeta) {
  assert(pTableMeta != NULL);
  // table created according to super table, use data from super table
  return getTableInfo(pTableMeta).numOfColumns;
208 209
}

X
Xiaoyu Wang 已提交
210 211 212
int32_t getNumOfTags(const STableMeta* pTableMeta) {
  assert(pTableMeta != NULL);
  return getTableInfo(pTableMeta).numOfTags;
213 214
}

X
Xiaoyu Wang 已提交
215
STableComInfo getTableInfo(const STableMeta* pTableMeta) {
216
  assert(pTableMeta != NULL);
X
Xiaoyu Wang 已提交
217
  return pTableMeta->tableInfo;
H
Haojun Liao 已提交
218
}
219 220

int32_t trimString(const char* src, int32_t len, char* dst, int32_t dlen) {
221 222
  if (len <=0 || dlen <= 0) return 0;

223 224 225 226
  char delim = src[0];
  int32_t j = 0;
  for (uint32_t k = 1; k < len - 1; ++k) {
    if (j >= dlen) {
227 228
      dst[j - 1] = '\0';
      return j;
229
    }
230
    if (src[k] == delim && src[k + 1] == delim) {   // deal with "", ''
231 232 233 234 235
      dst[j] = src[k + 1];
      j++;
      k++;
      continue;
    }
236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260

    if (src[k] == '\\') {   // deal with escape character
      if(src[k+1] == 'n'){
        dst[j] = '\n';
      }else if(src[k+1] == 'r'){
        dst[j] = '\r';
      }else if(src[k+1] == 't'){
        dst[j] = '\t';
      }else if(src[k+1] == '\\'){
        dst[j] = '\\';
      }else if(src[k+1] == '\''){
        dst[j] = '\'';
      }else if(src[k+1] == '"'){
        dst[j] = '"';
      }else if(src[k+1] == '%' || src[k+1] == '_'){
        dst[j++] = src[k];
        dst[j] = src[k+1];
      }else{
        dst[j] = src[k+1];
      }
      j++;
      k++;
      continue;
    }

261 262 263 264
    dst[j] = src[k];
    j++;
  }
  dst[j] = '\0';
265
  strtrim(dst);
266 267
  return j;
}
268 269 270 271 272 273 274 275 276 277 278

static bool isValidateTag(char *input) {
  if (!input) return false;
  for (size_t i = 0; i < strlen(input); ++i) {
    if (isprint(input[i]) == 0) return false;
  }
  return true;
}

int parseJsontoTagData(const char* json, SKVRowBuilder* kvRowBuilder, SMsgBuf* pMsgBuf, int16_t startColId){
  // set json NULL data
279
  uint8_t jsonNULL = TSDB_DATA_TYPE_NULL;
280
  int jsonIndex = startColId + 1;
281
  if (!json || strcasecmp(json, TSDB_DATA_NULL_STR_L) == 0){
282
    tdAddColToKVRow(kvRowBuilder, jsonIndex, &jsonNULL, CHAR_BYTES);
283 284 285 286 287 288 289 290 291 292 293 294 295 296 297
    return TSDB_CODE_SUCCESS;
  }

  // set json real data
  cJSON *root = cJSON_Parse(json);
  if (root == NULL){
    return buildSyntaxErrMsg(pMsgBuf, "json parse error", json);
  }

  int size = cJSON_GetArraySize(root);
  if(!cJSON_IsObject(root)){
    return buildSyntaxErrMsg(pMsgBuf, "json error invalide value", json);
  }

  int retCode = 0;
298
  char *tagKV = NULL;
299 300 301 302 303
  SHashObj* keyHash = taosHashInit(8, taosGetDefaultHashFunction(TSDB_DATA_TYPE_BINARY), false, false);
  for(int i = 0; i < size; i++) {
    cJSON* item = cJSON_GetArrayItem(root, i);
    if (!item) {
      qError("json inner error:%d", i);
304
      retCode = buildSyntaxErrMsg(pMsgBuf, "json inner error", json);
305 306 307 308 309
      goto end;
    }

    char *jsonKey = item->string;
    if(!isValidateTag(jsonKey)){
310
      retCode = buildSyntaxErrMsg(pMsgBuf, "json key not validate", jsonKey);
311 312 313 314 315 316 317 318 319 320 321
      goto end;
    }
//    if(strlen(jsonKey) > TSDB_MAX_JSON_KEY_LEN){
//      tscError("json key too long error");
//      retCode =  tscSQLSyntaxErrMsg(errMsg, "json key too long, more than 256", NULL);
//      goto end;
//    }
    size_t keyLen = strlen(jsonKey);
    if(keyLen == 0 || taosHashGet(keyHash, jsonKey, keyLen) != NULL){
      continue;
    }
322 323 324 325 326 327 328 329
    // key: keyLen + VARSTR_HEADER_SIZE, value type: CHAR_BYTES, value reserved: LONG_BYTES
    tagKV = taosMemoryCalloc(keyLen + VARSTR_HEADER_SIZE + CHAR_BYTES + LONG_BYTES, 1);
    if(!tagKV) {
      retCode = TSDB_CODE_TSC_OUT_OF_MEMORY;
      goto end;
    }
    strncpy(varDataVal(tagKV), jsonKey, keyLen);
    varDataSetLen(tagKV, keyLen);
330
    if(taosHashGetSize(keyHash) == 0){
331
      uint8_t jsonNotNULL = TSDB_DATA_TYPE_JSON;
332 333 334 335 336 337 338
      tdAddColToKVRow(kvRowBuilder, jsonIndex++, &jsonNotNULL, CHAR_BYTES);   // add json type
    }
    taosHashPut(keyHash, jsonKey, keyLen, &keyLen, CHAR_BYTES);  // add key to hash to remove dumplicate, value is useless

    if(item->type == cJSON_String){     // add json value  format: type|data
      char *jsonValue = item->valuestring;
      int32_t valLen = (int32_t)strlen(jsonValue);
339 340 341
      int32_t totalLen = keyLen + VARSTR_HEADER_SIZE + valLen * TSDB_NCHAR_SIZE + VARSTR_HEADER_SIZE + CHAR_BYTES;
      char *tmp = taosMemoryRealloc(tagKV, totalLen);
      if(!tmp) {
342 343
        retCode = TSDB_CODE_TSC_OUT_OF_MEMORY;
        goto end;
344 345 346 347 348 349
      }
      tagKV = tmp;
      char* valueType = POINTER_SHIFT(tagKV, keyLen + VARSTR_HEADER_SIZE);
      char* valueData = POINTER_SHIFT(tagKV, keyLen + VARSTR_HEADER_SIZE + CHAR_BYTES);
      *valueType = TSDB_DATA_TYPE_NCHAR;
      if (valLen > 0 && !taosMbsToUcs4(jsonValue, valLen, (TdUcs4*)varDataVal(valueData),
350 351 352 353 354 355
                                                  (int32_t)(valLen * TSDB_NCHAR_SIZE), &valLen)) {
        qError("charset:%s to %s. val:%s, errno:%s, convert failed.", DEFAULT_UNICODE_ENCODEC, tsCharset, jsonValue, strerror(errno));
        retCode = buildSyntaxErrMsg(pMsgBuf, "charset convert json error", jsonValue);
        goto end;
      }

356 357
      varDataSetLen(valueData, valLen);
      tdAddColToKVRow(kvRowBuilder, jsonIndex++, tagKV, totalLen);
358 359 360 361 362 363
    }else if(item->type == cJSON_Number){
      if(!isfinite(item->valuedouble)){
        qError("json value is invalidate");
        retCode =  buildSyntaxErrMsg(pMsgBuf, "json value number is illegal", json);
        goto end;
      }
364 365 366 367 368 369
      char* valueType = POINTER_SHIFT(tagKV, keyLen + VARSTR_HEADER_SIZE);
      char* valueData = POINTER_SHIFT(tagKV, keyLen + VARSTR_HEADER_SIZE + CHAR_BYTES);
      *valueType = (item->valuedouble - (int64_t)(item->valuedouble) == 0) ? TSDB_DATA_TYPE_BIGINT : TSDB_DATA_TYPE_DOUBLE;
      if(*valueType== TSDB_DATA_TYPE_DOUBLE) *((double *)valueData) = item->valuedouble;
      else if(*valueType == TSDB_DATA_TYPE_BIGINT) *((int64_t *)valueData) = item->valueint;
      tdAddColToKVRow(kvRowBuilder, jsonIndex++, tagKV, keyLen + VARSTR_HEADER_SIZE + CHAR_BYTES +LONG_BYTES);
370
    }else if(item->type == cJSON_True || item->type == cJSON_False){
371 372 373 374 375
      char* valueType = POINTER_SHIFT(tagKV, keyLen + VARSTR_HEADER_SIZE);
      char* valueData = POINTER_SHIFT(tagKV, keyLen + VARSTR_HEADER_SIZE + CHAR_BYTES);
      *valueType = TSDB_DATA_TYPE_BOOL;
      *valueData = (char)(item->valueint);
      tdAddColToKVRow(kvRowBuilder, jsonIndex++, tagKV, keyLen + VARSTR_HEADER_SIZE + CHAR_BYTES + CHAR_BYTES);
376
    }else if(item->type == cJSON_NULL){
377 378 379
      char* valueType = POINTER_SHIFT(tagKV, keyLen + VARSTR_HEADER_SIZE);
      *valueType = TSDB_DATA_TYPE_NULL;
      tdAddColToKVRow(kvRowBuilder, jsonIndex++, tagKV, keyLen + VARSTR_HEADER_SIZE + CHAR_BYTES);
380 381 382 383 384 385 386 387
    }
    else{
      retCode = buildSyntaxErrMsg(pMsgBuf, "invalidate json value", json);
      goto end;
    }
  }

  if(taosHashGetSize(keyHash) == 0){  // set json NULL true
388
    tdAddColToKVRow(kvRowBuilder, jsonIndex, &jsonNULL, CHAR_BYTES);
389 390 391
  }

end:
392
  taosMemoryFree(tagKV);
393 394 395 396
  taosHashCleanup(keyHash);
  cJSON_Delete(root);
  return retCode;
}