parUtil.c 15.1 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */
15

X
Xiaoyu Wang 已提交
16
#include "parUtil.h"
17
#include "cJSON.h"
18

19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45
static char* getSyntaxErrFormat(int32_t errCode) {
  switch (errCode) {
    case TSDB_CODE_PAR_SYNTAX_ERROR:
      return "syntax error near \"%s\"";
    case TSDB_CODE_PAR_INCOMPLETE_SQL:
      return "Incomplete SQL statement";
    case TSDB_CODE_PAR_INVALID_COLUMN:
      return "Invalid column name : %s";
    case TSDB_CODE_PAR_TABLE_NOT_EXIST:
      return "Table does not exist : %s";
    case TSDB_CODE_PAR_AMBIGUOUS_COLUMN:
      return "Column ambiguously defined : %s";
    case TSDB_CODE_PAR_WRONG_VALUE_TYPE:
      return "Invalid value type : %s";
    case TSDB_CODE_PAR_INVALID_FUNTION:
      return "Invalid function name : %s";
    case TSDB_CODE_PAR_ILLEGAL_USE_AGG_FUNCTION:
      return "There mustn't be aggregation";
    case TSDB_CODE_PAR_WRONG_NUMBER_OF_SELECT:
      return "ORDER BY item must be the number of a SELECT-list expression";
    case TSDB_CODE_PAR_GROUPBY_LACK_EXPRESSION:
      return "Not a GROUP BY expression";
    case TSDB_CODE_PAR_NOT_SELECTED_EXPRESSION:
      return "Not SELECTed expression";
    case TSDB_CODE_PAR_NOT_SINGLE_GROUP:
      return "Not a single-group group function";
    case TSDB_CODE_PAR_TAGS_NOT_MATCHED:
46
      return "Tags number not matched";
47
    case TSDB_CODE_PAR_INVALID_TAG_NAME:
48
      return "Invalid tag name : %s";
49
    case TSDB_CODE_PAR_NAME_OR_PASSWD_TOO_LONG:
50
      return "Name or password too long";
51
    case TSDB_CODE_PAR_PASSWD_EMPTY:
52
      return "Password can not be empty";
53
    case TSDB_CODE_PAR_INVALID_PORT:
54
      return "Port should be an integer that is less than 65535 and greater than 0";
55
    case TSDB_CODE_PAR_INVALID_ENDPOINT:
56 57 58
      return "Endpoint should be in the format of 'fqdn:port'";
    case TSDB_CODE_PAR_EXPRIE_STATEMENT:
      return "This statement is no longer supported";
X
Xiaoyu Wang 已提交
59 60
    case TSDB_CODE_PAR_INTER_VALUE_TOO_SMALL:
      return "Interval cannot be less than %d us";
X
Xiaoyu Wang 已提交
61
    case TSDB_CODE_PAR_DB_NOT_SPECIFIED:
62
      return "Database not specified";
X
Xiaoyu Wang 已提交
63 64
    case TSDB_CODE_PAR_INVALID_IDENTIFIER_NAME:
      return "Invalid identifier name : %s";
X
Xiaoyu Wang 已提交
65
    case TSDB_CODE_PAR_CORRESPONDING_STABLE_ERR:
66
      return "Corresponding super table not in this db";
X
Xiaoyu Wang 已提交
67
    case TSDB_CODE_PAR_INVALID_RANGE_OPTION:
68
      return "Invalid option %s: %"PRId64" valid range: [%d, %d]";
X
Xiaoyu Wang 已提交
69
    case TSDB_CODE_PAR_INVALID_STR_OPTION:
70
      return "Invalid option %s: %s";
X
Xiaoyu Wang 已提交
71
    case TSDB_CODE_PAR_INVALID_ENUM_OPTION:
72
      return "Invalid option %s: %"PRId64", only %d, %d allowed";
X
Xiaoyu Wang 已提交
73
    case TSDB_CODE_PAR_INVALID_TTL_OPTION:
74
      return "Invalid option ttl: %"PRId64", should be greater than or equal to %d";
X
Xiaoyu Wang 已提交
75
    case TSDB_CODE_PAR_INVALID_KEEP_NUM:
76
      return "Invalid number of keep options";
X
Xiaoyu Wang 已提交
77
    case TSDB_CODE_PAR_INVALID_KEEP_ORDER:
78
      return "Invalid keep value, should be keep0 <= keep1 <= keep2";
X
Xiaoyu Wang 已提交
79
    case TSDB_CODE_PAR_INVALID_KEEP_VALUE:
80
      return "Invalid option keep: %d, %d, %d valid range: [%d, %d]";
X
Xiaoyu Wang 已提交
81
    case TSDB_CODE_PAR_INVALID_COMMENT_OPTION:
82
      return "Invalid option comment, length cannot exceed %d";
X
Xiaoyu Wang 已提交
83
    case TSDB_CODE_PAR_INVALID_F_RANGE_OPTION:
84
      return "Invalid option %s: %f valid range: [%d, %d]";
X
Xiaoyu Wang 已提交
85
    case TSDB_CODE_PAR_INVALID_ROLLUP_OPTION:
86
      return "Invalid option rollup: only one function is allowed";
X
Xiaoyu Wang 已提交
87
    case TSDB_CODE_PAR_INVALID_RETENTIONS_OPTION:
88
      return "Invalid option retentions";
X
Xiaoyu Wang 已提交
89 90
    case TSDB_CODE_PAR_GROUPBY_WINDOW_COEXIST:
      return "GROUP BY and WINDOW-clause can't be used together";
91 92 93 94
    case TSDB_CODE_PAR_INVALID_OPTION_UNIT:
      return "Invalid option %s unit: %c, only m, h, d allowed";
    case TSDB_CODE_PAR_INVALID_KEEP_UNIT:
      return "Invalid option keep unit: %c, %c, %c, only m, h, d allowed";
X
Xiaoyu Wang 已提交
95 96
    case TSDB_CODE_PAR_AGG_FUNC_NESTING:
      return "Aggregate functions do not support nesting";
X
Xiaoyu Wang 已提交
97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118
    case TSDB_CODE_PAR_INVALID_STATE_WIN_TYPE:
      return "Only support STATE_WINDOW on integer column";
    case TSDB_CODE_PAR_INVALID_STATE_WIN_COL:
      return "Not support STATE_WINDOW on tag column";
    case TSDB_CODE_PAR_INVALID_STATE_WIN_TABLE:
      return "STATE_WINDOW not support for super table query";
    case TSDB_CODE_PAR_INTER_SESSION_GAP:
      return "SESSION gap should be fixed time window, and greater than 0";
    case TSDB_CODE_PAR_INTER_SESSION_COL:
      return "Only support SESSION on primary timestamp column";
    case TSDB_CODE_PAR_INTER_OFFSET_NEGATIVE:
      return "Interval offset cannot be negative";
    case TSDB_CODE_PAR_INTER_OFFSET_UNIT:
      return "Cannot use 'year' as offset when interval is 'month'";
    case TSDB_CODE_PAR_INTER_OFFSET_TOO_BIG:
      return "Interval offset should be shorter than interval";
    case TSDB_CODE_PAR_INTER_SLIDING_UNIT:
      return "Does not support sliding when interval is natural month/year";
    case TSDB_CODE_PAR_INTER_SLIDING_TOO_BIG:
      return "sliding value no larger than the interval value";
    case TSDB_CODE_PAR_INTER_SLIDING_TOO_SMALL:
      return "sliding value can not less than 1% of interval value";
119 120
    case TSDB_CODE_PAR_ONLY_ONE_JSON_TAG:
      return "Only one tag if there is a json tag";
X
Xiaoyu Wang 已提交
121 122
    case TSDB_CODE_PAR_INCORRECT_NUM_OF_COL:
      return "Query block has incorrect number of result columns";
123 124 125 126 127 128 129 130 131 132 133 134
    case TSDB_CODE_OUT_OF_MEMORY:
      return "Out of memory";
    default:
      return "Unknown error";
  }
}

int32_t generateSyntaxErrMsg(SMsgBuf* pBuf, int32_t errCode, ...) {
  va_list vArgList;
  va_start(vArgList, errCode);
  vsnprintf(pBuf->buf, pBuf->len, getSyntaxErrFormat(errCode), vArgList);
  va_end(vArgList);
X
Xiaoyu Wang 已提交
135
  terrno = errCode;
136 137 138
  return errCode;
}

X
Xiaoyu Wang 已提交
139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154
int32_t buildInvalidOperationMsg(SMsgBuf* pBuf, const char* msg) {
  strncpy(pBuf->buf, msg, pBuf->len);
  return TSDB_CODE_TSC_INVALID_OPERATION;
}

int32_t buildSyntaxErrMsg(SMsgBuf* pBuf, const char* additionalInfo, const char* sourceStr) {
  const char* msgFormat1 = "syntax error near \'%s\'";
  const char* msgFormat2 = "syntax error near \'%s\' (%s)";
  const char* msgFormat3 = "%s";

  const char* prefix = "syntax error";
  if (sourceStr == NULL) {
    assert(additionalInfo != NULL);
    snprintf(pBuf->buf, pBuf->len, msgFormat1, additionalInfo);
    return TSDB_CODE_TSC_SQL_SYNTAX_ERROR;
  }
155

X
Xiaoyu Wang 已提交
156 157 158 159 160 161 162 163 164 165 166 167
  char buf[64] = {0};  // only extract part of sql string
  strncpy(buf, sourceStr, tListLen(buf) - 1);

  if (additionalInfo != NULL) {
    snprintf(pBuf->buf, pBuf->len, msgFormat2, buf, additionalInfo);
  } else {
    const char* msgFormat = (0 == strncmp(sourceStr, prefix, strlen(prefix))) ? msgFormat3 : msgFormat1;
    snprintf(pBuf->buf, pBuf->len, msgFormat, buf);
  }

  return TSDB_CODE_TSC_SQL_SYNTAX_ERROR;
}
168

X
Xiaoyu Wang 已提交
169 170
static uint32_t getTableMetaSize(const STableMeta* pTableMeta) {
  assert(pTableMeta != NULL);
171

X
Xiaoyu Wang 已提交
172 173 174
  int32_t totalCols = 0;
  if (pTableMeta->tableInfo.numOfColumns >= 0) {
    totalCols = pTableMeta->tableInfo.numOfColumns + pTableMeta->tableInfo.numOfTags;
175 176
  }

X
Xiaoyu Wang 已提交
177
  return sizeof(STableMeta) + totalCols * sizeof(SSchema);
178 179
}

X
Xiaoyu Wang 已提交
180 181 182
STableMeta* tableMetaDup(const STableMeta* pTableMeta) {
  assert(pTableMeta != NULL);
  size_t size = getTableMetaSize(pTableMeta);
183

wafwerar's avatar
wafwerar 已提交
184
  STableMeta* p = taosMemoryMalloc(size);
X
Xiaoyu Wang 已提交
185 186
  memcpy(p, pTableMeta, size);
  return p;
187 188
}

X
Xiaoyu Wang 已提交
189 190 191
SSchema *getTableColumnSchema(const STableMeta *pTableMeta) {
  assert(pTableMeta != NULL);
  return (SSchema*) pTableMeta->schema;
192 193
}

X
Xiaoyu Wang 已提交
194 195
static SSchema* getOneColumnSchema(const STableMeta* pTableMeta, int32_t colIndex) {
  assert(pTableMeta != NULL && pTableMeta->schema != NULL && colIndex >= 0 && colIndex < (getNumOfColumns(pTableMeta) + getNumOfTags(pTableMeta)));
196

X
Xiaoyu Wang 已提交
197 198
  SSchema* pSchema = (SSchema*) pTableMeta->schema;
  return &pSchema[colIndex];
199
}
200

X
Xiaoyu Wang 已提交
201 202 203
SSchema* getTableTagSchema(const STableMeta* pTableMeta) {
  assert(pTableMeta != NULL && (pTableMeta->tableType == TSDB_SUPER_TABLE || pTableMeta->tableType == TSDB_CHILD_TABLE));
  return getOneColumnSchema(pTableMeta, getTableInfo(pTableMeta).numOfColumns);
204 205
}

X
Xiaoyu Wang 已提交
206 207 208 209
int32_t getNumOfColumns(const STableMeta* pTableMeta) {
  assert(pTableMeta != NULL);
  // table created according to super table, use data from super table
  return getTableInfo(pTableMeta).numOfColumns;
210 211
}

X
Xiaoyu Wang 已提交
212 213 214
int32_t getNumOfTags(const STableMeta* pTableMeta) {
  assert(pTableMeta != NULL);
  return getTableInfo(pTableMeta).numOfTags;
215 216
}

X
Xiaoyu Wang 已提交
217
STableComInfo getTableInfo(const STableMeta* pTableMeta) {
218
  assert(pTableMeta != NULL);
X
Xiaoyu Wang 已提交
219
  return pTableMeta->tableInfo;
H
Haojun Liao 已提交
220
}
221 222

int32_t trimString(const char* src, int32_t len, char* dst, int32_t dlen) {
223 224
  if (len <=0 || dlen <= 0) return 0;

225 226 227 228
  char delim = src[0];
  int32_t j = 0;
  for (uint32_t k = 1; k < len - 1; ++k) {
    if (j >= dlen) {
229 230
      dst[j - 1] = '\0';
      return j;
231
    }
232
    if (src[k] == delim && src[k + 1] == delim) {   // deal with "", ''
233 234 235 236 237
      dst[j] = src[k + 1];
      j++;
      k++;
      continue;
    }
238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262

    if (src[k] == '\\') {   // deal with escape character
      if(src[k+1] == 'n'){
        dst[j] = '\n';
      }else if(src[k+1] == 'r'){
        dst[j] = '\r';
      }else if(src[k+1] == 't'){
        dst[j] = '\t';
      }else if(src[k+1] == '\\'){
        dst[j] = '\\';
      }else if(src[k+1] == '\''){
        dst[j] = '\'';
      }else if(src[k+1] == '"'){
        dst[j] = '"';
      }else if(src[k+1] == '%' || src[k+1] == '_'){
        dst[j++] = src[k];
        dst[j] = src[k+1];
      }else{
        dst[j] = src[k+1];
      }
      j++;
      k++;
      continue;
    }

263 264 265 266 267 268
    dst[j] = src[k];
    j++;
  }
  dst[j] = '\0';
  return j;
}
269 270 271 272 273 274 275 276 277 278 279

static bool isValidateTag(char *input) {
  if (!input) return false;
  for (size_t i = 0; i < strlen(input); ++i) {
    if (isprint(input[i]) == 0) return false;
  }
  return true;
}

int parseJsontoTagData(const char* json, SKVRowBuilder* kvRowBuilder, SMsgBuf* pMsgBuf, int16_t startColId){
  // set json NULL data
280
  uint8_t jsonNULL = TSDB_DATA_TYPE_NULL;
281
  int jsonIndex = startColId + 1;
282
  if (!json || strcasecmp(json, TSDB_DATA_NULL_STR_L) == 0){
283
    tdAddColToKVRow(kvRowBuilder, jsonIndex, &jsonNULL, CHAR_BYTES);
284 285 286 287 288 289 290 291 292 293 294 295 296 297 298
    return TSDB_CODE_SUCCESS;
  }

  // set json real data
  cJSON *root = cJSON_Parse(json);
  if (root == NULL){
    return buildSyntaxErrMsg(pMsgBuf, "json parse error", json);
  }

  int size = cJSON_GetArraySize(root);
  if(!cJSON_IsObject(root)){
    return buildSyntaxErrMsg(pMsgBuf, "json error invalide value", json);
  }

  int retCode = 0;
299
  char *tagKV = NULL;
300 301 302 303 304
  SHashObj* keyHash = taosHashInit(8, taosGetDefaultHashFunction(TSDB_DATA_TYPE_BINARY), false, false);
  for(int i = 0; i < size; i++) {
    cJSON* item = cJSON_GetArrayItem(root, i);
    if (!item) {
      qError("json inner error:%d", i);
305
      retCode = buildSyntaxErrMsg(pMsgBuf, "json inner error", json);
306 307 308 309 310
      goto end;
    }

    char *jsonKey = item->string;
    if(!isValidateTag(jsonKey)){
311
      retCode = buildSyntaxErrMsg(pMsgBuf, "json key not validate", jsonKey);
312 313 314 315 316 317 318 319 320 321 322
      goto end;
    }
//    if(strlen(jsonKey) > TSDB_MAX_JSON_KEY_LEN){
//      tscError("json key too long error");
//      retCode =  tscSQLSyntaxErrMsg(errMsg, "json key too long, more than 256", NULL);
//      goto end;
//    }
    size_t keyLen = strlen(jsonKey);
    if(keyLen == 0 || taosHashGet(keyHash, jsonKey, keyLen) != NULL){
      continue;
    }
323 324 325 326 327 328 329 330
    // key: keyLen + VARSTR_HEADER_SIZE, value type: CHAR_BYTES, value reserved: LONG_BYTES
    tagKV = taosMemoryCalloc(keyLen + VARSTR_HEADER_SIZE + CHAR_BYTES + LONG_BYTES, 1);
    if(!tagKV) {
      retCode = TSDB_CODE_TSC_OUT_OF_MEMORY;
      goto end;
    }
    strncpy(varDataVal(tagKV), jsonKey, keyLen);
    varDataSetLen(tagKV, keyLen);
331
    if(taosHashGetSize(keyHash) == 0){
332
      uint8_t jsonNotNULL = TSDB_DATA_TYPE_JSON;
333 334 335 336 337 338 339
      tdAddColToKVRow(kvRowBuilder, jsonIndex++, &jsonNotNULL, CHAR_BYTES);   // add json type
    }
    taosHashPut(keyHash, jsonKey, keyLen, &keyLen, CHAR_BYTES);  // add key to hash to remove dumplicate, value is useless

    if(item->type == cJSON_String){     // add json value  format: type|data
      char *jsonValue = item->valuestring;
      int32_t valLen = (int32_t)strlen(jsonValue);
340 341 342
      int32_t totalLen = keyLen + VARSTR_HEADER_SIZE + valLen * TSDB_NCHAR_SIZE + VARSTR_HEADER_SIZE + CHAR_BYTES;
      char *tmp = taosMemoryRealloc(tagKV, totalLen);
      if(!tmp) {
343 344
        retCode = TSDB_CODE_TSC_OUT_OF_MEMORY;
        goto end;
345 346 347 348 349 350
      }
      tagKV = tmp;
      char* valueType = POINTER_SHIFT(tagKV, keyLen + VARSTR_HEADER_SIZE);
      char* valueData = POINTER_SHIFT(tagKV, keyLen + VARSTR_HEADER_SIZE + CHAR_BYTES);
      *valueType = TSDB_DATA_TYPE_NCHAR;
      if (valLen > 0 && !taosMbsToUcs4(jsonValue, valLen, (TdUcs4*)varDataVal(valueData),
351 352 353 354 355 356
                                                  (int32_t)(valLen * TSDB_NCHAR_SIZE), &valLen)) {
        qError("charset:%s to %s. val:%s, errno:%s, convert failed.", DEFAULT_UNICODE_ENCODEC, tsCharset, jsonValue, strerror(errno));
        retCode = buildSyntaxErrMsg(pMsgBuf, "charset convert json error", jsonValue);
        goto end;
      }

357 358
      varDataSetLen(valueData, valLen);
      tdAddColToKVRow(kvRowBuilder, jsonIndex++, tagKV, totalLen);
359 360 361 362 363 364
    }else if(item->type == cJSON_Number){
      if(!isfinite(item->valuedouble)){
        qError("json value is invalidate");
        retCode =  buildSyntaxErrMsg(pMsgBuf, "json value number is illegal", json);
        goto end;
      }
365 366 367 368 369 370
      char* valueType = POINTER_SHIFT(tagKV, keyLen + VARSTR_HEADER_SIZE);
      char* valueData = POINTER_SHIFT(tagKV, keyLen + VARSTR_HEADER_SIZE + CHAR_BYTES);
      *valueType = (item->valuedouble - (int64_t)(item->valuedouble) == 0) ? TSDB_DATA_TYPE_BIGINT : TSDB_DATA_TYPE_DOUBLE;
      if(*valueType== TSDB_DATA_TYPE_DOUBLE) *((double *)valueData) = item->valuedouble;
      else if(*valueType == TSDB_DATA_TYPE_BIGINT) *((int64_t *)valueData) = item->valueint;
      tdAddColToKVRow(kvRowBuilder, jsonIndex++, tagKV, keyLen + VARSTR_HEADER_SIZE + CHAR_BYTES +LONG_BYTES);
371
    }else if(item->type == cJSON_True || item->type == cJSON_False){
372 373 374 375 376
      char* valueType = POINTER_SHIFT(tagKV, keyLen + VARSTR_HEADER_SIZE);
      char* valueData = POINTER_SHIFT(tagKV, keyLen + VARSTR_HEADER_SIZE + CHAR_BYTES);
      *valueType = TSDB_DATA_TYPE_BOOL;
      *valueData = (char)(item->valueint);
      tdAddColToKVRow(kvRowBuilder, jsonIndex++, tagKV, keyLen + VARSTR_HEADER_SIZE + CHAR_BYTES + CHAR_BYTES);
377
    }else if(item->type == cJSON_NULL){
378 379 380
      char* valueType = POINTER_SHIFT(tagKV, keyLen + VARSTR_HEADER_SIZE);
      *valueType = TSDB_DATA_TYPE_NULL;
      tdAddColToKVRow(kvRowBuilder, jsonIndex++, tagKV, keyLen + VARSTR_HEADER_SIZE + CHAR_BYTES);
381 382 383 384 385 386 387 388
    }
    else{
      retCode = buildSyntaxErrMsg(pMsgBuf, "invalidate json value", json);
      goto end;
    }
  }

  if(taosHashGetSize(keyHash) == 0){  // set json NULL true
389
    tdAddColToKVRow(kvRowBuilder, jsonIndex, &jsonNULL, CHAR_BYTES);
390 391 392
  }

end:
393
  taosMemoryFree(tagKV);
394 395 396 397
  taosHashCleanup(keyHash);
  cJSON_Delete(root);
  return retCode;
}