tmqUpdate-multiCtb.py 13.7 KB
Newer Older
P
plum-lihui 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19

import taos
import sys
import time
import socket
import os
import threading
from enum import Enum

from util.log import *
from util.sql import *
from util.cases import *
from util.dnodes import *
sys.path.append("./7-tmq")
from tmqCommon import *

class TDTestCase:
    def __init__(self):
        self.snapshot   = 0
P
plum-lihui 已提交
20
        self.vgroups    = 4
P
plum-lihui 已提交
21
        self.ctbNum     = 50
P
plum-lihui 已提交
22 23
        self.rowsPerTbl = 1000
        self.autoCtbPrefix = 'aCtb'
G
Ganlin Zhao 已提交
24

25
    def init(self, conn, logSql, replicaVar=1):
P
plum-lihui 已提交
26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41
        tdLog.debug(f"start to excute {__file__}")
        tdSql.init(conn.cursor(), False)

    def prepareTestEnv(self):
        tdLog.printNoPrefix("======== prepare test env include database, stable, ctables, and insert data: ")
        paraDict = {'dbName':     'dbt',
                    'dropFlag':   1,
                    'event':      '',
                    'vgroups':    4,
                    'stbName':    'stb',
                    'colPrefix':  'c',
                    'tagPrefix':  't',
                    'colSchema':   [{'type': 'INT', 'count':1},{'type': 'BIGINT', 'count':1},{'type': 'DOUBLE', 'count':1},{'type': 'BINARY', 'len':32, 'count':1},{'type': 'NCHAR', 'len':32, 'count':1},{'type': 'TIMESTAMP', 'count':1}],
                    'tagSchema':   [{'type': 'INT', 'count':1},{'type': 'BIGINT', 'count':1},{'type': 'DOUBLE', 'count':1},{'type': 'BINARY', 'len':32, 'count':1},{'type': 'NCHAR', 'len':32, 'count':1}],
                    'ctbPrefix':  'ctb',
                    'ctbStartIdx': 0,
P
plum-lihui 已提交
42
                    'ctbNum':     100,
P
plum-lihui 已提交
43
                    'rowsPerTbl': 1000,
P
plum-lihui 已提交
44
                    'batchNum':   1000,
P
plum-lihui 已提交
45 46 47 48 49 50 51 52 53
                    'startTs':    1640966400000,  # 2022-01-01 00:00:00.000
                    'pollDelay':  3,
                    'showMsg':    1,
                    'showRow':    1,
                    'snapshot':   0}

        paraDict['vgroups'] = self.vgroups
        paraDict['ctbNum'] = self.ctbNum
        paraDict['rowsPerTbl'] = self.rowsPerTbl
G
Ganlin Zhao 已提交
54

P
plum-lihui 已提交
55 56 57 58 59 60 61 62 63 64 65
        tmqCom.initConsumerTable()
        tdCom.create_database(tdSql, paraDict["dbName"],paraDict["dropFlag"], vgroups=paraDict["vgroups"],replica=1)
        tdLog.info("create stb")
        tmqCom.create_stable(tdSql, dbName=paraDict["dbName"],stbName=paraDict["stbName"])
        tdLog.info("create ctb")
        tmqCom.create_ctable(tdSql, dbName=paraDict["dbName"],stbName=paraDict["stbName"],ctbPrefix=paraDict['ctbPrefix'],
                             ctbNum=paraDict["ctbNum"],ctbStartIdx=paraDict['ctbStartIdx'])
        tdLog.info("insert data")
        tmqCom.insert_data_interlaceByMultiTbl(tsql=tdSql,dbName=paraDict["dbName"],ctbPrefix=paraDict["ctbPrefix"],
                                               ctbNum=paraDict["ctbNum"],rowsPerTbl=paraDict["rowsPerTbl"],batchNum=paraDict["batchNum"],
                                               startTs=paraDict["startTs"],ctbStartIdx=paraDict['ctbStartIdx'])
P
plum-lihui 已提交
66 67 68
        tmqCom.insert_data_with_autoCreateTbl(tsql=tdSql,dbName=paraDict["dbName"],stbName=paraDict["stbName"],ctbPrefix=self.autoCtbPrefix,
                                              ctbNum=paraDict["ctbNum"],rowsPerTbl=paraDict["rowsPerTbl"],batchNum=paraDict["batchNum"],
                                              startTs=paraDict["startTs"],ctbStartIdx=paraDict['ctbStartIdx'])
G
Ganlin Zhao 已提交
69 70

        # tdLog.info("restart taosd to ensure that the data falls into the disk")
P
plum-lihui 已提交
71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86
        # tdSql.query("flush database %s"%(paraDict['dbName']))
        return

    def tmqCase1(self):
        tdLog.printNoPrefix("======== test case 1: ")
        paraDict = {'dbName':     'dbt',
                    'dropFlag':   1,
                    'event':      '',
                    'vgroups':    4,
                    'stbName':    'stb',
                    'colPrefix':  'c',
                    'tagPrefix':  't',
                    'colSchema':   [{'type': 'INT', 'count':1},{'type': 'BIGINT', 'count':1},{'type': 'DOUBLE', 'count':1},{'type': 'BINARY', 'len':32, 'count':1},{'type': 'NCHAR', 'len':32, 'count':1},{'type': 'TIMESTAMP', 'count':1}],
                    'tagSchema':   [{'type': 'INT', 'count':1},{'type': 'BIGINT', 'count':1},{'type': 'DOUBLE', 'count':1},{'type': 'BINARY', 'len':32, 'count':1},{'type': 'NCHAR', 'len':32, 'count':1}],
                    'ctbPrefix':  'ctb',
                    'ctbStartIdx': 0,
P
plum-lihui 已提交
87
                    'ctbNum':     100,
P
plum-lihui 已提交
88
                    'rowsPerTbl': 1000,
P
plum-lihui 已提交
89
                    'batchNum':   1000,
P
plum-lihui 已提交
90 91 92 93 94 95 96 97 98
                    'startTs':    1640966400000,  # 2022-01-01 00:00:00.000
                    'pollDelay':  5,
                    'showMsg':    1,
                    'showRow':    1,
                    'snapshot':   0}
        paraDict['snapshot'] = self.snapshot
        paraDict['vgroups'] = self.vgroups
        paraDict['ctbNum'] = self.ctbNum
        paraDict['rowsPerTbl'] = self.rowsPerTbl
G
Ganlin Zhao 已提交
99

P
plum-lihui 已提交
100
        # update to half tables
P
plum-lihui 已提交
101
        paraDict['ctbNum'] = int(self.ctbNum/2)
P
plum-lihui 已提交
102
        paraDict['rowsPerTbl'] = int(self.rowsPerTbl / 2)
P
plum-lihui 已提交
103 104 105
        tmqCom.insert_data_with_autoCreateTbl(tsql=tdSql,dbName=paraDict["dbName"],stbName=paraDict["stbName"],ctbPrefix=self.autoCtbPrefix,
                                              ctbNum=paraDict["ctbNum"],rowsPerTbl=paraDict["rowsPerTbl"],batchNum=paraDict["batchNum"],
                                              startTs=paraDict["startTs"],ctbStartIdx=paraDict['ctbStartIdx'])
P
plum-lihui 已提交
106 107
        tmqCom.insert_data_interlaceByMultiTbl(tsql=tdSql,dbName=paraDict["dbName"],ctbPrefix=paraDict["ctbPrefix"],
                                               ctbNum=paraDict["ctbNum"],rowsPerTbl=paraDict["rowsPerTbl"],batchNum=paraDict["batchNum"],
G
Ganlin Zhao 已提交
108 109
                                               startTs=paraDict["startTs"],ctbStartIdx=paraDict['ctbStartIdx'])

P
plum-lihui 已提交
110
        tdLog.info("create topics from stb1")
G
Ganlin Zhao 已提交
111
        topicFromStb1 = 'topic_stb1'
P
plum-lihui 已提交
112 113 114
        queryString = "select ts, c1, c2 from %s.%s"%(paraDict['dbName'], paraDict['stbName'])
        sqlString = "create topic %s as %s" %(topicFromStb1, queryString)
        tdLog.info("create topic sql: %s"%sqlString)
G
Ganlin Zhao 已提交
115 116
        tdSql.execute(sqlString)

P
plum-lihui 已提交
117
        paraDict['ctbNum'] = self.ctbNum
P
plum-lihui 已提交
118 119
        paraDict['rowsPerTbl'] = self.rowsPerTbl
        consumerId     = 0
P
plum-lihui 已提交
120 121 122 123
        if self.snapshot == 0:
            expectrowcnt   = int(paraDict["rowsPerTbl"] * paraDict["ctbNum"] * (2 + 1/2*1/2*2))
        elif self.snapshot == 1:
            expectrowcnt   = int(paraDict["rowsPerTbl"] * paraDict["ctbNum"] * (2))
G
Ganlin Zhao 已提交
124

P
plum-lihui 已提交
125 126 127 128 129 130 131 132 133 134 135 136
        topicList      = topicFromStb1
        ifcheckdata    = 1
        ifManualCommit = 1
        keyList        = 'group.id:cgrp1,\
                        enable.auto.commit:true,\
                        auto.commit.interval.ms:1000,\
                        auto.offset.reset:earliest'
        tmqCom.insertConsumerInfo(consumerId, expectrowcnt,topicList,keyList,ifcheckdata,ifManualCommit)

        tdLog.info("start consume processor")
        tmqCom.startTmqSimProcess(pollDelay=paraDict['pollDelay'],dbName=paraDict["dbName"],showMsg=paraDict['showMsg'], showRow=paraDict['showRow'],snapshot=paraDict['snapshot'])

P
plum-lihui 已提交
137
        tdLog.info("start to check consume result")
P
plum-lihui 已提交
138 139 140 141 142 143 144 145
        expectRows = 1
        resultList = tmqCom.selectConsumeResult(expectRows)
        totalConsumeRows = 0
        for i in range(expectRows):
            totalConsumeRows += resultList[i]

        tdSql.query(queryString)
        totalRowsInserted = tdSql.getRows()
G
Ganlin Zhao 已提交
146

P
plum-lihui 已提交
147 148 149
        tdLog.info("act consume rows: %d, expect consume rows: %d, act insert rows: %d"%(totalConsumeRows, expectrowcnt, totalRowsInserted))
        if totalConsumeRows != expectrowcnt:
            tdLog.exit("tmq consume rows error!")
G
Ganlin Zhao 已提交
150 151

        # tmqCom.checkFileContent(consumerId, queryString)
P
plum-lihui 已提交
152 153 154 155 156

        tdSql.query("drop topic %s"%topicFromStb1)
        tdLog.printNoPrefix("======== test case 1 end ...... ")

    def tmqCase2(self):
G
Ganlin Zhao 已提交
157
        tdLog.printNoPrefix("======== test case 2: ")
P
plum-lihui 已提交
158 159 160 161 162 163 164 165 166 167 168
        paraDict = {'dbName':     'dbt',
                    'dropFlag':   1,
                    'event':      '',
                    'vgroups':    4,
                    'stbName':    'stb',
                    'colPrefix':  'c',
                    'tagPrefix':  't',
                    'colSchema':   [{'type': 'INT', 'count':1},{'type': 'BIGINT', 'count':1},{'type': 'DOUBLE', 'count':1},{'type': 'BINARY', 'len':32, 'count':1},{'type': 'NCHAR', 'len':32, 'count':1},{'type': 'TIMESTAMP', 'count':1}],
                    'tagSchema':   [{'type': 'INT', 'count':1},{'type': 'BIGINT', 'count':1},{'type': 'DOUBLE', 'count':1},{'type': 'BINARY', 'len':32, 'count':1},{'type': 'NCHAR', 'len':32, 'count':1}],
                    'ctbPrefix':  'ctb',
                    'ctbStartIdx': 0,
P
plum-lihui 已提交
169
                    'ctbNum':     100,
P
plum-lihui 已提交
170
                    'rowsPerTbl': 1000,
P
plum-lihui 已提交
171
                    'batchNum':   1000,
P
plum-lihui 已提交
172 173 174 175 176
                    'startTs':    1640966400000,  # 2022-01-01 00:00:00.000
                    'pollDelay':  5,
                    'showMsg':    1,
                    'showRow':    1,
                    'snapshot':   0}
G
Ganlin Zhao 已提交
177

P
plum-lihui 已提交
178 179 180 181
        paraDict['snapshot'] = self.snapshot
        paraDict['vgroups'] = self.vgroups
        paraDict['ctbNum'] = self.ctbNum
        paraDict['rowsPerTbl'] = self.rowsPerTbl
G
Ganlin Zhao 已提交
182 183

        tdLog.info("restart taosd to ensure that the data falls into the disk")
P
plum-lihui 已提交
184
        tdSql.query("flush database %s"%(paraDict['dbName']))
G
Ganlin Zhao 已提交
185

P
plum-lihui 已提交
186
        # update to half tables
P
plum-lihui 已提交
187
        paraDict['ctbNum'] = int(self.ctbNum/2)
P
plum-lihui 已提交
188
        paraDict['rowsPerTbl'] = int(self.rowsPerTbl / 2)
P
plum-lihui 已提交
189 190
        paraDict['startTs'] = paraDict['startTs'] + int(self.rowsPerTbl / 2)
        tmqCom.insert_data_with_autoCreateTbl(tsql=tdSql,dbName=paraDict["dbName"],stbName=paraDict["stbName"],ctbPrefix=self.autoCtbPrefix,
P
plum-lihui 已提交
191
                                              ctbNum=paraDict["ctbNum"],rowsPerTbl=paraDict["rowsPerTbl"],batchNum=paraDict["batchNum"],
P
plum-lihui 已提交
192
                                              startTs=paraDict["startTs"],ctbStartIdx=paraDict['ctbStartIdx']+int(self.ctbNum/2))
G
Ganlin Zhao 已提交
193

P
plum-lihui 已提交
194 195 196
        tmqCom.insert_data_with_autoCreateTbl(tsql=tdSql,dbName=paraDict["dbName"],stbName=paraDict["stbName"],ctbPrefix="aCtby",
                                              ctbNum=paraDict["ctbNum"],rowsPerTbl=paraDict["rowsPerTbl"],batchNum=paraDict["batchNum"],
                                              startTs=paraDict["startTs"],ctbStartIdx=paraDict['ctbStartIdx']+int(self.ctbNum/2))
G
Ganlin Zhao 已提交
197

P
plum-lihui 已提交
198 199 200
        tmqCom.insert_data_interlaceByMultiTbl(tsql=tdSql,dbName=paraDict["dbName"],ctbPrefix=paraDict["ctbPrefix"],
                                               ctbNum=paraDict["ctbNum"],rowsPerTbl=paraDict["rowsPerTbl"],batchNum=paraDict["batchNum"],
                                               startTs=paraDict["startTs"],ctbStartIdx=paraDict['ctbStartIdx']+int(self.ctbNum/2))
P
plum-lihui 已提交
201 202 203

        tmqCom.initConsumerTable()
        tdLog.info("create topics from stb1")
G
Ganlin Zhao 已提交
204
        topicFromStb1 = 'topic_stb1'
P
plum-lihui 已提交
205 206 207 208
        queryString = "select ts, c1, c2 from %s.%s"%(paraDict['dbName'], paraDict['stbName'])
        sqlString = "create topic %s as %s" %(topicFromStb1, queryString)
        tdLog.info("create topic sql: %s"%sqlString)
        tdSql.execute(sqlString)
G
Ganlin Zhao 已提交
209

P
plum-lihui 已提交
210
        # paraDict['ctbNum'] = self.ctbNum
P
plum-lihui 已提交
211
        paraDict['ctbNum'] = self.ctbNum
P
plum-lihui 已提交
212 213
        paraDict['rowsPerTbl'] = self.rowsPerTbl
        consumerId     = 1
P
plum-lihui 已提交
214 215 216 217
        if self.snapshot == 0:
            expectrowcnt   = int(paraDict["rowsPerTbl"] * paraDict["ctbNum"] * (2 + 1/2*1/2*2 + 1/2*1/2))
        elif self.snapshot == 1:
            expectrowcnt   = int(paraDict["rowsPerTbl"] * paraDict["ctbNum"] * (2 + 1/2*1/2))
G
Ganlin Zhao 已提交
218

P
plum-lihui 已提交
219 220 221 222 223 224 225 226 227 228 229
        topicList      = topicFromStb1
        ifcheckdata    = 1
        ifManualCommit = 1
        keyList        = 'group.id:cgrp1,\
                        enable.auto.commit:true,\
                        auto.commit.interval.ms:1000,\
                        auto.offset.reset:earliest'
        tmqCom.insertConsumerInfo(consumerId, expectrowcnt,topicList,keyList,ifcheckdata,ifManualCommit)

        tdLog.info("start consume processor")
        tmqCom.startTmqSimProcess(pollDelay=paraDict['pollDelay'],dbName=paraDict["dbName"],showMsg=paraDict['showMsg'], showRow=paraDict['showRow'],snapshot=paraDict['snapshot'])
G
Ganlin Zhao 已提交
230

P
plum-lihui 已提交
231
        tdLog.info("start to check consume result")
P
plum-lihui 已提交
232 233 234 235 236 237 238 239
        expectRows = 1
        resultList = tmqCom.selectConsumeResult(expectRows)
        totalConsumeRows = 0
        for i in range(expectRows):
            totalConsumeRows += resultList[i]

        tdSql.query(queryString)
        totalRowsInserted = tdSql.getRows()
G
Ganlin Zhao 已提交
240

P
plum-lihui 已提交
241
        tdLog.info("act consume rows: %d, act insert rows: %d, expect consume rows: %d, "%(totalConsumeRows, totalRowsInserted, expectrowcnt))
G
Ganlin Zhao 已提交
242

P
plum-lihui 已提交
243 244
        if totalConsumeRows != expectrowcnt:
            tdLog.exit("tmq consume rows error!")
G
Ganlin Zhao 已提交
245 246

        # tmqCom.checkFileContent(consumerId, queryString)
P
plum-lihui 已提交
247 248 249 250 251 252 253 254 255 256 257 258

        tdSql.query("drop topic %s"%topicFromStb1)

        tdLog.printNoPrefix("======== test case 2 end ...... ")

    def run(self):
        tdSql.prepare()
        self.prepareTestEnv()
        tdLog.printNoPrefix("=============================================")
        tdLog.printNoPrefix("======== snapshot is 0: only consume from wal")
        self.tmqCase1()
        self.tmqCase2()
G
Ganlin Zhao 已提交
259

P
plum-lihui 已提交
260 261 262 263 264 265
        self.prepareTestEnv()
        tdLog.printNoPrefix("====================================================================")
        tdLog.printNoPrefix("======== snapshot is 1: firstly consume from tsbs, and then from wal")
        self.snapshot = 1
        self.tmqCase1()
        self.tmqCase2()
G
Ganlin Zhao 已提交
266

P
plum-lihui 已提交
267 268 269 270 271 272 273 274 275

    def stop(self):
        tdSql.close()
        tdLog.success(f"{__file__} successfully executed")

event = threading.Event()

tdCases.addLinux(__file__, TDTestCase())
tdCases.addWindows(__file__, TDTestCase())