concurrent_inquiry.py 13.7 KB
Newer Older
L
liuyq-617 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14
###################################################################
#           Copyright (c) 2016 by TAOS Technologies, Inc.
#                     All rights reserved.
#
#  This file is proprietary and confidential to TAOS Technologies.
#  No part of this file may be reproduced, stored, transmitted,
#  disclosed or used in any form or by any means other than as
#  expressly provided by the written permission from Jianhui Tao
#
###################################################################

# -*- coding: utf-8 -*-
import threading
import taos
L
liuyq-617 已提交
15
import sys
L
liuyq-617 已提交
16 17 18
import json
import time
import random
19 20 21 22 23 24 25 26 27 28 29 30 31
import requests
from requests.auth import HTTPBasicAuth
func_list=['avg','count','twa','sum','stddev','leastsquares','min',
'max','first','last','top','bottom','percentile','apercentile',
'last_row','diff','spread']
condition_list=[
    "where _c0 > now -10d ",
    'interval(10s)',
    'limit 10',
    'group by',
    'order by',
    'fill(null)'
    
L
liuyq-617 已提交
32
]
33
where_list = ['_c0>now-10d',' <50'," like \'%a%\'"]
L
liuyq-617 已提交
34
class ConcurrentInquiry:
35 36 37
    def __init__(self,n_Therads=25,r_Therads=25):  
        self.n_numOfTherads = n_Therads
        self.r_numOfTherads = r_Therads
L
liuyq-617 已提交
38
        self.ts=1500000001000
39 40 41 42 43 44 45
        self.dbname='test'
        self.stb_list=[]
        self.subtb_list=[]
        self.stb_stru_list=[]
        self.subtb_stru_list=[]
        self.stb_tag_list=[]
        self.subtb_tag_list=[]
46
        self.probabilities = [0.05,0.95]
47
        self.ifjoin = [0,1]
L
liuyq-617 已提交
48 49
    def SetThreadsNum(self,num):
        self.numOfTherads=num
50

51 52 53 54 55 56
    def ret_fcol(self,cl,sql):                     #返回结果的第一列
        cl.execute(sql)
        fcol_list=[]
        for data in cl:
            fcol_list.append(data[0])
        return fcol_list
57 58

    def r_stb_list(self,cl):                    #返回超级表列表
59 60
        sql='show '+self.dbname+'.stables'
        self.stb_list=self.ret_fcol(cl,sql)
61 62

    def r_subtb_list(self,cl,stablename):       #每个超级表返回2个子表
63 64
        sql='select tbname from '+self.dbname+'.'+stablename+' limit 2;'
        self.subtb_list+=self.ret_fcol(cl,sql)
65 66

    def cal_struct(self,cl,tbname):             #查看表结构
67 68 69 70 71 72 73 74 75 76
        tb=[]
        tag=[]
        sql='describe '+self.dbname+'.'+tbname+';'
        cl.execute(sql)
        for data in cl:
            if data[3]:
                tag.append(data[0])
            else:
                tb.append(data[0])
        return tb,tag
77 78

    def r_stb_stru(self,cl):                    #获取所有超级表的表结构
79 80 81 82
        for i in self.stb_list:
            tb,tag=self.cal_struct(cl,i)
            self.stb_stru_list.append(tb)
            self.stb_tag_list.append(tag)
83 84

    def r_subtb_stru(self,cl):                  #返回所有子表的表结构
85 86 87 88
        for i in self.subtb_list:
            tb,tag=self.cal_struct(cl,i)
            self.subtb_stru_list.append(tb)
            self.subtb_tag_list.append(tag)
89 90

    def get_full(self):                         #获取所有的表、表结构
91 92 93 94 95 96 97 98 99 100 101 102 103 104 105
        host = "127.0.0.1"
        user = "root"
        password = "taosdata"
        conn = taos.connect(
            host,
            user,
            password,
            )
        cl = conn.cursor()
        self.r_stb_list(cl)
        for i in self.stb_list:
            self.r_subtb_list(cl,i)
        self.r_stb_stru(cl)
        self.r_subtb_stru(cl)
        cl.close()
106 107 108
        conn.close()  
        
    #query condition
109
    def con_where(self,tlist,col_list,tag_list):                               
110 111 112 113 114 115 116 117
        l=[]
        for i in range(random.randint(0,len(tlist))):
            c = random.choice(where_list)
            if c == '_c0>now-10d':
                l.append(c)
            else:
                l.append(random.choice(tlist)+c)
        return 'where '+random.choice([' and ',' or ']).join(l)
118

119
    def con_interval(self,tlist,col_list,tag_list): 
120
        interval = 'interval(' + str(random.randint(0,100)) + random.choice(['a','s','d','w','n','y'])  + ')'          
121
        return interval
122

123 124 125
    def con_limit(self,tlist,col_list,tag_list):
        rand1 = str(random.randint(0,1000))
        rand2 = str(random.randint(0,1000))
126 127 128
        return random.choice(['limit ' + rand1,'limit ' + rand1 + ' offset '+rand2,
        ' slimit ' + rand1,' slimit ' + rand1 + ' offset ' + rand2,'limit '+rand1 + ' slimit '+ rand2,
        'limit '+ rand1 + ' offset' + rand2 + ' slimit '+ rand1 + ' soffset ' + rand2 ])
129
    
130
    def con_fill(self,tlist,col_list,tag_list):
131
        return random.choice(['fill(null)','fill(prev)','fill(none)','fill(LINEAR)'])
132
    
133 134 135 136
    def con_group(self,tlist,col_list,tag_list):
        rand_tag = random.randint(0,5)
        rand_col = random.randint(0,1)
        return 'group by '+','.join(random.sample(col_list,rand_col))+','.join(random.sample(tag_list,rand_tag))
137
    
138
    def con_order(self,tlist,col_list,tag_list):
139
        return 'order by '+random.choice(tlist)
140 141 142
    
    def gen_query_sql(self):                        #生成查询语句
        tbi=random.randint(0,len(self.subtb_list)+len(self.stb_list))  #随机决定查询哪张表
143 144 145 146 147 148 149 150 151 152 153 154 155 156
        tbname=''
        col_list=[]
        tag_list=[]
        is_stb=0
        if tbi>len(self.stb_list) :
            tbi=tbi-len(self.stb_list)
            tbname=self.subtb_list[tbi-1]
            col_list=self.subtb_stru_list[tbi-1]
            tag_list=self.subtb_tag_list[tbi-1]
        else:
            tbname=self.stb_list[tbi-1]
            col_list=self.stb_stru_list[tbi-1]
            tag_list=self.stb_tag_list[tbi-1]
            is_stb=1
157
        tlist=col_list+tag_list+['abc']            #增加不存在的域'abc',是否会引起新bug
158 159 160 161 162 163 164 165 166 167
        con_rand=random.randint(0,len(condition_list))
        func_rand=random.randint(0,len(func_list))
        col_rand=random.randint(0,len(col_list))
        tag_rand=random.randint(0,len(tag_list))
        t_rand=random.randint(0,len(tlist))
        sql='select '                                           #select 
        random.shuffle(col_list)
        random.shuffle(func_list)
        sel_col_list=[]
        col_rand=random.randint(0,len(col_list))
168
        for i,j in zip(col_list[0:col_rand],func_list):         #决定每个被查询col的函数
169 170
            alias = 'as '+ str(i)
            pick_func = ''
171
            if j == 'leastsquares':
172
                pick_func=j+'('+i+',1,1)'
173
            elif j == 'top' or j == 'bottom' or j == 'percentile' or j == 'apercentile':
174
                pick_func=j+'('+i+',1)'
175
            else:
176 177 178 179 180
                pick_func=j+'('+i+')'
            if bool(random.getrandbits(1)):
                pick_func+=alias
            sel_col_list.append(pick_func)
            
181 182 183 184 185
        sql=sql+','.join(sel_col_list)+' from '+random.choice(self.stb_list+self.subtb_list)+' '                        #select col & func
        con_func=[self.con_where,self.con_interval,self.con_limit,self.con_group,self.con_order,self.con_fill]
        sel_con=random.sample(con_func,random.randint(0,len(con_func)))
        sel_con_list=[]
        for i in sel_con:
186
            sel_con_list.append(i(tlist,col_list,tag_list))                                  #获取对应的条件函数
187 188 189
        sql+=' '.join(sel_con_list)                                       # condition
        print(sql)
        return sql
190

191
    def gen_query_join(self):                        #生成join查询语句
L
liuyq-617 已提交
192 193 194 195 196
        tbname   = []
        col_list = []
        tag_list = []
        col_intersection = []
        tag_intersection = []
197
        subtable = None
L
liuyq-617 已提交
198 199

        if bool(random.getrandbits(1)):
200
            subtable = True
L
liuyq-617 已提交
201 202 203 204 205 206
            tbname = random.sample(self.subtb_list,2)
            for i in tbname:
                col_list.append(self.subtb_stru_list[self.subtb_list.index(i)])
                tag_list.append(self.subtb_stru_list[self.subtb_list.index(i)])
            col_intersection = list(set(col_list[0]).intersection(set(col_list[1])))
            tag_intersection = list(set(tag_list[0]).intersection(set(tag_list[1])))
207
        else:
L
liuyq-617 已提交
208 209 210 211 212 213 214 215
            tbname = random.sample(self.stb_list,2)
            for i in tbname:
                col_list.append(self.stb_stru_list[self.stb_list.index(i)])
                tag_list.append(self.stb_stru_list[self.stb_list.index(i)])
            col_intersection = list(set(col_list[0]).intersection(set(col_list[1])))
            tag_intersection = list(set(tag_list[0]).intersection(set(tag_list[1])))
        
        
216 217 218
        con_rand=random.randint(0,len(condition_list))
        col_rand=random.randint(0,len(col_list))
        tag_rand=random.randint(0,len(tag_list))
L
liuyq-617 已提交
219
        
220
        sql='select '                                           #select 
L
liuyq-617 已提交
221 222
        
        sel_col_tag=[]
223
        col_rand=random.randint(0,len(col_list))
L
liuyq-617 已提交
224 225 226 227 228 229 230
        if bool(random.getrandbits(1)):
            sql += '*'
        else:
            sel_col_tag.append('t1.' + str(random.choice(col_list[0] + tag_list[0])))
            sel_col_tag.append('t2.' + str(random.choice(col_list[1] + tag_list[1])))
            sql += ','.join(sel_col_tag)

231 232 233 234 235 236 237 238
        sql = sql + ' from '+ str(tbname[0]) +' t1,' + str(tbname[1]) + ' t2 '                        #select col & func
        join_section = None
        if subtable:
            join_section = ''.join(random.choices(col_intersection))
            sql += 'where t1._c0 = t2._c0 and ' + 't1.' + join_section + '=t2.' + join_section
        else:
            join_section = ''.join(random.choices(col_intersection+tag_intersection))
            sql += 'where t1._c0 = t2._c0 and ' + 't1.' + join_section + '=t2.' + join_section
L
liuyq-617 已提交
239
        
240 241 242 243 244 245 246 247 248 249 250 251
        print(sql)
        return sql

    def random_pick(self): 
        x = random.uniform(0,1) 
        cumulative_probability = 0.0 
        for item, item_probability in zip(self.ifjoin, self.probabilities): 
            cumulative_probability += item_probability 
            if x < cumulative_probability:break 
        return item
        

252
    def rest_query(self,sql):                                       #rest 接口
253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286
        host = "127.0.0.1"
        user = "root"
        password = "taosdata"
        port =6041
        url = "http://{}:{}/rest/sql".format(host, port )
        try:
            r = requests.post(url, 
                data = 'use test',
                auth = HTTPBasicAuth('root', 'taosdata'))  
            r = requests.post(url, 
                data = sql,
                auth = HTTPBasicAuth('root', 'taosdata'))         
        except:
            print("REST API Failure (TODO: more info here)")
            raise
        rj = r.json()
        if ('status' not in rj):
            raise RuntimeError("No status in REST response")

        if rj['status'] == 'error':  # clearly reported error
            if ('code' not in rj):  # error without code
                raise RuntimeError("REST error return without code")
            errno = rj['code']  # May need to massage this in the future
            # print("Raising programming error with REST return: {}".format(rj))
            raise taos.error.ProgrammingError(
                rj['desc'], errno)  # todo: check existance of 'desc'

        if rj['status'] != 'succ':  # better be this
            raise RuntimeError(
                "Unexpected REST return status: {}".format(
                    rj['status']))

        nRows = rj['rows'] if ('rows' in rj) else 0
        return nRows
287

288
    
289
    def query_thread_n(self,threadID):                      #使用原生python接口查询
290
        host = "127.0.0.1"
L
liuyq-617 已提交
291 292 293 294 295 296 297 298
        user = "root"
        password = "taosdata"
        conn = taos.connect(
            host,
            user,
            password,
            )
        cl = conn.cursor()
L
liuyq-617 已提交
299
        cl.execute("use test;")
L
liuyq-617 已提交
300 301 302 303
        
        print("Thread %d: starting" % threadID)
        
        while True:
304
            
L
liuyq-617 已提交
305
                try:
306 307 308 309
                    if self.random_pick():
                        sql=self.gen_query_sql()
                    else:
                        sql=self.gen_query_join()
310
                    print("sql is ",sql)
L
liuyq-617 已提交
311
                    start = time.time()
312 313
                    cl.execute(sql)
                    cl.fetchall()
L
liuyq-617 已提交
314 315
                    end = time.time()
                    print("time cost :",end-start)
L
liuyq-617 已提交
316 317 318
                except Exception as e:
                    print(
                "Failure thread%d, sql: %s,exception: %s" %
319 320
                (threadID, str(sql),str(e)))
                    #exit(-1)
L
liuyq-617 已提交
321 322
                    
                
323
        print("Thread %d: finishing" % threadID)
L
liuyq-617 已提交
324
          
325
    def query_thread_r(self,threadID):                      #使用rest接口查询
326 327 328
        print("Thread %d: starting" % threadID)
        while True:
                try:
329 330 331 332
                    if self.random_pick():
                        sql=self.gen_query_sql()
                    else:
                        sql=self.gen_query_join()
333 334 335 336 337 338 339 340 341 342 343 344 345
                    print("sql is ",sql)
                    start = time.time()
                    self.rest_query(sql)
                    end = time.time()
                    print("time cost :",end-start)
                except Exception as e:
                    print(
                "Failure thread%d, sql: %s,exception: %s" %
                (threadID, str(sql),str(e)))
                    #exit(-1)
                    
                
        print("Thread %d: finishing" % threadID)    
L
liuyq-617 已提交
346 347

    def run(self):
348
        print(self.n_numOfTherads,self.r_numOfTherads)  
L
liuyq-617 已提交
349
        threads = []
350 351
        for i in range(self.n_numOfTherads):
            thread = threading.Thread(target=self.query_thread_n, args=(i,))
L
liuyq-617 已提交
352 353
            threads.append(thread)
            thread.start()  
354 355 356 357 358 359 360 361 362 363
        for i in range(self.r_numOfTherads):
            thread = threading.Thread(target=self.query_thread_r, args=(i,))
            threads.append(thread)
            thread.start()
if len(sys.argv)>1:
    q = ConcurrentInquiry(n_Therads=sys.argv[1],r_Therads=sys.argv[2])
else:
    q = ConcurrentInquiry()
q.get_full()
#q.gen_query_sql()
L
liuyq-617 已提交
364
q.run()