248 lines
		
	
	
		
			10 KiB
		
	
	
	
		
			Python
		
	
	
	
			
		
		
	
	
			248 lines
		
	
	
		
			10 KiB
		
	
	
	
		
			Python
		
	
	
	
| ###################################################################
 | |
| #           Copyright (c) 2016 by TAOS Technologies, Inc.
 | |
| #                     All rights reserved.
 | |
| #
 | |
| #  This file is proprietary and confidential to TAOS Technologies.
 | |
| #  No part of this file may be reproduced, stored, transmitted,
 | |
| #  disclosed or used in any form or by any means other than as
 | |
| #  expressly provided by the written permission from Jianhui Tao
 | |
| #
 | |
| ###################################################################
 | |
| 
 | |
| # -*- coding: utf-8 -*-
 | |
| 
 | |
| import requests
 | |
| import threading
 | |
| import random
 | |
| import time
 | |
| import argparse
 | |
| 
 | |
| class RestfulInsert:
 | |
|     def __init__(self, host, startTimestamp, dbname, threads, tables, records, batchSize, tbNamePerfix, outOfOrder,tablePerbatch):
 | |
|         self.header = {'Authorization': 'Basic cm9vdDp0YW9zZGF0YQ=='}
 | |
|         self.url = "http://%s:6041/rest/sql" % host
 | |
|         self.ts = startTimestamp
 | |
|         self.dbname = dbname
 | |
|         self.numOfThreads = threads
 | |
|         self.numOfTables = tables
 | |
|         self.recordsPerTable = records
 | |
|         self.batchSize = batchSize
 | |
|         self.tableNamePerfix = tbNamePerfix
 | |
|         self.outOfOrder = outOfOrder
 | |
|         self.tablePerbatch = tablePerbatch
 | |
|     
 | |
|     def createTable(self, threadID):
 | |
|         tablesPerThread = int (self.numOfTables / self.numOfThreads)
 | |
|         loop = tablesPerThread if threadID != self.numOfThreads - 1 else self.numOfTables - tablesPerThread * threadID        
 | |
|         print("create table %d to %d" % (tablesPerThread * threadID, tablesPerThread * threadID + loop - 1))
 | |
|         for i in range(loop):
 | |
|             tableID = threadID * tablesPerThread
 | |
|             if tableID + i >= self.numOfTables : break
 | |
|             name = 'beijing' if (tableID + i) % 2 == 0 else 'shanghai'
 | |
|             data = "create table if not exists %s.%s%d using %s.meters tags(%d, '%s')" % (self.dbname, self.tableNamePerfix, tableID + i, self.dbname, tableID + i, name)
 | |
|             try:
 | |
|                 response = requests.post(self.url, data, headers = self.header)
 | |
|                 if response.status_code != 200:
 | |
|                     print(response.content)                
 | |
|             except Exception as e:
 | |
|                 print(e)
 | |
| 
 | |
|     def insertData(self, threadID):        
 | |
|         print("thread %d started" % threadID)
 | |
|         tablesPerThread = int (self.numOfTables / self.numOfThreads)   
 | |
|         loop = int(self.recordsPerTable / self.batchSize)   
 | |
|         if self.tablePerbatch == 1 : 
 | |
|             for i in range(tablesPerThread+1):            
 | |
|                 tableID = i + threadID * tablesPerThread
 | |
|                 if tableID >= self.numOfTables: return
 | |
|                 start = self.ts
 | |
|                 start1=time.time()
 | |
|                 for k in range(loop):
 | |
|                     data = "insert into %s.%s%d values" % (self.dbname, self.tableNamePerfix, tableID)
 | |
|                     values = []
 | |
|                     bloop = self.batchSize if k != loop - 1 else self.recordsPerTable - self.batchSize * k
 | |
|                     for l in range(bloop):
 | |
|                         values.append("(%d, %d, %d, %d)" %  (start + k * self.batchSize + l, random.randint(1, 100), random.randint(1, 100), random.randint(1, 100)))                              
 | |
|                     if len(data) > 1048576 : 
 | |
|                         print ('batch size is larger than 1M')
 | |
|                         exit(-1)
 | |
|                     if self.outOfOrder :
 | |
|                         random.shuffle(values)
 | |
|                     data+=''.join(values)
 | |
|                     response = requests.post(self.url, data, headers = self.header)
 | |
|                     if response.status_code != 200:
 | |
|                         print(response.content)
 | |
|         else:
 | |
|             for i in range(0,tablesPerThread+self.tablePerbatch,self.tablePerbatch): 
 | |
|                 for k in range(loop):
 | |
|                     data = "insert into "
 | |
|                     for j in range(self.tablePerbatch):
 | |
|                         tableID = i + threadID * tablesPerThread+j
 | |
|                         if tableID >= self.numOfTables: return
 | |
|                         start = self.ts
 | |
|                         data += "%s.%s%d values" % (self.dbname, self.tableNamePerfix, tableID)
 | |
|                         values = []
 | |
|                         bloop = self.batchSize if k != loop - 1 else self.recordsPerTable - self.batchSize * k
 | |
|                         for l in range(bloop):
 | |
|                             values.append("(%d, %d, %d, %d)" %  (start + k * self.batchSize + l, random.randint(1, 100), random.randint(1, 100), random.randint(1, 100)))    
 | |
|                         if self.outOfOrder :
 | |
|                             random.shuffle(values)
 | |
|                         data+=''.join(values)                          
 | |
|                     if len(data) > 1024*1024 : 
 | |
|                         print ('batch size is larger than 1M')
 | |
|                         exit(-1)
 | |
|                     try:
 | |
|                         startTime = time.time()
 | |
|                         response = requests.post(self.url, data, headers = self.header)
 | |
|                         endTime = time.time()
 | |
|                         if response.status_code != 200:
 | |
|                             print(response.content)
 | |
|                         else:
 | |
|                             print("inserted %d records, %d seconds" % (bloop, endTime - startTime))
 | |
|                     except Exception as e:
 | |
|                         print(e)
 | |
| 
 | |
|     def insertUnlimitedData(self, threadID):        
 | |
|         print("thread %d started" % threadID)
 | |
|         tablesPerThread = int (self.numOfTables / self.numOfThreads)
 | |
|         
 | |
|         count = 0
 | |
|         while True:
 | |
|             i = 0
 | |
|             start = self.ts  + count * self.batchSize          
 | |
|             count = count + 1            
 | |
|             
 | |
|             for i in range(tablesPerThread):
 | |
|                 tableID = i + threadID * tablesPerThread
 | |
|                                 
 | |
|                 data = "insert into %s.%s%d values" % (self.dbname, self.tableNamePerfix, tableID)
 | |
|                 values = []
 | |
|                 for k in range(self.batchSize):
 | |
|                     values.append("(%d, %d, %d, %d)" %  (start + k, random.randint(1, 100), random.randint(1, 100), random.randint(1, 100)))
 | |
|                 
 | |
|                 if(self.outOfOrder == False):
 | |
|                     for k in range(len(values)):            
 | |
|                         data += values[k]
 | |
|                 else:
 | |
|                     random.shuffle(values)
 | |
|                     for k in range(len(values)):            
 | |
|                         data += values[k]    
 | |
|                 try:     
 | |
|                     startTime = time.time()
 | |
|                     response = requests.post(self.url, data, headers = self.header)
 | |
|                     endTime = time.time()
 | |
|                     if response.status_code != 200:
 | |
|                         print(response.content)
 | |
|                     else:
 | |
|                         print("inserted %d records, %d seconds" % (self.batchSize, endTime - startTime))
 | |
|                 except Exception as e:
 | |
|                     print(e)                    
 | |
| 
 | |
|     def run(self):            
 | |
|         data = "create database if not exists %s" % self.dbname
 | |
|         requests.post(self.url, data, headers = self.header)
 | |
|         data = "create table if not exists %s.meters(ts timestamp, f1 int, f2 int, f3 int) tags(id int, loc nchar(20))" % self.dbname
 | |
|         requests.post(self.url, data, headers = self.header)
 | |
| 
 | |
|         threads = []
 | |
|         startTime = time.time()    
 | |
|         for i in range(self.numOfThreads):
 | |
|             thread = threading.Thread(target=self.createTable, args=(i,))
 | |
|             thread.start()
 | |
|             threads.append(thread)
 | |
|         for i in range(self.numOfThreads):
 | |
|             threads[i].join()
 | |
|         print("createing %d tables takes %d seconds" % (self.numOfTables, (time.time() - startTime)))
 | |
| 
 | |
|         print("inserting data =======")
 | |
|         threads = []
 | |
|         startTime = time.time()
 | |
|         for i in range(self.numOfThreads):
 | |
|             if(self.recordsPerTable != -1):          
 | |
|                 thread = threading.Thread(target=self.insertData, args=(i,))
 | |
|             else:
 | |
|                 thread = threading.Thread(target=self.insertUnlimitedData, args=(i,))
 | |
|             thread.start()
 | |
|             threads.append(thread)
 | |
|         
 | |
|         for i in range(self.numOfThreads):
 | |
|             threads[i].join()
 | |
|         print("inserting %s records takes %d seconds" % (self.numOfTables * self.recordsPerTable, (time.time() - startTime)))
 | |
| 
 | |
| parser = argparse.ArgumentParser()
 | |
| parser.add_argument(
 | |
|     '-H',
 | |
|     '--host-name',
 | |
|     action='store',
 | |
|     default='127.0.0.1',
 | |
|     type=str,
 | |
|     help='host name to be connected (default: 127.0.0.1)')
 | |
| parser.add_argument(
 | |
|     '-S',
 | |
|     '--start-timestamp',
 | |
|     action='store',
 | |
|     default=1500000000000,
 | |
|     type=int,
 | |
|     help='insert data from timestamp (default: 1500000000000)')
 | |
| parser.add_argument(
 | |
|     '-d',
 | |
|     '--db-name',
 | |
|     action='store',
 | |
|     default='test',
 | |
|     type=str,
 | |
|     help='Database name to be created (default: test)')
 | |
| parser.add_argument(
 | |
|     '-t',
 | |
|     '--number-of-threads',
 | |
|     action='store',
 | |
|     default=10,
 | |
|     type=int,
 | |
|     help='Number of threads to create tables and insert datas (default: 10)')
 | |
| parser.add_argument(
 | |
|     '-T',
 | |
|     '--number-of-tables',
 | |
|     action='store',
 | |
|     default=10000,
 | |
|     type=int,
 | |
|     help='Number of tables to be created (default: 1000)')
 | |
| parser.add_argument(
 | |
|     '-r',
 | |
|     '--number-of-records',
 | |
|     action='store',
 | |
|     default=10000,
 | |
|     type=int,
 | |
|     help='Number of record to be created for each table  (default: 1000, -1 for unlimited records)')
 | |
| parser.add_argument(
 | |
|     '-s',
 | |
|     '--batch-size',
 | |
|     action='store',
 | |
|     default='1000',
 | |
|     type=int,
 | |
|     help='Number of tables to be created (default: 1000)')
 | |
| parser.add_argument(
 | |
|     '-p',
 | |
|     '--table-name-prefix',
 | |
|     action='store',
 | |
|     default='t',
 | |
|     type=str,
 | |
|     help='Number of tables to be created (default: 1000)')
 | |
| parser.add_argument(
 | |
|     '-o',
 | |
|     '--out-of-order',
 | |
|     action='store_true', 
 | |
|     help='The order of test data (default: False)')
 | |
| parser.add_argument(
 | |
|     '-b',
 | |
|     '--table-per-batch',
 | |
|     action='store', 
 | |
|     default=1,
 | |
|     type=int,
 | |
|     help='the table per batch (default: 1)')
 | |
| 
 | |
| 
 | |
| 
 | |
| args = parser.parse_args()
 | |
| ri = RestfulInsert(
 | |
|         args.host_name, args.start_timestamp, args.db_name, args.number_of_threads, args.number_of_tables, 
 | |
|         args.number_of_records, args.batch_size, args.table_name_prefix, args.out_of_order, args.table_per_batch)
 | |
| ri.run() |