diff options
Diffstat (limited to 'MSH-PIC/phoenix-hbase/bin/performance.py')
| -rw-r--r-- | MSH-PIC/phoenix-hbase/bin/performance.py | 147 |
1 files changed, 147 insertions, 0 deletions
diff --git a/MSH-PIC/phoenix-hbase/bin/performance.py b/MSH-PIC/phoenix-hbase/bin/performance.py new file mode 100644 index 0000000..16fee48 --- /dev/null +++ b/MSH-PIC/phoenix-hbase/bin/performance.py @@ -0,0 +1,147 @@ +#!/usr/bin/env python +############################################################################ +# +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. +# +############################################################################ + +from __future__ import print_function +import os +import subprocess +import sys +import tempfile +import phoenix_utils + +def queryex(description, statement): + global statements + print("Query # %s - %s" % (description, statement)) + statements = statements + statement + +def delfile(filename): + if os.path.exists(filename): + os.remove(filename) + +def usage(): + print("Performance script arguments not specified. Usage: performance.py \ +<zookeeper> <row count>") + print("Example: performance.py localhost 100000") + + +def createFileWithContent(filename, content): + fo = open(filename, "w+") + fo.write(content) + fo.close() + +if len(sys.argv) < 3: + usage() + sys.exit() + +# command line arguments +zookeeper = sys.argv[1] +rowcount = sys.argv[2] +table = "PERFORMANCE_" + sys.argv[2] + +# helper variable and functions +ddl = tempfile.mkstemp(prefix='ddl_', suffix='.sql')[1] +data = tempfile.mkstemp(prefix='data_', suffix='.csv')[1] +qry = tempfile.mkstemp(prefix='query_', suffix='.sql')[1] +statements = "" + +phoenix_utils.setPath() + +# HBase configuration folder path (where hbase-site.xml reside) for +# HBase/Phoenix client side property override +hbase_config_path = os.getenv('HBASE_CONF_DIR', phoenix_utils.current_dir) + +java_home = os.getenv('JAVA_HOME') + +# load hbase-env.??? to extract JAVA_HOME, HBASE_PID_DIR, HBASE_LOG_DIR +hbase_env_path = None +hbase_env_cmd = None +if os.name == 'posix': + hbase_env_path = os.path.join(hbase_config_path, 'hbase-env.sh') + hbase_env_cmd = ['bash', '-c', 'source %s && env' % hbase_env_path] +elif os.name == 'nt': + hbase_env_path = os.path.join(hbase_config_path, 'hbase-env.cmd') + hbase_env_cmd = ['cmd.exe', '/c', 'call %s & set' % hbase_env_path] +if not hbase_env_path or not hbase_env_cmd: + sys.stderr.write("hbase-env file unknown on platform {}{}".format(os.name, os.linesep)) + sys.exit(-1) + +hbase_env = {} +if os.path.isfile(hbase_env_path): + p = subprocess.Popen(hbase_env_cmd, stdout = subprocess.PIPE) + for x in p.stdout: + (k, _, v) = x.decode().partition('=') + hbase_env[k.strip()] = v.strip() + +if 'JAVA_HOME' in hbase_env: + java_home = hbase_env['JAVA_HOME'] + +if java_home: + java_cmd = os.path.join(java_home, 'bin', 'java') +else: + java_cmd = 'java' + +execute = ('%s $PHOENIX_OPTS -cp "%s%s%s" -Dlog4j.configuration=file:' + + os.path.join(phoenix_utils.current_dir, "log4j.properties") + + ' org.apache.phoenix.util.PhoenixRuntime -t %s %s ') % \ + (java_cmd, hbase_config_path, os.pathsep, phoenix_utils.phoenix_client_jar, table, zookeeper) + +# Create Table DDL +createtable = "CREATE TABLE IF NOT EXISTS %s (HOST CHAR(2) NOT NULL,\ +DOMAIN VARCHAR NOT NULL, FEATURE VARCHAR NOT NULL,DATE DATE NOT NULL,\ +USAGE.CORE BIGINT,USAGE.DB BIGINT,STATS.ACTIVE_VISITOR \ +INTEGER CONSTRAINT PK PRIMARY KEY (HOST, DOMAIN, FEATURE, DATE)) \ +SPLIT ON ('CSGoogle','CSSalesforce','EUApple','EUGoogle','EUSalesforce',\ +'NAApple','NAGoogle','NASalesforce');" % (table) + +# generate and upsert data +print("Phoenix Performance Evaluation Script 1.0") +print("-----------------------------------------") + +print("\nCreating performance table...") +createFileWithContent(ddl, createtable) + +exitcode = subprocess.call(execute + ddl, shell=True) +if exitcode != 0: + sys.exit(exitcode) + +# Write real,user,sys time on console for the following queries +queryex("1 - Count", "SELECT COUNT(1) FROM %s;" % (table)) +queryex("2 - Group By First PK", "SELECT HOST FROM %s GROUP BY HOST;" % (table)) +queryex("3 - Group By Second PK", "SELECT DOMAIN FROM %s GROUP BY DOMAIN;" % (table)) +queryex("4 - Truncate + Group By", "SELECT TRUNC(DATE,'DAY') DAY FROM %s GROUP BY TRUNC(DATE,'DAY');" % (table)) +queryex("5 - Filter + Count", "SELECT COUNT(1) FROM %s WHERE CORE<10;" % (table)) + +print("\nGenerating and upserting data...") +exitcode = subprocess.call('%s -jar %s %s %s' % (java_cmd, phoenix_utils.testjar, data, rowcount), + shell=True) +if exitcode != 0: + sys.exit(exitcode) + +print("\n") +createFileWithContent(qry, statements) + +exitcode = subprocess.call(execute + data + ' ' + qry, shell=True) +if exitcode != 0: + sys.exit(exitcode) + +# clear temporary files +delfile(ddl) +delfile(data) +delfile(qry) |
