summaryrefslogtreecommitdiff
path: root/TWA-PIC/phoenix-hbase/bin/performance.py
diff options
context:
space:
mode:
Diffstat (limited to 'TWA-PIC/phoenix-hbase/bin/performance.py')
-rw-r--r--TWA-PIC/phoenix-hbase/bin/performance.py147
1 files changed, 147 insertions, 0 deletions
diff --git a/TWA-PIC/phoenix-hbase/bin/performance.py b/TWA-PIC/phoenix-hbase/bin/performance.py
new file mode 100644
index 0000000..16fee48
--- /dev/null
+++ b/TWA-PIC/phoenix-hbase/bin/performance.py
@@ -0,0 +1,147 @@
+#!/usr/bin/env python
+############################################################################
+#
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements. See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership. The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License. You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+############################################################################
+
+from __future__ import print_function
+import os
+import subprocess
+import sys
+import tempfile
+import phoenix_utils
+
+def queryex(description, statement):
+ global statements
+ print("Query # %s - %s" % (description, statement))
+ statements = statements + statement
+
+def delfile(filename):
+ if os.path.exists(filename):
+ os.remove(filename)
+
+def usage():
+ print("Performance script arguments not specified. Usage: performance.py \
+<zookeeper> <row count>")
+ print("Example: performance.py localhost 100000")
+
+
+def createFileWithContent(filename, content):
+ fo = open(filename, "w+")
+ fo.write(content)
+ fo.close()
+
+if len(sys.argv) < 3:
+ usage()
+ sys.exit()
+
+# command line arguments
+zookeeper = sys.argv[1]
+rowcount = sys.argv[2]
+table = "PERFORMANCE_" + sys.argv[2]
+
+# helper variable and functions
+ddl = tempfile.mkstemp(prefix='ddl_', suffix='.sql')[1]
+data = tempfile.mkstemp(prefix='data_', suffix='.csv')[1]
+qry = tempfile.mkstemp(prefix='query_', suffix='.sql')[1]
+statements = ""
+
+phoenix_utils.setPath()
+
+# HBase configuration folder path (where hbase-site.xml reside) for
+# HBase/Phoenix client side property override
+hbase_config_path = os.getenv('HBASE_CONF_DIR', phoenix_utils.current_dir)
+
+java_home = os.getenv('JAVA_HOME')
+
+# load hbase-env.??? to extract JAVA_HOME, HBASE_PID_DIR, HBASE_LOG_DIR
+hbase_env_path = None
+hbase_env_cmd = None
+if os.name == 'posix':
+ hbase_env_path = os.path.join(hbase_config_path, 'hbase-env.sh')
+ hbase_env_cmd = ['bash', '-c', 'source %s && env' % hbase_env_path]
+elif os.name == 'nt':
+ hbase_env_path = os.path.join(hbase_config_path, 'hbase-env.cmd')
+ hbase_env_cmd = ['cmd.exe', '/c', 'call %s & set' % hbase_env_path]
+if not hbase_env_path or not hbase_env_cmd:
+ sys.stderr.write("hbase-env file unknown on platform {}{}".format(os.name, os.linesep))
+ sys.exit(-1)
+
+hbase_env = {}
+if os.path.isfile(hbase_env_path):
+ p = subprocess.Popen(hbase_env_cmd, stdout = subprocess.PIPE)
+ for x in p.stdout:
+ (k, _, v) = x.decode().partition('=')
+ hbase_env[k.strip()] = v.strip()
+
+if 'JAVA_HOME' in hbase_env:
+ java_home = hbase_env['JAVA_HOME']
+
+if java_home:
+ java_cmd = os.path.join(java_home, 'bin', 'java')
+else:
+ java_cmd = 'java'
+
+execute = ('%s $PHOENIX_OPTS -cp "%s%s%s" -Dlog4j.configuration=file:' +
+ os.path.join(phoenix_utils.current_dir, "log4j.properties") +
+ ' org.apache.phoenix.util.PhoenixRuntime -t %s %s ') % \
+ (java_cmd, hbase_config_path, os.pathsep, phoenix_utils.phoenix_client_jar, table, zookeeper)
+
+# Create Table DDL
+createtable = "CREATE TABLE IF NOT EXISTS %s (HOST CHAR(2) NOT NULL,\
+DOMAIN VARCHAR NOT NULL, FEATURE VARCHAR NOT NULL,DATE DATE NOT NULL,\
+USAGE.CORE BIGINT,USAGE.DB BIGINT,STATS.ACTIVE_VISITOR \
+INTEGER CONSTRAINT PK PRIMARY KEY (HOST, DOMAIN, FEATURE, DATE)) \
+SPLIT ON ('CSGoogle','CSSalesforce','EUApple','EUGoogle','EUSalesforce',\
+'NAApple','NAGoogle','NASalesforce');" % (table)
+
+# generate and upsert data
+print("Phoenix Performance Evaluation Script 1.0")
+print("-----------------------------------------")
+
+print("\nCreating performance table...")
+createFileWithContent(ddl, createtable)
+
+exitcode = subprocess.call(execute + ddl, shell=True)
+if exitcode != 0:
+ sys.exit(exitcode)
+
+# Write real,user,sys time on console for the following queries
+queryex("1 - Count", "SELECT COUNT(1) FROM %s;" % (table))
+queryex("2 - Group By First PK", "SELECT HOST FROM %s GROUP BY HOST;" % (table))
+queryex("3 - Group By Second PK", "SELECT DOMAIN FROM %s GROUP BY DOMAIN;" % (table))
+queryex("4 - Truncate + Group By", "SELECT TRUNC(DATE,'DAY') DAY FROM %s GROUP BY TRUNC(DATE,'DAY');" % (table))
+queryex("5 - Filter + Count", "SELECT COUNT(1) FROM %s WHERE CORE<10;" % (table))
+
+print("\nGenerating and upserting data...")
+exitcode = subprocess.call('%s -jar %s %s %s' % (java_cmd, phoenix_utils.testjar, data, rowcount),
+ shell=True)
+if exitcode != 0:
+ sys.exit(exitcode)
+
+print("\n")
+createFileWithContent(qry, statements)
+
+exitcode = subprocess.call(execute + data + ' ' + qry, shell=True)
+if exitcode != 0:
+ sys.exit(exitcode)
+
+# clear temporary files
+delfile(ddl)
+delfile(data)
+delfile(qry)