Skip to content

Commit

Permalink
Merge pull request #14 from qbicsoftware/development
Browse files Browse the repository at this point in the history
[1.0.0] Release
  • Loading branch information
Zethson authored Jul 9, 2019
2 parents 395446d + 0b02c78 commit 8d25279
Show file tree
Hide file tree
Showing 5 changed files with 48 additions and 43 deletions.
3 changes: 2 additions & 1 deletion .travis.yml
Original file line number Diff line number Diff line change
@@ -1,6 +1,7 @@
language: scala

jdk: oraclejdk8
jdk:
- openjdk8

scala:
- 2.12.8
Expand Down
12 changes: 7 additions & 5 deletions README.md
Original file line number Diff line number Diff line change
@@ -1,4 +1,5 @@
[![Build Status](https://travis-ci.com/qbicsoftware/spark-benchmark-cli.svg?branch=development)](https://travis-ci.com/qbicsoftware/spark-benchmark-cli)
[![Scala Steward badge](https://img.shields.io/badge/Scala_Steward-helping-brightgreen.svg?style=flat&logo=)](https://scala-steward.org)

# spark-benchmark-cli
A tool for submitting SQL queries to a Spark Cluster. Various benchmarking statistics will be calculated.
Expand All @@ -9,11 +10,11 @@ SBT assembly plugin is configured. Hence, in the project root:
```bash
sbt assembly
```
will build the fat jar. The result will be written to /target/$scala-version/$name-assembly-$version.jar
will build the fat jar. The result will be written to ```/target/$scala-version/$name-assembly-$version.jar```

## Running
```bash
java -jar spark-benchmark-cli-assembly-$version.jar
java -jar scark-cli-1.0.0.jar
```

## Usage
Expand All @@ -34,7 +35,8 @@ SQL Queries inside Spark!
Required parameters are:
```
-c, --config=<configFilePath>
-q, --query
-t --table[=<table>]
-q, --query[=<sqlQuery>]
```
Queries are optionally interactive.
You can either use ```-q``` to get a prompt for your query or supply a full query when running the tool: ```--q[=<sqlQuery>]```.
Expand All @@ -43,13 +45,13 @@ You can either use ```-q``` to get a prompt for your query or supply a full quer
A query can be submitted to spark via:
```bash
/spark/bin/spark-submit --master spark://spark-master:7077 \
/opt/spark-apps/spark-benchmark-cli-assembly-0.1.jar -s -d org.mariadb.jdbc.Driver -c /opt/spark-data/database_properties.txt -t <table> -q <"query">
/opt/spark-apps/scark-cli-1.0.0.jar -s -d org.mariadb.jdbc.Driver -c /opt/spark-data/database_properties.txt -t <table> -q <"query">
```
## Example Query
```bash
/spark/bin/spark-submit --master spark://spark-master:7077 \
/opt/spark-apps/spark-benchmark-cli-assembly-0.1.jar -s -d org.mariadb.jdbc.Driver -c /opt/spark-data/database_properties.txt -t Consequence -q "SELECT id FROM Consequence"
/opt/spark-apps/scark-cli-1.0.0.jar -s -d org.mariadb.jdbc.Driver -c /opt/spark-data/database_properties.txt -t Consequence -q "SELECT id FROM Consequence"
```
## Tests
Expand Down
4 changes: 2 additions & 2 deletions build.sbt
Original file line number Diff line number Diff line change
@@ -1,6 +1,6 @@
name := "spark-benchmark-cli"
name := "scark-cli"

version := "0.1"
version := "1.0.0"

scalaVersion := "2.12.8"

Expand Down
39 changes: 20 additions & 19 deletions src/main/scala/Main.scala
Original file line number Diff line number Diff line change
Expand Up @@ -9,9 +9,17 @@ import com.typesafe.scalalogging.Logger

object Main {

val LOG = Logger("Spark Benchmark CLI")
val LOG = Logger("scark-cli")

def main(args: Array[String]) {
LOG.info(
"""
| _________ __ .__ .__
| / _____/ ____ _____ _______| | __ ____ | | |__|
| \_____ \_/ ___\\__ \\_ __ \ |/ / ______ _/ ___\| | | |
| / \ \___ / __ \| | \/ < /_____/ \ \___| |_| |
|/_______ /\___ >____ /__| |__|_ \ \___ >____/__|
| \/ \/ \/ \/ \/ """.stripMargin)
// parse commandline parameters, get database properties
val commandLineParser = new CommandLineParser()
val commandLineParameters = commandLineParser.parseCommandLineParameters(args)
Expand All @@ -32,16 +40,17 @@ object Main {
val spark =
if (commandLineParameters.localMode) {
LOG.info("Running Spark in local mode!")
LOG.warn("scark-cli assumes that your mariadb-java-client jar is in /opt/spark-apps")
SparkSession
.builder()
.appName("Spark Benchmark CLI")
.config("spark.master", "local")
.config("spark.driver.extraClassPath", "/opt/spark-apps/spark-apps/mariadb-java-client-2.4.1.jar")
.config("spark.driver.extraClassPath", "/opt/spark-apps/mariadb-java-client-2.4.1.jar")
.getOrCreate()
} else {
SparkSession
.builder()
.appName("Spark Benchmark CLI")
.appName("scark-cli")
// .config("spark.some.config.option", "some-value")
.getOrCreate()
}
Expand All @@ -50,14 +59,11 @@ object Main {

Class.forName("org.mariadb.jdbc.Driver")

// test database connection
// connect to the database
try {
val connection = DriverManager.getConnection(databaseProperties.jdbcURL, databaseProperties.user, databaseProperties.password)
if (!connection.isClosed) {
LOG.error("Connection to the database did not close automatically when performing a connection test!")
}
} catch {
case e: Exception => LOG.error("Something went wrong when attempting to connect to the database. %s", e.getMessage)
case e: Exception => LOG.error(s"Unable to connect to the database ${e.getMessage}")
}

// Spark likes working with properties, hence we create a properties object
Expand All @@ -72,7 +78,8 @@ object Main {

// NOTE
// Spark requires a View of a table to allow for SQL queries
// CreateOrReplaceTempView will create a temporary view of the table in memory. It is not persistent at this moment but you can run sql query on top of that.
// CreateOrReplaceTempView will create a temporary view of the table in memory.
// It is not persistent at this moment but you can run sql queries on top of that.
// If you want to save it you can either persist or use saveAsTable to save.
table.createOrReplaceTempView(commandLineParameters.table)

Expand All @@ -83,9 +90,7 @@ object Main {
LOG.info("Spark support has been disabled!")

// connect
// Class.forName("org.mariadb.jdbc.Driver")
val connection = DriverManager.getConnection(databaseProperties.jdbcURL, databaseProperties.user, databaseProperties.password)
connection.isClosed

// execute query
val statement = connection.createStatement()
Expand All @@ -95,19 +100,15 @@ object Main {
val list = Iterator.from(0).takeWhile(_ => rs.next()).map(_ => rs.getString(1)).toList
println(list)

// while (rs.next()) {
// println(rs.getString(1)) //or rs.getString("column name");
// }

connection.isClosed
}
} catch {
case eie: ExceptionInInitializerError => {
case eie: ExceptionInInitializerError =>
LOG.error("__________________________________________________________________________________________")
LOG.error("Hadoop support is possibly wrongly configured or missing! " + eie.getException.getMessage)
LOG.error(s"Hadoop support is possibly wrongly configured or missing! ${eie.getException.getMessage}")
LOG.error("__________________________________________________________________________________________")
}
case e: Exception => LOG.error("Hadoop support is possibly wrongly configured or missing! " + e.getMessage)
case e: Exception => LOG.error(s"Hadoop support is possibly wrongly configured or missing! ${e.getMessage}")
LOG.error("Don't forget to specify the name of the database driver!")
}

}
Expand Down
33 changes: 17 additions & 16 deletions src/main/scala/io/parser/PropertiesParser.scala
Original file line number Diff line number Diff line change
Expand Up @@ -10,24 +10,25 @@ object PropertiesParser {
val lines = Source.fromFile(propertiesFileName).getLines.toList
val split = for (line <- lines) yield line.split(":")

// TODO Moms' Spaghetti Bolognese
var host = split.head(1) + ":" + split.head(2) + ":" + split.head(3)
.filterNot((x: Char) => x.equals('\"'))
host = host.replaceAll("\\s", "")
val port = split(1)(1)
.filterNot((x: Char) => x.equals('\"'))
.filterNot((x: Char) => x.isWhitespace)
val name = split(2)(1)
.filterNot((x: Char) => x.equals('\"'))
.filterNot((x: Char) => x.isWhitespace)
val password = split(3)(1)
.filterNot((x: Char) => x.equals('\"'))
.filterNot((x: Char) => x.isWhitespace)
val user = split(4)(1)
.filterNot((x: Char) => x.equals('\"'))
.filterNot((x: Char) => x.isWhitespace)
var port = split(1)(1)
var name = split(2)(1)
var password = split(3)(1)
var user = split(4)(1)
val properties = List(host, port, name, password, user)

// remove any backslashes and whitespaces
val formatted_properties = properties
.map(string => string.filterNot((x: Char) => x.equals('\"')))
.map(string => string.filterNot((x: Char) => x.isWhitespace))
host = formatted_properties.head
port = formatted_properties(1)
name = formatted_properties(2)
password = formatted_properties(3)
user = formatted_properties(4)

DatabaseProperties(host, user, password, port, name)
}

}
}

0 comments on commit 8d25279

Please sign in to comment.