/* * Copyright 2018 Alex Tucker * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package uk.org.floop.sparqlTestRunner import java.io._ import java.net.URI import java.nio.charset.StandardCharsets import java.nio.file.{Files, Path} import java.util import org.apache.http.HttpHeaders import org.apache.http.auth.{AuthScope, UsernamePasswordCredentials} import org.apache.http.client.protocol.HttpClientContext import org.apache.http.client.utils.URIUtils import org.apache.http.impl.auth.BasicScheme import org.apache.http.impl.client.{BasicAuthCache, BasicCredentialsProvider, HttpClients} import org.apache.http.message.BasicHeader import org.apache.jena.query._ import org.apache.jena.rdf.model.ModelFactory import org.apache.jena.riot.RDFDataMgr import org.apache.jena.riot.system.RiotLib import org.apache.jena.sparql.engine.http.QueryEngineHTTP import scopt.OptionParser import scala.io.Source import scala.xml.{NodeSeq, PrettyPrinter} case class Config(dir: File = new File("tests/sparql"), report: File = new File("reports/TESTS-sparql-test-runner.xml"), ignoreFail: Boolean = false, endpoint: Option[URI] = None, auth: Option[Either[String, String]] = None, params: Map[String, String] = Map.empty, froms: List[String] = List.empty, data: Seq[File] = Seq()) object Run extends App { val packageVersion: String = getClass.getPackage.getImplementationVersion val parser: OptionParser[Config] = new scopt.OptionParser[Config]("sparql-testrunner") { head("sparql-test-runner", packageVersion) opt[File]('t', "testdir") optional() valueName "<dir>" action { (x, c) => c.copy(dir = x) } text "location of SPARQL queries to run, defaults to tests/sparql" opt[File]('r', "report") optional() valueName "<report>" action { (x, c) => c.copy(report = x) } text "file to output XML test report, defaults to reports/TESTS-sparql-test-runner.xml" opt[Unit]('i', "ignorefail") optional() action { (_, c) => c.copy(ignoreFail = true) } text "exit with success even if there are reported failures" opt[URI]('s', name= "service") optional() valueName "<HTTP URI>" action { (x, c) => c.copy(endpoint = Some(x)) } text "SPARQL endpoint to run the queries against" opt[String]('a', "auth") optional() valueName "<user:pass>" action { (x, c) => c.copy(auth = Some(Left(x))) } text "basic authentication username:password" opt[String]('k', "token") optional() valueName "<user:pass>" action { (x, c) => c.copy(auth = Some(Right(x))) } text "oAuth token" opt[Map[String,String]]('p', name="param") optional() valueName "l=\"somelabel\"@en,n=<some-uri>" action { (x, c) => c.copy(params = x) } text "variables to replace in query" opt[String]('f', name="from") optional() unbounded() valueName "<some-uri>" action { (x, c) => c.copy(froms = c.froms :+ x) } text "graphs to query" arg[File]("<file>...") unbounded() optional() action { (x, c) => c.copy(data = c.data :+ x) } text "data to run the queries against" checkConfig( c => if (!c.dir.exists || !c.dir.isDirectory) { failure("Tests directory (" + c.dir.toString + ") doesn't exist or isn't a directory.") } else if (c.endpoint.isDefined && c.data.nonEmpty) { failure("Specify either a SPARQL endpoint or data files, not both.") } else if (c.endpoint.isEmpty && c.data.isEmpty) { failure("Must specify either a SPARQL endpoint or some data files.") } else success ) } parser.parse(args, Config()) match { case Some(config) => val queryExecution: Query => QueryExecution = (query: Query) => { val exec = config.endpoint match { case Some(uri) => // Querying a remote endpoint; if authentication is required, need to set up pre-emptive auth, // see https://hc.apache.org/httpcomponents-client-ga/tutorial/html/authentication.html config.auth match { case Some(Left(userpass)) => val target = URIUtils.extractHost(uri) // new HttpHost(uri.getHost, uri.getPort) val credsProvider = new BasicCredentialsProvider() credsProvider.setCredentials( new AuthScope(target.getHostName, target.getPort), new UsernamePasswordCredentials(userpass)) val authCache = new BasicAuthCache() authCache.put(target, new BasicScheme()) val context = HttpClientContext.create() context.setCredentialsProvider(credsProvider) context.setAuthCache(authCache) val client = HttpClients.custom.build() QueryExecutionFactory.sparqlService (uri.toString, query, client, context) case Some(Right(token)) => val authHeader = new BasicHeader(HttpHeaders.AUTHORIZATION, "Bearer " + token) val headers = new util.ArrayList[BasicHeader] headers.add(authHeader) val client = HttpClients.custom.setDefaultHeaders(headers).build() QueryExecutionFactory.sparqlService(uri.toString, query, client) case None => QueryExecutionFactory.sparqlService(uri.toString, query) } case None => val dataset = DatasetFactory.create for (d <- config.data) { RDFDataMgr.read(dataset, d.toString) } val union = ModelFactory.createDefaultModel union.add(dataset.getDefaultModel) union.add(dataset.getUnionModel) dataset.close() QueryExecutionFactory.create(query, union) } // if this is an HTTP executor, then we can add the FROM graphs as part of the protocol exec match { case httpExec: QueryEngineHTTP => for (g <- config.froms) { httpExec.addDefaultGraph(g) } httpExec case other => other } } val (error, results) = runTestsUnder(config.dir, config.params, queryExecution, config.dir.toPath) for (dir <- Option(config.report.getParentFile)) { dir.mkdirs } val pp = new PrettyPrinter(80, 2) val pw = new PrintWriter(config.report) pw.write(pp.format(<testsuites>{results}</testsuites>)) pw.close() System.exit(if (error && !config.ignoreFail) 1 else 0) case None => } def runTestsUnder(dir: File, params: Map[String, String], queryExecution: Query => QueryExecution, root: Path): (Boolean, NodeSeq) = { var testSuites = NodeSeq.Empty var testCases = NodeSeq.Empty var overallError = false var errors = 0 var skipped = 0 var tests = 0 val timeSuiteStart = System.currentTimeMillis() var subSuiteTimes = 0L for (f <- dir.listFiles) yield { if (f.isDirectory) { val subSuiteStart = System.currentTimeMillis() val (error, subSuites) = runTestsUnder(f, params, queryExecution, root) testSuites ++= subSuites overallError |= error subSuiteTimes += (System.currentTimeMillis() - subSuiteStart) } else if (f.isFile && f.getName.endsWith(".sparql")) { val timeTestStart = System.currentTimeMillis() val relativePath = root.relativize(f.toPath).toString val className = relativePath.substring(0, relativePath.lastIndexOf('.')).replace(File.pathSeparatorChar, '.') val comment = { val queryLines = Source.fromFile(f).getLines() if (queryLines.hasNext) { val line = queryLines.next() if (line.startsWith("# ")) line.substring(2) else line } else className } tests += 1 val rawQuery = new String(Files.readAllBytes(f.toPath), StandardCharsets.UTF_8) val query = if (params.isEmpty) { QueryFactory.create(rawQuery) } else { val parameterizedSparqlString = new ParameterizedSparqlString(rawQuery) for ( (k, v) <- params ) { parameterizedSparqlString.setParam(k, RiotLib.parse(v)) } parameterizedSparqlString.asQuery } val exec = queryExecution(query) try { if (query.isSelectType) { var results = exec.execSelect() val nonEmptyResults = results.hasNext val timeTaken = (System.currentTimeMillis() - timeTestStart).toFloat / 1000 testCases = testCases ++ <testcase name={comment} class={className} time={timeTaken.toString}> { val out = new ByteArrayOutputStream ResultSetFormatter.outputAsCSV(out, results) val actualResults = out.toString("utf-8") val expect = new File(f.getPath.substring(0, f.getPath.lastIndexOf('.')) + ".expected") if (expect.exists && expect.isFile) { val expectedResults = new String(Files.readAllBytes(expect.toPath), StandardCharsets.UTF_8) if (actualResults != expectedResults) { errors += 1 System.err.println(s"Testcase $comment\nExpected:\n$expectedResults\nActual:\n$actualResults") <error message={"Expected: \n" + expectedResults + "\nGot: \n" + actualResults}/> } } else { // assume there should be no results if (nonEmptyResults) { errors += 1 System.err.println(s"Testcase $comment\nExpected empty result set, got:\n$actualResults") <failure message={s"Expected empty result set, got:\n$actualResults"}/> } } } </testcase> } else if (query.isAskType) { val result = exec.execAsk() val timeTaken = (System.currentTimeMillis() - timeTestStart).toFloat / 1000 testCases = testCases ++ <testcase name={comment} class={className} time={timeTaken.toString}>{ if (result) { errors += 1 System.err.println(s"Testcase $comment\nExpected ASK query to return FALSE") <failure message={"Constraint violated"}/> }}</testcase> } else { skipped += 1 System.out.println(s"Skipped testcase $comment") testCases = testCases ++ <testcase name={comment} class={className}> <skipped/> </testcase> } } catch { case e: Exception => testCases = testCases ++ <testcase name={comment} class={className} time={((System.currentTimeMillis() - timeTestStart).toFloat / 1000).toString}> <error message={"Exception running query: " + e.getMessage}/> </testcase> } } } if (errors > 0) { overallError = true } val testSuiteTime = (System.currentTimeMillis() - timeSuiteStart - subSuiteTimes).toFloat / 1000 val suiteName = { val relativeName = root.toAbsolutePath.getParent.relativize(dir.toPath.toAbsolutePath).toString if (relativeName.length == 0) { "root" } else { relativeName } } (overallError, testSuites ++ <testsuite errors={errors.toString} tests={tests.toString} time={testSuiteTime.toString} name={suiteName} skipped={skipped.toString}> {testCases} </testsuite>) } }