-
Notifications
You must be signed in to change notification settings - Fork 38
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Common: add benchmarking module (close #370)
- Loading branch information
Showing
7 changed files
with
264 additions
and
0 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,6 @@ | ||
sourceDirectory in Jmh := (sourceDirectory in Test).value | ||
classDirectory in Jmh := (classDirectory in Test).value | ||
dependencyClasspath in Jmh := (dependencyClasspath in Test).value | ||
// rewire tasks, so that 'jmh:run' automatically invokes 'jmh:compile' (otherwise a clean 'jmh:run' would fail) | ||
compile in Jmh := (compile in Jmh).dependsOn(compile in Test).value | ||
run in Jmh := (run in Jmh).dependsOn(Keys.compile in Jmh).evaluated |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,2 @@ | ||
org.slf4j.simpleLogger.log.com.snowplowanalytics.snowplow.enrich.fs2.Assets=off | ||
org.slf4j.simpleLogger.log.com.snowplowanalytics.snowplow.enrich.fs2.test.TestEnvironment=off |
110 changes: 110 additions & 0 deletions
110
modules/bench/src/test/scala/com.snowplowanalytics.snowplow.enrich.bench/EnrichBench.scala
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,110 @@ | ||
/* | ||
* Copyright (c) 2020 Snowplow Analytics Ltd. All rights reserved. | ||
* | ||
* This program is licensed to you under the Apache License Version 2.0, | ||
* and you may not use this file except in compliance with the Apache License Version 2.0. | ||
* You may obtain a copy of the Apache License Version 2.0 at http://www.apache.org/licenses/LICENSE-2.0. | ||
* | ||
* Unless required by applicable law or agreed to in writing, | ||
* software distributed under the Apache License Version 2.0 is distributed on an | ||
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||
* See the Apache License Version 2.0 for the specific language governing permissions and limitations there under. | ||
*/ | ||
package com.snowplowanalytics.snowplow.enrich.bench | ||
|
||
import org.openjdk.jmh.annotations._ | ||
|
||
import java.util.concurrent.TimeUnit | ||
|
||
import cats.effect.{ContextShift, IO, Clock, Blocker} | ||
|
||
import fs2.Stream | ||
|
||
import com.snowplowanalytics.iglu.client.Client | ||
|
||
import com.snowplowanalytics.snowplow.enrich.common.enrichments.EnrichmentRegistry | ||
import com.snowplowanalytics.snowplow.enrich.common.loaders.ThriftLoader | ||
import com.snowplowanalytics.snowplow.enrich.fs2.test.TestEnvironment | ||
import com.snowplowanalytics.snowplow.enrich.fs2.{Enrich, Environment, EnrichSpec, Payload} | ||
|
||
import org.apache.http.message.BasicNameValuePair | ||
|
||
|
||
/** | ||
* @example | ||
* {{{ | ||
* jmh:run -i 15 -wi 10 -f1 -t1 EnrichBench | ||
* }}} | ||
*/ | ||
@State(Scope.Thread) | ||
@BenchmarkMode(Array(Mode.AverageTime)) | ||
@OutputTimeUnit(TimeUnit.MICROSECONDS) | ||
class EnrichBench { | ||
|
||
implicit val ioClock: Clock[IO] = Clock.create[IO] | ||
|
||
@Benchmark | ||
def measureEnrichWithMinimalPayload(state: EnrichBench.BenchState) = { | ||
implicit val CS: ContextShift[IO] = state.contextShift | ||
Enrich.enrichWith[IO](IO.pure(EnrichmentRegistry()), state.blocker, Client.IgluCentral, None, (_: Option[Long]) => IO.unit)(state.raw).unsafeRunSync() | ||
} | ||
|
||
@Benchmark | ||
def measureToCollectorPayload(state: EnrichBench.BenchState) = { | ||
ThriftLoader.toCollectorPayload(state.raw.data, Enrich.processor) | ||
} | ||
|
||
@Benchmark | ||
@OperationsPerInvocation(50) // 5 events repetated 10 times | ||
def measureRunWithNoEnrichments(state: EnrichBench.BenchState) = { | ||
// We used this benchmark to check if running the whole `enrichWith` on a blocking | ||
// thread-pool will give us increase in performance. Results haven't confirm it: | ||
// EnrichBench.measureRunWithNoEnrichments avgt 15 341.144 ± 18.884 us/op <- smaller blocker | ||
// EnrichBench.measureRunWithNoEnrichments avgt 15 326.608 ± 16.714 us/op <- wrapping blocker | ||
// EnrichBench.measureRunWithNoEnrichments avgt 15 292.907 ± 15.894 us/op <- no blocker at all | ||
// However, I'm still leaving the "smaller blocker" in a hope that with actual IO enrichments | ||
// it will give the expected increase in performance | ||
implicit val CS: ContextShift[IO] = state.contextShift | ||
state.useEnvironment(e => Enrich.run[IO](e).compile.drain).unsafeRunSync() | ||
} | ||
} | ||
|
||
object EnrichBench { | ||
@State(Scope.Benchmark) | ||
class BenchState { | ||
var raw: Payload[IO, Array[Byte]] = _ | ||
var useEnvironment: (Environment[IO] => IO[Unit]) => IO[Unit] = _ | ||
var contextShift: ContextShift[IO] = _ | ||
var blocker: Blocker = _ | ||
|
||
@Setup(Level.Trial) | ||
def setup(): Unit = { | ||
|
||
raw = EnrichSpec.payload[IO] | ||
|
||
val input = Stream.emits(List( | ||
EnrichSpec.colllectorPayload.copy( | ||
querystring = new BasicNameValuePair("ip", "125.12.2.40") :: EnrichSpec.querystring | ||
), | ||
EnrichSpec.colllectorPayload.copy( | ||
querystring = new BasicNameValuePair("ip", "125.12.2.41") :: EnrichSpec.querystring | ||
), | ||
EnrichSpec.colllectorPayload.copy( | ||
querystring = new BasicNameValuePair("ip", "125.12.2.42") :: EnrichSpec.querystring | ||
), | ||
EnrichSpec.colllectorPayload.copy( | ||
querystring = new BasicNameValuePair("ip", "125.12.2.43") :: EnrichSpec.querystring | ||
), | ||
EnrichSpec.colllectorPayload.copy( | ||
querystring = new BasicNameValuePair("ip", "125.12.2.44") :: EnrichSpec.querystring | ||
), | ||
)).repeatN(10).map(cp => Payload(cp.toRaw, IO.unit)).covary[IO] | ||
|
||
useEnvironment = TestEnvironment.make(input).map(_.env).use(_: Environment[IO] => IO[Unit]) | ||
|
||
contextShift = IO.contextShift(scala.concurrent.ExecutionContext.global) | ||
|
||
blocker = Blocker[IO].use(IO.pure).unsafeRunSync() | ||
} | ||
} | ||
} |
85 changes: 85 additions & 0 deletions
85
...s/bench/src/test/scala/com.snowplowanalytics.snowplow.enrich.bench/EtlPipelineBench.scala
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,85 @@ | ||
/* | ||
* Copyright (c) 2020 Snowplow Analytics Ltd. All rights reserved. | ||
* | ||
* This program is licensed to you under the Apache License Version 2.0, | ||
* and you may not use this file except in compliance with the Apache License Version 2.0. | ||
* You may obtain a copy of the Apache License Version 2.0 at http://www.apache.org/licenses/LICENSE-2.0. | ||
* | ||
* Unless required by applicable law or agreed to in writing, | ||
* software distributed under the Apache License Version 2.0 is distributed on an | ||
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||
* See the Apache License Version 2.0 for the specific language governing permissions and limitations there under. | ||
*/ | ||
package com.snowplowanalytics.snowplow.enrich.bench | ||
|
||
import org.openjdk.jmh.annotations._ | ||
|
||
import java.util.concurrent.TimeUnit | ||
|
||
import cats.Id | ||
import cats.data.Validated | ||
|
||
import cats.effect.{IO, Clock} | ||
|
||
import io.circe.Json | ||
|
||
import com.snowplowanalytics.iglu.client.{Resolver, Client, CirceValidator} | ||
|
||
import com.snowplowanalytics.snowplow.enrich.common.EtlPipeline | ||
import com.snowplowanalytics.snowplow.enrich.common.adapters.AdapterRegistry | ||
import com.snowplowanalytics.snowplow.enrich.common.enrichments.EnrichmentRegistry | ||
|
||
import com.snowplowanalytics.snowplow.enrich.fs2.{Enrich, EnrichSpec} | ||
|
||
import org.joda.time.DateTime | ||
|
||
@State(Scope.Thread) | ||
@BenchmarkMode(Array(Mode.AverageTime, Mode.Throughput)) | ||
@OutputTimeUnit(TimeUnit.MICROSECONDS) | ||
class EtlPipelineBench { | ||
|
||
private implicit val ioClock: Clock[IO] = Clock.create[IO] | ||
|
||
private implicit val idClock: Clock[Id] = new Clock[Id] { | ||
final def realTime(unit: TimeUnit): Id[Long] = | ||
unit.convert(System.currentTimeMillis(), TimeUnit.MILLISECONDS) | ||
final def monotonic(unit: TimeUnit): Id[Long] = | ||
unit.convert(System.nanoTime(), TimeUnit.NANOSECONDS) | ||
} | ||
|
||
@Benchmark | ||
def measureProcessEventsIO(state: EtlPipelineBench.BenchState) = { | ||
val payload = EnrichSpec.colllectorPayload | ||
EtlPipeline.processEvents[IO](state.adapterRegistry, state.enrichmentRegistryIo, Client.IgluCentral, Enrich.processor, state.dateTime, Validated.Valid(Some(payload))).unsafeRunSync() | ||
} | ||
|
||
@Benchmark | ||
def measureProcessEventsId(state: EtlPipelineBench.BenchState) = { | ||
val payload = EnrichSpec.colllectorPayload | ||
EtlPipeline.processEvents[Id](state.adapterRegistry, state.enrichmentRegistryId, state.clientId, Enrich.processor, state.dateTime, Validated.Valid(Some(payload))) | ||
} | ||
} | ||
|
||
object EtlPipelineBench { | ||
|
||
|
||
@State(Scope.Benchmark) | ||
class BenchState { | ||
var dateTime: DateTime = _ | ||
var adapterRegistry: AdapterRegistry = _ | ||
var enrichmentRegistryId: EnrichmentRegistry[Id] = _ | ||
var enrichmentRegistryIo: EnrichmentRegistry[IO] = _ | ||
var clientId: Client[Id, Json] = _ | ||
var clientIO: Client[IO, Json] = _ | ||
|
||
@Setup(Level.Trial) | ||
def setup(): Unit = { | ||
dateTime = DateTime.parse("2010-06-30T01:20+02:00") | ||
adapterRegistry = new AdapterRegistry() | ||
enrichmentRegistryId = EnrichmentRegistry[Id]() | ||
enrichmentRegistryIo = EnrichmentRegistry[IO]() | ||
clientId = Client[Id, Json](Resolver(List(), None), CirceValidator) | ||
clientIO = Client[IO, Json](Resolver(List(), None), CirceValidator) | ||
} | ||
} | ||
} |
55 changes: 55 additions & 0 deletions
55
.../bench/src/test/scala/com.snowplowanalytics.snowplow.enrich.bench/ThriftLoaderBench.scala
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,55 @@ | ||
/* | ||
* Copyright (c) 2020 Snowplow Analytics Ltd. All rights reserved. | ||
* | ||
* This program is licensed to you under the Apache License Version 2.0, | ||
* and you may not use this file except in compliance with the Apache License Version 2.0. | ||
* You may obtain a copy of the Apache License Version 2.0 at http://www.apache.org/licenses/LICENSE-2.0. | ||
* | ||
* Unless required by applicable law or agreed to in writing, | ||
* software distributed under the Apache License Version 2.0 is distributed on an | ||
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||
* See the Apache License Version 2.0 for the specific language governing permissions and limitations there under. | ||
*/ | ||
package com.snowplowanalytics.snowplow.enrich.bench | ||
|
||
import org.openjdk.jmh.annotations._ | ||
import java.util.concurrent.TimeUnit | ||
|
||
import com.snowplowanalytics.snowplow.enrich.common.loaders.ThriftLoader | ||
import com.snowplowanalytics.snowplow.enrich.common.outputs.EnrichedEvent | ||
import com.snowplowanalytics.snowplow.enrich.fs2.{Enrich, EnrichSpec} | ||
|
||
@State(Scope.Thread) | ||
@BenchmarkMode(Array(Mode.AverageTime)) | ||
@OutputTimeUnit(TimeUnit.NANOSECONDS) | ||
class ThriftLoaderBench { | ||
|
||
@Benchmark | ||
def measureToCollectorPayload(state: ThriftLoaderBench.BenchState) = | ||
ThriftLoader.toCollectorPayload(state.data, Enrich.processor) | ||
|
||
@Benchmark | ||
def measureNormalize(state: ThriftLoaderBench.BenchState) = { | ||
Enrich.encodeEvent(state.event) | ||
} | ||
} | ||
|
||
object ThriftLoaderBench { | ||
@State(Scope.Benchmark) | ||
class BenchState { | ||
var data: Array[Byte] = _ | ||
var event: EnrichedEvent = _ | ||
|
||
@Setup(Level.Trial) | ||
def setup(): Unit = { | ||
data = EnrichSpec.colllectorPayload.toRaw | ||
|
||
event = new EnrichedEvent() | ||
event.setApp_id("foo") | ||
event.setEvent_id("deadbeef-dead-dead-dead-deaddeafbeef") | ||
event.setUser_ipaddress("128.0.1.2") | ||
event.setUnstruct_event("""{"some": "json"}""") | ||
} | ||
} | ||
} | ||
|
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters