| /* |
| * Licensed to the Apache Software Foundation (ASF) under one |
| * or more contributor license agreements. See the NOTICE file |
| * distributed with this work for additional information |
| * regarding copyright ownership. The ASF licenses this file |
| * to you under the Apache License, Version 2.0 (the |
| * "License"); you may not use this file except in compliance |
| * with the License. You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| |
| package org.apache.wayang.profiler.java; |
| |
| import java.lang.management.ManagementFactory; |
| import java.lang.management.ThreadMXBean; |
| import java.util.Arrays; |
| import java.util.Collection; |
| import java.util.List; |
| import java.util.function.Supplier; |
| import org.apache.logging.log4j.LogManager; |
| import org.apache.logging.log4j.Logger; |
| import org.apache.wayang.core.api.Configuration; |
| import org.apache.wayang.core.optimizer.DefaultOptimizationContext; |
| import org.apache.wayang.core.optimizer.OptimizationContext; |
| import org.apache.wayang.core.plan.executionplan.Channel; |
| import org.apache.wayang.core.platform.ChannelDescriptor; |
| import org.apache.wayang.core.platform.ChannelInstance; |
| import org.apache.wayang.core.util.WayangArrays; |
| import org.apache.wayang.core.util.WayangCollections; |
| import org.apache.wayang.java.channels.CollectionChannel; |
| import org.apache.wayang.java.execution.JavaExecutor; |
| import org.apache.wayang.java.operators.JavaExecutionOperator; |
| import org.apache.wayang.profiler.util.ProfilingUtils; |
| |
| /** |
| * Allows to instrument an {@link JavaExecutionOperator}. |
| */ |
| public abstract class OperatorProfiler { |
| |
| protected final Logger logger = LogManager.getLogger(this.getClass()); |
| |
| public int cpuMhz; |
| |
| protected Supplier<JavaExecutionOperator> operatorGenerator; |
| |
| protected JavaExecutionOperator operator; |
| |
| protected JavaExecutor executor; |
| |
| protected final List<Supplier<?>> dataQuantumGenerators; |
| |
| private List<Long> inputCardinalities; |
| |
| public OperatorProfiler(Supplier<JavaExecutionOperator> operatorGenerator, |
| Supplier<?>... dataQuantumGenerators) { |
| this.operatorGenerator = operatorGenerator; |
| this.dataQuantumGenerators = Arrays.asList(dataQuantumGenerators); |
| this.executor = ProfilingUtils.fakeJavaExecutor(); |
| this.cpuMhz = Integer.parseInt(System.getProperty("wayang.java.cpu.mhz", "2700")); |
| } |
| |
| |
| public void prepare(long... inputCardinalities) { |
| this.operator = this.operatorGenerator.get(); |
| this.inputCardinalities = WayangArrays.asList(inputCardinalities); |
| } |
| |
| |
| /** |
| * Executes and profiles the profiling task. Requires that this instance is prepared. |
| */ |
| public Result run() { |
| final ThreadMXBean threadMXBean = ManagementFactory.getThreadMXBean(); |
| threadMXBean.setThreadCpuTimeEnabled(true); |
| ProfilingUtils.sleep(1000); |
| long startCpuTime = threadMXBean.getCurrentThreadCpuTime(); |
| final long outputCardinality = this.executeOperator(); |
| long endCpuTime = threadMXBean.getCurrentThreadCpuTime(); |
| |
| long cpuCycles = this.calculateCpuCycles(startCpuTime, endCpuTime); |
| return new Result( |
| this.inputCardinalities, |
| outputCardinality, |
| this.provideDiskBytes(), |
| this.provideNetworkBytes(), |
| cpuCycles |
| ); |
| } |
| |
| private long calculateCpuCycles(long startNanos, long endNanos) { |
| long passedNanos = endNanos - startNanos; |
| double cyclesPerNano = (this.cpuMhz * 1e6) / 1e9; |
| return Math.round(cyclesPerNano * passedNanos); |
| } |
| |
| protected long provideNetworkBytes() { |
| return 0L; |
| } |
| |
| protected long provideDiskBytes() { |
| return 0L; |
| } |
| |
| /** |
| * Executes the profiling task. Requires that this instance is prepared. |
| */ |
| protected abstract long executeOperator(); |
| |
| protected static CollectionChannel.Instance createChannelInstance(final Collection<?> collection) { |
| final CollectionChannel.Instance channelInstance = createChannelInstance(); |
| channelInstance.accept(collection); |
| return channelInstance; |
| } |
| |
| protected static CollectionChannel.Instance createChannelInstance() { |
| final ChannelDescriptor channelDescriptor = CollectionChannel.DESCRIPTOR; |
| final Channel channel = channelDescriptor.createChannel(null, new Configuration()); |
| return (CollectionChannel.Instance) channel.createInstance(null, null, -1); |
| } |
| |
| public JavaExecutionOperator getOperator() { |
| return this.operator; |
| } |
| |
| /** |
| * Utility method to invoke |
| * {@link JavaExecutionOperator#evaluate(ChannelInstance[], ChannelInstance[], JavaExecutor, OptimizationContext.OperatorContext)}. |
| */ |
| protected void evaluate(ChannelInstance[] inputs, |
| ChannelInstance[] outputs) { |
| OptimizationContext optimizationContext = new DefaultOptimizationContext(this.executor.getJob()); |
| final OptimizationContext.OperatorContext operatorContext = optimizationContext.addOneTimeOperator(operator); |
| operator.evaluate(inputs, outputs, this.executor, operatorContext); |
| } |
| |
| /** |
| * The result of a single profiling run. |
| */ |
| public static class Result { |
| |
| private final List<Long> inputCardinalities; |
| |
| private final long outputCardinality; |
| |
| private final long diskBytes, networkBytes; |
| |
| private final long cpuCycles; |
| |
| public Result(List<Long> inputCardinalities, long outputCardinality, long diskBytes, long networkBytes, long cpuCycles) { |
| this.inputCardinalities = inputCardinalities; |
| this.outputCardinality = outputCardinality; |
| this.diskBytes = diskBytes; |
| this.networkBytes = networkBytes; |
| this.cpuCycles = cpuCycles; |
| } |
| |
| public List<Long> getInputCardinalities() { |
| return this.inputCardinalities; |
| } |
| |
| public long getOutputCardinality() { |
| return this.outputCardinality; |
| } |
| |
| public long getDiskBytes() { |
| return this.diskBytes; |
| } |
| |
| public long getNetworkBytes() { |
| return this.networkBytes; |
| } |
| |
| public long getCpuCycles() { |
| return this.cpuCycles; |
| } |
| |
| @Override |
| public String toString() { |
| return "Result{" + |
| "inputCardinalities=" + this.inputCardinalities + |
| ", outputCardinality=" + this.outputCardinality + |
| ", diskBytes=" + this.diskBytes + |
| ", networkBytes=" + this.networkBytes + |
| ", cpuCycles=" + this.cpuCycles + |
| '}'; |
| } |
| |
| public String getCsvHeader() { |
| return String.join(",", WayangCollections.map(this.inputCardinalities, (index, card) -> "input_card_" + index)) + "," + |
| "output_card," + |
| "disk," + |
| "network," + |
| "cpu"; |
| } |
| |
| public String toCsvString() { |
| return String.join(",", WayangCollections.map(this.inputCardinalities, Object::toString)) + "," |
| + this.outputCardinality + "," |
| + this.diskBytes + "," |
| + this.networkBytes + "," |
| + this.cpuCycles; |
| } |
| } |
| |
| } |