blob: a559ff80c48d6ce5143a145c3dd7abc635f5a3f8 [file] [log] [blame]
// Licensed to the Apache Software Foundation (ASF) under one
// or more contributor license agreements. See the NOTICE file
// distributed with this work for additional information
// regarding copyright ownership. The ASF licenses this file
// to you under the Apache License, Version 2.0 (the
// "License"); you may not use this file except in compliance
// with the License. You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing,
// software distributed under the License is distributed on an
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
// KIND, either express or implied. See the License for the
// specific language governing permissions and limitations
// under the License.
using System;
using System.IO;
using System.Linq;
using Org.Apache.REEF.IMRU.API;
using Org.Apache.REEF.IMRU.OnREEF.Parameters;
using Org.Apache.REEF.IMRU.OnREEF.ResultHandler;
using Org.Apache.REEF.IO.FileSystem.Local;
using Org.Apache.REEF.IO.PartitionedData.Random;
using Org.Apache.REEF.Tang.Annotations;
using Org.Apache.REEF.Tang.Implementations.Tang;
using Org.Apache.REEF.Tang.Interface;
using Org.Apache.REEF.Tang.Util;
using Org.Apache.REEF.Wake.StreamingCodec.CommonStreamingCodecs;
namespace Org.Apache.REEF.IMRU.Examples.MapperCount
{
/// <summary>
/// A simple IMRU program that counts the number of map function instances launched.
/// </summary>
public sealed class MapperCount
{
private readonly IIMRUClient _imruClient;
[Inject]
private MapperCount(IIMRUClient imruClient)
{
_imruClient = imruClient;
}
/// <summary>
/// Runs the actual mapper count job
/// </summary>
/// <returns>The number of MapFunction instances that are part of the job.</returns>
public int Run(int numberofMappers, string outputFile, IConfiguration fileSystemConfig)
{
var results = _imruClient.Submit<int, int, int, Stream>(
new IMRUJobDefinitionBuilder()
.SetMapFunctionConfiguration(IMRUMapConfiguration<int, int>.ConfigurationModule
.Set(IMRUMapConfiguration<int, int>.MapFunction, GenericType<IdentityMapFunction>.Class)
.Build())
.SetUpdateFunctionConfiguration(
IMRUUpdateConfiguration<int, int, int>.ConfigurationModule
.Set(IMRUUpdateConfiguration<int, int, int>.UpdateFunction,
GenericType<MapperCountUpdateFunction>.Class)
.Build())
.SetMapInputCodecConfiguration(IMRUCodecConfiguration<int>.ConfigurationModule
.Set(IMRUCodecConfiguration<int>.Codec, GenericType<IntStreamingCodec>.Class)
.Build())
.SetUpdateFunctionCodecsConfiguration(IMRUCodecConfiguration<int>.ConfigurationModule
.Set(IMRUCodecConfiguration<int>.Codec, GenericType<IntStreamingCodec>.Class)
.Build())
.SetReduceFunctionConfiguration(IMRUReduceFunctionConfiguration<int>.ConfigurationModule
.Set(IMRUReduceFunctionConfiguration<int>.ReduceFunction,
GenericType<IntSumReduceFunction>.Class)
.Build())
.SetPartitionedDatasetConfiguration(
RandomInputDataConfiguration.ConfigurationModule.Set(
RandomInputDataConfiguration.NumberOfPartitions,
numberofMappers.ToString()).Build())
.SetResultHandlerConfiguration(
TangFactory.GetTang()
.NewConfigurationBuilder(fileSystemConfig)
.BindImplementation(GenericType<IIMRUResultHandler<int>>.Class,
GenericType<WriteResultHandler<int>>.Class)
.BindNamedParameter(typeof(ResultOutputLocation), outputFile)
.Build())
.SetMapTaskCores(2)
.SetUpdateTaskCores(3)
.SetJobName("MapperCount")
.SetNumberOfMappers(numberofMappers)
.Build());
if (results != null)
{
return results.First();
}
return -1;
}
}
}