001/* 002 * Copyright (c) 2007-2017 Xplenty, Inc. All Rights Reserved. 003 * 004 * Project and contact information: http://www.cascading.org/ 005 * 006 * This file is part of the Cascading project. 007 * 008 * Licensed under the Apache License, Version 2.0 (the "License"); 009 * you may not use this file except in compliance with the License. 010 * You may obtain a copy of the License at 011 * 012 * http://www.apache.org/licenses/LICENSE-2.0 013 * 014 * Unless required by applicable law or agreed to in writing, software 015 * distributed under the License is distributed on an "AS IS" BASIS, 016 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 017 * See the License for the specific language governing permissions and 018 * limitations under the License. 019 */ 020 021package cascading.tuple.hadoop.collect; 022 023import java.util.Collection; 024import java.util.Map; 025 026import cascading.flow.FlowProcess; 027import cascading.tuple.Tuple; 028import cascading.tuple.collect.SpillableProps; 029import cascading.tuple.collect.SpillableTupleList; 030import cascading.tuple.collect.SpillableTupleMap; 031import cascading.tuple.collect.TupleMapFactory; 032import org.apache.hadoop.conf.Configuration; 033 034/** 035 * 036 */ 037public class HadoopTupleMapFactory implements TupleMapFactory<Configuration> 038 { 039 private int capacity; 040 private float loadFactor; 041 private int mapThreshold; 042 private int listThreshold; 043 044 @Override 045 public void initialize( FlowProcess<? extends Configuration> flowProcess ) 046 { 047 capacity = SpillableTupleMap.getMapCapacity( flowProcess, SpillableProps.defaultMapInitialCapacity ); 048 loadFactor = SpillableTupleMap.getMapLoadFactor( flowProcess, SpillableProps.defaultMapLoadFactor ); 049 mapThreshold = SpillableTupleMap.getMapThreshold( flowProcess, SpillableProps.defaultMapThreshold ); 050 listThreshold = SpillableTupleList.getThreshold( flowProcess, SpillableProps.defaultListThreshold ); 051 } 052 053 @Override 054 public Map<Tuple, Collection<Tuple>> create( FlowProcess<? extends Configuration> flowProcess ) 055 { 056 return new HadoopSpillableTupleMap( capacity, loadFactor, mapThreshold, listThreshold, flowProcess ); 057 } 058 }