/**
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.hadoop.mapred;
import org.apache.hadoop.fs.BlockLocation;
import org.apache.hadoop.net.NetworkTopology;
import junit.framework.TestCase;
public class TestGetSplitHosts extends TestCase {
public void testGetSplitHosts() throws Exception {
int numBlocks = 3;
int block1Size = 100, block2Size = 150, block3Size = 75;
int fileSize = block1Size + block2Size + block3Size;
int replicationFactor = 3;
NetworkTopology clusterMap = new NetworkTopology();
BlockLocation[] bs = new BlockLocation[numBlocks];
String [] block1Hosts = {"host1","host2","host3"};
String [] block1Names = {"host1:100","host2:100","host3:100"};
String [] block1Racks = {"/rack1/","/rack1/","/rack2/"};
String [] block1Paths = new String[replicationFactor];
for (int i = 0; i < replicationFactor; i++) {
block1Paths[i] = block1Racks[i]+block1Names[i];
}
bs[0] = new BlockLocation(block1Names,block1Hosts,
block1Paths,0,block1Size);
String [] block2Hosts = {"host4","host5","host6"};
String [] block2Names = {"host4:100","host5:100","host6:100"};
String [] block2Racks = {"/rack2/","/rack3/","/rack3/"};
String [] block2Paths = new String[replicationFactor];
for (int i = 0; i < replicationFactor; i++) {
block2Paths[i] = block2Racks[i]+block2Names[i];
}
bs[1] = new BlockLocation(block2Names,block2Hosts,
block2Paths,block1Size,block2Size);
String [] block3Hosts = {"host1","host7","host8"};
String [] block3Names = {"host1:100","host7:100","host8:100"};
String [] block3Racks = {"/rack1/","/rack4/","/rack4/"};
String [] block3Paths = new String[replicationFactor];
for (int i = 0; i < replicationFactor; i++) {
block3Paths[i] = block3Racks[i]+block3Names[i];
}
bs[2] = new BlockLocation(block3Names,block3Hosts,
block3Paths,block1Size+block2Size,
block3Size);
SequenceFileInputFormat< String, String> sif =
new SequenceFileInputFormat<String,String>();
String [] hosts = sif.getSplitHosts(bs, 0, fileSize, clusterMap);
// Contributions By Racks are
// Rack1 175
// Rack2 275
// Rack3 150
// So, Rack2 hosts, host4 and host 3 should be returned
// even if their individual contribution is not the highest
assertTrue (hosts.length == replicationFactor);
assertTrue(hosts[0].equalsIgnoreCase("host4"));
assertTrue(hosts[1].equalsIgnoreCase("host3"));
assertTrue(hosts[2].equalsIgnoreCase("host1"));
// Now Create the blocks without topology information
bs[0] = new BlockLocation(block1Names,block1Hosts,0,block1Size);
bs[1] = new BlockLocation(block2Names,block2Hosts,block1Size,block2Size);
bs[2] = new BlockLocation(block3Names,block3Hosts,block1Size+block2Size,
block3Size);
hosts = sif.getSplitHosts(bs, 0, fileSize, clusterMap);
// host1 makes the highest contribution among all hosts
// So, that should be returned before others
assertTrue (hosts.length == replicationFactor);
assertTrue(hosts[0].equalsIgnoreCase("host1"));
}
}