blob: 53f980bfcf83539d0dbf39b546ed8b2e83c362a2 [file] [log] [blame]
<!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 4.01 Transitional//EN" "http://www.w3.org/TR/html4/loose.dtd">
<html lang="en">
<head>
<title>Source code</title>
<link rel="stylesheet" type="text/css" href="../../../../../../stylesheet.css" title="Style">
</head>
<body>
<div class="sourceContainer">
<pre><span class="sourceLineNo">001</span>/*<a name="line.1"></a>
<span class="sourceLineNo">002</span> * Licensed to the Apache Software Foundation (ASF) under one<a name="line.2"></a>
<span class="sourceLineNo">003</span> * or more contributor license agreements. See the NOTICE file<a name="line.3"></a>
<span class="sourceLineNo">004</span> * distributed with this work for additional information<a name="line.4"></a>
<span class="sourceLineNo">005</span> * regarding copyright ownership. The ASF licenses this file<a name="line.5"></a>
<span class="sourceLineNo">006</span> * to you under the Apache License, Version 2.0 (the<a name="line.6"></a>
<span class="sourceLineNo">007</span> * "License"); you may not use this file except in compliance<a name="line.7"></a>
<span class="sourceLineNo">008</span> * with the License. You may obtain a copy of the License at<a name="line.8"></a>
<span class="sourceLineNo">009</span> *<a name="line.9"></a>
<span class="sourceLineNo">010</span> * http://www.apache.org/licenses/LICENSE-2.0<a name="line.10"></a>
<span class="sourceLineNo">011</span> *<a name="line.11"></a>
<span class="sourceLineNo">012</span> * Unless required by applicable law or agreed to in writing, software<a name="line.12"></a>
<span class="sourceLineNo">013</span> * distributed under the License is distributed on an "AS IS" BASIS,<a name="line.13"></a>
<span class="sourceLineNo">014</span> * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.<a name="line.14"></a>
<span class="sourceLineNo">015</span> * See the License for the specific language governing permissions and<a name="line.15"></a>
<span class="sourceLineNo">016</span> * limitations under the License.<a name="line.16"></a>
<span class="sourceLineNo">017</span> */<a name="line.17"></a>
<span class="sourceLineNo">018</span>package org.apache.hadoop.hbase.fs;<a name="line.18"></a>
<span class="sourceLineNo">019</span><a name="line.19"></a>
<span class="sourceLineNo">020</span>import edu.umd.cs.findbugs.annotations.Nullable;<a name="line.20"></a>
<span class="sourceLineNo">021</span>import java.io.Closeable;<a name="line.21"></a>
<span class="sourceLineNo">022</span>import java.io.IOException;<a name="line.22"></a>
<span class="sourceLineNo">023</span>import java.lang.reflect.Field;<a name="line.23"></a>
<span class="sourceLineNo">024</span>import java.lang.reflect.InvocationHandler;<a name="line.24"></a>
<span class="sourceLineNo">025</span>import java.lang.reflect.InvocationTargetException;<a name="line.25"></a>
<span class="sourceLineNo">026</span>import java.lang.reflect.Method;<a name="line.26"></a>
<span class="sourceLineNo">027</span>import java.lang.reflect.Modifier;<a name="line.27"></a>
<span class="sourceLineNo">028</span>import java.lang.reflect.Proxy;<a name="line.28"></a>
<span class="sourceLineNo">029</span>import java.lang.reflect.UndeclaredThrowableException;<a name="line.29"></a>
<span class="sourceLineNo">030</span>import java.net.URI;<a name="line.30"></a>
<span class="sourceLineNo">031</span>import org.apache.hadoop.conf.Configuration;<a name="line.31"></a>
<span class="sourceLineNo">032</span>import org.apache.hadoop.fs.FSDataOutputStream;<a name="line.32"></a>
<span class="sourceLineNo">033</span>import org.apache.hadoop.fs.FileSystem;<a name="line.33"></a>
<span class="sourceLineNo">034</span>import org.apache.hadoop.fs.FilterFileSystem;<a name="line.34"></a>
<span class="sourceLineNo">035</span>import org.apache.hadoop.fs.LocalFileSystem;<a name="line.35"></a>
<span class="sourceLineNo">036</span>import org.apache.hadoop.fs.Path;<a name="line.36"></a>
<span class="sourceLineNo">037</span>import org.apache.hadoop.hbase.ServerName;<a name="line.37"></a>
<span class="sourceLineNo">038</span>import org.apache.hadoop.hbase.util.CommonFSUtils;<a name="line.38"></a>
<span class="sourceLineNo">039</span>import org.apache.hadoop.hbase.util.ReflectionUtils;<a name="line.39"></a>
<span class="sourceLineNo">040</span>import org.apache.hadoop.hbase.wal.AbstractFSWALProvider;<a name="line.40"></a>
<span class="sourceLineNo">041</span>import org.apache.hadoop.hdfs.DFSClient;<a name="line.41"></a>
<span class="sourceLineNo">042</span>import org.apache.hadoop.hdfs.DistributedFileSystem;<a name="line.42"></a>
<span class="sourceLineNo">043</span>import org.apache.hadoop.hdfs.protocol.BlockStoragePolicy;<a name="line.43"></a>
<span class="sourceLineNo">044</span>import org.apache.hadoop.hdfs.protocol.ClientProtocol;<a name="line.44"></a>
<span class="sourceLineNo">045</span>import org.apache.hadoop.hdfs.protocol.DatanodeInfo;<a name="line.45"></a>
<span class="sourceLineNo">046</span>import org.apache.hadoop.hdfs.protocol.HdfsFileStatus;<a name="line.46"></a>
<span class="sourceLineNo">047</span>import org.apache.hadoop.hdfs.protocol.LocatedBlock;<a name="line.47"></a>
<span class="sourceLineNo">048</span>import org.apache.hadoop.hdfs.protocol.LocatedBlocks;<a name="line.48"></a>
<span class="sourceLineNo">049</span>import org.apache.hadoop.hdfs.server.blockmanagement.BlockStoragePolicySuite;<a name="line.49"></a>
<span class="sourceLineNo">050</span>import org.apache.hadoop.ipc.RPC;<a name="line.50"></a>
<span class="sourceLineNo">051</span>import org.apache.hadoop.util.Progressable;<a name="line.51"></a>
<span class="sourceLineNo">052</span>import org.apache.yetus.audience.InterfaceAudience;<a name="line.52"></a>
<span class="sourceLineNo">053</span>import org.slf4j.Logger;<a name="line.53"></a>
<span class="sourceLineNo">054</span>import org.slf4j.LoggerFactory;<a name="line.54"></a>
<span class="sourceLineNo">055</span><a name="line.55"></a>
<span class="sourceLineNo">056</span>/**<a name="line.56"></a>
<span class="sourceLineNo">057</span> * An encapsulation for the FileSystem object that hbase uses to access data. This class allows the<a name="line.57"></a>
<span class="sourceLineNo">058</span> * flexibility of using separate filesystem objects for reading and writing hfiles and wals.<a name="line.58"></a>
<span class="sourceLineNo">059</span> */<a name="line.59"></a>
<span class="sourceLineNo">060</span>@InterfaceAudience.Private<a name="line.60"></a>
<span class="sourceLineNo">061</span>public class HFileSystem extends FilterFileSystem {<a name="line.61"></a>
<span class="sourceLineNo">062</span> public static final Logger LOG = LoggerFactory.getLogger(HFileSystem.class);<a name="line.62"></a>
<span class="sourceLineNo">063</span><a name="line.63"></a>
<span class="sourceLineNo">064</span> private final FileSystem noChecksumFs; // read hfile data from storage<a name="line.64"></a>
<span class="sourceLineNo">065</span> private final boolean useHBaseChecksum;<a name="line.65"></a>
<span class="sourceLineNo">066</span> private static volatile byte unspecifiedStoragePolicyId = Byte.MIN_VALUE;<a name="line.66"></a>
<span class="sourceLineNo">067</span><a name="line.67"></a>
<span class="sourceLineNo">068</span> /**<a name="line.68"></a>
<span class="sourceLineNo">069</span> * Create a FileSystem object for HBase regionservers.<a name="line.69"></a>
<span class="sourceLineNo">070</span> * @param conf The configuration to be used for the filesystem<a name="line.70"></a>
<span class="sourceLineNo">071</span> * @param useHBaseChecksum if true, then use checksum verfication in hbase, otherwise delegate<a name="line.71"></a>
<span class="sourceLineNo">072</span> * checksum verification to the FileSystem.<a name="line.72"></a>
<span class="sourceLineNo">073</span> */<a name="line.73"></a>
<span class="sourceLineNo">074</span> public HFileSystem(Configuration conf, boolean useHBaseChecksum) throws IOException {<a name="line.74"></a>
<span class="sourceLineNo">075</span><a name="line.75"></a>
<span class="sourceLineNo">076</span> // Create the default filesystem with checksum verification switched on.<a name="line.76"></a>
<span class="sourceLineNo">077</span> // By default, any operation to this FilterFileSystem occurs on<a name="line.77"></a>
<span class="sourceLineNo">078</span> // the underlying filesystem that has checksums switched on.<a name="line.78"></a>
<span class="sourceLineNo">079</span> // This FS#get(URI, conf) clearly indicates in the javadoc that if the FS is<a name="line.79"></a>
<span class="sourceLineNo">080</span> // not created it will initialize the FS and return that created FS. If it is<a name="line.80"></a>
<span class="sourceLineNo">081</span> // already created it will just return the FS that was already created.<a name="line.81"></a>
<span class="sourceLineNo">082</span> // We take pains to funnel all of our FileSystem instantiation through this call to ensure<a name="line.82"></a>
<span class="sourceLineNo">083</span> // we never need to call FS.initialize ourself so that we do not have to track any state to<a name="line.83"></a>
<span class="sourceLineNo">084</span> // avoid calling initialize more than once.<a name="line.84"></a>
<span class="sourceLineNo">085</span> this.fs = FileSystem.get(getDefaultUri(conf), conf);<a name="line.85"></a>
<span class="sourceLineNo">086</span> this.useHBaseChecksum = useHBaseChecksum;<a name="line.86"></a>
<span class="sourceLineNo">087</span><a name="line.87"></a>
<span class="sourceLineNo">088</span> // disable checksum verification for local fileSystem, see HBASE-11218<a name="line.88"></a>
<span class="sourceLineNo">089</span> if (fs instanceof LocalFileSystem) {<a name="line.89"></a>
<span class="sourceLineNo">090</span> fs.setWriteChecksum(false);<a name="line.90"></a>
<span class="sourceLineNo">091</span> fs.setVerifyChecksum(false);<a name="line.91"></a>
<span class="sourceLineNo">092</span> }<a name="line.92"></a>
<span class="sourceLineNo">093</span><a name="line.93"></a>
<span class="sourceLineNo">094</span> addLocationsOrderInterceptor(conf);<a name="line.94"></a>
<span class="sourceLineNo">095</span><a name="line.95"></a>
<span class="sourceLineNo">096</span> // If hbase checksum verification is switched on, then create a new<a name="line.96"></a>
<span class="sourceLineNo">097</span> // filesystem object that has cksum verification turned off.<a name="line.97"></a>
<span class="sourceLineNo">098</span> // We will avoid verifying checksums in the fs client, instead do it<a name="line.98"></a>
<span class="sourceLineNo">099</span> // inside of hbase.<a name="line.99"></a>
<span class="sourceLineNo">100</span> // If this is the local file system hadoop has a bug where seeks<a name="line.100"></a>
<span class="sourceLineNo">101</span> // do not go to the correct location if setVerifyChecksum(false) is called.<a name="line.101"></a>
<span class="sourceLineNo">102</span> // This manifests itself in that incorrect data is read and HFileBlocks won't be able to read<a name="line.102"></a>
<span class="sourceLineNo">103</span> // their header magic numbers. See HBASE-5885<a name="line.103"></a>
<span class="sourceLineNo">104</span> if (useHBaseChecksum &amp;&amp; !(fs instanceof LocalFileSystem)) {<a name="line.104"></a>
<span class="sourceLineNo">105</span> conf = new Configuration(conf);<a name="line.105"></a>
<span class="sourceLineNo">106</span> conf.setBoolean("dfs.client.read.shortcircuit.skip.checksum", true);<a name="line.106"></a>
<span class="sourceLineNo">107</span> this.noChecksumFs = maybeWrapFileSystem(newInstanceFileSystem(conf), conf);<a name="line.107"></a>
<span class="sourceLineNo">108</span> this.noChecksumFs.setVerifyChecksum(false);<a name="line.108"></a>
<span class="sourceLineNo">109</span> } else {<a name="line.109"></a>
<span class="sourceLineNo">110</span> this.noChecksumFs = maybeWrapFileSystem(fs, conf);<a name="line.110"></a>
<span class="sourceLineNo">111</span> }<a name="line.111"></a>
<span class="sourceLineNo">112</span><a name="line.112"></a>
<span class="sourceLineNo">113</span> this.fs = maybeWrapFileSystem(this.fs, conf);<a name="line.113"></a>
<span class="sourceLineNo">114</span> }<a name="line.114"></a>
<span class="sourceLineNo">115</span><a name="line.115"></a>
<span class="sourceLineNo">116</span> /**<a name="line.116"></a>
<span class="sourceLineNo">117</span> * Wrap a FileSystem object within a HFileSystem. The noChecksumFs and writefs are both set to be<a name="line.117"></a>
<span class="sourceLineNo">118</span> * the same specified fs. Do not verify hbase-checksums while reading data from filesystem.<a name="line.118"></a>
<span class="sourceLineNo">119</span> * @param fs Set the noChecksumFs and writeFs to this specified filesystem.<a name="line.119"></a>
<span class="sourceLineNo">120</span> */<a name="line.120"></a>
<span class="sourceLineNo">121</span> public HFileSystem(FileSystem fs) {<a name="line.121"></a>
<span class="sourceLineNo">122</span> this.fs = fs;<a name="line.122"></a>
<span class="sourceLineNo">123</span> this.noChecksumFs = fs;<a name="line.123"></a>
<span class="sourceLineNo">124</span> this.useHBaseChecksum = false;<a name="line.124"></a>
<span class="sourceLineNo">125</span> }<a name="line.125"></a>
<span class="sourceLineNo">126</span><a name="line.126"></a>
<span class="sourceLineNo">127</span> /**<a name="line.127"></a>
<span class="sourceLineNo">128</span> * Returns the filesystem that is specially setup for doing reads from storage. This object avoids<a name="line.128"></a>
<span class="sourceLineNo">129</span> * doing checksum verifications for reads.<a name="line.129"></a>
<span class="sourceLineNo">130</span> * @return The FileSystem object that can be used to read data from files.<a name="line.130"></a>
<span class="sourceLineNo">131</span> */<a name="line.131"></a>
<span class="sourceLineNo">132</span> public FileSystem getNoChecksumFs() {<a name="line.132"></a>
<span class="sourceLineNo">133</span> return noChecksumFs;<a name="line.133"></a>
<span class="sourceLineNo">134</span> }<a name="line.134"></a>
<span class="sourceLineNo">135</span><a name="line.135"></a>
<span class="sourceLineNo">136</span> /**<a name="line.136"></a>
<span class="sourceLineNo">137</span> * Returns the underlying filesystem<a name="line.137"></a>
<span class="sourceLineNo">138</span> * @return The underlying FileSystem for this FilterFileSystem object.<a name="line.138"></a>
<span class="sourceLineNo">139</span> */<a name="line.139"></a>
<span class="sourceLineNo">140</span> public FileSystem getBackingFs() throws IOException {<a name="line.140"></a>
<span class="sourceLineNo">141</span> return fs;<a name="line.141"></a>
<span class="sourceLineNo">142</span> }<a name="line.142"></a>
<span class="sourceLineNo">143</span><a name="line.143"></a>
<span class="sourceLineNo">144</span> /**<a name="line.144"></a>
<span class="sourceLineNo">145</span> * Set the source path (directory/file) to the specified storage policy.<a name="line.145"></a>
<span class="sourceLineNo">146</span> * @param path The source path (directory/file).<a name="line.146"></a>
<span class="sourceLineNo">147</span> * @param policyName The name of the storage policy: 'HOT', 'COLD', etc. See see hadoop 2.6+<a name="line.147"></a>
<span class="sourceLineNo">148</span> * org.apache.hadoop.hdfs.protocol.HdfsConstants for possible list e.g 'COLD',<a name="line.148"></a>
<span class="sourceLineNo">149</span> * 'WARM', 'HOT', 'ONE_SSD', 'ALL_SSD', 'LAZY_PERSIST'.<a name="line.149"></a>
<span class="sourceLineNo">150</span> */<a name="line.150"></a>
<span class="sourceLineNo">151</span> public void setStoragePolicy(Path path, String policyName) {<a name="line.151"></a>
<span class="sourceLineNo">152</span> CommonFSUtils.setStoragePolicy(this.fs, path, policyName);<a name="line.152"></a>
<span class="sourceLineNo">153</span> }<a name="line.153"></a>
<span class="sourceLineNo">154</span><a name="line.154"></a>
<span class="sourceLineNo">155</span> /**<a name="line.155"></a>
<span class="sourceLineNo">156</span> * Get the storage policy of the source path (directory/file).<a name="line.156"></a>
<span class="sourceLineNo">157</span> * @param path The source path (directory/file).<a name="line.157"></a>
<span class="sourceLineNo">158</span> * @return Storage policy name, or {@code null} if not using {@link DistributedFileSystem} or<a name="line.158"></a>
<span class="sourceLineNo">159</span> * exception thrown when trying to get policy<a name="line.159"></a>
<span class="sourceLineNo">160</span> */<a name="line.160"></a>
<span class="sourceLineNo">161</span> @Nullable<a name="line.161"></a>
<span class="sourceLineNo">162</span> public String getStoragePolicyName(Path path) {<a name="line.162"></a>
<span class="sourceLineNo">163</span> try {<a name="line.163"></a>
<span class="sourceLineNo">164</span> Object blockStoragePolicySpi =<a name="line.164"></a>
<span class="sourceLineNo">165</span> ReflectionUtils.invokeMethod(this.fs, "getStoragePolicy", path);<a name="line.165"></a>
<span class="sourceLineNo">166</span> return (String) ReflectionUtils.invokeMethod(blockStoragePolicySpi, "getName");<a name="line.166"></a>
<span class="sourceLineNo">167</span> } catch (Exception e) {<a name="line.167"></a>
<span class="sourceLineNo">168</span> // Maybe fail because of using old HDFS version, try the old way<a name="line.168"></a>
<span class="sourceLineNo">169</span> if (LOG.isTraceEnabled()) {<a name="line.169"></a>
<span class="sourceLineNo">170</span> LOG.trace("Failed to get policy directly", e);<a name="line.170"></a>
<span class="sourceLineNo">171</span> }<a name="line.171"></a>
<span class="sourceLineNo">172</span> return getStoragePolicyForOldHDFSVersion(path);<a name="line.172"></a>
<span class="sourceLineNo">173</span> }<a name="line.173"></a>
<span class="sourceLineNo">174</span> }<a name="line.174"></a>
<span class="sourceLineNo">175</span><a name="line.175"></a>
<span class="sourceLineNo">176</span> /**<a name="line.176"></a>
<span class="sourceLineNo">177</span> * Before Hadoop 2.8.0, there's no getStoragePolicy method for FileSystem interface, and we need<a name="line.177"></a>
<span class="sourceLineNo">178</span> * to keep compatible with it. See HADOOP-12161 for more details.<a name="line.178"></a>
<span class="sourceLineNo">179</span> * @param path Path to get storage policy against<a name="line.179"></a>
<span class="sourceLineNo">180</span> * @return the storage policy name<a name="line.180"></a>
<span class="sourceLineNo">181</span> */<a name="line.181"></a>
<span class="sourceLineNo">182</span> private String getStoragePolicyForOldHDFSVersion(Path path) {<a name="line.182"></a>
<span class="sourceLineNo">183</span> try {<a name="line.183"></a>
<span class="sourceLineNo">184</span> if (this.fs instanceof DistributedFileSystem) {<a name="line.184"></a>
<span class="sourceLineNo">185</span> DistributedFileSystem dfs = (DistributedFileSystem) this.fs;<a name="line.185"></a>
<span class="sourceLineNo">186</span> HdfsFileStatus status = dfs.getClient().getFileInfo(path.toUri().getPath());<a name="line.186"></a>
<span class="sourceLineNo">187</span> if (null != status) {<a name="line.187"></a>
<span class="sourceLineNo">188</span> if (unspecifiedStoragePolicyId &lt; 0) {<a name="line.188"></a>
<span class="sourceLineNo">189</span> // Get the unspecified id field through reflection to avoid compilation error.<a name="line.189"></a>
<span class="sourceLineNo">190</span> // In later version BlockStoragePolicySuite#ID_UNSPECIFIED is moved to<a name="line.190"></a>
<span class="sourceLineNo">191</span> // HdfsConstants#BLOCK_STORAGE_POLICY_ID_UNSPECIFIED<a name="line.191"></a>
<span class="sourceLineNo">192</span> Field idUnspecified = BlockStoragePolicySuite.class.getField("ID_UNSPECIFIED");<a name="line.192"></a>
<span class="sourceLineNo">193</span> unspecifiedStoragePolicyId = idUnspecified.getByte(BlockStoragePolicySuite.class);<a name="line.193"></a>
<span class="sourceLineNo">194</span> }<a name="line.194"></a>
<span class="sourceLineNo">195</span> byte storagePolicyId = status.getStoragePolicy();<a name="line.195"></a>
<span class="sourceLineNo">196</span> if (storagePolicyId != unspecifiedStoragePolicyId) {<a name="line.196"></a>
<span class="sourceLineNo">197</span> BlockStoragePolicy[] policies = dfs.getStoragePolicies();<a name="line.197"></a>
<span class="sourceLineNo">198</span> for (BlockStoragePolicy policy : policies) {<a name="line.198"></a>
<span class="sourceLineNo">199</span> if (policy.getId() == storagePolicyId) {<a name="line.199"></a>
<span class="sourceLineNo">200</span> return policy.getName();<a name="line.200"></a>
<span class="sourceLineNo">201</span> }<a name="line.201"></a>
<span class="sourceLineNo">202</span> }<a name="line.202"></a>
<span class="sourceLineNo">203</span> }<a name="line.203"></a>
<span class="sourceLineNo">204</span> }<a name="line.204"></a>
<span class="sourceLineNo">205</span> }<a name="line.205"></a>
<span class="sourceLineNo">206</span> } catch (Throwable e) {<a name="line.206"></a>
<span class="sourceLineNo">207</span> LOG.warn("failed to get block storage policy of [" + path + "]", e);<a name="line.207"></a>
<span class="sourceLineNo">208</span> }<a name="line.208"></a>
<span class="sourceLineNo">209</span><a name="line.209"></a>
<span class="sourceLineNo">210</span> return null;<a name="line.210"></a>
<span class="sourceLineNo">211</span> }<a name="line.211"></a>
<span class="sourceLineNo">212</span><a name="line.212"></a>
<span class="sourceLineNo">213</span> /**<a name="line.213"></a>
<span class="sourceLineNo">214</span> * Are we verifying checksums in HBase?<a name="line.214"></a>
<span class="sourceLineNo">215</span> * @return True, if hbase is configured to verify checksums, otherwise false.<a name="line.215"></a>
<span class="sourceLineNo">216</span> */<a name="line.216"></a>
<span class="sourceLineNo">217</span> public boolean useHBaseChecksum() {<a name="line.217"></a>
<span class="sourceLineNo">218</span> return useHBaseChecksum;<a name="line.218"></a>
<span class="sourceLineNo">219</span> }<a name="line.219"></a>
<span class="sourceLineNo">220</span><a name="line.220"></a>
<span class="sourceLineNo">221</span> /**<a name="line.221"></a>
<span class="sourceLineNo">222</span> * Close this filesystem object<a name="line.222"></a>
<span class="sourceLineNo">223</span> */<a name="line.223"></a>
<span class="sourceLineNo">224</span> @Override<a name="line.224"></a>
<span class="sourceLineNo">225</span> public void close() throws IOException {<a name="line.225"></a>
<span class="sourceLineNo">226</span> super.close();<a name="line.226"></a>
<span class="sourceLineNo">227</span> if (this.noChecksumFs != fs) {<a name="line.227"></a>
<span class="sourceLineNo">228</span> this.noChecksumFs.close();<a name="line.228"></a>
<span class="sourceLineNo">229</span> }<a name="line.229"></a>
<span class="sourceLineNo">230</span> }<a name="line.230"></a>
<span class="sourceLineNo">231</span><a name="line.231"></a>
<span class="sourceLineNo">232</span> /**<a name="line.232"></a>
<span class="sourceLineNo">233</span> * Returns a brand new instance of the FileSystem. It does not use the FileSystem.Cache. In newer<a name="line.233"></a>
<span class="sourceLineNo">234</span> * versions of HDFS, we can directly invoke FileSystem.newInstance(Configuration).<a name="line.234"></a>
<span class="sourceLineNo">235</span> * @param conf Configuration<a name="line.235"></a>
<span class="sourceLineNo">236</span> * @return A new instance of the filesystem<a name="line.236"></a>
<span class="sourceLineNo">237</span> */<a name="line.237"></a>
<span class="sourceLineNo">238</span> private static FileSystem newInstanceFileSystem(Configuration conf) throws IOException {<a name="line.238"></a>
<span class="sourceLineNo">239</span> URI uri = FileSystem.getDefaultUri(conf);<a name="line.239"></a>
<span class="sourceLineNo">240</span> FileSystem fs = null;<a name="line.240"></a>
<span class="sourceLineNo">241</span> Class&lt;?&gt; clazz = conf.getClass("fs." + uri.getScheme() + ".impl", null);<a name="line.241"></a>
<span class="sourceLineNo">242</span> if (clazz != null) {<a name="line.242"></a>
<span class="sourceLineNo">243</span> // This will be true for Hadoop 1.0, or 0.20.<a name="line.243"></a>
<span class="sourceLineNo">244</span> fs = (FileSystem) org.apache.hadoop.util.ReflectionUtils.newInstance(clazz, conf);<a name="line.244"></a>
<span class="sourceLineNo">245</span> fs.initialize(uri, conf);<a name="line.245"></a>
<span class="sourceLineNo">246</span> } else {<a name="line.246"></a>
<span class="sourceLineNo">247</span> // For Hadoop 2.0, we have to go through FileSystem for the filesystem<a name="line.247"></a>
<span class="sourceLineNo">248</span> // implementation to be loaded by the service loader in case it has not<a name="line.248"></a>
<span class="sourceLineNo">249</span> // been loaded yet.<a name="line.249"></a>
<span class="sourceLineNo">250</span> Configuration clone = new Configuration(conf);<a name="line.250"></a>
<span class="sourceLineNo">251</span> clone.setBoolean("fs." + uri.getScheme() + ".impl.disable.cache", true);<a name="line.251"></a>
<span class="sourceLineNo">252</span> fs = FileSystem.get(uri, clone);<a name="line.252"></a>
<span class="sourceLineNo">253</span> }<a name="line.253"></a>
<span class="sourceLineNo">254</span> if (fs == null) {<a name="line.254"></a>
<span class="sourceLineNo">255</span> throw new IOException("No FileSystem for scheme: " + uri.getScheme());<a name="line.255"></a>
<span class="sourceLineNo">256</span> }<a name="line.256"></a>
<span class="sourceLineNo">257</span><a name="line.257"></a>
<span class="sourceLineNo">258</span> return fs;<a name="line.258"></a>
<span class="sourceLineNo">259</span> }<a name="line.259"></a>
<span class="sourceLineNo">260</span><a name="line.260"></a>
<span class="sourceLineNo">261</span> /**<a name="line.261"></a>
<span class="sourceLineNo">262</span> * Returns an instance of Filesystem wrapped into the class specified in hbase.fs.wrapper<a name="line.262"></a>
<span class="sourceLineNo">263</span> * property, if one is set in the configuration, returns unmodified FS instance passed in as an<a name="line.263"></a>
<span class="sourceLineNo">264</span> * argument otherwise.<a name="line.264"></a>
<span class="sourceLineNo">265</span> * @param base Filesystem instance to wrap<a name="line.265"></a>
<span class="sourceLineNo">266</span> * @param conf Configuration<a name="line.266"></a>
<span class="sourceLineNo">267</span> * @return wrapped instance of FS, or the same instance if no wrapping configured.<a name="line.267"></a>
<span class="sourceLineNo">268</span> */<a name="line.268"></a>
<span class="sourceLineNo">269</span> private FileSystem maybeWrapFileSystem(FileSystem base, Configuration conf) {<a name="line.269"></a>
<span class="sourceLineNo">270</span> try {<a name="line.270"></a>
<span class="sourceLineNo">271</span> Class&lt;?&gt; clazz = conf.getClass("hbase.fs.wrapper", null);<a name="line.271"></a>
<span class="sourceLineNo">272</span> if (clazz != null) {<a name="line.272"></a>
<span class="sourceLineNo">273</span> return (FileSystem) clazz.getConstructor(FileSystem.class, Configuration.class)<a name="line.273"></a>
<span class="sourceLineNo">274</span> .newInstance(base, conf);<a name="line.274"></a>
<span class="sourceLineNo">275</span> }<a name="line.275"></a>
<span class="sourceLineNo">276</span> } catch (Exception e) {<a name="line.276"></a>
<span class="sourceLineNo">277</span> LOG.error("Failed to wrap filesystem: " + e);<a name="line.277"></a>
<span class="sourceLineNo">278</span> }<a name="line.278"></a>
<span class="sourceLineNo">279</span> return base;<a name="line.279"></a>
<span class="sourceLineNo">280</span> }<a name="line.280"></a>
<span class="sourceLineNo">281</span><a name="line.281"></a>
<span class="sourceLineNo">282</span> public static boolean addLocationsOrderInterceptor(Configuration conf) throws IOException {<a name="line.282"></a>
<span class="sourceLineNo">283</span> return addLocationsOrderInterceptor(conf, new ReorderWALBlocks());<a name="line.283"></a>
<span class="sourceLineNo">284</span> }<a name="line.284"></a>
<span class="sourceLineNo">285</span><a name="line.285"></a>
<span class="sourceLineNo">286</span> /**<a name="line.286"></a>
<span class="sourceLineNo">287</span> * Add an interceptor on the calls to the namenode#getBlockLocations from the DFSClient linked to<a name="line.287"></a>
<span class="sourceLineNo">288</span> * this FileSystem. See HBASE-6435 for the background.<a name="line.288"></a>
<span class="sourceLineNo">289</span> * &lt;p/&gt;<a name="line.289"></a>
<span class="sourceLineNo">290</span> * There should be no reason, except testing, to create a specific ReorderBlocks.<a name="line.290"></a>
<span class="sourceLineNo">291</span> * @return true if the interceptor was added, false otherwise.<a name="line.291"></a>
<span class="sourceLineNo">292</span> */<a name="line.292"></a>
<span class="sourceLineNo">293</span> static boolean addLocationsOrderInterceptor(Configuration conf, final ReorderBlocks lrb) {<a name="line.293"></a>
<span class="sourceLineNo">294</span> if (!conf.getBoolean("hbase.filesystem.reorder.blocks", true)) { // activated by default<a name="line.294"></a>
<span class="sourceLineNo">295</span> LOG.debug("addLocationsOrderInterceptor configured to false");<a name="line.295"></a>
<span class="sourceLineNo">296</span> return false;<a name="line.296"></a>
<span class="sourceLineNo">297</span> }<a name="line.297"></a>
<span class="sourceLineNo">298</span><a name="line.298"></a>
<span class="sourceLineNo">299</span> FileSystem fs;<a name="line.299"></a>
<span class="sourceLineNo">300</span> try {<a name="line.300"></a>
<span class="sourceLineNo">301</span> fs = FileSystem.get(conf);<a name="line.301"></a>
<span class="sourceLineNo">302</span> } catch (IOException e) {<a name="line.302"></a>
<span class="sourceLineNo">303</span> LOG.warn("Can't get the file system from the conf.", e);<a name="line.303"></a>
<span class="sourceLineNo">304</span> return false;<a name="line.304"></a>
<span class="sourceLineNo">305</span> }<a name="line.305"></a>
<span class="sourceLineNo">306</span><a name="line.306"></a>
<span class="sourceLineNo">307</span> if (!(fs instanceof DistributedFileSystem)) {<a name="line.307"></a>
<span class="sourceLineNo">308</span> LOG.debug("The file system is not a DistributedFileSystem. "<a name="line.308"></a>
<span class="sourceLineNo">309</span> + "Skipping on block location reordering");<a name="line.309"></a>
<span class="sourceLineNo">310</span> return false;<a name="line.310"></a>
<span class="sourceLineNo">311</span> }<a name="line.311"></a>
<span class="sourceLineNo">312</span><a name="line.312"></a>
<span class="sourceLineNo">313</span> DistributedFileSystem dfs = (DistributedFileSystem) fs;<a name="line.313"></a>
<span class="sourceLineNo">314</span> DFSClient dfsc = dfs.getClient();<a name="line.314"></a>
<span class="sourceLineNo">315</span> if (dfsc == null) {<a name="line.315"></a>
<span class="sourceLineNo">316</span> LOG.warn("The DistributedFileSystem does not contain a DFSClient. Can't add the location "<a name="line.316"></a>
<span class="sourceLineNo">317</span> + "block reordering interceptor. Continuing, but this is unexpected.");<a name="line.317"></a>
<span class="sourceLineNo">318</span> return false;<a name="line.318"></a>
<span class="sourceLineNo">319</span> }<a name="line.319"></a>
<span class="sourceLineNo">320</span><a name="line.320"></a>
<span class="sourceLineNo">321</span> try {<a name="line.321"></a>
<span class="sourceLineNo">322</span> Field nf = DFSClient.class.getDeclaredField("namenode");<a name="line.322"></a>
<span class="sourceLineNo">323</span> nf.setAccessible(true);<a name="line.323"></a>
<span class="sourceLineNo">324</span> Field modifiersField = ReflectionUtils.getModifiersField();<a name="line.324"></a>
<span class="sourceLineNo">325</span> modifiersField.setAccessible(true);<a name="line.325"></a>
<span class="sourceLineNo">326</span> modifiersField.setInt(nf, nf.getModifiers() &amp; ~Modifier.FINAL);<a name="line.326"></a>
<span class="sourceLineNo">327</span><a name="line.327"></a>
<span class="sourceLineNo">328</span> ClientProtocol namenode = (ClientProtocol) nf.get(dfsc);<a name="line.328"></a>
<span class="sourceLineNo">329</span> if (namenode == null) {<a name="line.329"></a>
<span class="sourceLineNo">330</span> LOG.warn("The DFSClient is not linked to a namenode. Can't add the location block"<a name="line.330"></a>
<span class="sourceLineNo">331</span> + " reordering interceptor. Continuing, but this is unexpected.");<a name="line.331"></a>
<span class="sourceLineNo">332</span> return false;<a name="line.332"></a>
<span class="sourceLineNo">333</span> }<a name="line.333"></a>
<span class="sourceLineNo">334</span><a name="line.334"></a>
<span class="sourceLineNo">335</span> ClientProtocol cp1 = createReorderingProxy(namenode, lrb, conf);<a name="line.335"></a>
<span class="sourceLineNo">336</span> nf.set(dfsc, cp1);<a name="line.336"></a>
<span class="sourceLineNo">337</span> LOG.info("Added intercepting call to namenode#getBlockLocations so can do block reordering"<a name="line.337"></a>
<span class="sourceLineNo">338</span> + " using class " + lrb.getClass().getName());<a name="line.338"></a>
<span class="sourceLineNo">339</span> } catch (NoSuchFieldException e) {<a name="line.339"></a>
<span class="sourceLineNo">340</span> LOG.warn("Can't modify the DFSClient#namenode field to add the location reorder.", e);<a name="line.340"></a>
<span class="sourceLineNo">341</span> return false;<a name="line.341"></a>
<span class="sourceLineNo">342</span> } catch (IllegalAccessException e) {<a name="line.342"></a>
<span class="sourceLineNo">343</span> LOG.warn("Can't modify the DFSClient#namenode field to add the location reorder.", e);<a name="line.343"></a>
<span class="sourceLineNo">344</span> return false;<a name="line.344"></a>
<span class="sourceLineNo">345</span> }<a name="line.345"></a>
<span class="sourceLineNo">346</span><a name="line.346"></a>
<span class="sourceLineNo">347</span> return true;<a name="line.347"></a>
<span class="sourceLineNo">348</span> }<a name="line.348"></a>
<span class="sourceLineNo">349</span><a name="line.349"></a>
<span class="sourceLineNo">350</span> private static ClientProtocol createReorderingProxy(final ClientProtocol cp,<a name="line.350"></a>
<span class="sourceLineNo">351</span> final ReorderBlocks lrb, final Configuration conf) {<a name="line.351"></a>
<span class="sourceLineNo">352</span> return (ClientProtocol) Proxy.newProxyInstance(cp.getClass().getClassLoader(),<a name="line.352"></a>
<span class="sourceLineNo">353</span> new Class[] { ClientProtocol.class, Closeable.class }, new InvocationHandler() {<a name="line.353"></a>
<span class="sourceLineNo">354</span> @Override<a name="line.354"></a>
<span class="sourceLineNo">355</span> public Object invoke(Object proxy, Method method, Object[] args) throws Throwable {<a name="line.355"></a>
<span class="sourceLineNo">356</span> try {<a name="line.356"></a>
<span class="sourceLineNo">357</span> if ((args == null || args.length == 0) &amp;&amp; "close".equals(method.getName())) {<a name="line.357"></a>
<span class="sourceLineNo">358</span> RPC.stopProxy(cp);<a name="line.358"></a>
<span class="sourceLineNo">359</span> return null;<a name="line.359"></a>
<span class="sourceLineNo">360</span> } else {<a name="line.360"></a>
<span class="sourceLineNo">361</span> Object res = method.invoke(cp, args);<a name="line.361"></a>
<span class="sourceLineNo">362</span> if (<a name="line.362"></a>
<span class="sourceLineNo">363</span> res != null &amp;&amp; args != null &amp;&amp; args.length == 3<a name="line.363"></a>
<span class="sourceLineNo">364</span> &amp;&amp; "getBlockLocations".equals(method.getName()) &amp;&amp; res instanceof LocatedBlocks<a name="line.364"></a>
<span class="sourceLineNo">365</span> &amp;&amp; args[0] instanceof String &amp;&amp; args[0] != null<a name="line.365"></a>
<span class="sourceLineNo">366</span> ) {<a name="line.366"></a>
<span class="sourceLineNo">367</span> lrb.reorderBlocks(conf, (LocatedBlocks) res, (String) args[0]);<a name="line.367"></a>
<span class="sourceLineNo">368</span> }<a name="line.368"></a>
<span class="sourceLineNo">369</span> return res;<a name="line.369"></a>
<span class="sourceLineNo">370</span> }<a name="line.370"></a>
<span class="sourceLineNo">371</span> } catch (InvocationTargetException ite) {<a name="line.371"></a>
<span class="sourceLineNo">372</span> // We will have this for all the exception, checked on not, sent<a name="line.372"></a>
<span class="sourceLineNo">373</span> // by any layer, including the functional exception<a name="line.373"></a>
<span class="sourceLineNo">374</span> Throwable cause = ite.getCause();<a name="line.374"></a>
<span class="sourceLineNo">375</span> if (cause == null) {<a name="line.375"></a>
<span class="sourceLineNo">376</span> throw new RuntimeException("Proxy invocation failed and getCause is null", ite);<a name="line.376"></a>
<span class="sourceLineNo">377</span> }<a name="line.377"></a>
<span class="sourceLineNo">378</span> if (cause instanceof UndeclaredThrowableException) {<a name="line.378"></a>
<span class="sourceLineNo">379</span> Throwable causeCause = cause.getCause();<a name="line.379"></a>
<span class="sourceLineNo">380</span> if (causeCause == null) {<a name="line.380"></a>
<span class="sourceLineNo">381</span> throw new RuntimeException("UndeclaredThrowableException had null cause!");<a name="line.381"></a>
<span class="sourceLineNo">382</span> }<a name="line.382"></a>
<span class="sourceLineNo">383</span> cause = cause.getCause();<a name="line.383"></a>
<span class="sourceLineNo">384</span> }<a name="line.384"></a>
<span class="sourceLineNo">385</span> throw cause;<a name="line.385"></a>
<span class="sourceLineNo">386</span> }<a name="line.386"></a>
<span class="sourceLineNo">387</span> }<a name="line.387"></a>
<span class="sourceLineNo">388</span> });<a name="line.388"></a>
<span class="sourceLineNo">389</span> }<a name="line.389"></a>
<span class="sourceLineNo">390</span><a name="line.390"></a>
<span class="sourceLineNo">391</span> /**<a name="line.391"></a>
<span class="sourceLineNo">392</span> * Interface to implement to add a specific reordering logic in hdfs.<a name="line.392"></a>
<span class="sourceLineNo">393</span> */<a name="line.393"></a>
<span class="sourceLineNo">394</span> interface ReorderBlocks {<a name="line.394"></a>
<span class="sourceLineNo">395</span> /**<a name="line.395"></a>
<span class="sourceLineNo">396</span> * @param conf - the conf to use<a name="line.396"></a>
<span class="sourceLineNo">397</span> * @param lbs - the LocatedBlocks to reorder<a name="line.397"></a>
<span class="sourceLineNo">398</span> * @param src - the file name currently read<a name="line.398"></a>
<span class="sourceLineNo">399</span> * @throws IOException - if something went wrong<a name="line.399"></a>
<span class="sourceLineNo">400</span> */<a name="line.400"></a>
<span class="sourceLineNo">401</span> void reorderBlocks(Configuration conf, LocatedBlocks lbs, String src) throws IOException;<a name="line.401"></a>
<span class="sourceLineNo">402</span> }<a name="line.402"></a>
<span class="sourceLineNo">403</span><a name="line.403"></a>
<span class="sourceLineNo">404</span> /**<a name="line.404"></a>
<span class="sourceLineNo">405</span> * We're putting at lowest priority the wal files blocks that are on the same datanode as the<a name="line.405"></a>
<span class="sourceLineNo">406</span> * original regionserver which created these files. This because we fear that the datanode is<a name="line.406"></a>
<span class="sourceLineNo">407</span> * actually dead, so if we use it it will timeout.<a name="line.407"></a>
<span class="sourceLineNo">408</span> */<a name="line.408"></a>
<span class="sourceLineNo">409</span> static class ReorderWALBlocks implements ReorderBlocks {<a name="line.409"></a>
<span class="sourceLineNo">410</span> @Override<a name="line.410"></a>
<span class="sourceLineNo">411</span> public void reorderBlocks(Configuration conf, LocatedBlocks lbs, String src)<a name="line.411"></a>
<span class="sourceLineNo">412</span> throws IOException {<a name="line.412"></a>
<span class="sourceLineNo">413</span><a name="line.413"></a>
<span class="sourceLineNo">414</span> ServerName sn = AbstractFSWALProvider.getServerNameFromWALDirectoryName(conf, src);<a name="line.414"></a>
<span class="sourceLineNo">415</span> if (sn == null) {<a name="line.415"></a>
<span class="sourceLineNo">416</span> // It's not an WAL<a name="line.416"></a>
<span class="sourceLineNo">417</span> return;<a name="line.417"></a>
<span class="sourceLineNo">418</span> }<a name="line.418"></a>
<span class="sourceLineNo">419</span><a name="line.419"></a>
<span class="sourceLineNo">420</span> // Ok, so it's an WAL<a name="line.420"></a>
<span class="sourceLineNo">421</span> String hostName = sn.getHostname();<a name="line.421"></a>
<span class="sourceLineNo">422</span> if (LOG.isTraceEnabled()) {<a name="line.422"></a>
<span class="sourceLineNo">423</span> LOG.trace(src + " is an WAL file, so reordering blocks, last hostname will be:" + hostName);<a name="line.423"></a>
<span class="sourceLineNo">424</span> }<a name="line.424"></a>
<span class="sourceLineNo">425</span><a name="line.425"></a>
<span class="sourceLineNo">426</span> // Just check for all blocks<a name="line.426"></a>
<span class="sourceLineNo">427</span> for (LocatedBlock lb : lbs.getLocatedBlocks()) {<a name="line.427"></a>
<span class="sourceLineNo">428</span> DatanodeInfo[] dnis = lb.getLocations();<a name="line.428"></a>
<span class="sourceLineNo">429</span> if (dnis != null &amp;&amp; dnis.length &gt; 1) {<a name="line.429"></a>
<span class="sourceLineNo">430</span> boolean found = false;<a name="line.430"></a>
<span class="sourceLineNo">431</span> for (int i = 0; i &lt; dnis.length - 1 &amp;&amp; !found; i++) {<a name="line.431"></a>
<span class="sourceLineNo">432</span> if (hostName.equals(dnis[i].getHostName())) {<a name="line.432"></a>
<span class="sourceLineNo">433</span> // advance the other locations by one and put this one at the last place.<a name="line.433"></a>
<span class="sourceLineNo">434</span> DatanodeInfo toLast = dnis[i];<a name="line.434"></a>
<span class="sourceLineNo">435</span> System.arraycopy(dnis, i + 1, dnis, i, dnis.length - i - 1);<a name="line.435"></a>
<span class="sourceLineNo">436</span> dnis[dnis.length - 1] = toLast;<a name="line.436"></a>
<span class="sourceLineNo">437</span> found = true;<a name="line.437"></a>
<span class="sourceLineNo">438</span> }<a name="line.438"></a>
<span class="sourceLineNo">439</span> }<a name="line.439"></a>
<span class="sourceLineNo">440</span> }<a name="line.440"></a>
<span class="sourceLineNo">441</span> }<a name="line.441"></a>
<span class="sourceLineNo">442</span> }<a name="line.442"></a>
<span class="sourceLineNo">443</span> }<a name="line.443"></a>
<span class="sourceLineNo">444</span><a name="line.444"></a>
<span class="sourceLineNo">445</span> /**<a name="line.445"></a>
<span class="sourceLineNo">446</span> * Create a new HFileSystem object, similar to FileSystem.get(). This returns a filesystem object<a name="line.446"></a>
<span class="sourceLineNo">447</span> * that avoids checksum verification in the filesystem for hfileblock-reads. For these blocks,<a name="line.447"></a>
<span class="sourceLineNo">448</span> * checksum verification is done by HBase.<a name="line.448"></a>
<span class="sourceLineNo">449</span> */<a name="line.449"></a>
<span class="sourceLineNo">450</span> static public FileSystem get(Configuration conf) throws IOException {<a name="line.450"></a>
<span class="sourceLineNo">451</span> return new HFileSystem(conf, true);<a name="line.451"></a>
<span class="sourceLineNo">452</span> }<a name="line.452"></a>
<span class="sourceLineNo">453</span><a name="line.453"></a>
<span class="sourceLineNo">454</span> /**<a name="line.454"></a>
<span class="sourceLineNo">455</span> * The org.apache.hadoop.fs.FilterFileSystem does not yet support createNonRecursive. This is a<a name="line.455"></a>
<span class="sourceLineNo">456</span> * hadoop bug and when it is fixed in Hadoop, this definition will go away.<a name="line.456"></a>
<span class="sourceLineNo">457</span> */<a name="line.457"></a>
<span class="sourceLineNo">458</span> @Override<a name="line.458"></a>
<span class="sourceLineNo">459</span> @SuppressWarnings("deprecation")<a name="line.459"></a>
<span class="sourceLineNo">460</span> public FSDataOutputStream createNonRecursive(Path f, boolean overwrite, int bufferSize,<a name="line.460"></a>
<span class="sourceLineNo">461</span> short replication, long blockSize, Progressable progress) throws IOException {<a name="line.461"></a>
<span class="sourceLineNo">462</span> return fs.createNonRecursive(f, overwrite, bufferSize, replication, blockSize, progress);<a name="line.462"></a>
<span class="sourceLineNo">463</span> }<a name="line.463"></a>
<span class="sourceLineNo">464</span>}<a name="line.464"></a>
</pre>
</div>
</body>
</html>