| <!DOCTYPE HTML> |
| <html lang="en"> |
| <head> |
| <!-- Generated by javadoc (17) --> |
| <title>Source code</title> |
| <meta name="viewport" content="width=device-width, initial-scale=1"> |
| <meta name="description" content="source: package: org.apache.hadoop.hbase.wal, class: WALSplitter, class: SplitWALResult"> |
| <meta name="generator" content="javadoc/SourceToHTMLConverter"> |
| <link rel="stylesheet" type="text/css" href="../../../../../../stylesheet.css" title="Style"> |
| </head> |
| <body class="source-page"> |
| <main role="main"> |
| <div class="source-container"> |
| <pre><span class="source-line-no">001</span><span id="line-1">/*</span> |
| <span class="source-line-no">002</span><span id="line-2"> * Licensed to the Apache Software Foundation (ASF) under one</span> |
| <span class="source-line-no">003</span><span id="line-3"> * or more contributor license agreements. See the NOTICE file</span> |
| <span class="source-line-no">004</span><span id="line-4"> * distributed with this work for additional information</span> |
| <span class="source-line-no">005</span><span id="line-5"> * regarding copyright ownership. The ASF licenses this file</span> |
| <span class="source-line-no">006</span><span id="line-6"> * to you under the Apache License, Version 2.0 (the</span> |
| <span class="source-line-no">007</span><span id="line-7"> * "License"); you may not use this file except in compliance</span> |
| <span class="source-line-no">008</span><span id="line-8"> * with the License. You may obtain a copy of the License at</span> |
| <span class="source-line-no">009</span><span id="line-9"> *</span> |
| <span class="source-line-no">010</span><span id="line-10"> * http://www.apache.org/licenses/LICENSE-2.0</span> |
| <span class="source-line-no">011</span><span id="line-11"> *</span> |
| <span class="source-line-no">012</span><span id="line-12"> * Unless required by applicable law or agreed to in writing, software</span> |
| <span class="source-line-no">013</span><span id="line-13"> * distributed under the License is distributed on an "AS IS" BASIS,</span> |
| <span class="source-line-no">014</span><span id="line-14"> * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.</span> |
| <span class="source-line-no">015</span><span id="line-15"> * See the License for the specific language governing permissions and</span> |
| <span class="source-line-no">016</span><span id="line-16"> * limitations under the License.</span> |
| <span class="source-line-no">017</span><span id="line-17"> */</span> |
| <span class="source-line-no">018</span><span id="line-18">package org.apache.hadoop.hbase.wal;</span> |
| <span class="source-line-no">019</span><span id="line-19"></span> |
| <span class="source-line-no">020</span><span id="line-20">import java.io.EOFException;</span> |
| <span class="source-line-no">021</span><span id="line-21">import java.io.FileNotFoundException;</span> |
| <span class="source-line-no">022</span><span id="line-22">import java.io.IOException;</span> |
| <span class="source-line-no">023</span><span id="line-23">import java.io.InterruptedIOException;</span> |
| <span class="source-line-no">024</span><span id="line-24">import java.text.ParseException;</span> |
| <span class="source-line-no">025</span><span id="line-25">import java.util.ArrayList;</span> |
| <span class="source-line-no">026</span><span id="line-26">import java.util.Collections;</span> |
| <span class="source-line-no">027</span><span id="line-27">import java.util.List;</span> |
| <span class="source-line-no">028</span><span id="line-28">import java.util.Map;</span> |
| <span class="source-line-no">029</span><span id="line-29">import java.util.TreeMap;</span> |
| <span class="source-line-no">030</span><span id="line-30">import java.util.concurrent.ConcurrentHashMap;</span> |
| <span class="source-line-no">031</span><span id="line-31">import java.util.concurrent.atomic.AtomicReference;</span> |
| <span class="source-line-no">032</span><span id="line-32">import org.apache.hadoop.conf.Configuration;</span> |
| <span class="source-line-no">033</span><span id="line-33">import org.apache.hadoop.fs.FileStatus;</span> |
| <span class="source-line-no">034</span><span id="line-34">import org.apache.hadoop.fs.FileSystem;</span> |
| <span class="source-line-no">035</span><span id="line-35">import org.apache.hadoop.fs.Path;</span> |
| <span class="source-line-no">036</span><span id="line-36">import org.apache.hadoop.hbase.HBaseConfiguration;</span> |
| <span class="source-line-no">037</span><span id="line-37">import org.apache.hadoop.hbase.HConstants;</span> |
| <span class="source-line-no">038</span><span id="line-38">import org.apache.hadoop.hbase.TableName;</span> |
| <span class="source-line-no">039</span><span id="line-39">import org.apache.hadoop.hbase.coordination.SplitLogWorkerCoordination;</span> |
| <span class="source-line-no">040</span><span id="line-40">import org.apache.hadoop.hbase.master.SplitLogManager;</span> |
| <span class="source-line-no">041</span><span id="line-41">import org.apache.hadoop.hbase.monitoring.MonitoredTask;</span> |
| <span class="source-line-no">042</span><span id="line-42">import org.apache.hadoop.hbase.monitoring.TaskMonitor;</span> |
| <span class="source-line-no">043</span><span id="line-43">import org.apache.hadoop.hbase.procedure2.util.StringUtils;</span> |
| <span class="source-line-no">044</span><span id="line-44">import org.apache.hadoop.hbase.regionserver.LastSequenceId;</span> |
| <span class="source-line-no">045</span><span id="line-45">import org.apache.hadoop.hbase.regionserver.RegionServerServices;</span> |
| <span class="source-line-no">046</span><span id="line-46">import org.apache.hadoop.hbase.regionserver.wal.WALCellCodec;</span> |
| <span class="source-line-no">047</span><span id="line-47">import org.apache.hadoop.hbase.util.Bytes;</span> |
| <span class="source-line-no">048</span><span id="line-48">import org.apache.hadoop.hbase.util.CancelableProgressable;</span> |
| <span class="source-line-no">049</span><span id="line-49">import org.apache.hadoop.hbase.util.CommonFSUtils;</span> |
| <span class="source-line-no">050</span><span id="line-50">import org.apache.hadoop.hbase.util.EnvironmentEdgeManager;</span> |
| <span class="source-line-no">051</span><span id="line-51">import org.apache.hadoop.hbase.util.RecoverLeaseFSUtils;</span> |
| <span class="source-line-no">052</span><span id="line-52">import org.apache.hadoop.hbase.wal.WAL.Entry;</span> |
| <span class="source-line-no">053</span><span id="line-53">import org.apache.hadoop.ipc.RemoteException;</span> |
| <span class="source-line-no">054</span><span id="line-54">import org.apache.yetus.audience.InterfaceAudience;</span> |
| <span class="source-line-no">055</span><span id="line-55">import org.slf4j.Logger;</span> |
| <span class="source-line-no">056</span><span id="line-56">import org.slf4j.LoggerFactory;</span> |
| <span class="source-line-no">057</span><span id="line-57"></span> |
| <span class="source-line-no">058</span><span id="line-58">import org.apache.hbase.thirdparty.com.google.common.base.Preconditions;</span> |
| <span class="source-line-no">059</span><span id="line-59">import org.apache.hbase.thirdparty.com.google.protobuf.TextFormat;</span> |
| <span class="source-line-no">060</span><span id="line-60"></span> |
| <span class="source-line-no">061</span><span id="line-61">import org.apache.hadoop.hbase.shaded.protobuf.generated.ClusterStatusProtos.RegionStoreSequenceIds;</span> |
| <span class="source-line-no">062</span><span id="line-62">import org.apache.hadoop.hbase.shaded.protobuf.generated.ClusterStatusProtos.StoreSequenceId;</span> |
| <span class="source-line-no">063</span><span id="line-63"></span> |
| <span class="source-line-no">064</span><span id="line-64">/**</span> |
| <span class="source-line-no">065</span><span id="line-65"> * Split RegionServer WAL files. Splits the WAL into new files, one per region, to be picked up on</span> |
| <span class="source-line-no">066</span><span id="line-66"> * Region reopen. Deletes the split WAL when finished. Create an instance and call</span> |
| <span class="source-line-no">067</span><span id="line-67"> * {@link #splitWAL(FileStatus, CancelableProgressable)} per file or use static helper methods.</span> |
| <span class="source-line-no">068</span><span id="line-68"> */</span> |
| <span class="source-line-no">069</span><span id="line-69">@InterfaceAudience.Private</span> |
| <span class="source-line-no">070</span><span id="line-70">public class WALSplitter {</span> |
| <span class="source-line-no">071</span><span id="line-71"> private static final Logger LOG = LoggerFactory.getLogger(WALSplitter.class);</span> |
| <span class="source-line-no">072</span><span id="line-72"> public static final String SPLIT_SKIP_ERRORS_KEY = "hbase.hlog.split.skip.errors";</span> |
| <span class="source-line-no">073</span><span id="line-73"></span> |
| <span class="source-line-no">074</span><span id="line-74"> /**</span> |
| <span class="source-line-no">075</span><span id="line-75"> * By default we retry errors in splitting, rather than skipping.</span> |
| <span class="source-line-no">076</span><span id="line-76"> */</span> |
| <span class="source-line-no">077</span><span id="line-77"> public static final boolean SPLIT_SKIP_ERRORS_DEFAULT = false;</span> |
| <span class="source-line-no">078</span><span id="line-78"></span> |
| <span class="source-line-no">079</span><span id="line-79"> // Parameters for split process</span> |
| <span class="source-line-no">080</span><span id="line-80"> protected final Path walRootDir;</span> |
| <span class="source-line-no">081</span><span id="line-81"> protected final FileSystem walFS;</span> |
| <span class="source-line-no">082</span><span id="line-82"> protected final Configuration conf;</span> |
| <span class="source-line-no">083</span><span id="line-83"> final Path rootDir;</span> |
| <span class="source-line-no">084</span><span id="line-84"> final FileSystem rootFS;</span> |
| <span class="source-line-no">085</span><span id="line-85"> final RegionServerServices rsServices;</span> |
| <span class="source-line-no">086</span><span id="line-86"></span> |
| <span class="source-line-no">087</span><span id="line-87"> // Major subcomponents of the split process.</span> |
| <span class="source-line-no">088</span><span id="line-88"> // These are separated into inner classes to make testing easier.</span> |
| <span class="source-line-no">089</span><span id="line-89"> OutputSink outputSink;</span> |
| <span class="source-line-no">090</span><span id="line-90"> private EntryBuffers entryBuffers;</span> |
| <span class="source-line-no">091</span><span id="line-91"></span> |
| <span class="source-line-no">092</span><span id="line-92"> /**</span> |
| <span class="source-line-no">093</span><span id="line-93"> * Coordinator for split log. Used by the zk-based log splitter. Not used by the procedure</span> |
| <span class="source-line-no">094</span><span id="line-94"> * v2-based log splitter.</span> |
| <span class="source-line-no">095</span><span id="line-95"> */</span> |
| <span class="source-line-no">096</span><span id="line-96"> private SplitLogWorkerCoordination splitLogWorkerCoordination;</span> |
| <span class="source-line-no">097</span><span id="line-97"></span> |
| <span class="source-line-no">098</span><span id="line-98"> private final WALFactory walFactory;</span> |
| <span class="source-line-no">099</span><span id="line-99"></span> |
| <span class="source-line-no">100</span><span id="line-100"> // For checking the latest flushed sequence id</span> |
| <span class="source-line-no">101</span><span id="line-101"> protected final LastSequenceId sequenceIdChecker;</span> |
| <span class="source-line-no">102</span><span id="line-102"></span> |
| <span class="source-line-no">103</span><span id="line-103"> // Map encodedRegionName -> lastFlushedSequenceId</span> |
| <span class="source-line-no">104</span><span id="line-104"> protected Map<String, Long> lastFlushedSequenceIds = new ConcurrentHashMap<>();</span> |
| <span class="source-line-no">105</span><span id="line-105"></span> |
| <span class="source-line-no">106</span><span id="line-106"> // Map encodedRegionName -> maxSeqIdInStores</span> |
| <span class="source-line-no">107</span><span id="line-107"> protected Map<String, Map<byte[], Long>> regionMaxSeqIdInStores = new ConcurrentHashMap<>();</span> |
| <span class="source-line-no">108</span><span id="line-108"></span> |
| <span class="source-line-no">109</span><span id="line-109"> // the file being split currently</span> |
| <span class="source-line-no">110</span><span id="line-110"> private FileStatus fileBeingSplit;</span> |
| <span class="source-line-no">111</span><span id="line-111"></span> |
| <span class="source-line-no">112</span><span id="line-112"> private final String tmpDirName;</span> |
| <span class="source-line-no">113</span><span id="line-113"></span> |
| <span class="source-line-no">114</span><span id="line-114"> /**</span> |
| <span class="source-line-no">115</span><span id="line-115"> * Split WAL directly to hfiles instead of into intermediary 'recovered.edits' files.</span> |
| <span class="source-line-no">116</span><span id="line-116"> */</span> |
| <span class="source-line-no">117</span><span id="line-117"> public static final String WAL_SPLIT_TO_HFILE = "hbase.wal.split.to.hfile";</span> |
| <span class="source-line-no">118</span><span id="line-118"> public static final boolean DEFAULT_WAL_SPLIT_TO_HFILE = false;</span> |
| <span class="source-line-no">119</span><span id="line-119"></span> |
| <span class="source-line-no">120</span><span id="line-120"> /**</span> |
| <span class="source-line-no">121</span><span id="line-121"> * True if we are to run with bounded amount of writers rather than let the count blossom. Default</span> |
| <span class="source-line-no">122</span><span id="line-122"> * is 'false'. Does not apply if you have set 'hbase.wal.split.to.hfile' as that is always</span> |
| <span class="source-line-no">123</span><span id="line-123"> * bounded. Only applies when you are doing recovery to 'recovered.edits' files (the old default).</span> |
| <span class="source-line-no">124</span><span id="line-124"> * Bounded writing tends to have higher throughput.</span> |
| <span class="source-line-no">125</span><span id="line-125"> */</span> |
| <span class="source-line-no">126</span><span id="line-126"> public final static String SPLIT_WRITER_CREATION_BOUNDED = "hbase.split.writer.creation.bounded";</span> |
| <span class="source-line-no">127</span><span id="line-127"></span> |
| <span class="source-line-no">128</span><span id="line-128"> public final static String SPLIT_WAL_BUFFER_SIZE = "hbase.regionserver.hlog.splitlog.buffersize";</span> |
| <span class="source-line-no">129</span><span id="line-129"> public final static String SPLIT_WAL_WRITER_THREADS =</span> |
| <span class="source-line-no">130</span><span id="line-130"> "hbase.regionserver.hlog.splitlog.writer.threads";</span> |
| <span class="source-line-no">131</span><span id="line-131"></span> |
| <span class="source-line-no">132</span><span id="line-132"> private final int numWriterThreads;</span> |
| <span class="source-line-no">133</span><span id="line-133"> private final long bufferSize;</span> |
| <span class="source-line-no">134</span><span id="line-134"> private final boolean splitWriterCreationBounded;</span> |
| <span class="source-line-no">135</span><span id="line-135"> private final boolean hfile;</span> |
| <span class="source-line-no">136</span><span id="line-136"> private final boolean skipErrors;</span> |
| <span class="source-line-no">137</span><span id="line-137"></span> |
| <span class="source-line-no">138</span><span id="line-138"> WALSplitter(final WALFactory factory, Configuration conf, Path walRootDir, FileSystem walFS,</span> |
| <span class="source-line-no">139</span><span id="line-139"> Path rootDir, FileSystem rootFS) {</span> |
| <span class="source-line-no">140</span><span id="line-140"> this(factory, conf, walRootDir, walFS, rootDir, rootFS, null, null, null);</span> |
| <span class="source-line-no">141</span><span id="line-141"> }</span> |
| <span class="source-line-no">142</span><span id="line-142"></span> |
| <span class="source-line-no">143</span><span id="line-143"> WALSplitter(final WALFactory factory, Configuration conf, Path walRootDir, FileSystem walFS,</span> |
| <span class="source-line-no">144</span><span id="line-144"> Path rootDir, FileSystem rootFS, LastSequenceId idChecker,</span> |
| <span class="source-line-no">145</span><span id="line-145"> SplitLogWorkerCoordination splitLogWorkerCoordination, RegionServerServices rsServices) {</span> |
| <span class="source-line-no">146</span><span id="line-146"> this.conf = HBaseConfiguration.create(conf);</span> |
| <span class="source-line-no">147</span><span id="line-147"> String codecClassName =</span> |
| <span class="source-line-no">148</span><span id="line-148"> conf.get(WALCellCodec.WAL_CELL_CODEC_CLASS_KEY, WALCellCodec.class.getName());</span> |
| <span class="source-line-no">149</span><span id="line-149"> this.conf.set(HConstants.RPC_CODEC_CONF_KEY, codecClassName);</span> |
| <span class="source-line-no">150</span><span id="line-150"> this.walRootDir = walRootDir;</span> |
| <span class="source-line-no">151</span><span id="line-151"> this.walFS = walFS;</span> |
| <span class="source-line-no">152</span><span id="line-152"> this.rootDir = rootDir;</span> |
| <span class="source-line-no">153</span><span id="line-153"> this.rootFS = rootFS;</span> |
| <span class="source-line-no">154</span><span id="line-154"> this.sequenceIdChecker = idChecker;</span> |
| <span class="source-line-no">155</span><span id="line-155"> this.splitLogWorkerCoordination = splitLogWorkerCoordination;</span> |
| <span class="source-line-no">156</span><span id="line-156"> this.rsServices = rsServices;</span> |
| <span class="source-line-no">157</span><span id="line-157"> this.walFactory = factory;</span> |
| <span class="source-line-no">158</span><span id="line-158"> this.tmpDirName =</span> |
| <span class="source-line-no">159</span><span id="line-159"> conf.get(HConstants.TEMPORARY_FS_DIRECTORY_KEY, HConstants.DEFAULT_TEMPORARY_HDFS_DIRECTORY);</span> |
| <span class="source-line-no">160</span><span id="line-160"> // if we limit the number of writers opened for sinking recovered edits</span> |
| <span class="source-line-no">161</span><span id="line-161"> this.splitWriterCreationBounded = conf.getBoolean(SPLIT_WRITER_CREATION_BOUNDED, false);</span> |
| <span class="source-line-no">162</span><span id="line-162"> this.bufferSize = this.conf.getLong(SPLIT_WAL_BUFFER_SIZE, 128 * 1024 * 1024);</span> |
| <span class="source-line-no">163</span><span id="line-163"> this.numWriterThreads = this.conf.getInt(SPLIT_WAL_WRITER_THREADS, 3);</span> |
| <span class="source-line-no">164</span><span id="line-164"> this.hfile = conf.getBoolean(WAL_SPLIT_TO_HFILE, DEFAULT_WAL_SPLIT_TO_HFILE);</span> |
| <span class="source-line-no">165</span><span id="line-165"> this.skipErrors = conf.getBoolean(SPLIT_SKIP_ERRORS_KEY, SPLIT_SKIP_ERRORS_DEFAULT);</span> |
| <span class="source-line-no">166</span><span id="line-166"> }</span> |
| <span class="source-line-no">167</span><span id="line-167"></span> |
| <span class="source-line-no">168</span><span id="line-168"> WALFactory getWalFactory() {</span> |
| <span class="source-line-no">169</span><span id="line-169"> return this.walFactory;</span> |
| <span class="source-line-no">170</span><span id="line-170"> }</span> |
| <span class="source-line-no">171</span><span id="line-171"></span> |
| <span class="source-line-no">172</span><span id="line-172"> FileStatus getFileBeingSplit() {</span> |
| <span class="source-line-no">173</span><span id="line-173"> return fileBeingSplit;</span> |
| <span class="source-line-no">174</span><span id="line-174"> }</span> |
| <span class="source-line-no">175</span><span id="line-175"></span> |
| <span class="source-line-no">176</span><span id="line-176"> String getTmpDirName() {</span> |
| <span class="source-line-no">177</span><span id="line-177"> return this.tmpDirName;</span> |
| <span class="source-line-no">178</span><span id="line-178"> }</span> |
| <span class="source-line-no">179</span><span id="line-179"></span> |
| <span class="source-line-no">180</span><span id="line-180"> Map<String, Map<byte[], Long>> getRegionMaxSeqIdInStores() {</span> |
| <span class="source-line-no">181</span><span id="line-181"> return regionMaxSeqIdInStores;</span> |
| <span class="source-line-no">182</span><span id="line-182"> }</span> |
| <span class="source-line-no">183</span><span id="line-183"></span> |
| <span class="source-line-no">184</span><span id="line-184"> /**</span> |
| <span class="source-line-no">185</span><span id="line-185"> * Splits a WAL file. Used by old {@link org.apache.hadoop.hbase.regionserver.SplitLogWorker} and</span> |
| <span class="source-line-no">186</span><span id="line-186"> * tests. Not used by new procedure-based WAL splitter.</span> |
| <span class="source-line-no">187</span><span id="line-187"> * @return false if it is interrupted by the progress-able.</span> |
| <span class="source-line-no">188</span><span id="line-188"> */</span> |
| <span class="source-line-no">189</span><span id="line-189"> public static boolean splitLogFile(Path walDir, FileStatus logfile, FileSystem walFS,</span> |
| <span class="source-line-no">190</span><span id="line-190"> Configuration conf, CancelableProgressable reporter, LastSequenceId idChecker,</span> |
| <span class="source-line-no">191</span><span id="line-191"> SplitLogWorkerCoordination splitLogWorkerCoordination, WALFactory factory,</span> |
| <span class="source-line-no">192</span><span id="line-192"> RegionServerServices rsServices) throws IOException {</span> |
| <span class="source-line-no">193</span><span id="line-193"> Path rootDir = CommonFSUtils.getRootDir(conf);</span> |
| <span class="source-line-no">194</span><span id="line-194"> FileSystem rootFS = rootDir.getFileSystem(conf);</span> |
| <span class="source-line-no">195</span><span id="line-195"> WALSplitter splitter = new WALSplitter(factory, conf, walDir, walFS, rootDir, rootFS, idChecker,</span> |
| <span class="source-line-no">196</span><span id="line-196"> splitLogWorkerCoordination, rsServices);</span> |
| <span class="source-line-no">197</span><span id="line-197"> // splitWAL returns a data structure with whether split is finished and if the file is corrupt.</span> |
| <span class="source-line-no">198</span><span id="line-198"> // We don't need to propagate corruption flag here because it is propagated by the</span> |
| <span class="source-line-no">199</span><span id="line-199"> // SplitLogWorkerCoordination.</span> |
| <span class="source-line-no">200</span><span id="line-200"> return splitter.splitWAL(logfile, reporter).isFinished();</span> |
| <span class="source-line-no">201</span><span id="line-201"> }</span> |
| <span class="source-line-no">202</span><span id="line-202"></span> |
| <span class="source-line-no">203</span><span id="line-203"> /**</span> |
| <span class="source-line-no">204</span><span id="line-204"> * Split a folder of WAL files. Delete the directory when done. Used by tools and unit tests. It</span> |
| <span class="source-line-no">205</span><span id="line-205"> * should be package private. It is public only because TestWALObserver is in a different package,</span> |
| <span class="source-line-no">206</span><span id="line-206"> * which uses this method to do log splitting.</span> |
| <span class="source-line-no">207</span><span id="line-207"> * @return List of output files created by the split.</span> |
| <span class="source-line-no">208</span><span id="line-208"> */</span> |
| <span class="source-line-no">209</span><span id="line-209"> public static List<Path> split(Path walRootDir, Path walsDir, Path archiveDir, FileSystem walFS,</span> |
| <span class="source-line-no">210</span><span id="line-210"> Configuration conf, final WALFactory factory) throws IOException {</span> |
| <span class="source-line-no">211</span><span id="line-211"> Path rootDir = CommonFSUtils.getRootDir(conf);</span> |
| <span class="source-line-no">212</span><span id="line-212"> FileSystem rootFS = rootDir.getFileSystem(conf);</span> |
| <span class="source-line-no">213</span><span id="line-213"> WALSplitter splitter = new WALSplitter(factory, conf, walRootDir, walFS, rootDir, rootFS);</span> |
| <span class="source-line-no">214</span><span id="line-214"> final List<FileStatus> wals =</span> |
| <span class="source-line-no">215</span><span id="line-215"> SplitLogManager.getFileList(conf, Collections.singletonList(walsDir), null);</span> |
| <span class="source-line-no">216</span><span id="line-216"> List<Path> splits = new ArrayList<>();</span> |
| <span class="source-line-no">217</span><span id="line-217"> if (!wals.isEmpty()) {</span> |
| <span class="source-line-no">218</span><span id="line-218"> for (FileStatus wal : wals) {</span> |
| <span class="source-line-no">219</span><span id="line-219"> SplitWALResult splitWALResult = splitter.splitWAL(wal, null);</span> |
| <span class="source-line-no">220</span><span id="line-220"> if (splitWALResult.isFinished()) {</span> |
| <span class="source-line-no">221</span><span id="line-221"> WALSplitUtil.archive(wal.getPath(), splitWALResult.isCorrupt(), archiveDir, walFS, conf);</span> |
| <span class="source-line-no">222</span><span id="line-222"> // splitter.outputSink.splits is mark as final, do not need null check</span> |
| <span class="source-line-no">223</span><span id="line-223"> splits.addAll(splitter.outputSink.splits);</span> |
| <span class="source-line-no">224</span><span id="line-224"> }</span> |
| <span class="source-line-no">225</span><span id="line-225"> }</span> |
| <span class="source-line-no">226</span><span id="line-226"> }</span> |
| <span class="source-line-no">227</span><span id="line-227"> if (!walFS.delete(walsDir, true)) {</span> |
| <span class="source-line-no">228</span><span id="line-228"> throw new IOException("Unable to delete src dir " + walsDir);</span> |
| <span class="source-line-no">229</span><span id="line-229"> }</span> |
| <span class="source-line-no">230</span><span id="line-230"> return splits;</span> |
| <span class="source-line-no">231</span><span id="line-231"> }</span> |
| <span class="source-line-no">232</span><span id="line-232"></span> |
| <span class="source-line-no">233</span><span id="line-233"> /**</span> |
| <span class="source-line-no">234</span><span id="line-234"> * Data structure returned as result by #splitWAL(FileStatus, CancelableProgressable). Test</span> |
| <span class="source-line-no">235</span><span id="line-235"> * {@link #isFinished()} to see if we are done with the WAL and {@link #isCorrupt()} for if the</span> |
| <span class="source-line-no">236</span><span id="line-236"> * WAL is corrupt.</span> |
| <span class="source-line-no">237</span><span id="line-237"> */</span> |
| <span class="source-line-no">238</span><span id="line-238"> static final class SplitWALResult {</span> |
| <span class="source-line-no">239</span><span id="line-239"> private final boolean finished;</span> |
| <span class="source-line-no">240</span><span id="line-240"> private final boolean corrupt;</span> |
| <span class="source-line-no">241</span><span id="line-241"></span> |
| <span class="source-line-no">242</span><span id="line-242"> private SplitWALResult(boolean finished, boolean corrupt) {</span> |
| <span class="source-line-no">243</span><span id="line-243"> this.finished = finished;</span> |
| <span class="source-line-no">244</span><span id="line-244"> this.corrupt = corrupt;</span> |
| <span class="source-line-no">245</span><span id="line-245"> }</span> |
| <span class="source-line-no">246</span><span id="line-246"></span> |
| <span class="source-line-no">247</span><span id="line-247"> public boolean isFinished() {</span> |
| <span class="source-line-no">248</span><span id="line-248"> return finished;</span> |
| <span class="source-line-no">249</span><span id="line-249"> }</span> |
| <span class="source-line-no">250</span><span id="line-250"></span> |
| <span class="source-line-no">251</span><span id="line-251"> public boolean isCorrupt() {</span> |
| <span class="source-line-no">252</span><span id="line-252"> return corrupt;</span> |
| <span class="source-line-no">253</span><span id="line-253"> }</span> |
| <span class="source-line-no">254</span><span id="line-254"> }</span> |
| <span class="source-line-no">255</span><span id="line-255"></span> |
| <span class="source-line-no">256</span><span id="line-256"> /**</span> |
| <span class="source-line-no">257</span><span id="line-257"> * Setup the output sinks and entry buffers ahead of splitting WAL.</span> |
| <span class="source-line-no">258</span><span id="line-258"> */</span> |
| <span class="source-line-no">259</span><span id="line-259"> private void createOutputSinkAndEntryBuffers() {</span> |
| <span class="source-line-no">260</span><span id="line-260"> PipelineController controller = new PipelineController();</span> |
| <span class="source-line-no">261</span><span id="line-261"> if (this.hfile) {</span> |
| <span class="source-line-no">262</span><span id="line-262"> this.entryBuffers = new BoundedEntryBuffers(controller, this.bufferSize);</span> |
| <span class="source-line-no">263</span><span id="line-263"> this.outputSink = new BoundedRecoveredHFilesOutputSink(this, controller, this.entryBuffers,</span> |
| <span class="source-line-no">264</span><span id="line-264"> this.numWriterThreads);</span> |
| <span class="source-line-no">265</span><span id="line-265"> } else if (this.splitWriterCreationBounded) {</span> |
| <span class="source-line-no">266</span><span id="line-266"> this.entryBuffers = new BoundedEntryBuffers(controller, this.bufferSize);</span> |
| <span class="source-line-no">267</span><span id="line-267"> this.outputSink = new BoundedRecoveredEditsOutputSink(this, controller, this.entryBuffers,</span> |
| <span class="source-line-no">268</span><span id="line-268"> this.numWriterThreads);</span> |
| <span class="source-line-no">269</span><span id="line-269"> } else {</span> |
| <span class="source-line-no">270</span><span id="line-270"> this.entryBuffers = new EntryBuffers(controller, this.bufferSize);</span> |
| <span class="source-line-no">271</span><span id="line-271"> this.outputSink =</span> |
| <span class="source-line-no">272</span><span id="line-272"> new RecoveredEditsOutputSink(this, controller, this.entryBuffers, this.numWriterThreads);</span> |
| <span class="source-line-no">273</span><span id="line-273"> }</span> |
| <span class="source-line-no">274</span><span id="line-274"> }</span> |
| <span class="source-line-no">275</span><span id="line-275"></span> |
| <span class="source-line-no">276</span><span id="line-276"> /**</span> |
| <span class="source-line-no">277</span><span id="line-277"> * WAL splitting implementation, splits one WAL file.</span> |
| <span class="source-line-no">278</span><span id="line-278"> * @param walStatus should be for an actual WAL file.</span> |
| <span class="source-line-no">279</span><span id="line-279"> */</span> |
| <span class="source-line-no">280</span><span id="line-280"> SplitWALResult splitWAL(FileStatus walStatus, CancelableProgressable cancel) throws IOException {</span> |
| <span class="source-line-no">281</span><span id="line-281"> Path wal = walStatus.getPath();</span> |
| <span class="source-line-no">282</span><span id="line-282"> Preconditions.checkArgument(walStatus.isFile(), "Not a regular file " + wal.toString());</span> |
| <span class="source-line-no">283</span><span id="line-283"> boolean corrupt = false;</span> |
| <span class="source-line-no">284</span><span id="line-284"> int interval = conf.getInt("hbase.splitlog.report.interval.loglines", 1024);</span> |
| <span class="source-line-no">285</span><span id="line-285"> boolean outputSinkStarted = false;</span> |
| <span class="source-line-no">286</span><span id="line-286"> boolean cancelled = false;</span> |
| <span class="source-line-no">287</span><span id="line-287"> int editsCount = 0;</span> |
| <span class="source-line-no">288</span><span id="line-288"> int editsSkipped = 0;</span> |
| <span class="source-line-no">289</span><span id="line-289"> MonitoredTask status = TaskMonitor.get()</span> |
| <span class="source-line-no">290</span><span id="line-290"> .createStatus("Splitting " + wal + " to temporary staging area.", false, true);</span> |
| <span class="source-line-no">291</span><span id="line-291"> WALStreamReader walReader = null;</span> |
| <span class="source-line-no">292</span><span id="line-292"> this.fileBeingSplit = walStatus;</span> |
| <span class="source-line-no">293</span><span id="line-293"> long startTS = EnvironmentEdgeManager.currentTime();</span> |
| <span class="source-line-no">294</span><span id="line-294"> long length = walStatus.getLen();</span> |
| <span class="source-line-no">295</span><span id="line-295"> String lengthStr = StringUtils.humanSize(length);</span> |
| <span class="source-line-no">296</span><span id="line-296"> createOutputSinkAndEntryBuffers();</span> |
| <span class="source-line-no">297</span><span id="line-297"> try {</span> |
| <span class="source-line-no">298</span><span id="line-298"> String logStr = "Splitting " + wal + ", size=" + lengthStr + " (" + length + "bytes)";</span> |
| <span class="source-line-no">299</span><span id="line-299"> LOG.info(logStr);</span> |
| <span class="source-line-no">300</span><span id="line-300"> status.setStatus(logStr);</span> |
| <span class="source-line-no">301</span><span id="line-301"> if (cancel != null && !cancel.progress()) {</span> |
| <span class="source-line-no">302</span><span id="line-302"> cancelled = true;</span> |
| <span class="source-line-no">303</span><span id="line-303"> return new SplitWALResult(false, corrupt);</span> |
| <span class="source-line-no">304</span><span id="line-304"> }</span> |
| <span class="source-line-no">305</span><span id="line-305"> walReader = getReader(walStatus, this.skipErrors, cancel);</span> |
| <span class="source-line-no">306</span><span id="line-306"> if (walReader == null) {</span> |
| <span class="source-line-no">307</span><span id="line-307"> LOG.warn("Nothing in {}; empty?", wal);</span> |
| <span class="source-line-no">308</span><span id="line-308"> return new SplitWALResult(true, corrupt);</span> |
| <span class="source-line-no">309</span><span id="line-309"> }</span> |
| <span class="source-line-no">310</span><span id="line-310"> LOG.info("Open {} took {}ms", wal, EnvironmentEdgeManager.currentTime() - startTS);</span> |
| <span class="source-line-no">311</span><span id="line-311"> int numOpenedFilesBeforeReporting = conf.getInt("hbase.splitlog.report.openedfiles", 3);</span> |
| <span class="source-line-no">312</span><span id="line-312"> int numOpenedFilesLastCheck = 0;</span> |
| <span class="source-line-no">313</span><span id="line-313"> outputSink.setReporter(cancel);</span> |
| <span class="source-line-no">314</span><span id="line-314"> outputSink.setStatus(status);</span> |
| <span class="source-line-no">315</span><span id="line-315"> outputSink.startWriterThreads();</span> |
| <span class="source-line-no">316</span><span id="line-316"> outputSinkStarted = true;</span> |
| <span class="source-line-no">317</span><span id="line-317"> Entry entry;</span> |
| <span class="source-line-no">318</span><span id="line-318"> startTS = EnvironmentEdgeManager.currentTime();</span> |
| <span class="source-line-no">319</span><span id="line-319"> while ((entry = getNextLogLine(walReader, wal, this.skipErrors)) != null) {</span> |
| <span class="source-line-no">320</span><span id="line-320"> if (WALEdit.isReplicationMarkerEdit(entry.getEdit())) {</span> |
| <span class="source-line-no">321</span><span id="line-321"> // Skip processing the replication marker edits.</span> |
| <span class="source-line-no">322</span><span id="line-322"> if (LOG.isDebugEnabled()) {</span> |
| <span class="source-line-no">323</span><span id="line-323"> LOG.debug("Ignoring Replication marker edits.");</span> |
| <span class="source-line-no">324</span><span id="line-324"> }</span> |
| <span class="source-line-no">325</span><span id="line-325"> continue;</span> |
| <span class="source-line-no">326</span><span id="line-326"> }</span> |
| <span class="source-line-no">327</span><span id="line-327"> byte[] region = entry.getKey().getEncodedRegionName();</span> |
| <span class="source-line-no">328</span><span id="line-328"> String encodedRegionNameAsStr = Bytes.toString(region);</span> |
| <span class="source-line-no">329</span><span id="line-329"> Long lastFlushedSequenceId = lastFlushedSequenceIds.get(encodedRegionNameAsStr);</span> |
| <span class="source-line-no">330</span><span id="line-330"> if (lastFlushedSequenceId == null) {</span> |
| <span class="source-line-no">331</span><span id="line-331"> if (</span> |
| <span class="source-line-no">332</span><span id="line-332"> !(isRegionDirPresentUnderRoot(entry.getKey().getTableName(), encodedRegionNameAsStr))</span> |
| <span class="source-line-no">333</span><span id="line-333"> ) {</span> |
| <span class="source-line-no">334</span><span id="line-334"> // The region directory itself is not present in the FS. This indicates that</span> |
| <span class="source-line-no">335</span><span id="line-335"> // the region/table is already removed. We can just skip all the edits for this</span> |
| <span class="source-line-no">336</span><span id="line-336"> // region. Setting lastFlushedSequenceId as Long.MAX_VALUE so that all edits</span> |
| <span class="source-line-no">337</span><span id="line-337"> // will get skipped by the seqId check below.</span> |
| <span class="source-line-no">338</span><span id="line-338"> // See more details at https://issues.apache.org/jira/browse/HBASE-24189</span> |
| <span class="source-line-no">339</span><span id="line-339"> LOG.info("{} no longer in filesystem; skipping all edits.", encodedRegionNameAsStr);</span> |
| <span class="source-line-no">340</span><span id="line-340"> lastFlushedSequenceId = Long.MAX_VALUE;</span> |
| <span class="source-line-no">341</span><span id="line-341"> } else {</span> |
| <span class="source-line-no">342</span><span id="line-342"> if (sequenceIdChecker != null) {</span> |
| <span class="source-line-no">343</span><span id="line-343"> RegionStoreSequenceIds ids = sequenceIdChecker.getLastSequenceId(region);</span> |
| <span class="source-line-no">344</span><span id="line-344"> Map<byte[], Long> maxSeqIdInStores = new TreeMap<>(Bytes.BYTES_COMPARATOR);</span> |
| <span class="source-line-no">345</span><span id="line-345"> for (StoreSequenceId storeSeqId : ids.getStoreSequenceIdList()) {</span> |
| <span class="source-line-no">346</span><span id="line-346"> maxSeqIdInStores.put(storeSeqId.getFamilyName().toByteArray(),</span> |
| <span class="source-line-no">347</span><span id="line-347"> storeSeqId.getSequenceId());</span> |
| <span class="source-line-no">348</span><span id="line-348"> }</span> |
| <span class="source-line-no">349</span><span id="line-349"> regionMaxSeqIdInStores.put(encodedRegionNameAsStr, maxSeqIdInStores);</span> |
| <span class="source-line-no">350</span><span id="line-350"> lastFlushedSequenceId = ids.getLastFlushedSequenceId();</span> |
| <span class="source-line-no">351</span><span id="line-351"> if (LOG.isDebugEnabled()) {</span> |
| <span class="source-line-no">352</span><span id="line-352"> LOG.debug("Last flushed sequenceid for " + encodedRegionNameAsStr + ": "</span> |
| <span class="source-line-no">353</span><span id="line-353"> + TextFormat.shortDebugString(ids));</span> |
| <span class="source-line-no">354</span><span id="line-354"> }</span> |
| <span class="source-line-no">355</span><span id="line-355"> }</span> |
| <span class="source-line-no">356</span><span id="line-356"> if (lastFlushedSequenceId == null) {</span> |
| <span class="source-line-no">357</span><span id="line-357"> lastFlushedSequenceId = -1L;</span> |
| <span class="source-line-no">358</span><span id="line-358"> }</span> |
| <span class="source-line-no">359</span><span id="line-359"> }</span> |
| <span class="source-line-no">360</span><span id="line-360"> lastFlushedSequenceIds.put(encodedRegionNameAsStr, lastFlushedSequenceId);</span> |
| <span class="source-line-no">361</span><span id="line-361"> }</span> |
| <span class="source-line-no">362</span><span id="line-362"> editsCount++;</span> |
| <span class="source-line-no">363</span><span id="line-363"> if (lastFlushedSequenceId >= entry.getKey().getSequenceId()) {</span> |
| <span class="source-line-no">364</span><span id="line-364"> editsSkipped++;</span> |
| <span class="source-line-no">365</span><span id="line-365"> continue;</span> |
| <span class="source-line-no">366</span><span id="line-366"> }</span> |
| <span class="source-line-no">367</span><span id="line-367"> // Don't send Compaction/Close/Open region events to recovered edit type sinks.</span> |
| <span class="source-line-no">368</span><span id="line-368"> if (entry.getEdit().isMetaEdit() && !outputSink.keepRegionEvent(entry)) {</span> |
| <span class="source-line-no">369</span><span id="line-369"> editsSkipped++;</span> |
| <span class="source-line-no">370</span><span id="line-370"> continue;</span> |
| <span class="source-line-no">371</span><span id="line-371"> }</span> |
| <span class="source-line-no">372</span><span id="line-372"> entryBuffers.appendEntry(entry);</span> |
| <span class="source-line-no">373</span><span id="line-373"> int moreWritersFromLastCheck = this.getNumOpenWriters() - numOpenedFilesLastCheck;</span> |
| <span class="source-line-no">374</span><span id="line-374"> // If sufficient edits have passed, check if we should report progress.</span> |
| <span class="source-line-no">375</span><span id="line-375"> if (</span> |
| <span class="source-line-no">376</span><span id="line-376"> editsCount % interval == 0 || moreWritersFromLastCheck > numOpenedFilesBeforeReporting</span> |
| <span class="source-line-no">377</span><span id="line-377"> ) {</span> |
| <span class="source-line-no">378</span><span id="line-378"> numOpenedFilesLastCheck = this.getNumOpenWriters();</span> |
| <span class="source-line-no">379</span><span id="line-379"> String countsStr = (editsCount - (editsSkipped + outputSink.getTotalSkippedEdits()))</span> |
| <span class="source-line-no">380</span><span id="line-380"> + " edits, skipped " + editsSkipped + " edits.";</span> |
| <span class="source-line-no">381</span><span id="line-381"> status.setStatus("Split " + countsStr);</span> |
| <span class="source-line-no">382</span><span id="line-382"> if (cancel != null && !cancel.progress()) {</span> |
| <span class="source-line-no">383</span><span id="line-383"> cancelled = true;</span> |
| <span class="source-line-no">384</span><span id="line-384"> return new SplitWALResult(false, corrupt);</span> |
| <span class="source-line-no">385</span><span id="line-385"> }</span> |
| <span class="source-line-no">386</span><span id="line-386"> }</span> |
| <span class="source-line-no">387</span><span id="line-387"> }</span> |
| <span class="source-line-no">388</span><span id="line-388"> } catch (InterruptedException ie) {</span> |
| <span class="source-line-no">389</span><span id="line-389"> IOException iie = new InterruptedIOException();</span> |
| <span class="source-line-no">390</span><span id="line-390"> iie.initCause(ie);</span> |
| <span class="source-line-no">391</span><span id="line-391"> throw iie;</span> |
| <span class="source-line-no">392</span><span id="line-392"> } catch (CorruptedLogFileException e) {</span> |
| <span class="source-line-no">393</span><span id="line-393"> LOG.warn("Could not parse, corrupt WAL={}", wal, e);</span> |
| <span class="source-line-no">394</span><span id="line-394"> // If splitLogWorkerCoordination, then its old-school zk-coordinated splitting so update</span> |
| <span class="source-line-no">395</span><span id="line-395"> // zk. Otherwise, it is the newer procedure-based WAL split which has no zk component.</span> |
| <span class="source-line-no">396</span><span id="line-396"> if (this.splitLogWorkerCoordination != null) {</span> |
| <span class="source-line-no">397</span><span id="line-397"> // Some tests pass in a csm of null.</span> |
| <span class="source-line-no">398</span><span id="line-398"> splitLogWorkerCoordination.markCorrupted(walRootDir, wal.getName(), walFS);</span> |
| <span class="source-line-no">399</span><span id="line-399"> }</span> |
| <span class="source-line-no">400</span><span id="line-400"> corrupt = true;</span> |
| <span class="source-line-no">401</span><span id="line-401"> } catch (IOException e) {</span> |
| <span class="source-line-no">402</span><span id="line-402"> e = e instanceof RemoteException ? ((RemoteException) e).unwrapRemoteException() : e;</span> |
| <span class="source-line-no">403</span><span id="line-403"> throw e;</span> |
| <span class="source-line-no">404</span><span id="line-404"> } finally {</span> |
| <span class="source-line-no">405</span><span id="line-405"> final String log = "Finishing writing output for " + wal + " so closing down";</span> |
| <span class="source-line-no">406</span><span id="line-406"> LOG.debug(log);</span> |
| <span class="source-line-no">407</span><span id="line-407"> status.setStatus(log);</span> |
| <span class="source-line-no">408</span><span id="line-408"> if (null != walReader) {</span> |
| <span class="source-line-no">409</span><span id="line-409"> walReader.close();</span> |
| <span class="source-line-no">410</span><span id="line-410"> }</span> |
| <span class="source-line-no">411</span><span id="line-411"> try {</span> |
| <span class="source-line-no">412</span><span id="line-412"> if (outputSinkStarted) {</span> |
| <span class="source-line-no">413</span><span id="line-413"> // Set cancelled to true as the immediate following statement will reset its value.</span> |
| <span class="source-line-no">414</span><span id="line-414"> // If close() throws an exception, cancelled will have the right value</span> |
| <span class="source-line-no">415</span><span id="line-415"> cancelled = true;</span> |
| <span class="source-line-no">416</span><span id="line-416"> cancelled = outputSink.close() == null;</span> |
| <span class="source-line-no">417</span><span id="line-417"> }</span> |
| <span class="source-line-no">418</span><span id="line-418"> } finally {</span> |
| <span class="source-line-no">419</span><span id="line-419"> long processCost = EnvironmentEdgeManager.currentTime() - startTS;</span> |
| <span class="source-line-no">420</span><span id="line-420"> // See if length got updated post lease recovery</span> |
| <span class="source-line-no">421</span><span id="line-421"> String msg = "Processed " + editsCount + " edits across "</span> |
| <span class="source-line-no">422</span><span id="line-422"> + outputSink.getNumberOfRecoveredRegions() + " Regions in " + processCost</span> |
| <span class="source-line-no">423</span><span id="line-423"> + " ms; skipped=" + editsSkipped + "; WAL=" + wal + ", size=" + lengthStr + ", length="</span> |
| <span class="source-line-no">424</span><span id="line-424"> + length + ", corrupted=" + corrupt + ", cancelled=" + cancelled;</span> |
| <span class="source-line-no">425</span><span id="line-425"> LOG.info(msg);</span> |
| <span class="source-line-no">426</span><span id="line-426"> status.markComplete(msg);</span> |
| <span class="source-line-no">427</span><span id="line-427"> if (LOG.isDebugEnabled()) {</span> |
| <span class="source-line-no">428</span><span id="line-428"> LOG.debug("Completed split of {}, journal: {}", wal, status.prettyPrintJournal());</span> |
| <span class="source-line-no">429</span><span id="line-429"> }</span> |
| <span class="source-line-no">430</span><span id="line-430"> }</span> |
| <span class="source-line-no">431</span><span id="line-431"> }</span> |
| <span class="source-line-no">432</span><span id="line-432"> return new SplitWALResult(!cancelled, corrupt);</span> |
| <span class="source-line-no">433</span><span id="line-433"> }</span> |
| <span class="source-line-no">434</span><span id="line-434"></span> |
| <span class="source-line-no">435</span><span id="line-435"> private boolean isRegionDirPresentUnderRoot(TableName tn, String region) throws IOException {</span> |
| <span class="source-line-no">436</span><span id="line-436"> return this.rootFS.exists(CommonFSUtils.getRegionDir(this.rootDir, tn, region));</span> |
| <span class="source-line-no">437</span><span id="line-437"> }</span> |
| <span class="source-line-no">438</span><span id="line-438"></span> |
| <span class="source-line-no">439</span><span id="line-439"> /**</span> |
| <span class="source-line-no">440</span><span id="line-440"> * Create a new {@link WALStreamReader} for reading logs to split.</span> |
| <span class="source-line-no">441</span><span id="line-441"> * @return Returns null if file has length zero or file can't be found.</span> |
| <span class="source-line-no">442</span><span id="line-442"> */</span> |
| <span class="source-line-no">443</span><span id="line-443"> protected WALStreamReader getReader(FileStatus walStatus, boolean skipErrors,</span> |
| <span class="source-line-no">444</span><span id="line-444"> CancelableProgressable cancel) throws IOException, CorruptedLogFileException {</span> |
| <span class="source-line-no">445</span><span id="line-445"> Path path = walStatus.getPath();</span> |
| <span class="source-line-no">446</span><span id="line-446"> long length = walStatus.getLen();</span> |
| <span class="source-line-no">447</span><span id="line-447"> WALStreamReader in;</span> |
| <span class="source-line-no">448</span><span id="line-448"></span> |
| <span class="source-line-no">449</span><span id="line-449"> // Check for possibly empty file. With appends, currently Hadoop reports a</span> |
| <span class="source-line-no">450</span><span id="line-450"> // zero length even if the file has been sync'd. Revisit if HDFS-376 or</span> |
| <span class="source-line-no">451</span><span id="line-451"> // HDFS-878 is committed.</span> |
| <span class="source-line-no">452</span><span id="line-452"> if (length <= 0) {</span> |
| <span class="source-line-no">453</span><span id="line-453"> LOG.warn("File {} might be still open, length is 0", path);</span> |
| <span class="source-line-no">454</span><span id="line-454"> }</span> |
| <span class="source-line-no">455</span><span id="line-455"></span> |
| <span class="source-line-no">456</span><span id="line-456"> try {</span> |
| <span class="source-line-no">457</span><span id="line-457"> RecoverLeaseFSUtils.recoverFileLease(walFS, path, conf, cancel);</span> |
| <span class="source-line-no">458</span><span id="line-458"> try {</span> |
| <span class="source-line-no">459</span><span id="line-459"> in = getReader(path, cancel);</span> |
| <span class="source-line-no">460</span><span id="line-460"> } catch (EOFException e) {</span> |
| <span class="source-line-no">461</span><span id="line-461"> if (length <= 0) {</span> |
| <span class="source-line-no">462</span><span id="line-462"> // TODO should we ignore an empty, not-last log file if skip.errors</span> |
| <span class="source-line-no">463</span><span id="line-463"> // is false? Either way, the caller should decide what to do. E.g.</span> |
| <span class="source-line-no">464</span><span id="line-464"> // ignore if this is the last log in sequence.</span> |
| <span class="source-line-no">465</span><span id="line-465"> // TODO is this scenario still possible if the log has been</span> |
| <span class="source-line-no">466</span><span id="line-466"> // recovered (i.e. closed)</span> |
| <span class="source-line-no">467</span><span id="line-467"> LOG.warn("Could not open {} for reading. File is empty", path, e);</span> |
| <span class="source-line-no">468</span><span id="line-468"> }</span> |
| <span class="source-line-no">469</span><span id="line-469"> // EOFException being ignored</span> |
| <span class="source-line-no">470</span><span id="line-470"> return null;</span> |
| <span class="source-line-no">471</span><span id="line-471"> }</span> |
| <span class="source-line-no">472</span><span id="line-472"> } catch (IOException e) {</span> |
| <span class="source-line-no">473</span><span id="line-473"> if (e instanceof FileNotFoundException) {</span> |
| <span class="source-line-no">474</span><span id="line-474"> // A wal file may not exist anymore. Nothing can be recovered so move on</span> |
| <span class="source-line-no">475</span><span id="line-475"> LOG.warn("File {} does not exist anymore", path, e);</span> |
| <span class="source-line-no">476</span><span id="line-476"> return null;</span> |
| <span class="source-line-no">477</span><span id="line-477"> }</span> |
| <span class="source-line-no">478</span><span id="line-478"> if (!skipErrors || e instanceof InterruptedIOException) {</span> |
| <span class="source-line-no">479</span><span id="line-479"> throw e; // Don't mark the file corrupted if interrupted, or not skipErrors</span> |
| <span class="source-line-no">480</span><span id="line-480"> }</span> |
| <span class="source-line-no">481</span><span id="line-481"> throw new CorruptedLogFileException("skipErrors=true; could not open " + path + ", skipping",</span> |
| <span class="source-line-no">482</span><span id="line-482"> e);</span> |
| <span class="source-line-no">483</span><span id="line-483"> }</span> |
| <span class="source-line-no">484</span><span id="line-484"> return in;</span> |
| <span class="source-line-no">485</span><span id="line-485"> }</span> |
| <span class="source-line-no">486</span><span id="line-486"></span> |
| <span class="source-line-no">487</span><span id="line-487"> private Entry getNextLogLine(WALStreamReader in, Path path, boolean skipErrors)</span> |
| <span class="source-line-no">488</span><span id="line-488"> throws CorruptedLogFileException, IOException {</span> |
| <span class="source-line-no">489</span><span id="line-489"> try {</span> |
| <span class="source-line-no">490</span><span id="line-490"> return in.next();</span> |
| <span class="source-line-no">491</span><span id="line-491"> } catch (EOFException eof) {</span> |
| <span class="source-line-no">492</span><span id="line-492"> // truncated files are expected if a RS crashes (see HBASE-2643)</span> |
| <span class="source-line-no">493</span><span id="line-493"> LOG.info("EOF from {}; continuing.", path);</span> |
| <span class="source-line-no">494</span><span id="line-494"> return null;</span> |
| <span class="source-line-no">495</span><span id="line-495"> } catch (IOException e) {</span> |
| <span class="source-line-no">496</span><span id="line-496"> // If the IOE resulted from bad file format,</span> |
| <span class="source-line-no">497</span><span id="line-497"> // then this problem is idempotent and retrying won't help</span> |
| <span class="source-line-no">498</span><span id="line-498"> if (</span> |
| <span class="source-line-no">499</span><span id="line-499"> e.getCause() != null && (e.getCause() instanceof ParseException</span> |
| <span class="source-line-no">500</span><span id="line-500"> || e.getCause() instanceof org.apache.hadoop.fs.ChecksumException)</span> |
| <span class="source-line-no">501</span><span id="line-501"> ) {</span> |
| <span class="source-line-no">502</span><span id="line-502"> LOG.warn("Parse exception from {}; continuing", path, e);</span> |
| <span class="source-line-no">503</span><span id="line-503"> return null;</span> |
| <span class="source-line-no">504</span><span id="line-504"> }</span> |
| <span class="source-line-no">505</span><span id="line-505"> if (!skipErrors) {</span> |
| <span class="source-line-no">506</span><span id="line-506"> throw e;</span> |
| <span class="source-line-no">507</span><span id="line-507"> }</span> |
| <span class="source-line-no">508</span><span id="line-508"> throw new CorruptedLogFileException("skipErrors=true Ignoring exception"</span> |
| <span class="source-line-no">509</span><span id="line-509"> + " while parsing wal " + path + ". Marking as corrupted", e);</span> |
| <span class="source-line-no">510</span><span id="line-510"> }</span> |
| <span class="source-line-no">511</span><span id="line-511"> }</span> |
| <span class="source-line-no">512</span><span id="line-512"></span> |
| <span class="source-line-no">513</span><span id="line-513"> /**</span> |
| <span class="source-line-no">514</span><span id="line-514"> * Create a new {@link WALProvider.Writer} for writing log splits.</span> |
| <span class="source-line-no">515</span><span id="line-515"> * @return a new Writer instance, caller should close</span> |
| <span class="source-line-no">516</span><span id="line-516"> */</span> |
| <span class="source-line-no">517</span><span id="line-517"> protected WALProvider.Writer createWriter(Path logfile) throws IOException {</span> |
| <span class="source-line-no">518</span><span id="line-518"> return walFactory.createRecoveredEditsWriter(walFS, logfile);</span> |
| <span class="source-line-no">519</span><span id="line-519"> }</span> |
| <span class="source-line-no">520</span><span id="line-520"></span> |
| <span class="source-line-no">521</span><span id="line-521"> /**</span> |
| <span class="source-line-no">522</span><span id="line-522"> * Create a new {@link WALStreamReader} for reading logs to split.</span> |
| <span class="source-line-no">523</span><span id="line-523"> * @return new Reader instance, caller should close</span> |
| <span class="source-line-no">524</span><span id="line-524"> */</span> |
| <span class="source-line-no">525</span><span id="line-525"> private WALStreamReader getReader(Path curLogFile, CancelableProgressable reporter)</span> |
| <span class="source-line-no">526</span><span id="line-526"> throws IOException {</span> |
| <span class="source-line-no">527</span><span id="line-527"> return walFactory.createStreamReader(walFS, curLogFile, reporter);</span> |
| <span class="source-line-no">528</span><span id="line-528"> }</span> |
| <span class="source-line-no">529</span><span id="line-529"></span> |
| <span class="source-line-no">530</span><span id="line-530"> /**</span> |
| <span class="source-line-no">531</span><span id="line-531"> * Get current open writers</span> |
| <span class="source-line-no">532</span><span id="line-532"> */</span> |
| <span class="source-line-no">533</span><span id="line-533"> private int getNumOpenWriters() {</span> |
| <span class="source-line-no">534</span><span id="line-534"> int result = 0;</span> |
| <span class="source-line-no">535</span><span id="line-535"> if (this.outputSink != null) {</span> |
| <span class="source-line-no">536</span><span id="line-536"> result += this.outputSink.getNumOpenWriters();</span> |
| <span class="source-line-no">537</span><span id="line-537"> }</span> |
| <span class="source-line-no">538</span><span id="line-538"> return result;</span> |
| <span class="source-line-no">539</span><span id="line-539"> }</span> |
| <span class="source-line-no">540</span><span id="line-540"></span> |
| <span class="source-line-no">541</span><span id="line-541"> /**</span> |
| <span class="source-line-no">542</span><span id="line-542"> * Contains some methods to control WAL-entries producer / consumer interactions</span> |
| <span class="source-line-no">543</span><span id="line-543"> */</span> |
| <span class="source-line-no">544</span><span id="line-544"> public static class PipelineController {</span> |
| <span class="source-line-no">545</span><span id="line-545"> // If an exception is thrown by one of the other threads, it will be</span> |
| <span class="source-line-no">546</span><span id="line-546"> // stored here.</span> |
| <span class="source-line-no">547</span><span id="line-547"> AtomicReference<Throwable> thrown = new AtomicReference<>();</span> |
| <span class="source-line-no">548</span><span id="line-548"></span> |
| <span class="source-line-no">549</span><span id="line-549"> // Wait/notify for when data has been produced by the writer thread,</span> |
| <span class="source-line-no">550</span><span id="line-550"> // consumed by the reader thread, or an exception occurred</span> |
| <span class="source-line-no">551</span><span id="line-551"> final Object dataAvailable = new Object();</span> |
| <span class="source-line-no">552</span><span id="line-552"></span> |
| <span class="source-line-no">553</span><span id="line-553"> void writerThreadError(Throwable t) {</span> |
| <span class="source-line-no">554</span><span id="line-554"> thrown.compareAndSet(null, t);</span> |
| <span class="source-line-no">555</span><span id="line-555"> }</span> |
| <span class="source-line-no">556</span><span id="line-556"></span> |
| <span class="source-line-no">557</span><span id="line-557"> /**</span> |
| <span class="source-line-no">558</span><span id="line-558"> * Check for errors in the writer threads. If any is found, rethrow it.</span> |
| <span class="source-line-no">559</span><span id="line-559"> */</span> |
| <span class="source-line-no">560</span><span id="line-560"> void checkForErrors() throws IOException {</span> |
| <span class="source-line-no">561</span><span id="line-561"> Throwable thrown = this.thrown.get();</span> |
| <span class="source-line-no">562</span><span id="line-562"> if (thrown == null) {</span> |
| <span class="source-line-no">563</span><span id="line-563"> return;</span> |
| <span class="source-line-no">564</span><span id="line-564"> }</span> |
| <span class="source-line-no">565</span><span id="line-565"> if (thrown instanceof IOException) {</span> |
| <span class="source-line-no">566</span><span id="line-566"> throw new IOException(thrown);</span> |
| <span class="source-line-no">567</span><span id="line-567"> } else {</span> |
| <span class="source-line-no">568</span><span id="line-568"> throw new RuntimeException(thrown);</span> |
| <span class="source-line-no">569</span><span id="line-569"> }</span> |
| <span class="source-line-no">570</span><span id="line-570"> }</span> |
| <span class="source-line-no">571</span><span id="line-571"> }</span> |
| <span class="source-line-no">572</span><span id="line-572"></span> |
| <span class="source-line-no">573</span><span id="line-573"> static class CorruptedLogFileException extends Exception {</span> |
| <span class="source-line-no">574</span><span id="line-574"> private static final long serialVersionUID = 1L;</span> |
| <span class="source-line-no">575</span><span id="line-575"></span> |
| <span class="source-line-no">576</span><span id="line-576"> CorruptedLogFileException(String s) {</span> |
| <span class="source-line-no">577</span><span id="line-577"> super(s);</span> |
| <span class="source-line-no">578</span><span id="line-578"> }</span> |
| <span class="source-line-no">579</span><span id="line-579"></span> |
| <span class="source-line-no">580</span><span id="line-580"> /**</span> |
| <span class="source-line-no">581</span><span id="line-581"> * CorruptedLogFileException with cause</span> |
| <span class="source-line-no">582</span><span id="line-582"> * @param message the message for this exception</span> |
| <span class="source-line-no">583</span><span id="line-583"> * @param cause the cause for this exception</span> |
| <span class="source-line-no">584</span><span id="line-584"> */</span> |
| <span class="source-line-no">585</span><span id="line-585"> CorruptedLogFileException(String message, Throwable cause) {</span> |
| <span class="source-line-no">586</span><span id="line-586"> super(message, cause);</span> |
| <span class="source-line-no">587</span><span id="line-587"> }</span> |
| <span class="source-line-no">588</span><span id="line-588"> }</span> |
| <span class="source-line-no">589</span><span id="line-589">}</span> |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| </pre> |
| </div> |
| </main> |
| </body> |
| </html> |