| <!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 4.01 Transitional//EN" "http://www.w3.org/TR/html4/loose.dtd"> |
| <html lang="en"> |
| <head> |
| <title>Source code</title> |
| <link rel="stylesheet" type="text/css" href="../../../../../../stylesheet.css" title="Style"> |
| </head> |
| <body> |
| <div class="sourceContainer"> |
| <pre><span class="sourceLineNo">001</span>/*<a name="line.1"></a> |
| <span class="sourceLineNo">002</span> * Licensed to the Apache Software Foundation (ASF) under one<a name="line.2"></a> |
| <span class="sourceLineNo">003</span> * or more contributor license agreements. See the NOTICE file<a name="line.3"></a> |
| <span class="sourceLineNo">004</span> * distributed with this work for additional information<a name="line.4"></a> |
| <span class="sourceLineNo">005</span> * regarding copyright ownership. The ASF licenses this file<a name="line.5"></a> |
| <span class="sourceLineNo">006</span> * to you under the Apache License, Version 2.0 (the<a name="line.6"></a> |
| <span class="sourceLineNo">007</span> * "License"); you may not use this file except in compliance<a name="line.7"></a> |
| <span class="sourceLineNo">008</span> * with the License. You may obtain a copy of the License at<a name="line.8"></a> |
| <span class="sourceLineNo">009</span> *<a name="line.9"></a> |
| <span class="sourceLineNo">010</span> * http://www.apache.org/licenses/LICENSE-2.0<a name="line.10"></a> |
| <span class="sourceLineNo">011</span> *<a name="line.11"></a> |
| <span class="sourceLineNo">012</span> * Unless required by applicable law or agreed to in writing, software<a name="line.12"></a> |
| <span class="sourceLineNo">013</span> * distributed under the License is distributed on an "AS IS" BASIS,<a name="line.13"></a> |
| <span class="sourceLineNo">014</span> * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.<a name="line.14"></a> |
| <span class="sourceLineNo">015</span> * See the License for the specific language governing permissions and<a name="line.15"></a> |
| <span class="sourceLineNo">016</span> * limitations under the License.<a name="line.16"></a> |
| <span class="sourceLineNo">017</span> */<a name="line.17"></a> |
| <span class="sourceLineNo">018</span>package org.apache.hadoop.hbase.util;<a name="line.18"></a> |
| <span class="sourceLineNo">019</span><a name="line.19"></a> |
| <span class="sourceLineNo">020</span>import static org.apache.hadoop.hbase.util.Order.ASCENDING;<a name="line.20"></a> |
| <span class="sourceLineNo">021</span>import static org.apache.hadoop.hbase.util.Order.DESCENDING;<a name="line.21"></a> |
| <span class="sourceLineNo">022</span><a name="line.22"></a> |
| <span class="sourceLineNo">023</span>import java.math.BigDecimal;<a name="line.23"></a> |
| <span class="sourceLineNo">024</span>import java.math.MathContext;<a name="line.24"></a> |
| <span class="sourceLineNo">025</span>import java.math.RoundingMode;<a name="line.25"></a> |
| <span class="sourceLineNo">026</span>import java.nio.charset.Charset;<a name="line.26"></a> |
| <span class="sourceLineNo">027</span>import org.apache.yetus.audience.InterfaceAudience;<a name="line.27"></a> |
| <span class="sourceLineNo">028</span><a name="line.28"></a> |
| <span class="sourceLineNo">029</span>/**<a name="line.29"></a> |
| <span class="sourceLineNo">030</span> * Utility class that handles ordered byte arrays. That is, unlike {@link Bytes}, these methods<a name="line.30"></a> |
| <span class="sourceLineNo">031</span> * produce byte arrays which maintain the sort order of the original values.<a name="line.31"></a> |
| <span class="sourceLineNo">032</span> * <h3>Encoding Format summary</h3><a name="line.32"></a> |
| <span class="sourceLineNo">033</span> * <p><a name="line.33"></a> |
| <span class="sourceLineNo">034</span> * Each value is encoded as one or more bytes. The first byte of the encoding, its meaning, and a<a name="line.34"></a> |
| <span class="sourceLineNo">035</span> * terse description of the bytes that follow is given by the following table:<a name="line.35"></a> |
| <span class="sourceLineNo">036</span> * </p><a name="line.36"></a> |
| <span class="sourceLineNo">037</span> * <table summary="Encodings"><a name="line.37"></a> |
| <span class="sourceLineNo">038</span> * <tr><a name="line.38"></a> |
| <span class="sourceLineNo">039</span> * <th>Content Type</th><a name="line.39"></a> |
| <span class="sourceLineNo">040</span> * <th>Encoding</th><a name="line.40"></a> |
| <span class="sourceLineNo">041</span> * </tr><a name="line.41"></a> |
| <span class="sourceLineNo">042</span> * <tr><a name="line.42"></a> |
| <span class="sourceLineNo">043</span> * <td>NULL</td><a name="line.43"></a> |
| <span class="sourceLineNo">044</span> * <td>0x05</td><a name="line.44"></a> |
| <span class="sourceLineNo">045</span> * </tr><a name="line.45"></a> |
| <span class="sourceLineNo">046</span> * <tr><a name="line.46"></a> |
| <span class="sourceLineNo">047</span> * <td>negative infinity</td><a name="line.47"></a> |
| <span class="sourceLineNo">048</span> * <td>0x07</td><a name="line.48"></a> |
| <span class="sourceLineNo">049</span> * </tr><a name="line.49"></a> |
| <span class="sourceLineNo">050</span> * <tr><a name="line.50"></a> |
| <span class="sourceLineNo">051</span> * <td>negative large</td><a name="line.51"></a> |
| <span class="sourceLineNo">052</span> * <td>0x08, ~E, ~M</td><a name="line.52"></a> |
| <span class="sourceLineNo">053</span> * </tr><a name="line.53"></a> |
| <span class="sourceLineNo">054</span> * <tr><a name="line.54"></a> |
| <span class="sourceLineNo">055</span> * <td>negative medium</td><a name="line.55"></a> |
| <span class="sourceLineNo">056</span> * <td>0x13-E, ~M</td><a name="line.56"></a> |
| <span class="sourceLineNo">057</span> * </tr><a name="line.57"></a> |
| <span class="sourceLineNo">058</span> * <tr><a name="line.58"></a> |
| <span class="sourceLineNo">059</span> * <td>negative small</td><a name="line.59"></a> |
| <span class="sourceLineNo">060</span> * <td>0x14, -E, ~M</td><a name="line.60"></a> |
| <span class="sourceLineNo">061</span> * </tr><a name="line.61"></a> |
| <span class="sourceLineNo">062</span> * <tr><a name="line.62"></a> |
| <span class="sourceLineNo">063</span> * <td>zero</td><a name="line.63"></a> |
| <span class="sourceLineNo">064</span> * <td>0x15</td><a name="line.64"></a> |
| <span class="sourceLineNo">065</span> * </tr><a name="line.65"></a> |
| <span class="sourceLineNo">066</span> * <tr><a name="line.66"></a> |
| <span class="sourceLineNo">067</span> * <td>positive small</td><a name="line.67"></a> |
| <span class="sourceLineNo">068</span> * <td>0x16, ~-E, M</td><a name="line.68"></a> |
| <span class="sourceLineNo">069</span> * </tr><a name="line.69"></a> |
| <span class="sourceLineNo">070</span> * <tr><a name="line.70"></a> |
| <span class="sourceLineNo">071</span> * <td>positive medium</td><a name="line.71"></a> |
| <span class="sourceLineNo">072</span> * <td>0x17+E, M</td><a name="line.72"></a> |
| <span class="sourceLineNo">073</span> * </tr><a name="line.73"></a> |
| <span class="sourceLineNo">074</span> * <tr><a name="line.74"></a> |
| <span class="sourceLineNo">075</span> * <td>positive large</td><a name="line.75"></a> |
| <span class="sourceLineNo">076</span> * <td>0x22, E, M</td><a name="line.76"></a> |
| <span class="sourceLineNo">077</span> * </tr><a name="line.77"></a> |
| <span class="sourceLineNo">078</span> * <tr><a name="line.78"></a> |
| <span class="sourceLineNo">079</span> * <td>positive infinity</td><a name="line.79"></a> |
| <span class="sourceLineNo">080</span> * <td>0x23</td><a name="line.80"></a> |
| <span class="sourceLineNo">081</span> * </tr><a name="line.81"></a> |
| <span class="sourceLineNo">082</span> * <tr><a name="line.82"></a> |
| <span class="sourceLineNo">083</span> * <td>NaN</td><a name="line.83"></a> |
| <span class="sourceLineNo">084</span> * <td>0x25</td><a name="line.84"></a> |
| <span class="sourceLineNo">085</span> * </tr><a name="line.85"></a> |
| <span class="sourceLineNo">086</span> * <tr><a name="line.86"></a> |
| <span class="sourceLineNo">087</span> * <td>fixed-length 32-bit integer</td><a name="line.87"></a> |
| <span class="sourceLineNo">088</span> * <td>0x27, I</td><a name="line.88"></a> |
| <span class="sourceLineNo">089</span> * </tr><a name="line.89"></a> |
| <span class="sourceLineNo">090</span> * <tr><a name="line.90"></a> |
| <span class="sourceLineNo">091</span> * <td>fixed-length 64-bit integer</td><a name="line.91"></a> |
| <span class="sourceLineNo">092</span> * <td>0x28, I</td><a name="line.92"></a> |
| <span class="sourceLineNo">093</span> * </tr><a name="line.93"></a> |
| <span class="sourceLineNo">094</span> * <tr><a name="line.94"></a> |
| <span class="sourceLineNo">095</span> * <td>fixed-length 8-bit integer</td><a name="line.95"></a> |
| <span class="sourceLineNo">096</span> * <td>0x29</td><a name="line.96"></a> |
| <span class="sourceLineNo">097</span> * </tr><a name="line.97"></a> |
| <span class="sourceLineNo">098</span> * <tr><a name="line.98"></a> |
| <span class="sourceLineNo">099</span> * <td>fixed-length 16-bit integer</td><a name="line.99"></a> |
| <span class="sourceLineNo">100</span> * <td>0x2a</td><a name="line.100"></a> |
| <span class="sourceLineNo">101</span> * </tr><a name="line.101"></a> |
| <span class="sourceLineNo">102</span> * <tr><a name="line.102"></a> |
| <span class="sourceLineNo">103</span> * <td>fixed-length 32-bit float</td><a name="line.103"></a> |
| <span class="sourceLineNo">104</span> * <td>0x30, F</td><a name="line.104"></a> |
| <span class="sourceLineNo">105</span> * </tr><a name="line.105"></a> |
| <span class="sourceLineNo">106</span> * <tr><a name="line.106"></a> |
| <span class="sourceLineNo">107</span> * <td>fixed-length 64-bit float</td><a name="line.107"></a> |
| <span class="sourceLineNo">108</span> * <td>0x31, F</td><a name="line.108"></a> |
| <span class="sourceLineNo">109</span> * </tr><a name="line.109"></a> |
| <span class="sourceLineNo">110</span> * <tr><a name="line.110"></a> |
| <span class="sourceLineNo">111</span> * <td>TEXT</td><a name="line.111"></a> |
| <span class="sourceLineNo">112</span> * <td>0x33, T</td><a name="line.112"></a> |
| <span class="sourceLineNo">113</span> * </tr><a name="line.113"></a> |
| <span class="sourceLineNo">114</span> * <tr><a name="line.114"></a> |
| <span class="sourceLineNo">115</span> * <td>variable length BLOB</td><a name="line.115"></a> |
| <span class="sourceLineNo">116</span> * <td>0x35, B</td><a name="line.116"></a> |
| <span class="sourceLineNo">117</span> * </tr><a name="line.117"></a> |
| <span class="sourceLineNo">118</span> * <tr><a name="line.118"></a> |
| <span class="sourceLineNo">119</span> * <td>byte-for-byte BLOB</td><a name="line.119"></a> |
| <span class="sourceLineNo">120</span> * <td>0x36, X</td><a name="line.120"></a> |
| <span class="sourceLineNo">121</span> * </tr><a name="line.121"></a> |
| <span class="sourceLineNo">122</span> * </table><a name="line.122"></a> |
| <span class="sourceLineNo">123</span> * <h3>Null Encoding</h3><a name="line.123"></a> |
| <span class="sourceLineNo">124</span> * <p><a name="line.124"></a> |
| <span class="sourceLineNo">125</span> * Each value that is a NULL encodes as a single byte of 0x05. Since every other value encoding<a name="line.125"></a> |
| <span class="sourceLineNo">126</span> * begins with a byte greater than 0x05, this forces NULL values to sort first.<a name="line.126"></a> |
| <span class="sourceLineNo">127</span> * </p><a name="line.127"></a> |
| <span class="sourceLineNo">128</span> * <h3>Text Encoding</h3><a name="line.128"></a> |
| <span class="sourceLineNo">129</span> * <p><a name="line.129"></a> |
| <span class="sourceLineNo">130</span> * Each text value begins with a single byte of 0x33 and ends with a single byte of 0x00. There are<a name="line.130"></a> |
| <span class="sourceLineNo">131</span> * zero or more intervening bytes that encode the text value. The intervening bytes are chosen so<a name="line.131"></a> |
| <span class="sourceLineNo">132</span> * that the encoding will sort in the desired collating order. The intervening bytes may not contain<a name="line.132"></a> |
| <span class="sourceLineNo">133</span> * a 0x00 character; the only 0x00 byte allowed in a text encoding is the final byte.<a name="line.133"></a> |
| <span class="sourceLineNo">134</span> * </p><a name="line.134"></a> |
| <span class="sourceLineNo">135</span> * <p><a name="line.135"></a> |
| <span class="sourceLineNo">136</span> * The text encoding ends in 0x00 in order to ensure that when there are two strings where one is a<a name="line.136"></a> |
| <span class="sourceLineNo">137</span> * prefix of the other that the shorter string will sort first.<a name="line.137"></a> |
| <span class="sourceLineNo">138</span> * </p><a name="line.138"></a> |
| <span class="sourceLineNo">139</span> * <h3>Binary Encoding</h3><a name="line.139"></a> |
| <span class="sourceLineNo">140</span> * <p><a name="line.140"></a> |
| <span class="sourceLineNo">141</span> * There are two encoding strategies for binary fields, referred to as "BlobVar" and "BlobCopy".<a name="line.141"></a> |
| <span class="sourceLineNo">142</span> * BlobVar is less efficient in both space and encoding time. It has no limitations on the range of<a name="line.142"></a> |
| <span class="sourceLineNo">143</span> * encoded values. BlobCopy is a byte-for-byte copy of the input data followed by a termination<a name="line.143"></a> |
| <span class="sourceLineNo">144</span> * byte. It is extremely fast to encode and decode. It carries the restriction of not allowing a<a name="line.144"></a> |
| <span class="sourceLineNo">145</span> * 0x00 value in the input byte[] as this value is used as the termination byte.<a name="line.145"></a> |
| <span class="sourceLineNo">146</span> * </p><a name="line.146"></a> |
| <span class="sourceLineNo">147</span> * <h4>BlobVar</h4><a name="line.147"></a> |
| <span class="sourceLineNo">148</span> * <p><a name="line.148"></a> |
| <span class="sourceLineNo">149</span> * "BlobVar" encodes the input byte[] in a manner similar to a variable length integer encoding. As<a name="line.149"></a> |
| <span class="sourceLineNo">150</span> * with the other {@code OrderedBytes} encodings, the first encoded byte is used to indicate what<a name="line.150"></a> |
| <span class="sourceLineNo">151</span> * kind of value follows. This header byte is 0x37 for BlobVar encoded values. As with the<a name="line.151"></a> |
| <span class="sourceLineNo">152</span> * traditional varint encoding, the most significant bit of each subsequent encoded {@code byte} is<a name="line.152"></a> |
| <span class="sourceLineNo">153</span> * used as a continuation marker. The 7 remaining bits contain the 7 most significant bits of the<a name="line.153"></a> |
| <span class="sourceLineNo">154</span> * first unencoded byte. The next encoded byte starts with a continuation marker in the MSB. The<a name="line.154"></a> |
| <span class="sourceLineNo">155</span> * least significant bit from the first unencoded byte follows, and the remaining 6 bits contain the<a name="line.155"></a> |
| <span class="sourceLineNo">156</span> * 6 MSBs of the second unencoded byte. The encoding continues, encoding 7 bytes on to 8 encoded<a name="line.156"></a> |
| <span class="sourceLineNo">157</span> * bytes. The MSB of the final encoded byte contains a termination marker rather than a continuation<a name="line.157"></a> |
| <span class="sourceLineNo">158</span> * marker, and any remaining bits from the final input byte. Any trailing bits in the final encoded<a name="line.158"></a> |
| <span class="sourceLineNo">159</span> * byte are zeros.<a name="line.159"></a> |
| <span class="sourceLineNo">160</span> * </p><a name="line.160"></a> |
| <span class="sourceLineNo">161</span> * <h4>BlobCopy</h4><a name="line.161"></a> |
| <span class="sourceLineNo">162</span> * <p><a name="line.162"></a> |
| <span class="sourceLineNo">163</span> * "BlobCopy" is a simple byte-for-byte copy of the input data. It uses 0x38 as the header byte, and<a name="line.163"></a> |
| <span class="sourceLineNo">164</span> * is terminated by 0x00 in the DESCENDING case. This alternative encoding is faster and more<a name="line.164"></a> |
| <span class="sourceLineNo">165</span> * space-efficient, but it cannot accept values containing a 0x00 byte in DESCENDING order.<a name="line.165"></a> |
| <span class="sourceLineNo">166</span> * </p><a name="line.166"></a> |
| <span class="sourceLineNo">167</span> * <h3>Variable-length Numeric Encoding</h3><a name="line.167"></a> |
| <span class="sourceLineNo">168</span> * <p><a name="line.168"></a> |
| <span class="sourceLineNo">169</span> * Numeric values must be coded so as to sort in numeric order. We assume that numeric values can be<a name="line.169"></a> |
| <span class="sourceLineNo">170</span> * both integer and floating point values. Clients must be careful to use inspection methods for<a name="line.170"></a> |
| <span class="sourceLineNo">171</span> * encoded values (such as {@link #isNumericInfinite(PositionedByteRange)} and<a name="line.171"></a> |
| <span class="sourceLineNo">172</span> * {@link #isNumericNaN(PositionedByteRange)} to protect against decoding values into object which<a name="line.172"></a> |
| <span class="sourceLineNo">173</span> * do not support these numeric concepts (such as {@link Long} and {@link BigDecimal}).<a name="line.173"></a> |
| <span class="sourceLineNo">174</span> * </p><a name="line.174"></a> |
| <span class="sourceLineNo">175</span> * <p><a name="line.175"></a> |
| <span class="sourceLineNo">176</span> * Simplest cases first: If the numeric value is a NaN, then the encoding is a single byte of 0x25.<a name="line.176"></a> |
| <span class="sourceLineNo">177</span> * This causes NaN values to sort after every other numeric value.<a name="line.177"></a> |
| <span class="sourceLineNo">178</span> * </p><a name="line.178"></a> |
| <span class="sourceLineNo">179</span> * <p><a name="line.179"></a> |
| <span class="sourceLineNo">180</span> * If the numeric value is a negative infinity then the encoding is a single byte of 0x07. Since<a name="line.180"></a> |
| <span class="sourceLineNo">181</span> * every other numeric value except NaN has a larger initial byte, this encoding ensures that<a name="line.181"></a> |
| <span class="sourceLineNo">182</span> * negative infinity will sort prior to every other numeric value other than NaN.<a name="line.182"></a> |
| <span class="sourceLineNo">183</span> * </p><a name="line.183"></a> |
| <span class="sourceLineNo">184</span> * <p><a name="line.184"></a> |
| <span class="sourceLineNo">185</span> * If the numeric value is a positive infinity then the encoding is a single byte of 0x23. Every<a name="line.185"></a> |
| <span class="sourceLineNo">186</span> * other numeric value encoding begins with a smaller byte, ensuring that positive infinity always<a name="line.186"></a> |
| <span class="sourceLineNo">187</span> * sorts last among numeric values. 0x23 is also smaller than 0x33, the initial byte of a text<a name="line.187"></a> |
| <span class="sourceLineNo">188</span> * value, ensuring that every numeric value sorts before every text value.<a name="line.188"></a> |
| <span class="sourceLineNo">189</span> * </p><a name="line.189"></a> |
| <span class="sourceLineNo">190</span> * <p><a name="line.190"></a> |
| <span class="sourceLineNo">191</span> * If the numeric value is exactly zero then it is encoded as a single byte of 0x15. Finite negative<a name="line.191"></a> |
| <span class="sourceLineNo">192</span> * values will have initial bytes of 0x08 through 0x14 and finite positive values will have initial<a name="line.192"></a> |
| <span class="sourceLineNo">193</span> * bytes of 0x16 through 0x22.<a name="line.193"></a> |
| <span class="sourceLineNo">194</span> * </p><a name="line.194"></a> |
| <span class="sourceLineNo">195</span> * <p><a name="line.195"></a> |
| <span class="sourceLineNo">196</span> * For all numeric values, we compute a mantissa M and an exponent E. The mantissa is a base-100<a name="line.196"></a> |
| <span class="sourceLineNo">197</span> * representation of the value. The exponent E determines where to put the decimal point.<a name="line.197"></a> |
| <span class="sourceLineNo">198</span> * </p><a name="line.198"></a> |
| <span class="sourceLineNo">199</span> * <p><a name="line.199"></a> |
| <span class="sourceLineNo">200</span> * Each centimal digit of the mantissa is stored in a byte. If the value of the centimal digit is X<a name="line.200"></a> |
| <span class="sourceLineNo">201</span> * (hence X&ge;0 and X&le;99) then the byte value will be 2*X+1 for every byte of the mantissa,<a name="line.201"></a> |
| <span class="sourceLineNo">202</span> * except for the last byte which will be 2*X+0. The mantissa must be the minimum number of bytes<a name="line.202"></a> |
| <span class="sourceLineNo">203</span> * necessary to represent the value; trailing X==0 digits are omitted. This means that the mantissa<a name="line.203"></a> |
| <span class="sourceLineNo">204</span> * will never contain a byte with the value 0x00.<a name="line.204"></a> |
| <span class="sourceLineNo">205</span> * </p><a name="line.205"></a> |
| <span class="sourceLineNo">206</span> * <p><a name="line.206"></a> |
| <span class="sourceLineNo">207</span> * If we assume all digits of the mantissa occur to the right of the decimal point, then the<a name="line.207"></a> |
| <span class="sourceLineNo">208</span> * exponent E is the power of one hundred by which one must multiply the mantissa to recover the<a name="line.208"></a> |
| <span class="sourceLineNo">209</span> * original value.<a name="line.209"></a> |
| <span class="sourceLineNo">210</span> * </p><a name="line.210"></a> |
| <span class="sourceLineNo">211</span> * <p><a name="line.211"></a> |
| <span class="sourceLineNo">212</span> * Values are classified as large, medium, or small according to the value of E. If E is 11 or more,<a name="line.212"></a> |
| <span class="sourceLineNo">213</span> * the value is large. For E between 0 and 10, the value is medium. For E less than zero, the value<a name="line.213"></a> |
| <span class="sourceLineNo">214</span> * is small.<a name="line.214"></a> |
| <span class="sourceLineNo">215</span> * </p><a name="line.215"></a> |
| <span class="sourceLineNo">216</span> * <p><a name="line.216"></a> |
| <span class="sourceLineNo">217</span> * Large positive values are encoded as a single byte 0x22 followed by E as a varint and then M.<a name="line.217"></a> |
| <span class="sourceLineNo">218</span> * Medium positive values are a single byte of 0x17+E followed by M. Small positive values are<a name="line.218"></a> |
| <span class="sourceLineNo">219</span> * encoded as a single byte 0x16 followed by the ones-complement of the varint for -E followed by M.<a name="line.219"></a> |
| <span class="sourceLineNo">220</span> * </p><a name="line.220"></a> |
| <span class="sourceLineNo">221</span> * <p><a name="line.221"></a> |
| <span class="sourceLineNo">222</span> * Small negative values are encoded as a single byte 0x14 followed by -E as a varint and then the<a name="line.222"></a> |
| <span class="sourceLineNo">223</span> * ones-complement of M. Medium negative values are encoded as a byte 0x13-E followed by the<a name="line.223"></a> |
| <span class="sourceLineNo">224</span> * ones-complement of M. Large negative values consist of the single byte 0x08 followed by the<a name="line.224"></a> |
| <span class="sourceLineNo">225</span> * ones-complement of the varint encoding of E followed by the ones-complement of M.<a name="line.225"></a> |
| <span class="sourceLineNo">226</span> * </p><a name="line.226"></a> |
| <span class="sourceLineNo">227</span> * <h3>Fixed-length Integer Encoding</h3><a name="line.227"></a> |
| <span class="sourceLineNo">228</span> * <p><a name="line.228"></a> |
| <span class="sourceLineNo">229</span> * All 4-byte integers are serialized to a 5-byte, fixed-width, sortable byte format. All 8-byte<a name="line.229"></a> |
| <span class="sourceLineNo">230</span> * integers are serialized to the equivelant 9-byte format. Serialization is performed by writing a<a name="line.230"></a> |
| <span class="sourceLineNo">231</span> * header byte, inverting the integer sign bit and writing the resulting bytes to the byte array in<a name="line.231"></a> |
| <span class="sourceLineNo">232</span> * big endian order.<a name="line.232"></a> |
| <span class="sourceLineNo">233</span> * </p><a name="line.233"></a> |
| <span class="sourceLineNo">234</span> * <h3>Fixed-length Floating Point Encoding</h3><a name="line.234"></a> |
| <span class="sourceLineNo">235</span> * <p><a name="line.235"></a> |
| <span class="sourceLineNo">236</span> * 32-bit and 64-bit floating point numbers are encoded to a 5-byte and 9-byte encoding format,<a name="line.236"></a> |
| <span class="sourceLineNo">237</span> * respectively. The format is identical, save for the precision respected in each step of the<a name="line.237"></a> |
| <span class="sourceLineNo">238</span> * operation.<a name="line.238"></a> |
| <span class="sourceLineNo">239</span> * <p><a name="line.239"></a> |
| <span class="sourceLineNo">240</span> * This format ensures the following total ordering of floating point values:<a name="line.240"></a> |
| <span class="sourceLineNo">241</span> * Float.NEGATIVE_INFINITY &lt; -Float.MAX_VALUE &lt; ... &lt; -Float.MIN_VALUE &lt; -0.0 &lt; +0.0;<a name="line.241"></a> |
| <span class="sourceLineNo">242</span> * &lt; Float.MIN_VALUE &lt; ... &lt; Float.MAX_VALUE &lt; Float.POSITIVE_INFINITY &lt; Float.NaN<a name="line.242"></a> |
| <span class="sourceLineNo">243</span> * </p><a name="line.243"></a> |
| <span class="sourceLineNo">244</span> * <p><a name="line.244"></a> |
| <span class="sourceLineNo">245</span> * Floating point numbers are encoded as specified in IEEE 754. A 32-bit single precision float<a name="line.245"></a> |
| <span class="sourceLineNo">246</span> * consists of a sign bit, 8-bit unsigned exponent encoded in offset-127 notation, and a 23-bit<a name="line.246"></a> |
| <span class="sourceLineNo">247</span> * significand. The format is described further in the<a name="line.247"></a> |
| <span class="sourceLineNo">248</span> * <a href="http://en.wikipedia.org/wiki/Single_precision"> Single Precision Floating Point<a name="line.248"></a> |
| <span class="sourceLineNo">249</span> * Wikipedia page</a><a name="line.249"></a> |
| <span class="sourceLineNo">250</span> * </p><a name="line.250"></a> |
| <span class="sourceLineNo">251</span> * <p><a name="line.251"></a> |
| <span class="sourceLineNo">252</span> * The value of a normal float is -1 <sup>sign bit</sup> &times; 2<sup>exponent - 127</sup> &times;<a name="line.252"></a> |
| <span class="sourceLineNo">253</span> * 1.significand<a name="line.253"></a> |
| <span class="sourceLineNo">254</span> * </p><a name="line.254"></a> |
| <span class="sourceLineNo">255</span> * <p><a name="line.255"></a> |
| <span class="sourceLineNo">256</span> * The IEE754 floating point format already preserves sort ordering for positive floating point<a name="line.256"></a> |
| <span class="sourceLineNo">257</span> * numbers when the raw bytes are compared in most significant byte order. This is discussed further<a name="line.257"></a> |
| <span class="sourceLineNo">258</span> * at <a href= "http://www.cygnus-software.com/papers/comparingfloats/comparingfloats.htm"><a name="line.258"></a> |
| <span class="sourceLineNo">259</span> * http://www.cygnus-software.com/papers/comparingfloats/comparingfloats.htm</a><a name="line.259"></a> |
| <span class="sourceLineNo">260</span> * </p><a name="line.260"></a> |
| <span class="sourceLineNo">261</span> * <p><a name="line.261"></a> |
| <span class="sourceLineNo">262</span> * Thus, we need only ensure that negative numbers sort in the the exact opposite order as positive<a name="line.262"></a> |
| <span class="sourceLineNo">263</span> * numbers (so that say, negative infinity is less than negative 1), and that all negative numbers<a name="line.263"></a> |
| <span class="sourceLineNo">264</span> * compare less than any positive number. To accomplish this, we invert the sign bit of all floating<a name="line.264"></a> |
| <span class="sourceLineNo">265</span> * point numbers, and we also invert the exponent and significand bits if the floating point number<a name="line.265"></a> |
| <span class="sourceLineNo">266</span> * was negative.<a name="line.266"></a> |
| <span class="sourceLineNo">267</span> * </p><a name="line.267"></a> |
| <span class="sourceLineNo">268</span> * <p><a name="line.268"></a> |
| <span class="sourceLineNo">269</span> * More specifically, we first store the floating point bits into a 32-bit int {@code j} using<a name="line.269"></a> |
| <span class="sourceLineNo">270</span> * {@link Float#floatToIntBits}. This method collapses all NaNs into a single, canonical NaN value<a name="line.270"></a> |
| <span class="sourceLineNo">271</span> * but otherwise leaves the bits unchanged. We then compute<a name="line.271"></a> |
| <span class="sourceLineNo">272</span> * </p><a name="line.272"></a> |
| <span class="sourceLineNo">273</span> *<a name="line.273"></a> |
| <span class="sourceLineNo">274</span> * <pre><a name="line.274"></a> |
| <span class="sourceLineNo">275</span> * j &circ;= (j &gt;&gt; (Integer.SIZE - 1)) | Integer.MIN_SIZE<a name="line.275"></a> |
| <span class="sourceLineNo">276</span> * </pre><a name="line.276"></a> |
| <span class="sourceLineNo">277</span> * <p><a name="line.277"></a> |
| <span class="sourceLineNo">278</span> * which inverts the sign bit and XOR's all other bits with the sign bit itself. Comparing the raw<a name="line.278"></a> |
| <span class="sourceLineNo">279</span> * bytes of {@code j} in most significant byte order is equivalent to performing a single precision<a name="line.279"></a> |
| <span class="sourceLineNo">280</span> * floating point comparison on the underlying bits (ignoring NaN comparisons, as NaNs don't compare<a name="line.280"></a> |
| <span class="sourceLineNo">281</span> * equal to anything when performing floating point comparisons).<a name="line.281"></a> |
| <span class="sourceLineNo">282</span> * </p><a name="line.282"></a> |
| <span class="sourceLineNo">283</span> * <p><a name="line.283"></a> |
| <span class="sourceLineNo">284</span> * The resulting integer is then converted into a byte array by serializing the integer one byte at<a name="line.284"></a> |
| <span class="sourceLineNo">285</span> * a time in most significant byte order. The serialized integer is prefixed by a single header<a name="line.285"></a> |
| <span class="sourceLineNo">286</span> * byte. All serialized values are 5 bytes in length.<a name="line.286"></a> |
| <span class="sourceLineNo">287</span> * </p><a name="line.287"></a> |
| <span class="sourceLineNo">288</span> * <p><a name="line.288"></a> |
| <span class="sourceLineNo">289</span> * {@code OrderedBytes} encodings are heavily influenced by the<a name="line.289"></a> |
| <span class="sourceLineNo">290</span> * <a href="http://sqlite.org/src4/doc/trunk/www/key_encoding.wiki">SQLite4 Key Encoding</a>. Slight<a name="line.290"></a> |
| <span class="sourceLineNo">291</span> * deviations are make in the interest of order correctness and user extensibility. Fixed-width<a name="line.291"></a> |
| <span class="sourceLineNo">292</span> * {@code Long} and {@link Double} encodings are based on implementations from the now defunct<a name="line.292"></a> |
| <span class="sourceLineNo">293</span> * Orderly library.<a name="line.293"></a> |
| <span class="sourceLineNo">294</span> * </p><a name="line.294"></a> |
| <span class="sourceLineNo">295</span> */<a name="line.295"></a> |
| <span class="sourceLineNo">296</span>@InterfaceAudience.Public<a name="line.296"></a> |
| <span class="sourceLineNo">297</span>public class OrderedBytes {<a name="line.297"></a> |
| <span class="sourceLineNo">298</span><a name="line.298"></a> |
| <span class="sourceLineNo">299</span> /*<a name="line.299"></a> |
| <span class="sourceLineNo">300</span> * These constants define header bytes used to identify encoded values. Note that the values here<a name="line.300"></a> |
| <span class="sourceLineNo">301</span> * are not exhaustive as the Numeric format encodes portions of its value within the header byte.<a name="line.301"></a> |
| <span class="sourceLineNo">302</span> * The values listed here are directly applied to persisted data -- DO NOT modify the values<a name="line.302"></a> |
| <span class="sourceLineNo">303</span> * specified here. Instead, gaps are placed intentionally between values so that new<a name="line.303"></a> |
| <span class="sourceLineNo">304</span> * implementations can be inserted into the total ordering enforced here.<a name="line.304"></a> |
| <span class="sourceLineNo">305</span> */<a name="line.305"></a> |
| <span class="sourceLineNo">306</span> private static final byte NULL = 0x05;<a name="line.306"></a> |
| <span class="sourceLineNo">307</span> // room for 1 expansion type<a name="line.307"></a> |
| <span class="sourceLineNo">308</span> private static final byte NEG_INF = 0x07;<a name="line.308"></a> |
| <span class="sourceLineNo">309</span> private static final byte NEG_LARGE = 0x08;<a name="line.309"></a> |
| <span class="sourceLineNo">310</span> private static final byte NEG_MED_MIN = 0x09;<a name="line.310"></a> |
| <span class="sourceLineNo">311</span> private static final byte NEG_MED_MAX = 0x13;<a name="line.311"></a> |
| <span class="sourceLineNo">312</span> private static final byte NEG_SMALL = 0x14;<a name="line.312"></a> |
| <span class="sourceLineNo">313</span> private static final byte ZERO = 0x15;<a name="line.313"></a> |
| <span class="sourceLineNo">314</span> private static final byte POS_SMALL = 0x16;<a name="line.314"></a> |
| <span class="sourceLineNo">315</span> private static final byte POS_MED_MIN = 0x17;<a name="line.315"></a> |
| <span class="sourceLineNo">316</span> private static final byte POS_MED_MAX = 0x21;<a name="line.316"></a> |
| <span class="sourceLineNo">317</span> private static final byte POS_LARGE = 0x22;<a name="line.317"></a> |
| <span class="sourceLineNo">318</span> private static final byte POS_INF = 0x23;<a name="line.318"></a> |
| <span class="sourceLineNo">319</span> // room for 2 expansion type<a name="line.319"></a> |
| <span class="sourceLineNo">320</span> private static final byte NAN = 0x26;<a name="line.320"></a> |
| <span class="sourceLineNo">321</span> // room for 2 expansion types<a name="line.321"></a> |
| <span class="sourceLineNo">322</span> private static final byte FIXED_INT8 = 0x29;<a name="line.322"></a> |
| <span class="sourceLineNo">323</span> private static final byte FIXED_INT16 = 0x2a;<a name="line.323"></a> |
| <span class="sourceLineNo">324</span> private static final byte FIXED_INT32 = 0x2b;<a name="line.324"></a> |
| <span class="sourceLineNo">325</span> private static final byte FIXED_INT64 = 0x2c;<a name="line.325"></a> |
| <span class="sourceLineNo">326</span> // room for 3 expansion types<a name="line.326"></a> |
| <span class="sourceLineNo">327</span> private static final byte FIXED_FLOAT32 = 0x30;<a name="line.327"></a> |
| <span class="sourceLineNo">328</span> private static final byte FIXED_FLOAT64 = 0x31;<a name="line.328"></a> |
| <span class="sourceLineNo">329</span> // room for 2 expansion type<a name="line.329"></a> |
| <span class="sourceLineNo">330</span> private static final byte TEXT = 0x34;<a name="line.330"></a> |
| <span class="sourceLineNo">331</span> // room for 2 expansion type<a name="line.331"></a> |
| <span class="sourceLineNo">332</span> private static final byte BLOB_VAR = 0x37;<a name="line.332"></a> |
| <span class="sourceLineNo">333</span> private static final byte BLOB_COPY = 0x38;<a name="line.333"></a> |
| <span class="sourceLineNo">334</span><a name="line.334"></a> |
| <span class="sourceLineNo">335</span> /*<a name="line.335"></a> |
| <span class="sourceLineNo">336</span> * The following constant values are used by encoding implementations<a name="line.336"></a> |
| <span class="sourceLineNo">337</span> */<a name="line.337"></a> |
| <span class="sourceLineNo">338</span><a name="line.338"></a> |
| <span class="sourceLineNo">339</span> public static final Charset UTF8 = Charset.forName("UTF-8");<a name="line.339"></a> |
| <span class="sourceLineNo">340</span> private static final byte TERM = 0x00;<a name="line.340"></a> |
| <span class="sourceLineNo">341</span><a name="line.341"></a> |
| <span class="sourceLineNo">342</span> /**<a name="line.342"></a> |
| <span class="sourceLineNo">343</span> * Max precision guaranteed to fit into a {@code long}.<a name="line.343"></a> |
| <span class="sourceLineNo">344</span> */<a name="line.344"></a> |
| <span class="sourceLineNo">345</span> public static final int MAX_PRECISION = 31;<a name="line.345"></a> |
| <span class="sourceLineNo">346</span><a name="line.346"></a> |
| <span class="sourceLineNo">347</span> /**<a name="line.347"></a> |
| <span class="sourceLineNo">348</span> * The context used to normalize {@link BigDecimal} values.<a name="line.348"></a> |
| <span class="sourceLineNo">349</span> */<a name="line.349"></a> |
| <span class="sourceLineNo">350</span> public static final MathContext DEFAULT_MATH_CONTEXT =<a name="line.350"></a> |
| <span class="sourceLineNo">351</span> new MathContext(MAX_PRECISION, RoundingMode.HALF_UP);<a name="line.351"></a> |
| <span class="sourceLineNo">352</span><a name="line.352"></a> |
| <span class="sourceLineNo">353</span> /**<a name="line.353"></a> |
| <span class="sourceLineNo">354</span> * Creates the standard exception when the encoded header byte is unexpected for the decoding<a name="line.354"></a> |
| <span class="sourceLineNo">355</span> * context.<a name="line.355"></a> |
| <span class="sourceLineNo">356</span> * @param header value used in error message.<a name="line.356"></a> |
| <span class="sourceLineNo">357</span> */<a name="line.357"></a> |
| <span class="sourceLineNo">358</span> private static IllegalArgumentException unexpectedHeader(byte header) {<a name="line.358"></a> |
| <span class="sourceLineNo">359</span> throw new IllegalArgumentException(<a name="line.359"></a> |
| <span class="sourceLineNo">360</span> "unexpected value in first byte: 0x" + Long.toHexString(header));<a name="line.360"></a> |
| <span class="sourceLineNo">361</span> }<a name="line.361"></a> |
| <span class="sourceLineNo">362</span><a name="line.362"></a> |
| <span class="sourceLineNo">363</span> /**<a name="line.363"></a> |
| <span class="sourceLineNo">364</span> * Perform unsigned comparison between two long values. Conforms to the same interface as<a name="line.364"></a> |
| <span class="sourceLineNo">365</span> * {@link org.apache.hadoop.hbase.CellComparator}.<a name="line.365"></a> |
| <span class="sourceLineNo">366</span> */<a name="line.366"></a> |
| <span class="sourceLineNo">367</span> private static int unsignedCmp(long x1, long x2) {<a name="line.367"></a> |
| <span class="sourceLineNo">368</span> int cmp;<a name="line.368"></a> |
| <span class="sourceLineNo">369</span> if ((cmp = (x1 < x2 ? -1 : (x1 == x2 ? 0 : 1))) == 0) return 0;<a name="line.369"></a> |
| <span class="sourceLineNo">370</span> // invert the result when either value is negative<a name="line.370"></a> |
| <span class="sourceLineNo">371</span> if ((x1 < 0) != (x2 < 0)) return -cmp;<a name="line.371"></a> |
| <span class="sourceLineNo">372</span> return cmp;<a name="line.372"></a> |
| <span class="sourceLineNo">373</span> }<a name="line.373"></a> |
| <span class="sourceLineNo">374</span><a name="line.374"></a> |
| <span class="sourceLineNo">375</span> /**<a name="line.375"></a> |
| <span class="sourceLineNo">376</span> * Write a 32-bit unsigned integer to {@code dst} as 4 big-endian bytes.<a name="line.376"></a> |
| <span class="sourceLineNo">377</span> * @return number of bytes written.<a name="line.377"></a> |
| <span class="sourceLineNo">378</span> */<a name="line.378"></a> |
| <span class="sourceLineNo">379</span> private static int putUint32(PositionedByteRange dst, int val) {<a name="line.379"></a> |
| <span class="sourceLineNo">380</span> dst.put((byte) (val >>> 24)).put((byte) (val >>> 16)).put((byte) (val >>> 8)).put((byte) val);<a name="line.380"></a> |
| <span class="sourceLineNo">381</span> return 4;<a name="line.381"></a> |
| <span class="sourceLineNo">382</span> }<a name="line.382"></a> |
| <span class="sourceLineNo">383</span><a name="line.383"></a> |
| <span class="sourceLineNo">384</span> /**<a name="line.384"></a> |
| <span class="sourceLineNo">385</span> * Encode an unsigned 64-bit unsigned integer {@code val} into {@code dst}.<a name="line.385"></a> |
| <span class="sourceLineNo">386</span> * @param dst The destination to which encoded bytes are written.<a name="line.386"></a> |
| <span class="sourceLineNo">387</span> * @param val The value to write.<a name="line.387"></a> |
| <span class="sourceLineNo">388</span> * @param comp Compliment the encoded value when {@code comp} is true.<a name="line.388"></a> |
| <span class="sourceLineNo">389</span> * @return number of bytes written.<a name="line.389"></a> |
| <span class="sourceLineNo">390</span> */<a name="line.390"></a> |
| <span class="sourceLineNo">391</span> static int putVaruint64(PositionedByteRange dst, long val, boolean comp) {<a name="line.391"></a> |
| <span class="sourceLineNo">392</span> int w, y, len = 0;<a name="line.392"></a> |
| <span class="sourceLineNo">393</span> final int offset = dst.getOffset(), start = dst.getPosition();<a name="line.393"></a> |
| <span class="sourceLineNo">394</span> byte[] a = dst.getBytes();<a name="line.394"></a> |
| <span class="sourceLineNo">395</span> Order ord = comp ? DESCENDING : ASCENDING;<a name="line.395"></a> |
| <span class="sourceLineNo">396</span> if (-1 == unsignedCmp(val, 241L)) {<a name="line.396"></a> |
| <span class="sourceLineNo">397</span> dst.put((byte) val);<a name="line.397"></a> |
| <span class="sourceLineNo">398</span> len = dst.getPosition() - start;<a name="line.398"></a> |
| <span class="sourceLineNo">399</span> ord.apply(a, offset + start, len);<a name="line.399"></a> |
| <span class="sourceLineNo">400</span> return len;<a name="line.400"></a> |
| <span class="sourceLineNo">401</span> }<a name="line.401"></a> |
| <span class="sourceLineNo">402</span> if (-1 == unsignedCmp(val, 2288L)) {<a name="line.402"></a> |
| <span class="sourceLineNo">403</span> y = (int) (val - 240);<a name="line.403"></a> |
| <span class="sourceLineNo">404</span> dst.put((byte) (y / 256 + 241)).put((byte) (y % 256));<a name="line.404"></a> |
| <span class="sourceLineNo">405</span> len = dst.getPosition() - start;<a name="line.405"></a> |
| <span class="sourceLineNo">406</span> ord.apply(a, offset + start, len);<a name="line.406"></a> |
| <span class="sourceLineNo">407</span> return len;<a name="line.407"></a> |
| <span class="sourceLineNo">408</span> }<a name="line.408"></a> |
| <span class="sourceLineNo">409</span> if (-1 == unsignedCmp(val, 67824L)) {<a name="line.409"></a> |
| <span class="sourceLineNo">410</span> y = (int) (val - 2288);<a name="line.410"></a> |
| <span class="sourceLineNo">411</span> dst.put((byte) 249).put((byte) (y / 256)).put((byte) (y % 256));<a name="line.411"></a> |
| <span class="sourceLineNo">412</span> len = dst.getPosition() - start;<a name="line.412"></a> |
| <span class="sourceLineNo">413</span> ord.apply(a, offset + start, len);<a name="line.413"></a> |
| <span class="sourceLineNo">414</span> return len;<a name="line.414"></a> |
| <span class="sourceLineNo">415</span> }<a name="line.415"></a> |
| <span class="sourceLineNo">416</span> y = (int) val;<a name="line.416"></a> |
| <span class="sourceLineNo">417</span> w = (int) (val >>> 32);<a name="line.417"></a> |
| <span class="sourceLineNo">418</span> if (w == 0) {<a name="line.418"></a> |
| <span class="sourceLineNo">419</span> if (-1 == unsignedCmp(y, 16777216L)) {<a name="line.419"></a> |
| <span class="sourceLineNo">420</span> dst.put((byte) 250).put((byte) (y >>> 16)).put((byte) (y >>> 8)).put((byte) y);<a name="line.420"></a> |
| <span class="sourceLineNo">421</span> len = dst.getPosition() - start;<a name="line.421"></a> |
| <span class="sourceLineNo">422</span> ord.apply(a, offset + start, len);<a name="line.422"></a> |
| <span class="sourceLineNo">423</span> return len;<a name="line.423"></a> |
| <span class="sourceLineNo">424</span> }<a name="line.424"></a> |
| <span class="sourceLineNo">425</span> dst.put((byte) 251);<a name="line.425"></a> |
| <span class="sourceLineNo">426</span> putUint32(dst, y);<a name="line.426"></a> |
| <span class="sourceLineNo">427</span> len = dst.getPosition() - start;<a name="line.427"></a> |
| <span class="sourceLineNo">428</span> ord.apply(a, offset + start, len);<a name="line.428"></a> |
| <span class="sourceLineNo">429</span> return len;<a name="line.429"></a> |
| <span class="sourceLineNo">430</span> }<a name="line.430"></a> |
| <span class="sourceLineNo">431</span> if (-1 == unsignedCmp(w, 256L)) {<a name="line.431"></a> |
| <span class="sourceLineNo">432</span> dst.put((byte) 252).put((byte) w);<a name="line.432"></a> |
| <span class="sourceLineNo">433</span> putUint32(dst, y);<a name="line.433"></a> |
| <span class="sourceLineNo">434</span> len = dst.getPosition() - start;<a name="line.434"></a> |
| <span class="sourceLineNo">435</span> ord.apply(a, offset + start, len);<a name="line.435"></a> |
| <span class="sourceLineNo">436</span> return len;<a name="line.436"></a> |
| <span class="sourceLineNo">437</span> }<a name="line.437"></a> |
| <span class="sourceLineNo">438</span> if (-1 == unsignedCmp(w, 65536L)) {<a name="line.438"></a> |
| <span class="sourceLineNo">439</span> dst.put((byte) 253).put((byte) (w >>> 8)).put((byte) w);<a name="line.439"></a> |
| <span class="sourceLineNo">440</span> putUint32(dst, y);<a name="line.440"></a> |
| <span class="sourceLineNo">441</span> len = dst.getPosition() - start;<a name="line.441"></a> |
| <span class="sourceLineNo">442</span> ord.apply(a, offset + start, len);<a name="line.442"></a> |
| <span class="sourceLineNo">443</span> return len;<a name="line.443"></a> |
| <span class="sourceLineNo">444</span> }<a name="line.444"></a> |
| <span class="sourceLineNo">445</span> if (-1 == unsignedCmp(w, 16777216L)) {<a name="line.445"></a> |
| <span class="sourceLineNo">446</span> dst.put((byte) 254).put((byte) (w >>> 16)).put((byte) (w >>> 8)).put((byte) w);<a name="line.446"></a> |
| <span class="sourceLineNo">447</span> putUint32(dst, y);<a name="line.447"></a> |
| <span class="sourceLineNo">448</span> len = dst.getPosition() - start;<a name="line.448"></a> |
| <span class="sourceLineNo">449</span> ord.apply(a, offset + start, len);<a name="line.449"></a> |
| <span class="sourceLineNo">450</span> return len;<a name="line.450"></a> |
| <span class="sourceLineNo">451</span> }<a name="line.451"></a> |
| <span class="sourceLineNo">452</span> dst.put((byte) 255);<a name="line.452"></a> |
| <span class="sourceLineNo">453</span> putUint32(dst, w);<a name="line.453"></a> |
| <span class="sourceLineNo">454</span> putUint32(dst, y);<a name="line.454"></a> |
| <span class="sourceLineNo">455</span> len = dst.getPosition() - start;<a name="line.455"></a> |
| <span class="sourceLineNo">456</span> ord.apply(a, offset + start, len);<a name="line.456"></a> |
| <span class="sourceLineNo">457</span> return len;<a name="line.457"></a> |
| <span class="sourceLineNo">458</span> }<a name="line.458"></a> |
| <span class="sourceLineNo">459</span><a name="line.459"></a> |
| <span class="sourceLineNo">460</span> /**<a name="line.460"></a> |
| <span class="sourceLineNo">461</span> * Inspect {@code src} for an encoded varuint64 for its length in bytes. Preserves the state of<a name="line.461"></a> |
| <span class="sourceLineNo">462</span> * {@code src}.<a name="line.462"></a> |
| <span class="sourceLineNo">463</span> * @param src source buffer<a name="line.463"></a> |
| <span class="sourceLineNo">464</span> * @param comp if true, parse the compliment of the value.<a name="line.464"></a> |
| <span class="sourceLineNo">465</span> * @return the number of bytes consumed by this value.<a name="line.465"></a> |
| <span class="sourceLineNo">466</span> */<a name="line.466"></a> |
| <span class="sourceLineNo">467</span> static int lengthVaruint64(PositionedByteRange src, boolean comp) {<a name="line.467"></a> |
| <span class="sourceLineNo">468</span> int a0 = (comp ? DESCENDING : ASCENDING).apply(src.peek()) & 0xff;<a name="line.468"></a> |
| <span class="sourceLineNo">469</span> if (a0 <= 240) return 1;<a name="line.469"></a> |
| <span class="sourceLineNo">470</span> if (a0 <= 248) return 2;<a name="line.470"></a> |
| <span class="sourceLineNo">471</span> if (a0 == 249) return 3;<a name="line.471"></a> |
| <span class="sourceLineNo">472</span> if (a0 == 250) return 4;<a name="line.472"></a> |
| <span class="sourceLineNo">473</span> if (a0 == 251) return 5;<a name="line.473"></a> |
| <span class="sourceLineNo">474</span> if (a0 == 252) return 6;<a name="line.474"></a> |
| <span class="sourceLineNo">475</span> if (a0 == 253) return 7;<a name="line.475"></a> |
| <span class="sourceLineNo">476</span> if (a0 == 254) return 8;<a name="line.476"></a> |
| <span class="sourceLineNo">477</span> if (a0 == 255) return 9;<a name="line.477"></a> |
| <span class="sourceLineNo">478</span> throw unexpectedHeader(src.peek());<a name="line.478"></a> |
| <span class="sourceLineNo">479</span> }<a name="line.479"></a> |
| <span class="sourceLineNo">480</span><a name="line.480"></a> |
| <span class="sourceLineNo">481</span> /**<a name="line.481"></a> |
| <span class="sourceLineNo">482</span> * Skip {@code src} over the encoded varuint64.<a name="line.482"></a> |
| <span class="sourceLineNo">483</span> * @param src source buffer<a name="line.483"></a> |
| <span class="sourceLineNo">484</span> * @param cmp if true, parse the compliment of the value.<a name="line.484"></a> |
| <span class="sourceLineNo">485</span> * @return the number of bytes skipped.<a name="line.485"></a> |
| <span class="sourceLineNo">486</span> */<a name="line.486"></a> |
| <span class="sourceLineNo">487</span> static int skipVaruint64(PositionedByteRange src, boolean cmp) {<a name="line.487"></a> |
| <span class="sourceLineNo">488</span> final int len = lengthVaruint64(src, cmp);<a name="line.488"></a> |
| <span class="sourceLineNo">489</span> src.setPosition(src.getPosition() + len);<a name="line.489"></a> |
| <span class="sourceLineNo">490</span> return len;<a name="line.490"></a> |
| <span class="sourceLineNo">491</span> }<a name="line.491"></a> |
| <span class="sourceLineNo">492</span><a name="line.492"></a> |
| <span class="sourceLineNo">493</span> /**<a name="line.493"></a> |
| <span class="sourceLineNo">494</span> * Decode a sequence of bytes in {@code src} as a varuint64. Compliment the encoded value when<a name="line.494"></a> |
| <span class="sourceLineNo">495</span> * {@code comp} is true.<a name="line.495"></a> |
| <span class="sourceLineNo">496</span> * @return the decoded value.<a name="line.496"></a> |
| <span class="sourceLineNo">497</span> */<a name="line.497"></a> |
| <span class="sourceLineNo">498</span> static long getVaruint64(PositionedByteRange src, boolean comp) {<a name="line.498"></a> |
| <span class="sourceLineNo">499</span> assert src.getRemaining() >= lengthVaruint64(src, comp);<a name="line.499"></a> |
| <span class="sourceLineNo">500</span> final long ret;<a name="line.500"></a> |
| <span class="sourceLineNo">501</span> Order ord = comp ? DESCENDING : ASCENDING;<a name="line.501"></a> |
| <span class="sourceLineNo">502</span> byte x = src.get();<a name="line.502"></a> |
| <span class="sourceLineNo">503</span> final int a0 = ord.apply(x) & 0xff, a1, a2, a3, a4, a5, a6, a7, a8;<a name="line.503"></a> |
| <span class="sourceLineNo">504</span> if (-1 == unsignedCmp(a0, 241)) {<a name="line.504"></a> |
| <span class="sourceLineNo">505</span> return a0;<a name="line.505"></a> |
| <span class="sourceLineNo">506</span> }<a name="line.506"></a> |
| <span class="sourceLineNo">507</span> x = src.get();<a name="line.507"></a> |
| <span class="sourceLineNo">508</span> a1 = ord.apply(x) & 0xff;<a name="line.508"></a> |
| <span class="sourceLineNo">509</span> if (-1 == unsignedCmp(a0, 249)) {<a name="line.509"></a> |
| <span class="sourceLineNo">510</span> return (a0 - 241L) * 256 + a1 + 240;<a name="line.510"></a> |
| <span class="sourceLineNo">511</span> }<a name="line.511"></a> |
| <span class="sourceLineNo">512</span> x = src.get();<a name="line.512"></a> |
| <span class="sourceLineNo">513</span> a2 = ord.apply(x) & 0xff;<a name="line.513"></a> |
| <span class="sourceLineNo">514</span> if (a0 == 249) {<a name="line.514"></a> |
| <span class="sourceLineNo">515</span> return 2288L + 256 * a1 + a2;<a name="line.515"></a> |
| <span class="sourceLineNo">516</span> }<a name="line.516"></a> |
| <span class="sourceLineNo">517</span> x = src.get();<a name="line.517"></a> |
| <span class="sourceLineNo">518</span> a3 = ord.apply(x) & 0xff;<a name="line.518"></a> |
| <span class="sourceLineNo">519</span> if (a0 == 250) {<a name="line.519"></a> |
| <span class="sourceLineNo">520</span> return ((long) a1 << 16L) | (a2 << 8) | a3;<a name="line.520"></a> |
| <span class="sourceLineNo">521</span> }<a name="line.521"></a> |
| <span class="sourceLineNo">522</span> x = src.get();<a name="line.522"></a> |
| <span class="sourceLineNo">523</span> a4 = ord.apply(x) & 0xff;<a name="line.523"></a> |
| <span class="sourceLineNo">524</span> ret = (((long) a1) << 24) | (a2 << 16) | (a3 << 8) | a4;<a name="line.524"></a> |
| <span class="sourceLineNo">525</span> if (a0 == 251) {<a name="line.525"></a> |
| <span class="sourceLineNo">526</span> return ret;<a name="line.526"></a> |
| <span class="sourceLineNo">527</span> }<a name="line.527"></a> |
| <span class="sourceLineNo">528</span> x = src.get();<a name="line.528"></a> |
| <span class="sourceLineNo">529</span> a5 = ord.apply(x) & 0xff;<a name="line.529"></a> |
| <span class="sourceLineNo">530</span> if (a0 == 252) {<a name="line.530"></a> |
| <span class="sourceLineNo">531</span> return (ret << 8) | a5;<a name="line.531"></a> |
| <span class="sourceLineNo">532</span> }<a name="line.532"></a> |
| <span class="sourceLineNo">533</span> x = src.get();<a name="line.533"></a> |
| <span class="sourceLineNo">534</span> a6 = ord.apply(x) & 0xff;<a name="line.534"></a> |
| <span class="sourceLineNo">535</span> if (a0 == 253) {<a name="line.535"></a> |
| <span class="sourceLineNo">536</span> return (ret << 16) | (a5 << 8) | a6;<a name="line.536"></a> |
| <span class="sourceLineNo">537</span> }<a name="line.537"></a> |
| <span class="sourceLineNo">538</span> x = src.get();<a name="line.538"></a> |
| <span class="sourceLineNo">539</span> a7 = ord.apply(x) & 0xff;<a name="line.539"></a> |
| <span class="sourceLineNo">540</span> if (a0 == 254) {<a name="line.540"></a> |
| <span class="sourceLineNo">541</span> return (ret << 24) | (a5 << 16) | (a6 << 8) | a7;<a name="line.541"></a> |
| <span class="sourceLineNo">542</span> }<a name="line.542"></a> |
| <span class="sourceLineNo">543</span> x = src.get();<a name="line.543"></a> |
| <span class="sourceLineNo">544</span> a8 = ord.apply(x) & 0xff;<a name="line.544"></a> |
| <span class="sourceLineNo">545</span> return (ret << 32) | (((long) a5) << 24) | (a6 << 16) | (a7 << 8) | a8;<a name="line.545"></a> |
| <span class="sourceLineNo">546</span> }<a name="line.546"></a> |
| <span class="sourceLineNo">547</span><a name="line.547"></a> |
| <span class="sourceLineNo">548</span> /**<a name="line.548"></a> |
| <span class="sourceLineNo">549</span> * Strip all trailing zeros to ensure that no digit will be zero and round using our default<a name="line.549"></a> |
| <span class="sourceLineNo">550</span> * context to ensure precision doesn't exceed max allowed. From Phoenix's {@code NumberUtil}.<a name="line.550"></a> |
| <span class="sourceLineNo">551</span> * @return new {@link BigDecimal} instance<a name="line.551"></a> |
| <span class="sourceLineNo">552</span> */<a name="line.552"></a> |
| <span class="sourceLineNo">553</span> static BigDecimal normalize(BigDecimal val) {<a name="line.553"></a> |
| <span class="sourceLineNo">554</span> return null == val ? null : val.stripTrailingZeros().round(DEFAULT_MATH_CONTEXT);<a name="line.554"></a> |
| <span class="sourceLineNo">555</span> }<a name="line.555"></a> |
| <span class="sourceLineNo">556</span><a name="line.556"></a> |
| <span class="sourceLineNo">557</span> /**<a name="line.557"></a> |
| <span class="sourceLineNo">558</span> * Read significand digits from {@code src} according to the magnitude of {@code e}.<a name="line.558"></a> |
| <span class="sourceLineNo">559</span> * @param src The source from which to read encoded digits.<a name="line.559"></a> |
| <span class="sourceLineNo">560</span> * @param e The magnitude of the first digit read.<a name="line.560"></a> |
| <span class="sourceLineNo">561</span> * @param comp Treat encoded bytes as compliments when {@code comp} is true.<a name="line.561"></a> |
| <span class="sourceLineNo">562</span> * @return The decoded value.<a name="line.562"></a> |
| <span class="sourceLineNo">563</span> * @throws IllegalArgumentException when read exceeds the remaining length of {@code src}.<a name="line.563"></a> |
| <span class="sourceLineNo">564</span> */<a name="line.564"></a> |
| <span class="sourceLineNo">565</span> private static BigDecimal decodeSignificand(PositionedByteRange src, int e, boolean comp) {<a name="line.565"></a> |
| <span class="sourceLineNo">566</span> // TODO: can this be made faster?<a name="line.566"></a> |
| <span class="sourceLineNo">567</span> byte[] a = src.getBytes();<a name="line.567"></a> |
| <span class="sourceLineNo">568</span> final int start = src.getPosition(), offset = src.getOffset(), remaining = src.getRemaining();<a name="line.568"></a> |
| <span class="sourceLineNo">569</span> Order ord = comp ? DESCENDING : ASCENDING;<a name="line.569"></a> |
| <span class="sourceLineNo">570</span> BigDecimal m;<a name="line.570"></a> |
| <span class="sourceLineNo">571</span> StringBuilder sb = new StringBuilder();<a name="line.571"></a> |
| <span class="sourceLineNo">572</span> for (int i = 0;; i++) {<a name="line.572"></a> |
| <span class="sourceLineNo">573</span> if (i > remaining) {<a name="line.573"></a> |
| <span class="sourceLineNo">574</span> // we've exceeded this range's window<a name="line.574"></a> |
| <span class="sourceLineNo">575</span> src.setPosition(start);<a name="line.575"></a> |
| <span class="sourceLineNo">576</span> throw new IllegalArgumentException(<a name="line.576"></a> |
| <span class="sourceLineNo">577</span> "Read exceeds range before termination byte found. offset: " + offset + " position: "<a name="line.577"></a> |
| <span class="sourceLineNo">578</span> + (start + i));<a name="line.578"></a> |
| <span class="sourceLineNo">579</span> }<a name="line.579"></a> |
| <span class="sourceLineNo">580</span> // one byte -> 2 digits<a name="line.580"></a> |
| <span class="sourceLineNo">581</span> // base-100 digits are encoded as val * 2 + 1 except for the termination digit.<a name="line.581"></a> |
| <span class="sourceLineNo">582</span> int twoDigits = (ord.apply(a[offset + start + i]) & 0xff) / 2;<a name="line.582"></a> |
| <span class="sourceLineNo">583</span> sb.append(String.format("%02d", twoDigits));<a name="line.583"></a> |
| <span class="sourceLineNo">584</span> // detect termination digit<a name="line.584"></a> |
| <span class="sourceLineNo">585</span> // Besides, as we will normalise the return value at last,<a name="line.585"></a> |
| <span class="sourceLineNo">586</span> // we only need to decode at most MAX_PRECISION + 2 digits here.<a name="line.586"></a> |
| <span class="sourceLineNo">587</span> if ((ord.apply(a[offset + start + i]) & 1) == 0 || sb.length() > MAX_PRECISION + 1) {<a name="line.587"></a> |
| <span class="sourceLineNo">588</span> src.setPosition(start + i + 1);<a name="line.588"></a> |
| <span class="sourceLineNo">589</span> break;<a name="line.589"></a> |
| <span class="sourceLineNo">590</span> }<a name="line.590"></a> |
| <span class="sourceLineNo">591</span> }<a name="line.591"></a> |
| <span class="sourceLineNo">592</span> m = new BigDecimal(sb.toString());<a name="line.592"></a> |
| <span class="sourceLineNo">593</span> int stepsMoveLeft = sb.charAt(0) != '0' ? m.precision() : m.precision() + 1;<a name="line.593"></a> |
| <span class="sourceLineNo">594</span> stepsMoveLeft -= e * 2;<a name="line.594"></a> |
| <span class="sourceLineNo">595</span><a name="line.595"></a> |
| <span class="sourceLineNo">596</span> return normalize(m.movePointLeft(stepsMoveLeft));<a name="line.596"></a> |
| <span class="sourceLineNo">597</span> }<a name="line.597"></a> |
| <span class="sourceLineNo">598</span><a name="line.598"></a> |
| <span class="sourceLineNo">599</span> /**<a name="line.599"></a> |
| <span class="sourceLineNo">600</span> * Skip {@code src} over the significand bytes.<a name="line.600"></a> |
| <span class="sourceLineNo">601</span> * @param src The source from which to read encoded digits.<a name="line.601"></a> |
| <span class="sourceLineNo">602</span> * @param comp Treat encoded bytes as compliments when {@code comp} is true.<a name="line.602"></a> |
| <span class="sourceLineNo">603</span> * @return the number of bytes skipped.<a name="line.603"></a> |
| <span class="sourceLineNo">604</span> */<a name="line.604"></a> |
| <span class="sourceLineNo">605</span> private static int skipSignificand(PositionedByteRange src, boolean comp) {<a name="line.605"></a> |
| <span class="sourceLineNo">606</span> byte[] a = src.getBytes();<a name="line.606"></a> |
| <span class="sourceLineNo">607</span> final int offset = src.getOffset(), start = src.getPosition();<a name="line.607"></a> |
| <span class="sourceLineNo">608</span> int i = src.getPosition();<a name="line.608"></a> |
| <span class="sourceLineNo">609</span> while (((comp ? DESCENDING : ASCENDING).apply(a[offset + i++]) & 1) != 0)<a name="line.609"></a> |
| <span class="sourceLineNo">610</span> ;<a name="line.610"></a> |
| <span class="sourceLineNo">611</span> src.setPosition(i);<a name="line.611"></a> |
| <span class="sourceLineNo">612</span> return i - start;<a name="line.612"></a> |
| <span class="sourceLineNo">613</span> }<a name="line.613"></a> |
| <span class="sourceLineNo">614</span><a name="line.614"></a> |
| <span class="sourceLineNo">615</span> /**<a name="line.615"></a> |
| <span class="sourceLineNo">616</span> * <p><a name="line.616"></a> |
| <span class="sourceLineNo">617</span> * Encode the small magnitude floating point number {@code val} using the key encoding. The caller<a name="line.617"></a> |
| <span class="sourceLineNo">618</span> * guarantees that 1.0 > abs(val) > 0.0.<a name="line.618"></a> |
| <span class="sourceLineNo">619</span> * </p><a name="line.619"></a> |
| <span class="sourceLineNo">620</span> * <p><a name="line.620"></a> |
| <span class="sourceLineNo">621</span> * A floating point value is encoded as an integer exponent {@code E} and a mantissa {@code M}.<a name="line.621"></a> |
| <span class="sourceLineNo">622</span> * The original value is equal to {@code (M * 100^E)}. {@code E} is set to the smallest value<a name="line.622"></a> |
| <span class="sourceLineNo">623</span> * possible without making {@code M} greater than or equal to 1.0.<a name="line.623"></a> |
| <span class="sourceLineNo">624</span> * </p><a name="line.624"></a> |
| <span class="sourceLineNo">625</span> * <p><a name="line.625"></a> |
| <span class="sourceLineNo">626</span> * For this routine, {@code E} will always be zero or negative, since the original value is less<a name="line.626"></a> |
| <span class="sourceLineNo">627</span> * than one. The encoding written by this routine is the ones-complement of the varint of the<a name="line.627"></a> |
| <span class="sourceLineNo">628</span> * negative of {@code E} followed by the mantissa:<a name="line.628"></a> |
| <span class="sourceLineNo">629</span> *<a name="line.629"></a> |
| <span class="sourceLineNo">630</span> * <pre><a name="line.630"></a> |
| <span class="sourceLineNo">631</span> * Encoding: ~-E M<a name="line.631"></a> |
| <span class="sourceLineNo">632</span> * </pre><a name="line.632"></a> |
| <span class="sourceLineNo">633</span> * </p><a name="line.633"></a> |
| <span class="sourceLineNo">634</span> * @param dst The destination to which encoded digits are written.<a name="line.634"></a> |
| <span class="sourceLineNo">635</span> * @param val The value to encode.<a name="line.635"></a> |
| <span class="sourceLineNo">636</span> * @return the number of bytes written.<a name="line.636"></a> |
| <span class="sourceLineNo">637</span> */<a name="line.637"></a> |
| <span class="sourceLineNo">638</span> private static int encodeNumericSmall(PositionedByteRange dst, BigDecimal val) {<a name="line.638"></a> |
| <span class="sourceLineNo">639</span> // TODO: this can be done faster?<a name="line.639"></a> |
| <span class="sourceLineNo">640</span> // assert 1.0 > abs(val) > 0.0<a name="line.640"></a> |
| <span class="sourceLineNo">641</span> BigDecimal abs = val.abs();<a name="line.641"></a> |
| <span class="sourceLineNo">642</span> assert BigDecimal.ZERO.compareTo(abs) < 0 && BigDecimal.ONE.compareTo(abs) > 0;<a name="line.642"></a> |
| <span class="sourceLineNo">643</span> byte[] a = dst.getBytes();<a name="line.643"></a> |
| <span class="sourceLineNo">644</span> boolean isNeg = val.signum() == -1;<a name="line.644"></a> |
| <span class="sourceLineNo">645</span> final int offset = dst.getOffset(), start = dst.getPosition();<a name="line.645"></a> |
| <span class="sourceLineNo">646</span><a name="line.646"></a> |
| <span class="sourceLineNo">647</span> if (isNeg) { /* Small negative number: 0x14, -E, ~M */<a name="line.647"></a> |
| <span class="sourceLineNo">648</span> dst.put(NEG_SMALL);<a name="line.648"></a> |
| <span class="sourceLineNo">649</span> } else { /* Small positive number: 0x16, ~-E, M */<a name="line.649"></a> |
| <span class="sourceLineNo">650</span> dst.put(POS_SMALL);<a name="line.650"></a> |
| <span class="sourceLineNo">651</span> }<a name="line.651"></a> |
| <span class="sourceLineNo">652</span><a name="line.652"></a> |
| <span class="sourceLineNo">653</span> // normalize abs(val) to determine E<a name="line.653"></a> |
| <span class="sourceLineNo">654</span> int zerosBeforeFirstNonZero = abs.scale() - abs.precision();<a name="line.654"></a> |
| <span class="sourceLineNo">655</span> int lengthToMoveRight =<a name="line.655"></a> |
| <span class="sourceLineNo">656</span> zerosBeforeFirstNonZero % 2 == 0 ? zerosBeforeFirstNonZero : zerosBeforeFirstNonZero - 1;<a name="line.656"></a> |
| <span class="sourceLineNo">657</span> int e = lengthToMoveRight / 2;<a name="line.657"></a> |
| <span class="sourceLineNo">658</span> abs = abs.movePointRight(lengthToMoveRight);<a name="line.658"></a> |
| <span class="sourceLineNo">659</span><a name="line.659"></a> |
| <span class="sourceLineNo">660</span> putVaruint64(dst, e, !isNeg); // encode appropriate E value.<a name="line.660"></a> |
| <span class="sourceLineNo">661</span><a name="line.661"></a> |
| <span class="sourceLineNo">662</span> // encode M by peeling off centimal digits, encoding x as 2x+1<a name="line.662"></a> |
| <span class="sourceLineNo">663</span> int startM = dst.getPosition();<a name="line.663"></a> |
| <span class="sourceLineNo">664</span> encodeToCentimal(dst, abs);<a name="line.664"></a> |
| <span class="sourceLineNo">665</span> // terminal digit should be 2x<a name="line.665"></a> |
| <span class="sourceLineNo">666</span> a[offset + dst.getPosition() - 1] = (byte) (a[offset + dst.getPosition() - 1] & 0xfe);<a name="line.666"></a> |
| <span class="sourceLineNo">667</span> if (isNeg) {<a name="line.667"></a> |
| <span class="sourceLineNo">668</span> // negative values encoded as ~M<a name="line.668"></a> |
| <span class="sourceLineNo">669</span> DESCENDING.apply(a, offset + startM, dst.getPosition() - startM);<a name="line.669"></a> |
| <span class="sourceLineNo">670</span> }<a name="line.670"></a> |
| <span class="sourceLineNo">671</span> return dst.getPosition() - start;<a name="line.671"></a> |
| <span class="sourceLineNo">672</span> }<a name="line.672"></a> |
| <span class="sourceLineNo">673</span><a name="line.673"></a> |
| <span class="sourceLineNo">674</span> /**<a name="line.674"></a> |
| <span class="sourceLineNo">675</span> * Encode the large magnitude floating point number {@code val} using the key encoding. The caller<a name="line.675"></a> |
| <span class="sourceLineNo">676</span> * guarantees that {@code val} will be finite and abs(val) >= 1.0.<a name="line.676"></a> |
| <span class="sourceLineNo">677</span> * <p><a name="line.677"></a> |
| <span class="sourceLineNo">678</span> * A floating point value is encoded as an integer exponent {@code E} and a mantissa {@code M}.<a name="line.678"></a> |
| <span class="sourceLineNo">679</span> * The original value is equal to {@code (M * 100^E)}. {@code E} is set to the smallest value<a name="line.679"></a> |
| <span class="sourceLineNo">680</span> * possible without making {@code M} greater than or equal to 1.0.<a name="line.680"></a> |
| <span class="sourceLineNo">681</span> * </p><a name="line.681"></a> |
| <span class="sourceLineNo">682</span> * <p><a name="line.682"></a> |
| <span class="sourceLineNo">683</span> * Each centimal digit of the mantissa is stored in a byte. If the value of the centimal digit is<a name="line.683"></a> |
| <span class="sourceLineNo">684</span> * {@code X} (hence {@code X>=0} and {@code X<=99}) then the byte value will be {@code 2*X+1} for<a name="line.684"></a> |
| <span class="sourceLineNo">685</span> * every byte of the mantissa, except for the last byte which will be {@code 2*X+0}. The mantissa<a name="line.685"></a> |
| <span class="sourceLineNo">686</span> * must be the minimum number of bytes necessary to represent the value; trailing {@code X==0}<a name="line.686"></a> |
| <span class="sourceLineNo">687</span> * digits are omitted. This means that the mantissa will never contain a byte with the value<a name="line.687"></a> |
| <span class="sourceLineNo">688</span> * {@code 0x00}.<a name="line.688"></a> |
| <span class="sourceLineNo">689</span> * </p><a name="line.689"></a> |
| <span class="sourceLineNo">690</span> * <p><a name="line.690"></a> |
| <span class="sourceLineNo">691</span> * If {@code E > 10}, then this routine writes of {@code E} as a varint followed by the mantissa<a name="line.691"></a> |
| <span class="sourceLineNo">692</span> * as described above. Otherwise, if {@code E <= 10}, this routine only writes the mantissa and<a name="line.692"></a> |
| <span class="sourceLineNo">693</span> * leaves the {@code E} value to be encoded as part of the opening byte of the field by the<a name="line.693"></a> |
| <span class="sourceLineNo">694</span> * calling function.<a name="line.694"></a> |
| <span class="sourceLineNo">695</span> *<a name="line.695"></a> |
| <span class="sourceLineNo">696</span> * <pre><a name="line.696"></a> |
| <span class="sourceLineNo">697</span> * Encoding: M (if E&lt;=10)<a name="line.697"></a> |
| <span class="sourceLineNo">698</span> * E M (if E&gt;10)<a name="line.698"></a> |
| <span class="sourceLineNo">699</span> * </pre><a name="line.699"></a> |
| <span class="sourceLineNo">700</span> * </p><a name="line.700"></a> |
| <span class="sourceLineNo">701</span> * @param dst The destination to which encoded digits are written.<a name="line.701"></a> |
| <span class="sourceLineNo">702</span> * @param val The value to encode.<a name="line.702"></a> |
| <span class="sourceLineNo">703</span> * @return the number of bytes written.<a name="line.703"></a> |
| <span class="sourceLineNo">704</span> */<a name="line.704"></a> |
| <span class="sourceLineNo">705</span> private static int encodeNumericLarge(PositionedByteRange dst, BigDecimal val) {<a name="line.705"></a> |
| <span class="sourceLineNo">706</span> // TODO: this can be done faster<a name="line.706"></a> |
| <span class="sourceLineNo">707</span> BigDecimal abs = val.abs();<a name="line.707"></a> |
| <span class="sourceLineNo">708</span> byte[] a = dst.getBytes();<a name="line.708"></a> |
| <span class="sourceLineNo">709</span> boolean isNeg = val.signum() == -1;<a name="line.709"></a> |
| <span class="sourceLineNo">710</span> final int start = dst.getPosition(), offset = dst.getOffset();<a name="line.710"></a> |
| <span class="sourceLineNo">711</span><a name="line.711"></a> |
| <span class="sourceLineNo">712</span> if (isNeg) { /* Large negative number: 0x08, ~E, ~M */<a name="line.712"></a> |
| <span class="sourceLineNo">713</span> dst.put(NEG_LARGE);<a name="line.713"></a> |
| <span class="sourceLineNo">714</span> } else { /* Large positive number: 0x22, E, M */<a name="line.714"></a> |
| <span class="sourceLineNo">715</span> dst.put(POS_LARGE);<a name="line.715"></a> |
| <span class="sourceLineNo">716</span> }<a name="line.716"></a> |
| <span class="sourceLineNo">717</span><a name="line.717"></a> |
| <span class="sourceLineNo">718</span> // normalize abs(val) to determine E<a name="line.718"></a> |
| <span class="sourceLineNo">719</span> int integerDigits = abs.precision() - abs.scale();<a name="line.719"></a> |
| <span class="sourceLineNo">720</span> int lengthToMoveLeft = integerDigits % 2 == 0 ? integerDigits : integerDigits + 1;<a name="line.720"></a> |
| <span class="sourceLineNo">721</span> int e = lengthToMoveLeft / 2;<a name="line.721"></a> |
| <span class="sourceLineNo">722</span> abs = abs.movePointLeft(lengthToMoveLeft);<a name="line.722"></a> |
| <span class="sourceLineNo">723</span><a name="line.723"></a> |
| <span class="sourceLineNo">724</span> // encode appropriate header byte and/or E value.<a name="line.724"></a> |
| <span class="sourceLineNo">725</span> if (e > 10) { /* large number, write out {~,}E */<a name="line.725"></a> |
| <span class="sourceLineNo">726</span> putVaruint64(dst, e, isNeg);<a name="line.726"></a> |
| <span class="sourceLineNo">727</span> } else {<a name="line.727"></a> |
| <span class="sourceLineNo">728</span> if (isNeg) { /* Medium negative number: 0x13-E, ~M */<a name="line.728"></a> |
| <span class="sourceLineNo">729</span> dst.put(start, (byte) (NEG_MED_MAX - e));<a name="line.729"></a> |
| <span class="sourceLineNo">730</span> } else { /* Medium positive number: 0x17+E, M */<a name="line.730"></a> |
| <span class="sourceLineNo">731</span> dst.put(start, (byte) (POS_MED_MIN + e));<a name="line.731"></a> |
| <span class="sourceLineNo">732</span> }<a name="line.732"></a> |
| <span class="sourceLineNo">733</span> }<a name="line.733"></a> |
| <span class="sourceLineNo">734</span><a name="line.734"></a> |
| <span class="sourceLineNo">735</span> // encode M by peeling off centimal digits, encoding x as 2x+1<a name="line.735"></a> |
| <span class="sourceLineNo">736</span> int startM = dst.getPosition();<a name="line.736"></a> |
| <span class="sourceLineNo">737</span> encodeToCentimal(dst, abs);<a name="line.737"></a> |
| <span class="sourceLineNo">738</span> // terminal digit should be 2x<a name="line.738"></a> |
| <span class="sourceLineNo">739</span> a[offset + dst.getPosition() - 1] = (byte) (a[offset + dst.getPosition() - 1] & 0xfe);<a name="line.739"></a> |
| <span class="sourceLineNo">740</span> if (isNeg) {<a name="line.740"></a> |
| <span class="sourceLineNo">741</span> // negative values encoded as ~M<a name="line.741"></a> |
| <span class="sourceLineNo">742</span> DESCENDING.apply(a, offset + startM, dst.getPosition() - startM);<a name="line.742"></a> |
| <span class="sourceLineNo">743</span> }<a name="line.743"></a> |
| <span class="sourceLineNo">744</span> return dst.getPosition() - start;<a name="line.744"></a> |
| <span class="sourceLineNo">745</span> }<a name="line.745"></a> |
| <span class="sourceLineNo">746</span><a name="line.746"></a> |
| <span class="sourceLineNo">747</span> /**<a name="line.747"></a> |
| <span class="sourceLineNo">748</span> * Encode a value val in [0.01, 1.0) into Centimals. Util function for<a name="line.748"></a> |
| <span class="sourceLineNo">749</span> * {@link OrderedBytes#encodeNumericLarge(PositionedByteRange, BigDecimal)} and<a name="line.749"></a> |
| <span class="sourceLineNo">750</span> * {@link OrderedBytes#encodeNumericSmall(PositionedByteRange, BigDecimal)}<a name="line.750"></a> |
| <span class="sourceLineNo">751</span> * @param dst The destination to which encoded digits are written.<a name="line.751"></a> |
| <span class="sourceLineNo">752</span> * @param val A BigDecimal after the normalization. The value must be in [0.01, 1.0).<a name="line.752"></a> |
| <span class="sourceLineNo">753</span> */<a name="line.753"></a> |
| <span class="sourceLineNo">754</span> private static void encodeToCentimal(PositionedByteRange dst, BigDecimal val) {<a name="line.754"></a> |
| <span class="sourceLineNo">755</span> // The input value val must be in [0.01, 1.0)<a name="line.755"></a> |
| <span class="sourceLineNo">756</span> String stringOfAbs = val.stripTrailingZeros().toPlainString();<a name="line.756"></a> |
| <span class="sourceLineNo">757</span> String value = stringOfAbs.substring(stringOfAbs.indexOf('.') + 1);<a name="line.757"></a> |
| <span class="sourceLineNo">758</span> int d;<a name="line.758"></a> |
| <span class="sourceLineNo">759</span><a name="line.759"></a> |
| <span class="sourceLineNo">760</span> // If the first float digit is 0, we will encode one digit more than MAX_PRECISION<a name="line.760"></a> |
| <span class="sourceLineNo">761</span> // We encode at most MAX_PRECISION significant digits into centimals,<a name="line.761"></a> |
| <span class="sourceLineNo">762</span> // because the input value, has been already normalized.<a name="line.762"></a> |
| <span class="sourceLineNo">763</span> int maxPrecision = value.charAt(0) == '0' ? MAX_PRECISION + 1 : MAX_PRECISION;<a name="line.763"></a> |
| <span class="sourceLineNo">764</span> maxPrecision = Math.min(maxPrecision, value.length());<a name="line.764"></a> |
| <span class="sourceLineNo">765</span> for (int i = 0; i < maxPrecision; i += 2) {<a name="line.765"></a> |
| <span class="sourceLineNo">766</span> d = (value.charAt(i) - '0') * 10;<a name="line.766"></a> |
| <span class="sourceLineNo">767</span> if (i + 1 < maxPrecision) {<a name="line.767"></a> |
| <span class="sourceLineNo">768</span> d += (value.charAt(i + 1) - '0');<a name="line.768"></a> |
| <span class="sourceLineNo">769</span> }<a name="line.769"></a> |
| <span class="sourceLineNo">770</span> dst.put((byte) (2 * d + 1));<a name="line.770"></a> |
| <span class="sourceLineNo">771</span> }<a name="line.771"></a> |
| <span class="sourceLineNo">772</span> }<a name="line.772"></a> |
| <span class="sourceLineNo">773</span><a name="line.773"></a> |
| <span class="sourceLineNo">774</span> /**<a name="line.774"></a> |
| <span class="sourceLineNo">775</span> * Encode a numerical value using the variable-length encoding.<a name="line.775"></a> |
| <span class="sourceLineNo">776</span> * @param dst The destination to which encoded digits are written.<a name="line.776"></a> |
| <span class="sourceLineNo">777</span> * @param val The value to encode.<a name="line.777"></a> |
| <span class="sourceLineNo">778</span> * @param ord The {@link Order} to respect while encoding {@code val}.<a name="line.778"></a> |
| <span class="sourceLineNo">779</span> * @return the number of bytes written.<a name="line.779"></a> |
| <span class="sourceLineNo">780</span> */<a name="line.780"></a> |
| <span class="sourceLineNo">781</span> public static int encodeNumeric(PositionedByteRange dst, long val, Order ord) {<a name="line.781"></a> |
| <span class="sourceLineNo">782</span> return encodeNumeric(dst, BigDecimal.valueOf(val), ord);<a name="line.782"></a> |
| <span class="sourceLineNo">783</span> }<a name="line.783"></a> |
| <span class="sourceLineNo">784</span><a name="line.784"></a> |
| <span class="sourceLineNo">785</span> /**<a name="line.785"></a> |
| <span class="sourceLineNo">786</span> * Encode a numerical value using the variable-length encoding.<a name="line.786"></a> |
| <span class="sourceLineNo">787</span> * @param dst The destination to which encoded digits are written.<a name="line.787"></a> |
| <span class="sourceLineNo">788</span> * @param val The value to encode.<a name="line.788"></a> |
| <span class="sourceLineNo">789</span> * @param ord The {@link Order} to respect while encoding {@code val}.<a name="line.789"></a> |
| <span class="sourceLineNo">790</span> * @return the number of bytes written.<a name="line.790"></a> |
| <span class="sourceLineNo">791</span> */<a name="line.791"></a> |
| <span class="sourceLineNo">792</span> public static int encodeNumeric(PositionedByteRange dst, double val, Order ord) {<a name="line.792"></a> |
| <span class="sourceLineNo">793</span> if (val == 0.0) {<a name="line.793"></a> |
| <span class="sourceLineNo">794</span> dst.put(ord.apply(ZERO));<a name="line.794"></a> |
| <span class="sourceLineNo">795</span> return 1;<a name="line.795"></a> |
| <span class="sourceLineNo">796</span> }<a name="line.796"></a> |
| <span class="sourceLineNo">797</span> if (Double.isNaN(val)) {<a name="line.797"></a> |
| <span class="sourceLineNo">798</span> dst.put(ord.apply(NAN));<a name="line.798"></a> |
| <span class="sourceLineNo">799</span> return 1;<a name="line.799"></a> |
| <span class="sourceLineNo">800</span> }<a name="line.800"></a> |
| <span class="sourceLineNo">801</span> if (val == Double.NEGATIVE_INFINITY) {<a name="line.801"></a> |
| <span class="sourceLineNo">802</span> dst.put(ord.apply(NEG_INF));<a name="line.802"></a> |
| <span class="sourceLineNo">803</span> return 1;<a name="line.803"></a> |
| <span class="sourceLineNo">804</span> }<a name="line.804"></a> |
| <span class="sourceLineNo">805</span> if (val == Double.POSITIVE_INFINITY) {<a name="line.805"></a> |
| <span class="sourceLineNo">806</span> dst.put(ord.apply(POS_INF));<a name="line.806"></a> |
| <span class="sourceLineNo">807</span> return 1;<a name="line.807"></a> |
| <span class="sourceLineNo">808</span> }<a name="line.808"></a> |
| <span class="sourceLineNo">809</span> return encodeNumeric(dst, BigDecimal.valueOf(val), ord);<a name="line.809"></a> |
| <span class="sourceLineNo">810</span> }<a name="line.810"></a> |
| <span class="sourceLineNo">811</span><a name="line.811"></a> |
| <span class="sourceLineNo">812</span> /**<a name="line.812"></a> |
| <span class="sourceLineNo">813</span> * Encode a numerical value using the variable-length encoding. If the number of significant<a name="line.813"></a> |
| <span class="sourceLineNo">814</span> * digits of the value exceeds the {@link OrderedBytes#MAX_PRECISION}, the exceeding part will be<a name="line.814"></a> |
| <span class="sourceLineNo">815</span> * lost.<a name="line.815"></a> |
| <span class="sourceLineNo">816</span> * @param dst The destination to which encoded digits are written.<a name="line.816"></a> |
| <span class="sourceLineNo">817</span> * @param val The value to encode.<a name="line.817"></a> |
| <span class="sourceLineNo">818</span> * @param ord The {@link Order} to respect while encoding {@code val}.<a name="line.818"></a> |
| <span class="sourceLineNo">819</span> * @return the number of bytes written.<a name="line.819"></a> |
| <span class="sourceLineNo">820</span> */<a name="line.820"></a> |
| <span class="sourceLineNo">821</span> public static int encodeNumeric(PositionedByteRange dst, BigDecimal val, Order ord) {<a name="line.821"></a> |
| <span class="sourceLineNo">822</span> final int len, offset = dst.getOffset(), start = dst.getPosition();<a name="line.822"></a> |
| <span class="sourceLineNo">823</span> if (null == val) {<a name="line.823"></a> |
| <span class="sourceLineNo">824</span> return encodeNull(dst, ord);<a name="line.824"></a> |
| <span class="sourceLineNo">825</span> } else if (BigDecimal.ZERO.compareTo(val) == 0) {<a name="line.825"></a> |
| <span class="sourceLineNo">826</span> dst.put(ord.apply(ZERO));<a name="line.826"></a> |
| <span class="sourceLineNo">827</span> return 1;<a name="line.827"></a> |
| <span class="sourceLineNo">828</span> }<a name="line.828"></a> |
| <span class="sourceLineNo">829</span> BigDecimal abs = val.abs();<a name="line.829"></a> |
| <span class="sourceLineNo">830</span> if (BigDecimal.ONE.compareTo(abs) <= 0) { // abs(v) >= 1.0<a name="line.830"></a> |
| <span class="sourceLineNo">831</span> len = encodeNumericLarge(dst, normalize(val));<a name="line.831"></a> |
| <span class="sourceLineNo">832</span> } else { // 1.0 > abs(v) >= 0.0<a name="line.832"></a> |
| <span class="sourceLineNo">833</span> len = encodeNumericSmall(dst, normalize(val));<a name="line.833"></a> |
| <span class="sourceLineNo">834</span> }<a name="line.834"></a> |
| <span class="sourceLineNo">835</span> ord.apply(dst.getBytes(), offset + start, len);<a name="line.835"></a> |
| <span class="sourceLineNo">836</span> return len;<a name="line.836"></a> |
| <span class="sourceLineNo">837</span> }<a name="line.837"></a> |
| <span class="sourceLineNo">838</span><a name="line.838"></a> |
| <span class="sourceLineNo">839</span> /**<a name="line.839"></a> |
| <span class="sourceLineNo">840</span> * Decode a {@link BigDecimal} from {@code src}. Assumes {@code src} encodes a value in Numeric<a name="line.840"></a> |
| <span class="sourceLineNo">841</span> * encoding and is within the valid range of {@link BigDecimal} values. {@link BigDecimal} does<a name="line.841"></a> |
| <span class="sourceLineNo">842</span> * not support {@code NaN} or {@code Infinte} values.<a name="line.842"></a> |
| <span class="sourceLineNo">843</span> * @see #decodeNumericAsDouble(PositionedByteRange)<a name="line.843"></a> |
| <span class="sourceLineNo">844</span> */<a name="line.844"></a> |
| <span class="sourceLineNo">845</span> private static BigDecimal decodeNumericValue(PositionedByteRange src) {<a name="line.845"></a> |
| <span class="sourceLineNo">846</span> final int e;<a name="line.846"></a> |
| <span class="sourceLineNo">847</span> byte header = src.get();<a name="line.847"></a> |
| <span class="sourceLineNo">848</span> boolean dsc = -1 == Integer.signum(header);<a name="line.848"></a> |
| <span class="sourceLineNo">849</span> header = dsc ? DESCENDING.apply(header) : header;<a name="line.849"></a> |
| <span class="sourceLineNo">850</span><a name="line.850"></a> |
| <span class="sourceLineNo">851</span> if (header == NULL) return null;<a name="line.851"></a> |
| <span class="sourceLineNo">852</span> if (header == NEG_LARGE) { /* Large negative number: 0x08, ~E, ~M */<a name="line.852"></a> |
| <span class="sourceLineNo">853</span> e = (int) getVaruint64(src, !dsc);<a name="line.853"></a> |
| <span class="sourceLineNo">854</span> return decodeSignificand(src, e, !dsc).negate();<a name="line.854"></a> |
| <span class="sourceLineNo">855</span> }<a name="line.855"></a> |
| <span class="sourceLineNo">856</span> if (header >= NEG_MED_MIN && header <= NEG_MED_MAX) {<a name="line.856"></a> |
| <span class="sourceLineNo">857</span> /* Medium negative number: 0x13-E, ~M */<a name="line.857"></a> |
| <span class="sourceLineNo">858</span> e = NEG_MED_MAX - header;<a name="line.858"></a> |
| <span class="sourceLineNo">859</span> return decodeSignificand(src, e, !dsc).negate();<a name="line.859"></a> |
| <span class="sourceLineNo">860</span> }<a name="line.860"></a> |
| <span class="sourceLineNo">861</span> if (header == NEG_SMALL) { /* Small negative number: 0x14, -E, ~M */<a name="line.861"></a> |
| <span class="sourceLineNo">862</span> e = (int) -getVaruint64(src, dsc);<a name="line.862"></a> |
| <span class="sourceLineNo">863</span> return decodeSignificand(src, e, !dsc).negate();<a name="line.863"></a> |
| <span class="sourceLineNo">864</span> }<a name="line.864"></a> |
| <span class="sourceLineNo">865</span> if (header == ZERO) {<a name="line.865"></a> |
| <span class="sourceLineNo">866</span> return BigDecimal.ZERO;<a name="line.866"></a> |
| <span class="sourceLineNo">867</span> }<a name="line.867"></a> |
| <span class="sourceLineNo">868</span> if (header == POS_SMALL) { /* Small positive number: 0x16, ~-E, M */<a name="line.868"></a> |
| <span class="sourceLineNo">869</span> e = (int) -getVaruint64(src, !dsc);<a name="line.869"></a> |
| <span class="sourceLineNo">870</span> return decodeSignificand(src, e, dsc);<a name="line.870"></a> |
| <span class="sourceLineNo">871</span> }<a name="line.871"></a> |
| <span class="sourceLineNo">872</span> if (header >= POS_MED_MIN && header <= POS_MED_MAX) {<a name="line.872"></a> |
| <span class="sourceLineNo">873</span> /* Medium positive number: 0x17+E, M */<a name="line.873"></a> |
| <span class="sourceLineNo">874</span> e = header - POS_MED_MIN;<a name="line.874"></a> |
| <span class="sourceLineNo">875</span> return decodeSignificand(src, e, dsc);<a name="line.875"></a> |
| <span class="sourceLineNo">876</span> }<a name="line.876"></a> |
| <span class="sourceLineNo">877</span> if (header == POS_LARGE) { /* Large positive number: 0x22, E, M */<a name="line.877"></a> |
| <span class="sourceLineNo">878</span> e = (int) getVaruint64(src, dsc);<a name="line.878"></a> |
| <span class="sourceLineNo">879</span> return decodeSignificand(src, e, dsc);<a name="line.879"></a> |
| <span class="sourceLineNo">880</span> }<a name="line.880"></a> |
| <span class="sourceLineNo">881</span> throw unexpectedHeader(header);<a name="line.881"></a> |
| <span class="sourceLineNo">882</span> }<a name="line.882"></a> |
| <span class="sourceLineNo">883</span><a name="line.883"></a> |
| <span class="sourceLineNo">884</span> /**<a name="line.884"></a> |
| <span class="sourceLineNo">885</span> * Decode a primitive {@code double} value from the Numeric encoding. Numeric encoding is based on<a name="line.885"></a> |
| <span class="sourceLineNo">886</span> * {@link BigDecimal}; in the event the encoded value is larger than can be represented in a<a name="line.886"></a> |
| <span class="sourceLineNo">887</span> * {@code double}, this method performs an implicit narrowing conversion as described in<a name="line.887"></a> |
| <span class="sourceLineNo">888</span> * {@link BigDecimal#doubleValue()}.<a name="line.888"></a> |
| <span class="sourceLineNo">889</span> * @throws NullPointerException when the encoded value is {@code NULL}.<a name="line.889"></a> |
| <span class="sourceLineNo">890</span> * @throws IllegalArgumentException when the encoded value is not a Numeric.<a name="line.890"></a> |
| <span class="sourceLineNo">891</span> * @see #encodeNumeric(PositionedByteRange, double, Order)<a name="line.891"></a> |
| <span class="sourceLineNo">892</span> * @see BigDecimal#doubleValue()<a name="line.892"></a> |
| <span class="sourceLineNo">893</span> */<a name="line.893"></a> |
| <span class="sourceLineNo">894</span> public static double decodeNumericAsDouble(PositionedByteRange src) {<a name="line.894"></a> |
| <span class="sourceLineNo">895</span> // TODO: should an encoded NULL value throw unexpectedHeader() instead?<a name="line.895"></a> |
| <span class="sourceLineNo">896</span> if (isNull(src)) {<a name="line.896"></a> |
| <span class="sourceLineNo">897</span> throw new NullPointerException("A null value cannot be decoded to a double.");<a name="line.897"></a> |
| <span class="sourceLineNo">898</span> }<a name="line.898"></a> |
| <span class="sourceLineNo">899</span> if (isNumericNaN(src)) {<a name="line.899"></a> |
| <span class="sourceLineNo">900</span> src.get();<a name="line.900"></a> |
| <span class="sourceLineNo">901</span> return Double.NaN;<a name="line.901"></a> |
| <span class="sourceLineNo">902</span> }<a name="line.902"></a> |
| <span class="sourceLineNo">903</span> if (isNumericZero(src)) {<a name="line.903"></a> |
| <span class="sourceLineNo">904</span> src.get();<a name="line.904"></a> |
| <span class="sourceLineNo">905</span> return Double.valueOf(0.0);<a name="line.905"></a> |
| <span class="sourceLineNo">906</span> }<a name="line.906"></a> |
| <span class="sourceLineNo">907</span><a name="line.907"></a> |
| <span class="sourceLineNo">908</span> byte header = -1 == Integer.signum(src.peek()) ? DESCENDING.apply(src.peek()) : src.peek();<a name="line.908"></a> |
| <span class="sourceLineNo">909</span><a name="line.909"></a> |
| <span class="sourceLineNo">910</span> if (header == NEG_INF) {<a name="line.910"></a> |
| <span class="sourceLineNo">911</span> src.get();<a name="line.911"></a> |
| <span class="sourceLineNo">912</span> return Double.NEGATIVE_INFINITY;<a name="line.912"></a> |
| <span class="sourceLineNo">913</span> } else if (header == POS_INF) {<a name="line.913"></a> |
| <span class="sourceLineNo">914</span> src.get();<a name="line.914"></a> |
| <span class="sourceLineNo">915</span> return Double.POSITIVE_INFINITY;<a name="line.915"></a> |
| <span class="sourceLineNo">916</span> } else {<a name="line.916"></a> |
| <span class="sourceLineNo">917</span> return decodeNumericValue(src).doubleValue();<a name="line.917"></a> |
| <span class="sourceLineNo">918</span> }<a name="line.918"></a> |
| <span class="sourceLineNo">919</span> }<a name="line.919"></a> |
| <span class="sourceLineNo">920</span><a name="line.920"></a> |
| <span class="sourceLineNo">921</span> /**<a name="line.921"></a> |
| <span class="sourceLineNo">922</span> * Decode a primitive {@code long} value from the Numeric encoding. Numeric encoding is based on<a name="line.922"></a> |
| <span class="sourceLineNo">923</span> * {@link BigDecimal}; in the event the encoded value is larger than can be represented in a<a name="line.923"></a> |
| <span class="sourceLineNo">924</span> * {@code long}, this method performs an implicit narrowing conversion as described in<a name="line.924"></a> |
| <span class="sourceLineNo">925</span> * {@link BigDecimal#doubleValue()}.<a name="line.925"></a> |
| <span class="sourceLineNo">926</span> * @throws NullPointerException when the encoded value is {@code NULL}.<a name="line.926"></a> |
| <span class="sourceLineNo">927</span> * @throws IllegalArgumentException when the encoded value is not a Numeric.<a name="line.927"></a> |
| <span class="sourceLineNo">928</span> * @see #encodeNumeric(PositionedByteRange, long, Order)<a name="line.928"></a> |
| <span class="sourceLineNo">929</span> * @see BigDecimal#longValue()<a name="line.929"></a> |
| <span class="sourceLineNo">930</span> */<a name="line.930"></a> |
| <span class="sourceLineNo">931</span> public static long decodeNumericAsLong(PositionedByteRange src) {<a name="line.931"></a> |
| <span class="sourceLineNo">932</span> // TODO: should an encoded NULL value throw unexpectedHeader() instead?<a name="line.932"></a> |
| <span class="sourceLineNo">933</span> if (isNull(src)) throw new NullPointerException();<a name="line.933"></a> |
| <span class="sourceLineNo">934</span> if (!isNumeric(src)) throw unexpectedHeader(src.peek());<a name="line.934"></a> |
| <span class="sourceLineNo">935</span> if (isNumericNaN(src)) throw unexpectedHeader(src.peek());<a name="line.935"></a> |
| <span class="sourceLineNo">936</span> if (isNumericInfinite(src)) throw unexpectedHeader(src.peek());<a name="line.936"></a> |
| <span class="sourceLineNo">937</span><a name="line.937"></a> |
| <span class="sourceLineNo">938</span> if (isNumericZero(src)) {<a name="line.938"></a> |
| <span class="sourceLineNo">939</span> src.get();<a name="line.939"></a> |
| <span class="sourceLineNo">940</span> return Long.valueOf(0);<a name="line.940"></a> |
| <span class="sourceLineNo">941</span> }<a name="line.941"></a> |
| <span class="sourceLineNo">942</span> return decodeNumericValue(src).longValue();<a name="line.942"></a> |
| <span class="sourceLineNo">943</span> }<a name="line.943"></a> |
| <span class="sourceLineNo">944</span><a name="line.944"></a> |
| <span class="sourceLineNo">945</span> /**<a name="line.945"></a> |
| <span class="sourceLineNo">946</span> * Decode a {@link BigDecimal} value from the variable-length encoding.<a name="line.946"></a> |
| <span class="sourceLineNo">947</span> * @throws IllegalArgumentException when the encoded value is not a Numeric.<a name="line.947"></a> |
| <span class="sourceLineNo">948</span> * @see #encodeNumeric(PositionedByteRange, BigDecimal, Order)<a name="line.948"></a> |
| <span class="sourceLineNo">949</span> */<a name="line.949"></a> |
| <span class="sourceLineNo">950</span> public static BigDecimal decodeNumericAsBigDecimal(PositionedByteRange src) {<a name="line.950"></a> |
| <span class="sourceLineNo">951</span> if (isNull(src)) {<a name="line.951"></a> |
| <span class="sourceLineNo">952</span> src.get();<a name="line.952"></a> |
| <span class="sourceLineNo">953</span> return null;<a name="line.953"></a> |
| <span class="sourceLineNo">954</span> }<a name="line.954"></a> |
| <span class="sourceLineNo">955</span> if (!isNumeric(src)) throw unexpectedHeader(src.peek());<a name="line.955"></a> |
| <span class="sourceLineNo">956</span> if (isNumericNaN(src)) throw unexpectedHeader(src.peek());<a name="line.956"></a> |
| <span class="sourceLineNo">957</span> if (isNumericInfinite(src)) throw unexpectedHeader(src.peek());<a name="line.957"></a> |
| <span class="sourceLineNo">958</span> return decodeNumericValue(src);<a name="line.958"></a> |
| <span class="sourceLineNo">959</span> }<a name="line.959"></a> |
| <span class="sourceLineNo">960</span><a name="line.960"></a> |
| <span class="sourceLineNo">961</span> /**<a name="line.961"></a> |
| <span class="sourceLineNo">962</span> * Encode a String value. String encoding is 0x00-terminated and so it does not support<a name="line.962"></a> |
| <span class="sourceLineNo">963</span> * {@code \u0000} codepoints in the value.<a name="line.963"></a> |
| <span class="sourceLineNo">964</span> * @param dst The destination to which the encoded value is written.<a name="line.964"></a> |
| <span class="sourceLineNo">965</span> * @param val The value to encode.<a name="line.965"></a> |
| <span class="sourceLineNo">966</span> * @param ord The {@link Order} to respect while encoding {@code val}.<a name="line.966"></a> |
| <span class="sourceLineNo">967</span> * @return the number of bytes written.<a name="line.967"></a> |
| <span class="sourceLineNo">968</span> * @throws IllegalArgumentException when {@code val} contains a {@code \u0000}.<a name="line.968"></a> |
| <span class="sourceLineNo">969</span> */<a name="line.969"></a> |
| <span class="sourceLineNo">970</span> public static int encodeString(PositionedByteRange dst, String val, Order ord) {<a name="line.970"></a> |
| <span class="sourceLineNo">971</span> if (null == val) {<a name="line.971"></a> |
| <span class="sourceLineNo">972</span> return encodeNull(dst, ord);<a name="line.972"></a> |
| <span class="sourceLineNo">973</span> }<a name="line.973"></a> |
| <span class="sourceLineNo">974</span> if (val.contains("\u0000"))<a name="line.974"></a> |
| <span class="sourceLineNo">975</span> throw new IllegalArgumentException("Cannot encode String values containing '\\u0000'");<a name="line.975"></a> |
| <span class="sourceLineNo">976</span> final int offset = dst.getOffset(), start = dst.getPosition();<a name="line.976"></a> |
| <span class="sourceLineNo">977</span> dst.put(TEXT);<a name="line.977"></a> |
| <span class="sourceLineNo">978</span> // TODO: is there no way to decode into dst directly?<a name="line.978"></a> |
| <span class="sourceLineNo">979</span> dst.put(val.getBytes(UTF8));<a name="line.979"></a> |
| <span class="sourceLineNo">980</span> dst.put(TERM);<a name="line.980"></a> |
| <span class="sourceLineNo">981</span> ord.apply(dst.getBytes(), offset + start, dst.getPosition() - start);<a name="line.981"></a> |
| <span class="sourceLineNo">982</span> return dst.getPosition() - start;<a name="line.982"></a> |
| <span class="sourceLineNo">983</span> }<a name="line.983"></a> |
| <span class="sourceLineNo">984</span><a name="line.984"></a> |
| <span class="sourceLineNo">985</span> /**<a name="line.985"></a> |
| <span class="sourceLineNo">986</span> * Decode a String value.<a name="line.986"></a> |
| <span class="sourceLineNo">987</span> */<a name="line.987"></a> |
| <span class="sourceLineNo">988</span> public static String decodeString(PositionedByteRange src) {<a name="line.988"></a> |
| <span class="sourceLineNo">989</span> final byte header = src.get();<a name="line.989"></a> |
| <span class="sourceLineNo">990</span> if (header == NULL || header == DESCENDING.apply(NULL)) return null;<a name="line.990"></a> |
| <span class="sourceLineNo">991</span> assert header == TEXT || header == DESCENDING.apply(TEXT);<a name="line.991"></a> |
| <span class="sourceLineNo">992</span> Order ord = header == TEXT ? ASCENDING : DESCENDING;<a name="line.992"></a> |
| <span class="sourceLineNo">993</span> byte[] a = src.getBytes();<a name="line.993"></a> |
| <span class="sourceLineNo">994</span> final int offset = src.getOffset(), start = src.getPosition();<a name="line.994"></a> |
| <span class="sourceLineNo">995</span> final byte terminator = ord.apply(TERM);<a name="line.995"></a> |
| <span class="sourceLineNo">996</span> int rawStartPos = offset + start, rawTermPos = rawStartPos;<a name="line.996"></a> |
| <span class="sourceLineNo">997</span> for (; a[rawTermPos] != terminator; rawTermPos++)<a name="line.997"></a> |
| <span class="sourceLineNo">998</span> ;<a name="line.998"></a> |
| <span class="sourceLineNo">999</span> src.setPosition(rawTermPos - offset + 1); // advance position to TERM + 1<a name="line.999"></a> |
| <span class="sourceLineNo">1000</span> if (DESCENDING == ord) {<a name="line.1000"></a> |
| <span class="sourceLineNo">1001</span> // make a copy so that we don't disturb encoded value with ord.<a name="line.1001"></a> |
| <span class="sourceLineNo">1002</span> byte[] copy = new byte[rawTermPos - rawStartPos];<a name="line.1002"></a> |
| <span class="sourceLineNo">1003</span> System.arraycopy(a, rawStartPos, copy, 0, copy.length);<a name="line.1003"></a> |
| <span class="sourceLineNo">1004</span> ord.apply(copy);<a name="line.1004"></a> |
| <span class="sourceLineNo">1005</span> return new String(copy, UTF8);<a name="line.1005"></a> |
| <span class="sourceLineNo">1006</span> } else {<a name="line.1006"></a> |
| <span class="sourceLineNo">1007</span> return new String(a, rawStartPos, rawTermPos - rawStartPos, UTF8);<a name="line.1007"></a> |
| <span class="sourceLineNo">1008</span> }<a name="line.1008"></a> |
| <span class="sourceLineNo">1009</span> }<a name="line.1009"></a> |
| <span class="sourceLineNo">1010</span><a name="line.1010"></a> |
| <span class="sourceLineNo">1011</span> /**<a name="line.1011"></a> |
| <span class="sourceLineNo">1012</span> * Calculate the expected BlobVar encoded length based on unencoded length.<a name="line.1012"></a> |
| <span class="sourceLineNo">1013</span> */<a name="line.1013"></a> |
| <span class="sourceLineNo">1014</span> public static int blobVarEncodedLength(int len) {<a name="line.1014"></a> |
| <span class="sourceLineNo">1015</span> if (0 == len) return 2; // 1-byte header + 1-byte terminator<a name="line.1015"></a> |
| <span class="sourceLineNo">1016</span> else return (int) Math.ceil((len * 8) // 8-bits per input byte<a name="line.1016"></a> |
| <span class="sourceLineNo">1017</span> / 7.0) // 7-bits of input data per encoded byte, rounded up<a name="line.1017"></a> |
| <span class="sourceLineNo">1018</span> + 1; // + 1-byte header<a name="line.1018"></a> |
| <span class="sourceLineNo">1019</span> }<a name="line.1019"></a> |
| <span class="sourceLineNo">1020</span><a name="line.1020"></a> |
| <span class="sourceLineNo">1021</span> /**<a name="line.1021"></a> |
| <span class="sourceLineNo">1022</span> * Calculate the expected BlobVar decoded length based on encoded length.<a name="line.1022"></a> |
| <span class="sourceLineNo">1023</span> */<a name="line.1023"></a> |
| <span class="sourceLineNo">1024</span> static int blobVarDecodedLength(int len) {<a name="line.1024"></a> |
| <span class="sourceLineNo">1025</span> return ((len - 1) // 1-byte header<a name="line.1025"></a> |
| <span class="sourceLineNo">1026</span> * 7) // 7-bits of payload per encoded byte<a name="line.1026"></a> |
| <span class="sourceLineNo">1027</span> / 8; // 8-bits per byte<a name="line.1027"></a> |
| <span class="sourceLineNo">1028</span> }<a name="line.1028"></a> |
| <span class="sourceLineNo">1029</span><a name="line.1029"></a> |
| <span class="sourceLineNo">1030</span> /**<a name="line.1030"></a> |
| <span class="sourceLineNo">1031</span> * Encode a Blob value using a modified varint encoding scheme.<a name="line.1031"></a> |
| <span class="sourceLineNo">1032</span> * <p><a name="line.1032"></a> |
| <span class="sourceLineNo">1033</span> * This format encodes a byte[] value such that no limitations on the input value are imposed. The<a name="line.1033"></a> |
| <span class="sourceLineNo">1034</span> * first byte encodes the encoding scheme that follows, {@link #BLOB_VAR}. Each encoded byte<a name="line.1034"></a> |
| <span class="sourceLineNo">1035</span> * thereafter consists of a header bit followed by 7 bits of payload. A header bit of '1'<a name="line.1035"></a> |
| <span class="sourceLineNo">1036</span> * indicates continuation of the encoding. A header bit of '0' indicates this byte contains the<a name="line.1036"></a> |
| <span class="sourceLineNo">1037</span> * last of the payload. An empty input value is encoded as the header byte immediately followed by<a name="line.1037"></a> |
| <span class="sourceLineNo">1038</span> * a termination byte {@code 0x00}. This is not ambiguous with the encoded value of {@code []},<a name="line.1038"></a> |
| <span class="sourceLineNo">1039</span> * which results in {@code [0x80, 0x00]}.<a name="line.1039"></a> |
| <span class="sourceLineNo">1040</span> * </p><a name="line.1040"></a> |
| <span class="sourceLineNo">1041</span> * @return the number of bytes written.<a name="line.1041"></a> |
| <span class="sourceLineNo">1042</span> */<a name="line.1042"></a> |
| <span class="sourceLineNo">1043</span> public static int encodeBlobVar(PositionedByteRange dst, byte[] val, int voff, int vlen,<a name="line.1043"></a> |
| <span class="sourceLineNo">1044</span> Order ord) {<a name="line.1044"></a> |
| <span class="sourceLineNo">1045</span> if (null == val) {<a name="line.1045"></a> |
| <span class="sourceLineNo">1046</span> return encodeNull(dst, ord);<a name="line.1046"></a> |
| <span class="sourceLineNo">1047</span> }<a name="line.1047"></a> |
| <span class="sourceLineNo">1048</span> // Empty value is null-terminated. All other values are encoded as 7-bits per byte.<a name="line.1048"></a> |
| <span class="sourceLineNo">1049</span> assert dst.getRemaining() >= blobVarEncodedLength(vlen) : "buffer overflow expected.";<a name="line.1049"></a> |
| <span class="sourceLineNo">1050</span> final int offset = dst.getOffset(), start = dst.getPosition();<a name="line.1050"></a> |
| <span class="sourceLineNo">1051</span> dst.put(BLOB_VAR);<a name="line.1051"></a> |
| <span class="sourceLineNo">1052</span> if (0 == vlen) {<a name="line.1052"></a> |
| <span class="sourceLineNo">1053</span> dst.put(TERM);<a name="line.1053"></a> |
| <span class="sourceLineNo">1054</span> } else {<a name="line.1054"></a> |
| <span class="sourceLineNo">1055</span> byte s = 1, t = 0;<a name="line.1055"></a> |
| <span class="sourceLineNo">1056</span> for (int i = voff; i < vlen; i++) {<a name="line.1056"></a> |
| <span class="sourceLineNo">1057</span> dst.put((byte) (0x80 | t | ((val[i] & 0xff) >>> s)));<a name="line.1057"></a> |
| <span class="sourceLineNo">1058</span> if (s < 7) {<a name="line.1058"></a> |
| <span class="sourceLineNo">1059</span> t = (byte) (val[i] << (7 - s));<a name="line.1059"></a> |
| <span class="sourceLineNo">1060</span> s++;<a name="line.1060"></a> |
| <span class="sourceLineNo">1061</span> } else {<a name="line.1061"></a> |
| <span class="sourceLineNo">1062</span> dst.put((byte) (0x80 | val[i]));<a name="line.1062"></a> |
| <span class="sourceLineNo">1063</span> s = 1;<a name="line.1063"></a> |
| <span class="sourceLineNo">1064</span> t = 0;<a name="line.1064"></a> |
| <span class="sourceLineNo">1065</span> }<a name="line.1065"></a> |
| <span class="sourceLineNo">1066</span> }<a name="line.1066"></a> |
| <span class="sourceLineNo">1067</span> if (s > 1) {<a name="line.1067"></a> |
| <span class="sourceLineNo">1068</span> dst.put((byte) (0x7f & t));<a name="line.1068"></a> |
| <span class="sourceLineNo">1069</span> } else {<a name="line.1069"></a> |
| <span class="sourceLineNo">1070</span> dst.getBytes()[offset + dst.getPosition() - 1] =<a name="line.1070"></a> |
| <span class="sourceLineNo">1071</span> (byte) (dst.getBytes()[offset + dst.getPosition() - 1] & 0x7f);<a name="line.1071"></a> |
| <span class="sourceLineNo">1072</span> }<a name="line.1072"></a> |
| <span class="sourceLineNo">1073</span> }<a name="line.1073"></a> |
| <span class="sourceLineNo">1074</span> ord.apply(dst.getBytes(), offset + start, dst.getPosition() - start);<a name="line.1074"></a> |
| <span class="sourceLineNo">1075</span> return dst.getPosition() - start;<a name="line.1075"></a> |
| <span class="sourceLineNo">1076</span> }<a name="line.1076"></a> |
| <span class="sourceLineNo">1077</span><a name="line.1077"></a> |
| <span class="sourceLineNo">1078</span> /**<a name="line.1078"></a> |
| <span class="sourceLineNo">1079</span> * Encode a blob value using a modified varint encoding scheme.<a name="line.1079"></a> |
| <span class="sourceLineNo">1080</span> * @return the number of bytes written.<a name="line.1080"></a> |
| <span class="sourceLineNo">1081</span> * @see #encodeBlobVar(PositionedByteRange, byte[], int, int, Order)<a name="line.1081"></a> |
| <span class="sourceLineNo">1082</span> */<a name="line.1082"></a> |
| <span class="sourceLineNo">1083</span> public static int encodeBlobVar(PositionedByteRange dst, byte[] val, Order ord) {<a name="line.1083"></a> |
| <span class="sourceLineNo">1084</span> return encodeBlobVar(dst, val, 0, null != val ? val.length : 0, ord);<a name="line.1084"></a> |
| <span class="sourceLineNo">1085</span> }<a name="line.1085"></a> |
| <span class="sourceLineNo">1086</span><a name="line.1086"></a> |
| <span class="sourceLineNo">1087</span> /**<a name="line.1087"></a> |
| <span class="sourceLineNo">1088</span> * Decode a blob value that was encoded using BlobVar encoding.<a name="line.1088"></a> |
| <span class="sourceLineNo">1089</span> */<a name="line.1089"></a> |
| <span class="sourceLineNo">1090</span> public static byte[] decodeBlobVar(PositionedByteRange src) {<a name="line.1090"></a> |
| <span class="sourceLineNo">1091</span> final byte header = src.get();<a name="line.1091"></a> |
| <span class="sourceLineNo">1092</span> if (header == NULL || header == DESCENDING.apply(NULL)) {<a name="line.1092"></a> |
| <span class="sourceLineNo">1093</span> return null;<a name="line.1093"></a> |
| <span class="sourceLineNo">1094</span> }<a name="line.1094"></a> |
| <span class="sourceLineNo">1095</span> assert header == BLOB_VAR || header == DESCENDING.apply(BLOB_VAR);<a name="line.1095"></a> |
| <span class="sourceLineNo">1096</span> Order ord = BLOB_VAR == header ? ASCENDING : DESCENDING;<a name="line.1096"></a> |
| <span class="sourceLineNo">1097</span> if (src.peek() == ord.apply(TERM)) {<a name="line.1097"></a> |
| <span class="sourceLineNo">1098</span> // skip empty input buffer.<a name="line.1098"></a> |
| <span class="sourceLineNo">1099</span> src.get();<a name="line.1099"></a> |
| <span class="sourceLineNo">1100</span> return new byte[0];<a name="line.1100"></a> |
| <span class="sourceLineNo">1101</span> }<a name="line.1101"></a> |
| <span class="sourceLineNo">1102</span> final int offset = src.getOffset(), start = src.getPosition();<a name="line.1102"></a> |
| <span class="sourceLineNo">1103</span> int end;<a name="line.1103"></a> |
| <span class="sourceLineNo">1104</span> byte[] a = src.getBytes();<a name="line.1104"></a> |
| <span class="sourceLineNo">1105</span> for (end = start; (byte) (ord.apply(a[offset + end]) & 0x80) != TERM; end++)<a name="line.1105"></a> |
| <span class="sourceLineNo">1106</span> ;<a name="line.1106"></a> |
| <span class="sourceLineNo">1107</span> end++; // increment end to 1-past last byte<a name="line.1107"></a> |
| <span class="sourceLineNo">1108</span> // create ret buffer using length of encoded data + 1 (header byte)<a name="line.1108"></a> |
| <span class="sourceLineNo">1109</span> PositionedByteRange ret =<a name="line.1109"></a> |
| <span class="sourceLineNo">1110</span> new SimplePositionedMutableByteRange(blobVarDecodedLength(end - start + 1));<a name="line.1110"></a> |
| <span class="sourceLineNo">1111</span> int s = 6;<a name="line.1111"></a> |
| <span class="sourceLineNo">1112</span> byte t = (byte) ((ord.apply(a[offset + start]) << 1) & 0xff);<a name="line.1112"></a> |
| <span class="sourceLineNo">1113</span> for (int i = start + 1; i < end; i++) {<a name="line.1113"></a> |
| <span class="sourceLineNo">1114</span> if (s == 7) {<a name="line.1114"></a> |
| <span class="sourceLineNo">1115</span> ret.put((byte) (t | (ord.apply(a[offset + i]) & 0x7f)));<a name="line.1115"></a> |
| <span class="sourceLineNo">1116</span> i++;<a name="line.1116"></a> |
| <span class="sourceLineNo">1117</span> // explicitly reset t -- clean up overflow buffer after decoding<a name="line.1117"></a> |
| <span class="sourceLineNo">1118</span> // a full cycle and retain assertion condition below. This happens<a name="line.1118"></a> |
| <span class="sourceLineNo">1119</span> t = 0; // when the LSB in the last encoded byte is 1. (HBASE-9893)<a name="line.1119"></a> |
| <span class="sourceLineNo">1120</span> } else {<a name="line.1120"></a> |
| <span class="sourceLineNo">1121</span> ret.put((byte) (t | ((ord.apply(a[offset + i]) & 0x7f) >>> s)));<a name="line.1121"></a> |
| <span class="sourceLineNo">1122</span> }<a name="line.1122"></a> |
| <span class="sourceLineNo">1123</span> if (i == end) break;<a name="line.1123"></a> |
| <span class="sourceLineNo">1124</span> t = (byte) ((ord.apply(a[offset + i]) << (8 - s)) & 0xff);<a name="line.1124"></a> |
| <span class="sourceLineNo">1125</span> s = s == 1 ? 7 : s - 1;<a name="line.1125"></a> |
| <span class="sourceLineNo">1126</span> }<a name="line.1126"></a> |
| <span class="sourceLineNo">1127</span> src.setPosition(end);<a name="line.1127"></a> |
| <span class="sourceLineNo">1128</span> assert t == 0 : "Unexpected bits remaining after decoding blob.";<a name="line.1128"></a> |
| <span class="sourceLineNo">1129</span> assert ret.getPosition() == ret.getLength() : "Allocated unnecessarily large return buffer.";<a name="line.1129"></a> |
| <span class="sourceLineNo">1130</span> return ret.getBytes();<a name="line.1130"></a> |
| <span class="sourceLineNo">1131</span> }<a name="line.1131"></a> |
| <span class="sourceLineNo">1132</span><a name="line.1132"></a> |
| <span class="sourceLineNo">1133</span> /**<a name="line.1133"></a> |
| <span class="sourceLineNo">1134</span> * Encode a Blob value as a byte-for-byte copy. BlobCopy encoding in DESCENDING order is NULL<a name="line.1134"></a> |
| <span class="sourceLineNo">1135</span> * terminated so as to preserve proper sorting of {@code []} and so it does not support<a name="line.1135"></a> |
| <span class="sourceLineNo">1136</span> * {@code 0x00} in the value.<a name="line.1136"></a> |
| <span class="sourceLineNo">1137</span> * @return the number of bytes written.<a name="line.1137"></a> |
| <span class="sourceLineNo">1138</span> * @throws IllegalArgumentException when {@code ord} is DESCENDING and {@code val} contains a<a name="line.1138"></a> |
| <span class="sourceLineNo">1139</span> * {@code 0x00} byte.<a name="line.1139"></a> |
| <span class="sourceLineNo">1140</span> */<a name="line.1140"></a> |
| <span class="sourceLineNo">1141</span> public static int encodeBlobCopy(PositionedByteRange dst, byte[] val, int voff, int vlen,<a name="line.1141"></a> |
| <span class="sourceLineNo">1142</span> Order ord) {<a name="line.1142"></a> |
| <span class="sourceLineNo">1143</span> if (null == val) {<a name="line.1143"></a> |
| <span class="sourceLineNo">1144</span> encodeNull(dst, ord);<a name="line.1144"></a> |
| <span class="sourceLineNo">1145</span> if (ASCENDING == ord) return 1;<a name="line.1145"></a> |
| <span class="sourceLineNo">1146</span> else {<a name="line.1146"></a> |
| <span class="sourceLineNo">1147</span> // DESCENDING ordered BlobCopy requires a termination bit to preserve<a name="line.1147"></a> |
| <span class="sourceLineNo">1148</span> // sort-order semantics of null values.<a name="line.1148"></a> |
| <span class="sourceLineNo">1149</span> dst.put(ord.apply(TERM));<a name="line.1149"></a> |
| <span class="sourceLineNo">1150</span> return 2;<a name="line.1150"></a> |
| <span class="sourceLineNo">1151</span> }<a name="line.1151"></a> |
| <span class="sourceLineNo">1152</span> }<a name="line.1152"></a> |
| <span class="sourceLineNo">1153</span> // Blobs as final entry in a compound key are written unencoded.<a name="line.1153"></a> |
| <span class="sourceLineNo">1154</span> assert dst.getRemaining() >= vlen + (ASCENDING == ord ? 1 : 2);<a name="line.1154"></a> |
| <span class="sourceLineNo">1155</span> if (DESCENDING == ord) {<a name="line.1155"></a> |
| <span class="sourceLineNo">1156</span> for (int i = 0; i < vlen; i++) {<a name="line.1156"></a> |
| <span class="sourceLineNo">1157</span> if (TERM == val[voff + i]) {<a name="line.1157"></a> |
| <span class="sourceLineNo">1158</span> throw new IllegalArgumentException("0x00 bytes not permitted in value.");<a name="line.1158"></a> |
| <span class="sourceLineNo">1159</span> }<a name="line.1159"></a> |
| <span class="sourceLineNo">1160</span> }<a name="line.1160"></a> |
| <span class="sourceLineNo">1161</span> }<a name="line.1161"></a> |
| <span class="sourceLineNo">1162</span> final int offset = dst.getOffset(), start = dst.getPosition();<a name="line.1162"></a> |
| <span class="sourceLineNo">1163</span> dst.put(BLOB_COPY);<a name="line.1163"></a> |
| <span class="sourceLineNo">1164</span> dst.put(val, voff, vlen);<a name="line.1164"></a> |
| <span class="sourceLineNo">1165</span> // DESCENDING ordered BlobCopy requires a termination bit to preserve<a name="line.1165"></a> |
| <span class="sourceLineNo">1166</span> // sort-order semantics of null values.<a name="line.1166"></a> |
| <span class="sourceLineNo">1167</span> if (DESCENDING == ord) dst.put(TERM);<a name="line.1167"></a> |
| <span class="sourceLineNo">1168</span> ord.apply(dst.getBytes(), offset + start, dst.getPosition() - start);<a name="line.1168"></a> |
| <span class="sourceLineNo">1169</span> return dst.getPosition() - start;<a name="line.1169"></a> |
| <span class="sourceLineNo">1170</span> }<a name="line.1170"></a> |
| <span class="sourceLineNo">1171</span><a name="line.1171"></a> |
| <span class="sourceLineNo">1172</span> /**<a name="line.1172"></a> |
| <span class="sourceLineNo">1173</span> * Encode a Blob value as a byte-for-byte copy. BlobCopy encoding in DESCENDING order is NULL<a name="line.1173"></a> |
| <span class="sourceLineNo">1174</span> * terminated so as to preserve proper sorting of {@code []} and so it does not support<a name="line.1174"></a> |
| <span class="sourceLineNo">1175</span> * {@code 0x00} in the value.<a name="line.1175"></a> |
| <span class="sourceLineNo">1176</span> * @return the number of bytes written.<a name="line.1176"></a> |
| <span class="sourceLineNo">1177</span> * @throws IllegalArgumentException when {@code ord} is DESCENDING and {@code val} contains a<a name="line.1177"></a> |
| <span class="sourceLineNo">1178</span> * {@code 0x00} byte.<a name="line.1178"></a> |
| <span class="sourceLineNo">1179</span> * @see #encodeBlobCopy(PositionedByteRange, byte[], int, int, Order)<a name="line.1179"></a> |
| <span class="sourceLineNo">1180</span> */<a name="line.1180"></a> |
| <span class="sourceLineNo">1181</span> public static int encodeBlobCopy(PositionedByteRange dst, byte[] val, Order ord) {<a name="line.1181"></a> |
| <span class="sourceLineNo">1182</span> return encodeBlobCopy(dst, val, 0, null != val ? val.length : 0, ord);<a name="line.1182"></a> |
| <span class="sourceLineNo">1183</span> }<a name="line.1183"></a> |
| <span class="sourceLineNo">1184</span><a name="line.1184"></a> |
| <span class="sourceLineNo">1185</span> /**<a name="line.1185"></a> |
| <span class="sourceLineNo">1186</span> * Decode a Blob value, byte-for-byte copy.<a name="line.1186"></a> |
| <span class="sourceLineNo">1187</span> * @see #encodeBlobCopy(PositionedByteRange, byte[], int, int, Order)<a name="line.1187"></a> |
| <span class="sourceLineNo">1188</span> */<a name="line.1188"></a> |
| <span class="sourceLineNo">1189</span> public static byte[] decodeBlobCopy(PositionedByteRange src) {<a name="line.1189"></a> |
| <span class="sourceLineNo">1190</span> byte header = src.get();<a name="line.1190"></a> |
| <span class="sourceLineNo">1191</span> if (header == NULL || header == DESCENDING.apply(NULL)) {<a name="line.1191"></a> |
| <span class="sourceLineNo">1192</span> return null;<a name="line.1192"></a> |
| <span class="sourceLineNo">1193</span> }<a name="line.1193"></a> |
| <span class="sourceLineNo">1194</span> assert header == BLOB_COPY || header == DESCENDING.apply(BLOB_COPY);<a name="line.1194"></a> |
| <span class="sourceLineNo">1195</span> Order ord = header == BLOB_COPY ? ASCENDING : DESCENDING;<a name="line.1195"></a> |
| <span class="sourceLineNo">1196</span> final int length = src.getRemaining() - (ASCENDING == ord ? 0 : 1);<a name="line.1196"></a> |
| <span class="sourceLineNo">1197</span> byte[] ret = new byte[length];<a name="line.1197"></a> |
| <span class="sourceLineNo">1198</span> src.get(ret);<a name="line.1198"></a> |
| <span class="sourceLineNo">1199</span> ord.apply(ret, 0, ret.length);<a name="line.1199"></a> |
| <span class="sourceLineNo">1200</span> // DESCENDING ordered BlobCopy requires a termination bit to preserve<a name="line.1200"></a> |
| <span class="sourceLineNo">1201</span> // sort-order semantics of null values.<a name="line.1201"></a> |
| <span class="sourceLineNo">1202</span> if (DESCENDING == ord) src.get();<a name="line.1202"></a> |
| <span class="sourceLineNo">1203</span> return ret;<a name="line.1203"></a> |
| <span class="sourceLineNo">1204</span> }<a name="line.1204"></a> |
| <span class="sourceLineNo">1205</span><a name="line.1205"></a> |
| <span class="sourceLineNo">1206</span> /**<a name="line.1206"></a> |
| <span class="sourceLineNo">1207</span> * Encode a null value.<a name="line.1207"></a> |
| <span class="sourceLineNo">1208</span> * @param dst The destination to which encoded digits are written.<a name="line.1208"></a> |
| <span class="sourceLineNo">1209</span> * @param ord The {@link Order} to respect while encoding {@code val}.<a name="line.1209"></a> |
| <span class="sourceLineNo">1210</span> * @return the number of bytes written.<a name="line.1210"></a> |
| <span class="sourceLineNo">1211</span> */<a name="line.1211"></a> |
| <span class="sourceLineNo">1212</span> public static int encodeNull(PositionedByteRange dst, Order ord) {<a name="line.1212"></a> |
| <span class="sourceLineNo">1213</span> dst.put(ord.apply(NULL));<a name="line.1213"></a> |
| <span class="sourceLineNo">1214</span> return 1;<a name="line.1214"></a> |
| <span class="sourceLineNo">1215</span> }<a name="line.1215"></a> |
| <span class="sourceLineNo">1216</span><a name="line.1216"></a> |
| <span class="sourceLineNo">1217</span> /**<a name="line.1217"></a> |
| <span class="sourceLineNo">1218</span> * Encode an {@code int8} value using the fixed-length encoding.<a name="line.1218"></a> |
| <span class="sourceLineNo">1219</span> * @return the number of bytes written.<a name="line.1219"></a> |
| <span class="sourceLineNo">1220</span> * @see #encodeInt64(PositionedByteRange, long, Order)<a name="line.1220"></a> |
| <span class="sourceLineNo">1221</span> * @see #decodeInt8(PositionedByteRange)<a name="line.1221"></a> |
| <span class="sourceLineNo">1222</span> */<a name="line.1222"></a> |
| <span class="sourceLineNo">1223</span> public static int encodeInt8(PositionedByteRange dst, byte val, Order ord) {<a name="line.1223"></a> |
| <span class="sourceLineNo">1224</span> final int offset = dst.getOffset(), start = dst.getPosition();<a name="line.1224"></a> |
| <span class="sourceLineNo">1225</span> dst.put(FIXED_INT8).put((byte) (val ^ 0x80));<a name="line.1225"></a> |
| <span class="sourceLineNo">1226</span> ord.apply(dst.getBytes(), offset + start, 2);<a name="line.1226"></a> |
| <span class="sourceLineNo">1227</span> return 2;<a name="line.1227"></a> |
| <span class="sourceLineNo">1228</span> }<a name="line.1228"></a> |
| <span class="sourceLineNo">1229</span><a name="line.1229"></a> |
| <span class="sourceLineNo">1230</span> /**<a name="line.1230"></a> |
| <span class="sourceLineNo">1231</span> * Decode an {@code int8} value.<a name="line.1231"></a> |
| <span class="sourceLineNo">1232</span> * @see #encodeInt8(PositionedByteRange, byte, Order)<a name="line.1232"></a> |
| <span class="sourceLineNo">1233</span> */<a name="line.1233"></a> |
| <span class="sourceLineNo">1234</span> public static byte decodeInt8(PositionedByteRange src) {<a name="line.1234"></a> |
| <span class="sourceLineNo">1235</span> final byte header = src.get();<a name="line.1235"></a> |
| <span class="sourceLineNo">1236</span> assert header == FIXED_INT8 || header == DESCENDING.apply(FIXED_INT8);<a name="line.1236"></a> |
| <span class="sourceLineNo">1237</span> Order ord = header == FIXED_INT8 ? ASCENDING : DESCENDING;<a name="line.1237"></a> |
| <span class="sourceLineNo">1238</span> return (byte) ((ord.apply(src.get()) ^ 0x80) & 0xff);<a name="line.1238"></a> |
| <span class="sourceLineNo">1239</span> }<a name="line.1239"></a> |
| <span class="sourceLineNo">1240</span><a name="line.1240"></a> |
| <span class="sourceLineNo">1241</span> /**<a name="line.1241"></a> |
| <span class="sourceLineNo">1242</span> * Encode an {@code int16} value using the fixed-length encoding.<a name="line.1242"></a> |
| <span class="sourceLineNo">1243</span> * @return the number of bytes written.<a name="line.1243"></a> |
| <span class="sourceLineNo">1244</span> * @see #encodeInt64(PositionedByteRange, long, Order)<a name="line.1244"></a> |
| <span class="sourceLineNo">1245</span> * @see #decodeInt16(PositionedByteRange)<a name="line.1245"></a> |
| <span class="sourceLineNo">1246</span> */<a name="line.1246"></a> |
| <span class="sourceLineNo">1247</span> public static int encodeInt16(PositionedByteRange dst, short val, Order ord) {<a name="line.1247"></a> |
| <span class="sourceLineNo">1248</span> final int offset = dst.getOffset(), start = dst.getPosition();<a name="line.1248"></a> |
| <span class="sourceLineNo">1249</span> dst.put(FIXED_INT16).put((byte) ((val >> 8) ^ 0x80)).put((byte) val);<a name="line.1249"></a> |
| <span class="sourceLineNo">1250</span> ord.apply(dst.getBytes(), offset + start, 3);<a name="line.1250"></a> |
| <span class="sourceLineNo">1251</span> return 3;<a name="line.1251"></a> |
| <span class="sourceLineNo">1252</span> }<a name="line.1252"></a> |
| <span class="sourceLineNo">1253</span><a name="line.1253"></a> |
| <span class="sourceLineNo">1254</span> /**<a name="line.1254"></a> |
| <span class="sourceLineNo">1255</span> * Decode an {@code int16} value.<a name="line.1255"></a> |
| <span class="sourceLineNo">1256</span> * @see #encodeInt16(PositionedByteRange, short, Order)<a name="line.1256"></a> |
| <span class="sourceLineNo">1257</span> */<a name="line.1257"></a> |
| <span class="sourceLineNo">1258</span> public static short decodeInt16(PositionedByteRange src) {<a name="line.1258"></a> |
| <span class="sourceLineNo">1259</span> final byte header = src.get();<a name="line.1259"></a> |
| <span class="sourceLineNo">1260</span> assert header == FIXED_INT16 || header == DESCENDING.apply(FIXED_INT16);<a name="line.1260"></a> |
| <span class="sourceLineNo">1261</span> Order ord = header == FIXED_INT16 ? ASCENDING : DESCENDING;<a name="line.1261"></a> |
| <span class="sourceLineNo">1262</span> short val = (short) ((ord.apply(src.get()) ^ 0x80) & 0xff);<a name="line.1262"></a> |
| <span class="sourceLineNo">1263</span> val = (short) ((val << 8) + (ord.apply(src.get()) & 0xff));<a name="line.1263"></a> |
| <span class="sourceLineNo">1264</span> return val;<a name="line.1264"></a> |
| <span class="sourceLineNo">1265</span> }<a name="line.1265"></a> |
| <span class="sourceLineNo">1266</span><a name="line.1266"></a> |
| <span class="sourceLineNo">1267</span> /**<a name="line.1267"></a> |
| <span class="sourceLineNo">1268</span> * Encode an {@code int32} value using the fixed-length encoding.<a name="line.1268"></a> |
| <span class="sourceLineNo">1269</span> * @return the number of bytes written.<a name="line.1269"></a> |
| <span class="sourceLineNo">1270</span> * @see #encodeInt64(PositionedByteRange, long, Order)<a name="line.1270"></a> |
| <span class="sourceLineNo">1271</span> * @see #decodeInt32(PositionedByteRange)<a name="line.1271"></a> |
| <span class="sourceLineNo">1272</span> */<a name="line.1272"></a> |
| <span class="sourceLineNo">1273</span> public static int encodeInt32(PositionedByteRange dst, int val, Order ord) {<a name="line.1273"></a> |
| <span class="sourceLineNo">1274</span> final int offset = dst.getOffset(), start = dst.getPosition();<a name="line.1274"></a> |
| <span class="sourceLineNo">1275</span> dst.put(FIXED_INT32).put((byte) ((val >> 24) ^ 0x80)).put((byte) (val >> 16))<a name="line.1275"></a> |
| <span class="sourceLineNo">1276</span> .put((byte) (val >> 8)).put((byte) val);<a name="line.1276"></a> |
| <span class="sourceLineNo">1277</span> ord.apply(dst.getBytes(), offset + start, 5);<a name="line.1277"></a> |
| <span class="sourceLineNo">1278</span> return 5;<a name="line.1278"></a> |
| <span class="sourceLineNo">1279</span> }<a name="line.1279"></a> |
| <span class="sourceLineNo">1280</span><a name="line.1280"></a> |
| <span class="sourceLineNo">1281</span> /**<a name="line.1281"></a> |
| <span class="sourceLineNo">1282</span> * Decode an {@code int32} value.<a name="line.1282"></a> |
| <span class="sourceLineNo">1283</span> * @see #encodeInt32(PositionedByteRange, int, Order)<a name="line.1283"></a> |
| <span class="sourceLineNo">1284</span> */<a name="line.1284"></a> |
| <span class="sourceLineNo">1285</span> public static int decodeInt32(PositionedByteRange src) {<a name="line.1285"></a> |
| <span class="sourceLineNo">1286</span> final byte header = src.get();<a name="line.1286"></a> |
| <span class="sourceLineNo">1287</span> assert header == FIXED_INT32 || header == DESCENDING.apply(FIXED_INT32);<a name="line.1287"></a> |
| <span class="sourceLineNo">1288</span> Order ord = header == FIXED_INT32 ? ASCENDING : DESCENDING;<a name="line.1288"></a> |
| <span class="sourceLineNo">1289</span> int val = (ord.apply(src.get()) ^ 0x80) & 0xff;<a name="line.1289"></a> |
| <span class="sourceLineNo">1290</span> for (int i = 1; i < 4; i++) {<a name="line.1290"></a> |
| <span class="sourceLineNo">1291</span> val = (val << 8) + (ord.apply(src.get()) & 0xff);<a name="line.1291"></a> |
| <span class="sourceLineNo">1292</span> }<a name="line.1292"></a> |
| <span class="sourceLineNo">1293</span> return val;<a name="line.1293"></a> |
| <span class="sourceLineNo">1294</span> }<a name="line.1294"></a> |
| <span class="sourceLineNo">1295</span><a name="line.1295"></a> |
| <span class="sourceLineNo">1296</span> /**<a name="line.1296"></a> |
| <span class="sourceLineNo">1297</span> * Encode an {@code int64} value using the fixed-length encoding.<a name="line.1297"></a> |
| <span class="sourceLineNo">1298</span> * <p><a name="line.1298"></a> |
| <span class="sourceLineNo">1299</span> * This format ensures that all longs sort in their natural order, as they would sort when using<a name="line.1299"></a> |
| <span class="sourceLineNo">1300</span> * signed long comparison.<a name="line.1300"></a> |
| <span class="sourceLineNo">1301</span> * </p><a name="line.1301"></a> |
| <span class="sourceLineNo">1302</span> * <p><a name="line.1302"></a> |
| <span class="sourceLineNo">1303</span> * All Longs are serialized to an 8-byte, fixed-width sortable byte format. Serialization is<a name="line.1303"></a> |
| <span class="sourceLineNo">1304</span> * performed by inverting the integer sign bit and writing the resulting bytes to the byte array<a name="line.1304"></a> |
| <span class="sourceLineNo">1305</span> * in big endian order. The encoded value is prefixed by the {@link #FIXED_INT64} header byte.<a name="line.1305"></a> |
| <span class="sourceLineNo">1306</span> * This encoding is designed to handle java language primitives and so Null values are NOT<a name="line.1306"></a> |
| <span class="sourceLineNo">1307</span> * supported by this implementation.<a name="line.1307"></a> |
| <span class="sourceLineNo">1308</span> * </p><a name="line.1308"></a> |
| <span class="sourceLineNo">1309</span> * <p><a name="line.1309"></a> |
| <span class="sourceLineNo">1310</span> * For example:<a name="line.1310"></a> |
| <span class="sourceLineNo">1311</span> * </p><a name="line.1311"></a> |
| <span class="sourceLineNo">1312</span> *<a name="line.1312"></a> |
| <span class="sourceLineNo">1313</span> * <pre><a name="line.1313"></a> |
| <span class="sourceLineNo">1314</span> * Input: 0x0000000000000005 (5)<a name="line.1314"></a> |
| <span class="sourceLineNo">1315</span> * Result: 0x288000000000000005<a name="line.1315"></a> |
| <span class="sourceLineNo">1316</span> *<a name="line.1316"></a> |
| <span class="sourceLineNo">1317</span> * Input: 0xfffffffffffffffb (-4)<a name="line.1317"></a> |
| <span class="sourceLineNo">1318</span> * Result: 0x280000000000000004<a name="line.1318"></a> |
| <span class="sourceLineNo">1319</span> *<a name="line.1319"></a> |
| <span class="sourceLineNo">1320</span> * Input: 0x7fffffffffffffff (Long.MAX_VALUE)<a name="line.1320"></a> |
| <span class="sourceLineNo">1321</span> * Result: 0x28ffffffffffffffff<a name="line.1321"></a> |
| <span class="sourceLineNo">1322</span> *<a name="line.1322"></a> |
| <span class="sourceLineNo">1323</span> * Input: 0x8000000000000000 (Long.MIN_VALUE)<a name="line.1323"></a> |
| <span class="sourceLineNo">1324</span> * Result: 0x287fffffffffffffff<a name="line.1324"></a> |
| <span class="sourceLineNo">1325</span> * </pre><a name="line.1325"></a> |
| <span class="sourceLineNo">1326</span> * <p><a name="line.1326"></a> |
| <span class="sourceLineNo">1327</span> * This encoding format, and much of this documentation string, is based on Orderly's<a name="line.1327"></a> |
| <span class="sourceLineNo">1328</span> * {@code FixedIntWritableRowKey}.<a name="line.1328"></a> |
| <span class="sourceLineNo">1329</span> * </p><a name="line.1329"></a> |
| <span class="sourceLineNo">1330</span> * @return the number of bytes written.<a name="line.1330"></a> |
| <span class="sourceLineNo">1331</span> * @see #decodeInt64(PositionedByteRange)<a name="line.1331"></a> |
| <span class="sourceLineNo">1332</span> */<a name="line.1332"></a> |
| <span class="sourceLineNo">1333</span> public static int encodeInt64(PositionedByteRange dst, long val, Order ord) {<a name="line.1333"></a> |
| <span class="sourceLineNo">1334</span> final int offset = dst.getOffset(), start = dst.getPosition();<a name="line.1334"></a> |
| <span class="sourceLineNo">1335</span> dst.put(FIXED_INT64).put((byte) ((val >> 56) ^ 0x80)).put((byte) (val >> 48))<a name="line.1335"></a> |
| <span class="sourceLineNo">1336</span> .put((byte) (val >> 40)).put((byte) (val >> 32)).put((byte) (val >> 24))<a name="line.1336"></a> |
| <span class="sourceLineNo">1337</span> .put((byte) (val >> 16)).put((byte) (val >> 8)).put((byte) val);<a name="line.1337"></a> |
| <span class="sourceLineNo">1338</span> ord.apply(dst.getBytes(), offset + start, 9);<a name="line.1338"></a> |
| <span class="sourceLineNo">1339</span> return 9;<a name="line.1339"></a> |
| <span class="sourceLineNo">1340</span> }<a name="line.1340"></a> |
| <span class="sourceLineNo">1341</span><a name="line.1341"></a> |
| <span class="sourceLineNo">1342</span> /**<a name="line.1342"></a> |
| <span class="sourceLineNo">1343</span> * Decode an {@code int64} value.<a name="line.1343"></a> |
| <span class="sourceLineNo">1344</span> * @see #encodeInt64(PositionedByteRange, long, Order)<a name="line.1344"></a> |
| <span class="sourceLineNo">1345</span> */<a name="line.1345"></a> |
| <span class="sourceLineNo">1346</span> public static long decodeInt64(PositionedByteRange src) {<a name="line.1346"></a> |
| <span class="sourceLineNo">1347</span> final byte header = src.get();<a name="line.1347"></a> |
| <span class="sourceLineNo">1348</span> assert header == FIXED_INT64 || header == DESCENDING.apply(FIXED_INT64);<a name="line.1348"></a> |
| <span class="sourceLineNo">1349</span> Order ord = header == FIXED_INT64 ? ASCENDING : DESCENDING;<a name="line.1349"></a> |
| <span class="sourceLineNo">1350</span> long val = (ord.apply(src.get()) ^ 0x80) & 0xff;<a name="line.1350"></a> |
| <span class="sourceLineNo">1351</span> for (int i = 1; i < 8; i++) {<a name="line.1351"></a> |
| <span class="sourceLineNo">1352</span> val = (val << 8) + (ord.apply(src.get()) & 0xff);<a name="line.1352"></a> |
| <span class="sourceLineNo">1353</span> }<a name="line.1353"></a> |
| <span class="sourceLineNo">1354</span> return val;<a name="line.1354"></a> |
| <span class="sourceLineNo">1355</span> }<a name="line.1355"></a> |
| <span class="sourceLineNo">1356</span><a name="line.1356"></a> |
| <span class="sourceLineNo">1357</span> /**<a name="line.1357"></a> |
| <span class="sourceLineNo">1358</span> * Encode a 32-bit floating point value using the fixed-length encoding. Encoding format is<a name="line.1358"></a> |
| <span class="sourceLineNo">1359</span> * described at length in {@link #encodeFloat64(PositionedByteRange, double, Order)}.<a name="line.1359"></a> |
| <span class="sourceLineNo">1360</span> * @return the number of bytes written.<a name="line.1360"></a> |
| <span class="sourceLineNo">1361</span> * @see #decodeFloat32(PositionedByteRange)<a name="line.1361"></a> |
| <span class="sourceLineNo">1362</span> * @see #encodeFloat64(PositionedByteRange, double, Order)<a name="line.1362"></a> |
| <span class="sourceLineNo">1363</span> */<a name="line.1363"></a> |
| <span class="sourceLineNo">1364</span> public static int encodeFloat32(PositionedByteRange dst, float val, Order ord) {<a name="line.1364"></a> |
| <span class="sourceLineNo">1365</span> final int offset = dst.getOffset(), start = dst.getPosition();<a name="line.1365"></a> |
| <span class="sourceLineNo">1366</span> int i = Float.floatToIntBits(val);<a name="line.1366"></a> |
| <span class="sourceLineNo">1367</span> i ^= ((i >> (Integer.SIZE - 1)) | Integer.MIN_VALUE);<a name="line.1367"></a> |
| <span class="sourceLineNo">1368</span> dst.put(FIXED_FLOAT32).put((byte) (i >> 24)).put((byte) (i >> 16)).put((byte) (i >> 8))<a name="line.1368"></a> |
| <span class="sourceLineNo">1369</span> .put((byte) i);<a name="line.1369"></a> |
| <span class="sourceLineNo">1370</span> ord.apply(dst.getBytes(), offset + start, 5);<a name="line.1370"></a> |
| <span class="sourceLineNo">1371</span> return 5;<a name="line.1371"></a> |
| <span class="sourceLineNo">1372</span> }<a name="line.1372"></a> |
| <span class="sourceLineNo">1373</span><a name="line.1373"></a> |
| <span class="sourceLineNo">1374</span> /**<a name="line.1374"></a> |
| <span class="sourceLineNo">1375</span> * Decode a 32-bit floating point value using the fixed-length encoding.<a name="line.1375"></a> |
| <span class="sourceLineNo">1376</span> * @see #encodeFloat32(PositionedByteRange, float, Order)<a name="line.1376"></a> |
| <span class="sourceLineNo">1377</span> */<a name="line.1377"></a> |
| <span class="sourceLineNo">1378</span> public static float decodeFloat32(PositionedByteRange src) {<a name="line.1378"></a> |
| <span class="sourceLineNo">1379</span> final byte header = src.get();<a name="line.1379"></a> |
| <span class="sourceLineNo">1380</span> assert header == FIXED_FLOAT32 || header == DESCENDING.apply(FIXED_FLOAT32);<a name="line.1380"></a> |
| <span class="sourceLineNo">1381</span> Order ord = header == FIXED_FLOAT32 ? ASCENDING : DESCENDING;<a name="line.1381"></a> |
| <span class="sourceLineNo">1382</span> int val = ord.apply(src.get()) & 0xff;<a name="line.1382"></a> |
| <span class="sourceLineNo">1383</span> for (int i = 1; i < 4; i++) {<a name="line.1383"></a> |
| <span class="sourceLineNo">1384</span> val = (val << 8) + (ord.apply(src.get()) & 0xff);<a name="line.1384"></a> |
| <span class="sourceLineNo">1385</span> }<a name="line.1385"></a> |
| <span class="sourceLineNo">1386</span> val ^= (~val >> (Integer.SIZE - 1)) | Integer.MIN_VALUE;<a name="line.1386"></a> |
| <span class="sourceLineNo">1387</span> return Float.intBitsToFloat(val);<a name="line.1387"></a> |
| <span class="sourceLineNo">1388</span> }<a name="line.1388"></a> |
| <span class="sourceLineNo">1389</span><a name="line.1389"></a> |
| <span class="sourceLineNo">1390</span> /**<a name="line.1390"></a> |
| <span class="sourceLineNo">1391</span> * Encode a 64-bit floating point value using the fixed-length encoding.<a name="line.1391"></a> |
| <span class="sourceLineNo">1392</span> * <p><a name="line.1392"></a> |
| <span class="sourceLineNo">1393</span> * This format ensures the following total ordering of floating point values:<a name="line.1393"></a> |
| <span class="sourceLineNo">1394</span> * Double.NEGATIVE_INFINITY &lt; -Double.MAX_VALUE &lt; ... &lt; -Double.MIN_VALUE &lt; -0.0 &lt;<a name="line.1394"></a> |
| <span class="sourceLineNo">1395</span> * +0.0; &lt; Double.MIN_VALUE &lt; ... &lt; Double.MAX_VALUE &lt; Double.POSITIVE_INFINITY &lt;<a name="line.1395"></a> |
| <span class="sourceLineNo">1396</span> * Double.NaN<a name="line.1396"></a> |
| <span class="sourceLineNo">1397</span> * </p><a name="line.1397"></a> |
| <span class="sourceLineNo">1398</span> * <p><a name="line.1398"></a> |
| <span class="sourceLineNo">1399</span> * Floating point numbers are encoded as specified in IEEE 754. A 64-bit double precision float<a name="line.1399"></a> |
| <span class="sourceLineNo">1400</span> * consists of a sign bit, 11-bit unsigned exponent encoded in offset-1023 notation, and a 52-bit<a name="line.1400"></a> |
| <span class="sourceLineNo">1401</span> * significand. The format is described further in the<a name="line.1401"></a> |
| <span class="sourceLineNo">1402</span> * <a href="http://en.wikipedia.org/wiki/Double_precision"> Double Precision Floating Point<a name="line.1402"></a> |
| <span class="sourceLineNo">1403</span> * Wikipedia page</a><a name="line.1403"></a> |
| <span class="sourceLineNo">1404</span> * </p><a name="line.1404"></a> |
| <span class="sourceLineNo">1405</span> * <p><a name="line.1405"></a> |
| <span class="sourceLineNo">1406</span> * The value of a normal float is -1 <sup>sign bit</sup> &times; 2<sup>exponent - 1023</sup><a name="line.1406"></a> |
| <span class="sourceLineNo">1407</span> * &times; 1.significand<a name="line.1407"></a> |
| <span class="sourceLineNo">1408</span> * </p><a name="line.1408"></a> |
| <span class="sourceLineNo">1409</span> * <p><a name="line.1409"></a> |
| <span class="sourceLineNo">1410</span> * The IEE754 floating point format already preserves sort ordering for positive floating point<a name="line.1410"></a> |
| <span class="sourceLineNo">1411</span> * numbers when the raw bytes are compared in most significant byte order. This is discussed<a name="line.1411"></a> |
| <span class="sourceLineNo">1412</span> * further at<a name="line.1412"></a> |
| <span class="sourceLineNo">1413</span> * <a href= "http://www.cygnus-software.com/papers/comparingfloats/comparingfloats.htm" ><a name="line.1413"></a> |
| <span class="sourceLineNo">1414</span> * http://www.cygnus-software.com/papers/comparingfloats/comparingfloats. htm</a><a name="line.1414"></a> |
| <span class="sourceLineNo">1415</span> * </p><a name="line.1415"></a> |
| <span class="sourceLineNo">1416</span> * <p><a name="line.1416"></a> |
| <span class="sourceLineNo">1417</span> * Thus, we need only ensure that negative numbers sort in the the exact opposite order as<a name="line.1417"></a> |
| <span class="sourceLineNo">1418</span> * positive numbers (so that say, negative infinity is less than negative 1), and that all<a name="line.1418"></a> |
| <span class="sourceLineNo">1419</span> * negative numbers compare less than any positive number. To accomplish this, we invert the sign<a name="line.1419"></a> |
| <span class="sourceLineNo">1420</span> * bit of all floating point numbers, and we also invert the exponent and significand bits if the<a name="line.1420"></a> |
| <span class="sourceLineNo">1421</span> * floating point number was negative.<a name="line.1421"></a> |
| <span class="sourceLineNo">1422</span> * </p><a name="line.1422"></a> |
| <span class="sourceLineNo">1423</span> * <p><a name="line.1423"></a> |
| <span class="sourceLineNo">1424</span> * More specifically, we first store the floating point bits into a 64-bit long {@code l} using<a name="line.1424"></a> |
| <span class="sourceLineNo">1425</span> * {@link Double#doubleToLongBits}. This method collapses all NaNs into a single, canonical NaN<a name="line.1425"></a> |
| <span class="sourceLineNo">1426</span> * value but otherwise leaves the bits unchanged. We then compute<a name="line.1426"></a> |
| <span class="sourceLineNo">1427</span> * </p><a name="line.1427"></a> |
| <span class="sourceLineNo">1428</span> *<a name="line.1428"></a> |
| <span class="sourceLineNo">1429</span> * <pre><a name="line.1429"></a> |
| <span class="sourceLineNo">1430</span> * l &circ;= (l &gt;&gt; (Long.SIZE - 1)) | Long.MIN_SIZE<a name="line.1430"></a> |
| <span class="sourceLineNo">1431</span> * </pre><a name="line.1431"></a> |
| <span class="sourceLineNo">1432</span> * <p><a name="line.1432"></a> |
| <span class="sourceLineNo">1433</span> * which inverts the sign bit and XOR's all other bits with the sign bit itself. Comparing the raw<a name="line.1433"></a> |
| <span class="sourceLineNo">1434</span> * bytes of {@code l} in most significant byte order is equivalent to performing a double<a name="line.1434"></a> |
| <span class="sourceLineNo">1435</span> * precision floating point comparison on the underlying bits (ignoring NaN comparisons, as NaNs<a name="line.1435"></a> |
| <span class="sourceLineNo">1436</span> * don't compare equal to anything when performing floating point comparisons).<a name="line.1436"></a> |
| <span class="sourceLineNo">1437</span> * </p><a name="line.1437"></a> |
| <span class="sourceLineNo">1438</span> * <p><a name="line.1438"></a> |
| <span class="sourceLineNo">1439</span> * The resulting long integer is then converted into a byte array by serializing the long one byte<a name="line.1439"></a> |
| <span class="sourceLineNo">1440</span> * at a time in most significant byte order. The serialized integer is prefixed by a single header<a name="line.1440"></a> |
| <span class="sourceLineNo">1441</span> * byte. All serialized values are 9 bytes in length.<a name="line.1441"></a> |
| <span class="sourceLineNo">1442</span> * </p><a name="line.1442"></a> |
| <span class="sourceLineNo">1443</span> * <p><a name="line.1443"></a> |
| <span class="sourceLineNo">1444</span> * This encoding format, and much of this highly detailed documentation string, is based on<a name="line.1444"></a> |
| <span class="sourceLineNo">1445</span> * Orderly's {@code DoubleWritableRowKey}.<a name="line.1445"></a> |
| <span class="sourceLineNo">1446</span> * </p><a name="line.1446"></a> |
| <span class="sourceLineNo">1447</span> * @return the number of bytes written.<a name="line.1447"></a> |
| <span class="sourceLineNo">1448</span> * @see #decodeFloat64(PositionedByteRange)<a name="line.1448"></a> |
| <span class="sourceLineNo">1449</span> */<a name="line.1449"></a> |
| <span class="sourceLineNo">1450</span> public static int encodeFloat64(PositionedByteRange dst, double val, Order ord) {<a name="line.1450"></a> |
| <span class="sourceLineNo">1451</span> final int offset = dst.getOffset(), start = dst.getPosition();<a name="line.1451"></a> |
| <span class="sourceLineNo">1452</span> long lng = Double.doubleToLongBits(val);<a name="line.1452"></a> |
| <span class="sourceLineNo">1453</span> lng ^= ((lng >> (Long.SIZE - 1)) | Long.MIN_VALUE);<a name="line.1453"></a> |
| <span class="sourceLineNo">1454</span> dst.put(FIXED_FLOAT64).put((byte) (lng >> 56)).put((byte) (lng >> 48)).put((byte) (lng >> 40))<a name="line.1454"></a> |
| <span class="sourceLineNo">1455</span> .put((byte) (lng >> 32)).put((byte) (lng >> 24)).put((byte) (lng >> 16))<a name="line.1455"></a> |
| <span class="sourceLineNo">1456</span> .put((byte) (lng >> 8)).put((byte) lng);<a name="line.1456"></a> |
| <span class="sourceLineNo">1457</span> ord.apply(dst.getBytes(), offset + start, 9);<a name="line.1457"></a> |
| <span class="sourceLineNo">1458</span> return 9;<a name="line.1458"></a> |
| <span class="sourceLineNo">1459</span> }<a name="line.1459"></a> |
| <span class="sourceLineNo">1460</span><a name="line.1460"></a> |
| <span class="sourceLineNo">1461</span> /**<a name="line.1461"></a> |
| <span class="sourceLineNo">1462</span> * Decode a 64-bit floating point value using the fixed-length encoding.<a name="line.1462"></a> |
| <span class="sourceLineNo">1463</span> * @see #encodeFloat64(PositionedByteRange, double, Order)<a name="line.1463"></a> |
| <span class="sourceLineNo">1464</span> */<a name="line.1464"></a> |
| <span class="sourceLineNo">1465</span> public static double decodeFloat64(PositionedByteRange src) {<a name="line.1465"></a> |
| <span class="sourceLineNo">1466</span> final byte header = src.get();<a name="line.1466"></a> |
| <span class="sourceLineNo">1467</span> assert header == FIXED_FLOAT64 || header == DESCENDING.apply(FIXED_FLOAT64);<a name="line.1467"></a> |
| <span class="sourceLineNo">1468</span> Order ord = header == FIXED_FLOAT64 ? ASCENDING : DESCENDING;<a name="line.1468"></a> |
| <span class="sourceLineNo">1469</span> long val = ord.apply(src.get()) & 0xff;<a name="line.1469"></a> |
| <span class="sourceLineNo">1470</span> for (int i = 1; i < 8; i++) {<a name="line.1470"></a> |
| <span class="sourceLineNo">1471</span> val = (val << 8) + (ord.apply(src.get()) & 0xff);<a name="line.1471"></a> |
| <span class="sourceLineNo">1472</span> }<a name="line.1472"></a> |
| <span class="sourceLineNo">1473</span> val ^= (~val >> (Long.SIZE - 1)) | Long.MIN_VALUE;<a name="line.1473"></a> |
| <span class="sourceLineNo">1474</span> return Double.longBitsToDouble(val);<a name="line.1474"></a> |
| <span class="sourceLineNo">1475</span> }<a name="line.1475"></a> |
| <span class="sourceLineNo">1476</span><a name="line.1476"></a> |
| <span class="sourceLineNo">1477</span> /**<a name="line.1477"></a> |
| <span class="sourceLineNo">1478</span> * Returns true when {@code src} appears to be positioned an encoded value, false otherwise.<a name="line.1478"></a> |
| <span class="sourceLineNo">1479</span> */<a name="line.1479"></a> |
| <span class="sourceLineNo">1480</span> public static boolean isEncodedValue(PositionedByteRange src) {<a name="line.1480"></a> |
| <span class="sourceLineNo">1481</span> return isNull(src) || isNumeric(src) || isFixedInt8(src) || isFixedInt16(src)<a name="line.1481"></a> |
| <span class="sourceLineNo">1482</span> || isFixedInt32(src) || isFixedInt64(src) || isFixedFloat32(src) || isFixedFloat64(src)<a name="line.1482"></a> |
| <span class="sourceLineNo">1483</span> || isText(src) || isBlobCopy(src) || isBlobVar(src);<a name="line.1483"></a> |
| <span class="sourceLineNo">1484</span> }<a name="line.1484"></a> |
| <span class="sourceLineNo">1485</span><a name="line.1485"></a> |
| <span class="sourceLineNo">1486</span> /**<a name="line.1486"></a> |
| <span class="sourceLineNo">1487</span> * Return true when the next encoded value in {@code src} is null, false otherwise.<a name="line.1487"></a> |
| <span class="sourceLineNo">1488</span> */<a name="line.1488"></a> |
| <span class="sourceLineNo">1489</span> public static boolean isNull(PositionedByteRange src) {<a name="line.1489"></a> |
| <span class="sourceLineNo">1490</span> return NULL == (-1 == Integer.signum(src.peek()) ? DESCENDING : ASCENDING).apply(src.peek());<a name="line.1490"></a> |
| <span class="sourceLineNo">1491</span> }<a name="line.1491"></a> |
| <span class="sourceLineNo">1492</span><a name="line.1492"></a> |
| <span class="sourceLineNo">1493</span> /**<a name="line.1493"></a> |
| <span class="sourceLineNo">1494</span> * Return true when the next encoded value in {@code src} uses Numeric encoding, false otherwise.<a name="line.1494"></a> |
| <span class="sourceLineNo">1495</span> * {@code NaN}, {@code +/-Inf} are valid Numeric values.<a name="line.1495"></a> |
| <span class="sourceLineNo">1496</span> */<a name="line.1496"></a> |
| <span class="sourceLineNo">1497</span> public static boolean isNumeric(PositionedByteRange src) {<a name="line.1497"></a> |
| <span class="sourceLineNo">1498</span> byte x = (-1 == Integer.signum(src.peek()) ? DESCENDING : ASCENDING).apply(src.peek());<a name="line.1498"></a> |
| <span class="sourceLineNo">1499</span> return x >= NEG_INF && x <= NAN;<a name="line.1499"></a> |
| <span class="sourceLineNo">1500</span> }<a name="line.1500"></a> |
| <span class="sourceLineNo">1501</span><a name="line.1501"></a> |
| <span class="sourceLineNo">1502</span> /**<a name="line.1502"></a> |
| <span class="sourceLineNo">1503</span> * Return true when the next encoded value in {@code src} uses Numeric encoding and is<a name="line.1503"></a> |
| <span class="sourceLineNo">1504</span> * {@code Infinite}, false otherwise.<a name="line.1504"></a> |
| <span class="sourceLineNo">1505</span> */<a name="line.1505"></a> |
| <span class="sourceLineNo">1506</span> public static boolean isNumericInfinite(PositionedByteRange src) {<a name="line.1506"></a> |
| <span class="sourceLineNo">1507</span> byte x = (-1 == Integer.signum(src.peek()) ? DESCENDING : ASCENDING).apply(src.peek());<a name="line.1507"></a> |
| <span class="sourceLineNo">1508</span> return NEG_INF == x || POS_INF == x;<a name="line.1508"></a> |
| <span class="sourceLineNo">1509</span> }<a name="line.1509"></a> |
| <span class="sourceLineNo">1510</span><a name="line.1510"></a> |
| <span class="sourceLineNo">1511</span> /**<a name="line.1511"></a> |
| <span class="sourceLineNo">1512</span> * Return true when the next encoded value in {@code src} uses Numeric encoding and is<a name="line.1512"></a> |
| <span class="sourceLineNo">1513</span> * {@code NaN}, false otherwise.<a name="line.1513"></a> |
| <span class="sourceLineNo">1514</span> */<a name="line.1514"></a> |
| <span class="sourceLineNo">1515</span> public static boolean isNumericNaN(PositionedByteRange src) {<a name="line.1515"></a> |
| <span class="sourceLineNo">1516</span> return NAN == (-1 == Integer.signum(src.peek()) ? DESCENDING : ASCENDING).apply(src.peek());<a name="line.1516"></a> |
| <span class="sourceLineNo">1517</span> }<a name="line.1517"></a> |
| <span class="sourceLineNo">1518</span><a name="line.1518"></a> |
| <span class="sourceLineNo">1519</span> /**<a name="line.1519"></a> |
| <span class="sourceLineNo">1520</span> * Return true when the next encoded value in {@code src} uses Numeric encoding and is {@code 0},<a name="line.1520"></a> |
| <span class="sourceLineNo">1521</span> * false otherwise.<a name="line.1521"></a> |
| <span class="sourceLineNo">1522</span> */<a name="line.1522"></a> |
| <span class="sourceLineNo">1523</span> public static boolean isNumericZero(PositionedByteRange src) {<a name="line.1523"></a> |
| <span class="sourceLineNo">1524</span> return ZERO == (-1 == Integer.signum(src.peek()) ? DESCENDING : ASCENDING).apply(src.peek());<a name="line.1524"></a> |
| <span class="sourceLineNo">1525</span> }<a name="line.1525"></a> |
| <span class="sourceLineNo">1526</span><a name="line.1526"></a> |
| <span class="sourceLineNo">1527</span> /**<a name="line.1527"></a> |
| <span class="sourceLineNo">1528</span> * Return true when the next encoded value in {@code src} uses fixed-width Int8 encoding, false<a name="line.1528"></a> |
| <span class="sourceLineNo">1529</span> * otherwise.<a name="line.1529"></a> |
| <span class="sourceLineNo">1530</span> */<a name="line.1530"></a> |
| <span class="sourceLineNo">1531</span> public static boolean isFixedInt8(PositionedByteRange src) {<a name="line.1531"></a> |
| <span class="sourceLineNo">1532</span> return FIXED_INT8<a name="line.1532"></a> |
| <span class="sourceLineNo">1533</span> == (-1 == Integer.signum(src.peek()) ? DESCENDING : ASCENDING).apply(src.peek());<a name="line.1533"></a> |
| <span class="sourceLineNo">1534</span> }<a name="line.1534"></a> |
| <span class="sourceLineNo">1535</span><a name="line.1535"></a> |
| <span class="sourceLineNo">1536</span> /**<a name="line.1536"></a> |
| <span class="sourceLineNo">1537</span> * Return true when the next encoded value in {@code src} uses fixed-width Int16 encoding, false<a name="line.1537"></a> |
| <span class="sourceLineNo">1538</span> * otherwise.<a name="line.1538"></a> |
| <span class="sourceLineNo">1539</span> */<a name="line.1539"></a> |
| <span class="sourceLineNo">1540</span> public static boolean isFixedInt16(PositionedByteRange src) {<a name="line.1540"></a> |
| <span class="sourceLineNo">1541</span> return FIXED_INT16<a name="line.1541"></a> |
| <span class="sourceLineNo">1542</span> == (-1 == Integer.signum(src.peek()) ? DESCENDING : ASCENDING).apply(src.peek());<a name="line.1542"></a> |
| <span class="sourceLineNo">1543</span> }<a name="line.1543"></a> |
| <span class="sourceLineNo">1544</span><a name="line.1544"></a> |
| <span class="sourceLineNo">1545</span> /**<a name="line.1545"></a> |
| <span class="sourceLineNo">1546</span> * Return true when the next encoded value in {@code src} uses fixed-width Int32 encoding, false<a name="line.1546"></a> |
| <span class="sourceLineNo">1547</span> * otherwise.<a name="line.1547"></a> |
| <span class="sourceLineNo">1548</span> */<a name="line.1548"></a> |
| <span class="sourceLineNo">1549</span> public static boolean isFixedInt32(PositionedByteRange src) {<a name="line.1549"></a> |
| <span class="sourceLineNo">1550</span> return FIXED_INT32<a name="line.1550"></a> |
| <span class="sourceLineNo">1551</span> == (-1 == Integer.signum(src.peek()) ? DESCENDING : ASCENDING).apply(src.peek());<a name="line.1551"></a> |
| <span class="sourceLineNo">1552</span> }<a name="line.1552"></a> |
| <span class="sourceLineNo">1553</span><a name="line.1553"></a> |
| <span class="sourceLineNo">1554</span> /**<a name="line.1554"></a> |
| <span class="sourceLineNo">1555</span> * Return true when the next encoded value in {@code src} uses fixed-width Int64 encoding, false<a name="line.1555"></a> |
| <span class="sourceLineNo">1556</span> * otherwise.<a name="line.1556"></a> |
| <span class="sourceLineNo">1557</span> */<a name="line.1557"></a> |
| <span class="sourceLineNo">1558</span> public static boolean isFixedInt64(PositionedByteRange src) {<a name="line.1558"></a> |
| <span class="sourceLineNo">1559</span> return FIXED_INT64<a name="line.1559"></a> |
| <span class="sourceLineNo">1560</span> == (-1 == Integer.signum(src.peek()) ? DESCENDING : ASCENDING).apply(src.peek());<a name="line.1560"></a> |
| <span class="sourceLineNo">1561</span> }<a name="line.1561"></a> |
| <span class="sourceLineNo">1562</span><a name="line.1562"></a> |
| <span class="sourceLineNo">1563</span> /**<a name="line.1563"></a> |
| <span class="sourceLineNo">1564</span> * Return true when the next encoded value in {@code src} uses fixed-width Float32 encoding, false<a name="line.1564"></a> |
| <span class="sourceLineNo">1565</span> * otherwise.<a name="line.1565"></a> |
| <span class="sourceLineNo">1566</span> */<a name="line.1566"></a> |
| <span class="sourceLineNo">1567</span> public static boolean isFixedFloat32(PositionedByteRange src) {<a name="line.1567"></a> |
| <span class="sourceLineNo">1568</span> return FIXED_FLOAT32<a name="line.1568"></a> |
| <span class="sourceLineNo">1569</span> == (-1 == Integer.signum(src.peek()) ? DESCENDING : ASCENDING).apply(src.peek());<a name="line.1569"></a> |
| <span class="sourceLineNo">1570</span> }<a name="line.1570"></a> |
| <span class="sourceLineNo">1571</span><a name="line.1571"></a> |
| <span class="sourceLineNo">1572</span> /**<a name="line.1572"></a> |
| <span class="sourceLineNo">1573</span> * Return true when the next encoded value in {@code src} uses fixed-width Float64 encoding, false<a name="line.1573"></a> |
| <span class="sourceLineNo">1574</span> * otherwise.<a name="line.1574"></a> |
| <span class="sourceLineNo">1575</span> */<a name="line.1575"></a> |
| <span class="sourceLineNo">1576</span> public static boolean isFixedFloat64(PositionedByteRange src) {<a name="line.1576"></a> |
| <span class="sourceLineNo">1577</span> return FIXED_FLOAT64<a name="line.1577"></a> |
| <span class="sourceLineNo">1578</span> == (-1 == Integer.signum(src.peek()) ? DESCENDING : ASCENDING).apply(src.peek());<a name="line.1578"></a> |
| <span class="sourceLineNo">1579</span> }<a name="line.1579"></a> |
| <span class="sourceLineNo">1580</span><a name="line.1580"></a> |
| <span class="sourceLineNo">1581</span> /**<a name="line.1581"></a> |
| <span class="sourceLineNo">1582</span> * Return true when the next encoded value in {@code src} uses Text encoding, false otherwise.<a name="line.1582"></a> |
| <span class="sourceLineNo">1583</span> */<a name="line.1583"></a> |
| <span class="sourceLineNo">1584</span> public static boolean isText(PositionedByteRange src) {<a name="line.1584"></a> |
| <span class="sourceLineNo">1585</span> return TEXT == (-1 == Integer.signum(src.peek()) ? DESCENDING : ASCENDING).apply(src.peek());<a name="line.1585"></a> |
| <span class="sourceLineNo">1586</span> }<a name="line.1586"></a> |
| <span class="sourceLineNo">1587</span><a name="line.1587"></a> |
| <span class="sourceLineNo">1588</span> /**<a name="line.1588"></a> |
| <span class="sourceLineNo">1589</span> * Return true when the next encoded value in {@code src} uses BlobVar encoding, false otherwise.<a name="line.1589"></a> |
| <span class="sourceLineNo">1590</span> */<a name="line.1590"></a> |
| <span class="sourceLineNo">1591</span> public static boolean isBlobVar(PositionedByteRange src) {<a name="line.1591"></a> |
| <span class="sourceLineNo">1592</span> return BLOB_VAR<a name="line.1592"></a> |
| <span class="sourceLineNo">1593</span> == (-1 == Integer.signum(src.peek()) ? DESCENDING : ASCENDING).apply(src.peek());<a name="line.1593"></a> |
| <span class="sourceLineNo">1594</span> }<a name="line.1594"></a> |
| <span class="sourceLineNo">1595</span><a name="line.1595"></a> |
| <span class="sourceLineNo">1596</span> /**<a name="line.1596"></a> |
| <span class="sourceLineNo">1597</span> * Return true when the next encoded value in {@code src} uses BlobCopy encoding, false otherwise.<a name="line.1597"></a> |
| <span class="sourceLineNo">1598</span> */<a name="line.1598"></a> |
| <span class="sourceLineNo">1599</span> public static boolean isBlobCopy(PositionedByteRange src) {<a name="line.1599"></a> |
| <span class="sourceLineNo">1600</span> return BLOB_COPY<a name="line.1600"></a> |
| <span class="sourceLineNo">1601</span> == (-1 == Integer.signum(src.peek()) ? DESCENDING : ASCENDING).apply(src.peek());<a name="line.1601"></a> |
| <span class="sourceLineNo">1602</span> }<a name="line.1602"></a> |
| <span class="sourceLineNo">1603</span><a name="line.1603"></a> |
| <span class="sourceLineNo">1604</span> /**<a name="line.1604"></a> |
| <span class="sourceLineNo">1605</span> * Skip {@code buff}'s position forward over one encoded value.<a name="line.1605"></a> |
| <span class="sourceLineNo">1606</span> * @return number of bytes skipped.<a name="line.1606"></a> |
| <span class="sourceLineNo">1607</span> */<a name="line.1607"></a> |
| <span class="sourceLineNo">1608</span> public static int skip(PositionedByteRange src) {<a name="line.1608"></a> |
| <span class="sourceLineNo">1609</span> final int start = src.getPosition();<a name="line.1609"></a> |
| <span class="sourceLineNo">1610</span> byte header = src.get();<a name="line.1610"></a> |
| <span class="sourceLineNo">1611</span> Order ord = (-1 == Integer.signum(header)) ? DESCENDING : ASCENDING;<a name="line.1611"></a> |
| <span class="sourceLineNo">1612</span> header = ord.apply(header);<a name="line.1612"></a> |
| <span class="sourceLineNo">1613</span><a name="line.1613"></a> |
| <span class="sourceLineNo">1614</span> switch (header) {<a name="line.1614"></a> |
| <span class="sourceLineNo">1615</span> case NULL:<a name="line.1615"></a> |
| <span class="sourceLineNo">1616</span> case NEG_INF:<a name="line.1616"></a> |
| <span class="sourceLineNo">1617</span> return 1;<a name="line.1617"></a> |
| <span class="sourceLineNo">1618</span> case NEG_LARGE: /* Large negative number: 0x08, ~E, ~M */<a name="line.1618"></a> |
| <span class="sourceLineNo">1619</span> skipVaruint64(src, DESCENDING != ord);<a name="line.1619"></a> |
| <span class="sourceLineNo">1620</span> skipSignificand(src, DESCENDING != ord);<a name="line.1620"></a> |
| <span class="sourceLineNo">1621</span> return src.getPosition() - start;<a name="line.1621"></a> |
| <span class="sourceLineNo">1622</span> case NEG_MED_MIN: /* Medium negative number: 0x13-E, ~M */<a name="line.1622"></a> |
| <span class="sourceLineNo">1623</span> case NEG_MED_MIN + 0x01:<a name="line.1623"></a> |
| <span class="sourceLineNo">1624</span> case NEG_MED_MIN + 0x02:<a name="line.1624"></a> |
| <span class="sourceLineNo">1625</span> case NEG_MED_MIN + 0x03:<a name="line.1625"></a> |
| <span class="sourceLineNo">1626</span> case NEG_MED_MIN + 0x04:<a name="line.1626"></a> |
| <span class="sourceLineNo">1627</span> case NEG_MED_MIN + 0x05:<a name="line.1627"></a> |
| <span class="sourceLineNo">1628</span> case NEG_MED_MIN + 0x06:<a name="line.1628"></a> |
| <span class="sourceLineNo">1629</span> case NEG_MED_MIN + 0x07:<a name="line.1629"></a> |
| <span class="sourceLineNo">1630</span> case NEG_MED_MIN + 0x08:<a name="line.1630"></a> |
| <span class="sourceLineNo">1631</span> case NEG_MED_MIN + 0x09:<a name="line.1631"></a> |
| <span class="sourceLineNo">1632</span> case NEG_MED_MAX:<a name="line.1632"></a> |
| <span class="sourceLineNo">1633</span> skipSignificand(src, DESCENDING != ord);<a name="line.1633"></a> |
| <span class="sourceLineNo">1634</span> return src.getPosition() - start;<a name="line.1634"></a> |
| <span class="sourceLineNo">1635</span> case NEG_SMALL: /* Small negative number: 0x14, -E, ~M */<a name="line.1635"></a> |
| <span class="sourceLineNo">1636</span> skipVaruint64(src, DESCENDING == ord);<a name="line.1636"></a> |
| <span class="sourceLineNo">1637</span> skipSignificand(src, DESCENDING != ord);<a name="line.1637"></a> |
| <span class="sourceLineNo">1638</span> return src.getPosition() - start;<a name="line.1638"></a> |
| <span class="sourceLineNo">1639</span> case ZERO:<a name="line.1639"></a> |
| <span class="sourceLineNo">1640</span> return 1;<a name="line.1640"></a> |
| <span class="sourceLineNo">1641</span> case POS_SMALL: /* Small positive number: 0x16, ~-E, M */<a name="line.1641"></a> |
| <span class="sourceLineNo">1642</span> skipVaruint64(src, DESCENDING != ord);<a name="line.1642"></a> |
| <span class="sourceLineNo">1643</span> skipSignificand(src, DESCENDING == ord);<a name="line.1643"></a> |
| <span class="sourceLineNo">1644</span> return src.getPosition() - start;<a name="line.1644"></a> |
| <span class="sourceLineNo">1645</span> case POS_MED_MIN: /* Medium positive number: 0x17+E, M */<a name="line.1645"></a> |
| <span class="sourceLineNo">1646</span> case POS_MED_MIN + 0x01:<a name="line.1646"></a> |
| <span class="sourceLineNo">1647</span> case POS_MED_MIN + 0x02:<a name="line.1647"></a> |
| <span class="sourceLineNo">1648</span> case POS_MED_MIN + 0x03:<a name="line.1648"></a> |
| <span class="sourceLineNo">1649</span> case POS_MED_MIN + 0x04:<a name="line.1649"></a> |
| <span class="sourceLineNo">1650</span> case POS_MED_MIN + 0x05:<a name="line.1650"></a> |
| <span class="sourceLineNo">1651</span> case POS_MED_MIN + 0x06:<a name="line.1651"></a> |
| <span class="sourceLineNo">1652</span> case POS_MED_MIN + 0x07:<a name="line.1652"></a> |
| <span class="sourceLineNo">1653</span> case POS_MED_MIN + 0x08:<a name="line.1653"></a> |
| <span class="sourceLineNo">1654</span> case POS_MED_MIN + 0x09:<a name="line.1654"></a> |
| <span class="sourceLineNo">1655</span> case POS_MED_MAX:<a name="line.1655"></a> |
| <span class="sourceLineNo">1656</span> skipSignificand(src, DESCENDING == ord);<a name="line.1656"></a> |
| <span class="sourceLineNo">1657</span> return src.getPosition() - start;<a name="line.1657"></a> |
| <span class="sourceLineNo">1658</span> case POS_LARGE: /* Large positive number: 0x22, E, M */<a name="line.1658"></a> |
| <span class="sourceLineNo">1659</span> skipVaruint64(src, DESCENDING == ord);<a name="line.1659"></a> |
| <span class="sourceLineNo">1660</span> skipSignificand(src, DESCENDING == ord);<a name="line.1660"></a> |
| <span class="sourceLineNo">1661</span> return src.getPosition() - start;<a name="line.1661"></a> |
| <span class="sourceLineNo">1662</span> case POS_INF:<a name="line.1662"></a> |
| <span class="sourceLineNo">1663</span> return 1;<a name="line.1663"></a> |
| <span class="sourceLineNo">1664</span> case NAN:<a name="line.1664"></a> |
| <span class="sourceLineNo">1665</span> return 1;<a name="line.1665"></a> |
| <span class="sourceLineNo">1666</span> case FIXED_INT8:<a name="line.1666"></a> |
| <span class="sourceLineNo">1667</span> src.setPosition(src.getPosition() + 1);<a name="line.1667"></a> |
| <span class="sourceLineNo">1668</span> return src.getPosition() - start;<a name="line.1668"></a> |
| <span class="sourceLineNo">1669</span> case FIXED_INT16:<a name="line.1669"></a> |
| <span class="sourceLineNo">1670</span> src.setPosition(src.getPosition() + 2);<a name="line.1670"></a> |
| <span class="sourceLineNo">1671</span> return src.getPosition() - start;<a name="line.1671"></a> |
| <span class="sourceLineNo">1672</span> case FIXED_INT32:<a name="line.1672"></a> |
| <span class="sourceLineNo">1673</span> src.setPosition(src.getPosition() + 4);<a name="line.1673"></a> |
| <span class="sourceLineNo">1674</span> return src.getPosition() - start;<a name="line.1674"></a> |
| <span class="sourceLineNo">1675</span> case FIXED_INT64:<a name="line.1675"></a> |
| <span class="sourceLineNo">1676</span> src.setPosition(src.getPosition() + 8);<a name="line.1676"></a> |
| <span class="sourceLineNo">1677</span> return src.getPosition() - start;<a name="line.1677"></a> |
| <span class="sourceLineNo">1678</span> case FIXED_FLOAT32:<a name="line.1678"></a> |
| <span class="sourceLineNo">1679</span> src.setPosition(src.getPosition() + 4);<a name="line.1679"></a> |
| <span class="sourceLineNo">1680</span> return src.getPosition() - start;<a name="line.1680"></a> |
| <span class="sourceLineNo">1681</span> case FIXED_FLOAT64:<a name="line.1681"></a> |
| <span class="sourceLineNo">1682</span> src.setPosition(src.getPosition() + 8);<a name="line.1682"></a> |
| <span class="sourceLineNo">1683</span> return src.getPosition() - start;<a name="line.1683"></a> |
| <span class="sourceLineNo">1684</span> case TEXT:<a name="line.1684"></a> |
| <span class="sourceLineNo">1685</span> // for null-terminated values, skip to the end.<a name="line.1685"></a> |
| <span class="sourceLineNo">1686</span> do {<a name="line.1686"></a> |
| <span class="sourceLineNo">1687</span> header = ord.apply(src.get());<a name="line.1687"></a> |
| <span class="sourceLineNo">1688</span> } while (header != TERM);<a name="line.1688"></a> |
| <span class="sourceLineNo">1689</span> return src.getPosition() - start;<a name="line.1689"></a> |
| <span class="sourceLineNo">1690</span> case BLOB_VAR:<a name="line.1690"></a> |
| <span class="sourceLineNo">1691</span> // read until we find a 0 in the MSB<a name="line.1691"></a> |
| <span class="sourceLineNo">1692</span> do {<a name="line.1692"></a> |
| <span class="sourceLineNo">1693</span> header = ord.apply(src.get());<a name="line.1693"></a> |
| <span class="sourceLineNo">1694</span> } while ((byte) (header & 0x80) != TERM);<a name="line.1694"></a> |
| <span class="sourceLineNo">1695</span> return src.getPosition() - start;<a name="line.1695"></a> |
| <span class="sourceLineNo">1696</span> case BLOB_COPY:<a name="line.1696"></a> |
| <span class="sourceLineNo">1697</span> if (Order.DESCENDING == ord) {<a name="line.1697"></a> |
| <span class="sourceLineNo">1698</span> // if descending, read to termination byte.<a name="line.1698"></a> |
| <span class="sourceLineNo">1699</span> do {<a name="line.1699"></a> |
| <span class="sourceLineNo">1700</span> header = ord.apply(src.get());<a name="line.1700"></a> |
| <span class="sourceLineNo">1701</span> } while (header != TERM);<a name="line.1701"></a> |
| <span class="sourceLineNo">1702</span> return src.getPosition() - start;<a name="line.1702"></a> |
| <span class="sourceLineNo">1703</span> } else {<a name="line.1703"></a> |
| <span class="sourceLineNo">1704</span> // otherwise, just skip to the end.<a name="line.1704"></a> |
| <span class="sourceLineNo">1705</span> src.setPosition(src.getLength());<a name="line.1705"></a> |
| <span class="sourceLineNo">1706</span> return src.getPosition() - start;<a name="line.1706"></a> |
| <span class="sourceLineNo">1707</span> }<a name="line.1707"></a> |
| <span class="sourceLineNo">1708</span> default:<a name="line.1708"></a> |
| <span class="sourceLineNo">1709</span> throw unexpectedHeader(header);<a name="line.1709"></a> |
| <span class="sourceLineNo">1710</span> }<a name="line.1710"></a> |
| <span class="sourceLineNo">1711</span> }<a name="line.1711"></a> |
| <span class="sourceLineNo">1712</span><a name="line.1712"></a> |
| <span class="sourceLineNo">1713</span> /**<a name="line.1713"></a> |
| <span class="sourceLineNo">1714</span> * Return the number of encoded entries remaining in {@code buff}. The state of {@code buff} is<a name="line.1714"></a> |
| <span class="sourceLineNo">1715</span> * not modified through use of this method.<a name="line.1715"></a> |
| <span class="sourceLineNo">1716</span> */<a name="line.1716"></a> |
| <span class="sourceLineNo">1717</span> public static int length(PositionedByteRange buff) {<a name="line.1717"></a> |
| <span class="sourceLineNo">1718</span> PositionedByteRange b =<a name="line.1718"></a> |
| <span class="sourceLineNo">1719</span> new SimplePositionedMutableByteRange(buff.getBytes(), buff.getOffset(), buff.getLength());<a name="line.1719"></a> |
| <span class="sourceLineNo">1720</span> b.setPosition(buff.getPosition());<a name="line.1720"></a> |
| <span class="sourceLineNo">1721</span> int cnt = 0;<a name="line.1721"></a> |
| <span class="sourceLineNo">1722</span> for (; isEncodedValue(b); skip(b), cnt++)<a name="line.1722"></a> |
| <span class="sourceLineNo">1723</span> ;<a name="line.1723"></a> |
| <span class="sourceLineNo">1724</span> return cnt;<a name="line.1724"></a> |
| <span class="sourceLineNo">1725</span> }<a name="line.1725"></a> |
| <span class="sourceLineNo">1726</span>}<a name="line.1726"></a> |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| </pre> |
| </div> |
| </body> |
| </html> |