sgx_tstd/src/sys_common/memchr.rs - incubator-teaclave-sgx-sdk - Git at Google

 // Licensed to the Apache Software Foundation (ASF) under one
 // or more contributor license agreements.  See the NOTICE file
 // distributed with this work for additional information
 // regarding copyright ownership.  The ASF licenses this file
 // to you under the Apache License, Version 2.0 (the
 // "License"); you may not use this file except in compliance
 // with the License.  You may obtain a copy of the License at
 //
 //   http://www.apache.org/licenses/LICENSE-2.0
 //
 // Unless required by applicable law or agreed to in writing,
 // software distributed under the License is distributed on an
 // "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, either express or implied.  See the License for the
 // specific language governing permissions and limitations
 // under the License..

 #[allow(dead_code)]
 pub mod fallback {
     use core::cmp;
     use core::mem;

     const LO_U64: u64 = 0x0101010101010101;
     const HI_U64: u64 = 0x8080808080808080;

     // use truncation
     const LO_USIZE: usize = LO_U64 as usize;
     const HI_USIZE: usize = HI_U64 as usize;

     /// Return `true` if `x` contains any zero byte.
     ///
     /// From *Matters Computational*, J. Arndt
     ///
     /// "The idea is to subtract one from each of the bytes and then look for
     /// bytes where the borrow propagated all the way to the most significant
     /// bit."
     #[inline]
     fn contains_zero_byte(x: usize) -> bool {
         x.wrapping_sub(LO_USIZE) & !x & HI_USIZE != 0
     }

     #[cfg(target_pointer_width = "32")]
     #[inline]
     fn repeat_byte(b: u8) -> usize {
         let mut rep = (b as usize) << 8 | b as usize;
         rep = rep << 16 | rep;
         rep
     }

     #[cfg(target_pointer_width = "64")]
     #[inline]
     fn repeat_byte(b: u8) -> usize {
         let mut rep = (b as usize) << 8 | b as usize;
         rep = rep << 16 | rep;
         rep = rep << 32 | rep;
         rep
     }

     /// Return the first index matching the byte `a` in `text`.
     pub fn memchr(x: u8, text: &[u8]) -> Option<usize> {
         // Scan for a single byte value by reading two `usize` words at a time.
         //
         // Split `text` in three parts
         // - unaligned initial part, before the first word aligned address in text
         // - body, scan by 2 words at a time
         // - the last remaining part, < 2 word size
         let len = text.len();
         let ptr = text.as_ptr();
         let usize_bytes = mem::size_of::<usize>();

         // search up to an aligned boundary
         let mut offset = ptr.align_offset(usize_bytes);
         if offset > 0 {
             offset = cmp::min(offset, len);
             if let Some(index) = text[..offset].iter().position(|elt| *elt == x) {
                 return Some(index);
             }
         }

         // search the body of the text
         let repeated_x = repeat_byte(x);

         if len >= 2 * usize_bytes {
             while offset <= len - 2 * usize_bytes {
                 unsafe {
                     let u = *(ptr.offset(offset as isize) as *const usize);
                     let v = *(ptr.offset((offset + usize_bytes) as isize) as *const usize);

                     // break if there is a matching byte
                     let zu = contains_zero_byte(u ^ repeated_x);
                     let zv = contains_zero_byte(v ^ repeated_x);
                     if zu || zv {
                         break;
                     }
                 }
                 offset += usize_bytes * 2;
             }
         }

         // find the byte after the point the body loop stopped
         text[offset..].iter().position(|elt| *elt == x).map(|i| offset + i)
     }

     /// Return the last index matching the byte `a` in `text`.
     pub fn memrchr(x: u8, text: &[u8]) -> Option<usize> {
         // Scan for a single byte value by reading two `usize` words at a time.
         //
         // Split `text` in three parts
         // - unaligned tail, after the last word aligned address in text
         // - body, scan by 2 words at a time
         // - the first remaining bytes, < 2 word size
         let len = text.len();
         let ptr = text.as_ptr();
         let usize_bytes = mem::size_of::<usize>();

         // search to an aligned boundary
         let end_align = (ptr as usize + len) & (usize_bytes - 1);
         let mut offset;
         if end_align > 0 {
             offset = if end_align >= len { 0 } else { len - end_align };
             if let Some(index) = text[offset..].iter().rposition(|elt| *elt == x) {
                 return Some(offset + index);
             }
         } else {
             offset = len;
         }

         // search the body of the text
         let repeated_x = repeat_byte(x);

         while offset >= 2 * usize_bytes {
             unsafe {
                 let u = *(ptr.offset(offset as isize - 2 * usize_bytes as isize) as *const usize);
                 let v = *(ptr.offset(offset as isize - usize_bytes as isize) as *const usize);

                 // break if there is a matching byte
                 let zu = contains_zero_byte(u ^ repeated_x);
                 let zv = contains_zero_byte(v ^ repeated_x);
                 if zu || zv {
                     break;
                 }
             }
             offset -= 2 * usize_bytes;
         }

         // find the byte before the point the body loop stopped
         text[..offset].iter().rposition(|elt| *elt == x)
     }
 }
	// Licensed to the Apache Software Foundation (ASF) under one
	// or more contributor license agreements. See the NOTICE file
	// distributed with this work for additional information
	// regarding copyright ownership. The ASF licenses this file
	// to you under the Apache License, Version 2.0 (the
	// "License"); you may not use this file except in compliance
	// with the License. You may obtain a copy of the License at
	//
	// http://www.apache.org/licenses/LICENSE-2.0
	//
	// Unless required by applicable law or agreed to in writing,
	// software distributed under the License is distributed on an
	// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
	// KIND, either express or implied. See the License for the
	// specific language governing permissions and limitations
	// under the License..

	#[allow(dead_code)]
	pub mod fallback {
	use core::cmp;
	use core::mem;

	const LO_U64: u64 = 0x0101010101010101;
	const HI_U64: u64 = 0x8080808080808080;

	// use truncation
	const LO_USIZE: usize = LO_U64 as usize;
	const HI_USIZE: usize = HI_U64 as usize;

	/// Return `true` if `x` contains any zero byte.
	///
	/// From Matters Computational, J. Arndt
	///
	/// "The idea is to subtract one from each of the bytes and then look for
	/// bytes where the borrow propagated all the way to the most significant
	/// bit."
	#[inline]
	fn contains_zero_byte(x: usize) -> bool {
	x.wrapping_sub(LO_USIZE) & !x & HI_USIZE != 0
	}

	#[cfg(target_pointer_width = "32")]
	#[inline]
	fn repeat_byte(b: u8) -> usize {
	let mut rep = (b as usize) << 8 \| b as usize;
	rep = rep << 16 \| rep;
	rep
	}

	#[cfg(target_pointer_width = "64")]
	#[inline]
	fn repeat_byte(b: u8) -> usize {
	let mut rep = (b as usize) << 8 \| b as usize;
	rep = rep << 16 \| rep;
	rep = rep << 32 \| rep;
	rep
	}

	/// Return the first index matching the byte `a` in `text`.
	pub fn memchr(x: u8, text: &[u8]) -> Option<usize> {
	// Scan for a single byte value by reading two `usize` words at a time.
	//
	// Split `text` in three parts
	// - unaligned initial part, before the first word aligned address in text
	// - body, scan by 2 words at a time
	// - the last remaining part, < 2 word size
	let len = text.len();
	let ptr = text.as_ptr();
	let usize_bytes = mem::size_of::<usize>();

	// search up to an aligned boundary
	let mut offset = ptr.align_offset(usize_bytes);
	if offset > 0 {
	offset = cmp::min(offset, len);
	if let Some(index) = text[..offset].iter().position(\|elt\| *elt == x) {
	return Some(index);
	}
	}

	// search the body of the text
	let repeated_x = repeat_byte(x);

	if len >= 2 * usize_bytes {
	while offset <= len - 2 * usize_bytes {
	unsafe {
	let u = (ptr.offset(offset as isize) as const usize);
	let v = (ptr.offset((offset + usize_bytes) as isize) as const usize);

	// break if there is a matching byte
	let zu = contains_zero_byte(u ^ repeated_x);
	let zv = contains_zero_byte(v ^ repeated_x);
	if zu \|\| zv {
	break;
	}
	}
	offset += usize_bytes * 2;
	}
	}

	// find the byte after the point the body loop stopped
	text[offset..].iter().position(\|elt\| *elt == x).map(\|i\| offset + i)
	}

	/// Return the last index matching the byte `a` in `text`.
	pub fn memrchr(x: u8, text: &[u8]) -> Option<usize> {
	// Scan for a single byte value by reading two `usize` words at a time.
	//
	// Split `text` in three parts
	// - unaligned tail, after the last word aligned address in text
	// - body, scan by 2 words at a time
	// - the first remaining bytes, < 2 word size
	let len = text.len();
	let ptr = text.as_ptr();
	let usize_bytes = mem::size_of::<usize>();

	// search to an aligned boundary
	let end_align = (ptr as usize + len) & (usize_bytes - 1);
	let mut offset;
	if end_align > 0 {
	offset = if end_align >= len { 0 } else { len - end_align };
	if let Some(index) = text[offset..].iter().rposition(\|elt\| *elt == x) {
	return Some(offset + index);
	}
	} else {
	offset = len;
	}

	// search the body of the text
	let repeated_x = repeat_byte(x);

	while offset >= 2 * usize_bytes {
	unsafe {
	let u = (ptr.offset(offset as isize - 2 usize_bytes as isize) as *const usize);
	let v = (ptr.offset(offset as isize - usize_bytes as isize) as const usize);

	// break if there is a matching byte
	let zu = contains_zero_byte(u ^ repeated_x);
	let zv = contains_zero_byte(v ^ repeated_x);
	if zu \|\| zv {
	break;
	}
	}
	offset -= 2 * usize_bytes;
	}

	// find the byte before the point the body loop stopped
	text[..offset].iter().rposition(\|elt\| *elt == x)
	}
	}