rust-lang · bors · Jan 19, 2024 · Jan 17, 2024 · saethlin · Jan 17, 2024
diff --git a/compiler/rustc_const_eval/src/interpret/memory.rs b/compiler/rustc_const_eval/src/interpret/memory.rs
@@ -1209,21 +1209,28 @@ impl<'mir, 'tcx: 'mir, M: Machine<'mir, 'tcx>> InterpCx<'mir, 'tcx, M> {
                         throw_ub_custom!(fluent::const_eval_copy_nonoverlapping_overlapping);
                     }
                 }
+            }
 
-                for i in 0..num_copies {
-                    ptr::copy(
-                        src_bytes,
-                        dest_bytes.add((size * i).bytes_usize()), // `Size` multiplication
-                        size.bytes_usize(),
-                    );
+            let size_in_bytes = size.bytes_usize();
+            // For particularly large arrays (where this is perf-sensitive) it's common that
+            // we're writing a single byte repeatedly. So, optimize that case to a memset.
+            if size_in_bytes == 1 && num_copies >= 1 {
+                // SAFETY: `src_bytes` would be read from anyway by copies below (num_copies >= 1).
+                // Since size_in_bytes = 1, then the `init.no_bytes_init()` check above guarantees
+                // that this read at type `u8` is OK -- it must be an initialized byte.
     fn uninit_inner<R>(size: Size, align: Align, fail: impl FnOnce() -> R) -> Result<Self, R> { 
         // We raise an error if we cannot create the allocation on the host. 
         // This results in an error that can happen non-deterministically, since the memory 
         // available to the compiler can change between runs. Normally queries are always 
         // deterministic. However, we can be non-deterministic here because all uses of const 
         // evaluation (including ConstProp!) will make compilation fail (via hard error 
         // or ICE) upon encountering a `MemoryExhausted` error. 
         let bytes = Bytes::zeroed(size, align).ok_or_else(fail)?; 
         Ok(Allocation { 
             bytes, 
             provenance: ProvenanceMap::new(), 
             init_mask: InitMask::new(size, false), 
             align, 
             mutability: Mutability::Mut, 
             extra: (), 
         }) 
     } 
     /// Try to create an Allocation of `size` bytes, failing if there is not enough memory 
     /// available to the compiler to do so. 
     pub fn try_uninit<'tcx>(size: Size, align: Align) -> InterpResult<'tcx, Self> { 
         Self::uninit_inner(size, align, || { 
             ty::tls::with(|tcx| tcx.dcx().delayed_bug("exhausted memory during interpretation")); 
             InterpError::ResourceExhaustion(ResourceExhaustionInfo::MemoryExhausted).into() 
         }) 
     } 
     /// Try to create an Allocation of `size` bytes, panics if there is not enough memory 
     /// available to the compiler to do so. 
     /// 
     /// Example use case: To obtain an Allocation filled with specific data, 
     /// first call this function and then call write_scalar to fill in the right data. 
     pub fn uninit(size: Size, align: Align) -> Self { 
         match Self::uninit_inner(size, align, || { 
             panic!("Allocation::uninit called with panic_on_fail had allocation failure"); 
         }) { 
             Ok(x) => x, 
             Err(x) => x, 
         } 
     } 
 fn zeroed(size: Size, _align: Align) -> Option<Self> { 
     let bytes = Box::<[u8]>::try_new_zeroed_slice(size.bytes_usize()).ok()?; 
     // SAFETY: the box was zero-allocated, which is a valid initial value for Box<[u8]> 
     let bytes = unsafe { bytes.assume_init() }; 
     Some(bytes) 
 } 
     fn uninit_inner<R>(size: Size, align: Align, fail: impl FnOnce() -> R) -> Result<Self, R> { 
         // We raise an error if we cannot create the allocation on the host. 
         // This results in an error that can happen non-deterministically, since the memory 
         // available to the compiler can change between runs. Normally queries are always 
         // deterministic. However, we can be non-deterministic here because all uses of const 
         // evaluation (including ConstProp!) will make compilation fail (via hard error 
         // or ICE) upon encountering a `MemoryExhausted` error. 
         let bytes = Bytes::zeroed(size, align).ok_or_else(fail)?; 
  
         Ok(Allocation { 
             bytes, 
             provenance: ProvenanceMap::new(), 
             init_mask: InitMask::new(size, false), 
             align, 
             mutability: Mutability::Mut, 
             extra: (), 
         }) 
     } 
  
     /// Try to create an Allocation of `size` bytes, failing if there is not enough memory 
     /// available to the compiler to do so. 
     pub fn try_uninit<'tcx>(size: Size, align: Align) -> InterpResult<'tcx, Self> { 
         Self::uninit_inner(size, align, || { 
             ty::tls::with(|tcx| tcx.dcx().delayed_bug("exhausted memory during interpretation")); 
             InterpError::ResourceExhaustion(ResourceExhaustionInfo::MemoryExhausted).into() 
         }) 
     } 
  
     /// Try to create an Allocation of `size` bytes, panics if there is not enough memory 
     /// available to the compiler to do so. 
     /// 
     /// Example use case: To obtain an Allocation filled with specific data, 
     /// first call this function and then call write_scalar to fill in the right data. 
     pub fn uninit(size: Size, align: Align) -> Self { 
         match Self::uninit_inner(size, align, || { 
             panic!("Allocation::uninit called with panic_on_fail had allocation failure"); 
         }) { 
             Ok(x) => x, 
             Err(x) => x, 
         } 
     } 
 fn zeroed(size: Size, _align: Align) -> Option<Self> { 
     let bytes = Box::<[u8]>::try_new_zeroed_slice(size.bytes_usize()).ok()?; 
     // SAFETY: the box was zero-allocated, which is a valid initial value for Box<[u8]> 
     let bytes = unsafe { bytes.assume_init() }; 
     Some(bytes) 
 } 
+                let value = *src_bytes;
+                dest_bytes.write_bytes(value, (size * num_copies).bytes_usize());
+            } else if src_alloc_id == dest_alloc_id {
+                let mut dest_ptr = dest_bytes;
+                for _ in 0..num_copies {
+                    ptr::copy(src_bytes, dest_ptr, size_in_bytes);
+                    dest_ptr = dest_ptr.add(size_in_bytes);
                 }
             } else {
-                for i in 0..num_copies {
-                    ptr::copy_nonoverlapping(
-                        src_bytes,
-                        dest_bytes.add((size * i).bytes_usize()), // `Size` multiplication
-                        size.bytes_usize(),
-                    );
+                let mut dest_ptr = dest_bytes;
+                for _ in 0..num_copies {
+                    ptr::copy_nonoverlapping(src_bytes, dest_ptr, size_in_bytes);
+                    dest_ptr = dest_ptr.add(size_in_bytes);
                 }
             }
         }