1// Copyright 2023 The Fuchsia Authors. All rights reserved.
2// Use of this source code is governed by a BSD-style license that can be
3// found in the LICENSE file.
45use std::fs::File;
6use std::io::{self, ErrorKind, Read as _, Seek as _, SeekFrom};
7use std::path::Path;
8use tempfile::{NamedTempFile, PersistError};
910const CHUNK_SIZE: usize = 8192;
1112pub trait NamedTempFileExt {
13/// Atomically overwrite the target path if the contents are different.
14 ///
15 /// This is conceptually similar to [tempfile::NamedTempFile::persist], but
16 /// will only overwrite the target path if:
17 ///
18 /// * The target path does not exist.
19 /// * The target path has different contents than `self`.
20 ///
21 /// It will not overwrite the target path if it already exists and has the
22 /// same content.
23 ///
24 /// Either way, it will return an opened `File` for the target path.
25fn persist_if_changed<P: AsRef<Path>>(self, path: P) -> Result<File, PersistError>;
26}
2728impl NamedTempFileExt for NamedTempFile {
29fn persist_if_changed<P: AsRef<Path>>(mut self, path: P) -> Result<File, PersistError> {
30let path = path.as_ref();
3132// Open up the file and see if the contents are the same. If so, return
33 // the old file, otherwise overwrite it with the new contents.
34if let Ok(mut old_file) = File::open(&path) {
35if let Err(err) = self.seek(SeekFrom::Start(0)) {
36return Err(PersistError { error: err, file: self });
37 }
3839match files_have_same_content(self.as_file_mut(), &mut old_file) {
40Ok(true) => {
41// Since the two files have the same contents, we'll return
42 // the old one. We read from it, so reset back to the start.
43if let Err(err) = old_file.seek(SeekFrom::Start(0)) {
44return Err(PersistError { error: err, file: self });
45 }
4647return Ok(old_file);
48 }
49Ok(false) => {}
50Err(err) => {
51return Err(PersistError { error: err, file: self });
52 }
53 }
54 }
5556self.persist(path)
57 }
58}
5960/// Checks if the two files have the same contents. Returns `true` if so,
61/// otherwise `false`.
62fn files_have_same_content(lhs: &mut File, rhs: &mut File) -> io::Result<bool> {
63let lhs_metadata = lhs.metadata()?;
64let rhs_metadata = rhs.metadata()?;
6566// The files cannot have the same content if they have different lengths.
67if lhs_metadata.len() != rhs_metadata.len() {
68return Ok(false);
69 }
7071 files_after_checking_length_have_same_content(lhs, rhs)
72}
7374/// Check the contents of two files have the same contents, after we have
75/// checked they have the same length. Returns `true` if they have the same
76/// contents, `false` if not.
77///
78/// This will return `false` if the files changed length while checking.
79fn files_after_checking_length_have_same_content(
80 lhs: &mut File,
81 rhs: &mut File,
82) -> io::Result<bool> {
83let mut lhs_bytes = [0; CHUNK_SIZE];
84let mut rhs_bytes = [0; CHUNK_SIZE];
8586loop {
87// Read the next chunk.
88let lhs_len = lhs.read(&mut lhs_bytes)?;
89let lhs_bytes = &lhs_bytes[0..lhs_len];
9091if lhs_bytes.is_empty() {
92// We hit the end of `lhs`, so we'll need to check if `rhs` is also
93 // at the end of the file. We can't use `read_exact` to check for
94 // this, since it's not guaranteed to read from the file if we pass
95 // it a zero-sized slice.
96if rhs.read(&mut rhs_bytes)? == 0 {
97return Ok(true);
98 } else {
99return Ok(false);
100 }
101 }
102103// Otherwise, read the same length from the other file.
104let rhs_bytes = &mut rhs_bytes[0..lhs_len];
105match rhs.read_exact(rhs_bytes) {
106Ok(()) => {}
107Err(err) if err.kind() == ErrorKind::UnexpectedEof => {
108// The file was truncated while we were reading from it, so
109 // return that the two files are different.
110return Ok(false);
111 }
112Err(err) => {
113return Err(err);
114 }
115 }
116117// Return false if the two chunks are not the same.
118if lhs_bytes != rhs_bytes {
119return Ok(false);
120 }
121 }
122}
123124#[cfg(test)]
125mod tests {
126use super::*;
127use std::io::Write as _;
128use std::os::unix::fs::MetadataExt as _;
129use tempfile::TempDir;
130131#[test]
132fn test_persist_if_changed() {
133for size in [1, 20, CHUNK_SIZE - 1, CHUNK_SIZE, CHUNK_SIZE + 1, CHUNK_SIZE * 10] {
134let dir = TempDir::new().unwrap();
135let path = dir.path().join("file");
136137let mut body = (0..std::u8::MAX).cycle().take(size).collect::<Vec<_>>();
138139// We should persist the file if it doesn't already exist.
140let mut tmp1 = NamedTempFile::new_in(dir.path()).unwrap();
141 tmp1.write_all(&body).unwrap();
142 tmp1.persist_if_changed(&path).unwrap();
143assert_eq!(std::fs::read(&path).unwrap(), body);
144145let metadata1 = std::fs::metadata(&path).unwrap();
146147// We should not persist if the contents didn't change.
148let mut tmp2 = NamedTempFile::new_in(dir.path()).unwrap();
149 tmp2.write_all(&body).unwrap();
150 tmp2.persist_if_changed(&path).unwrap();
151assert_eq!(std::fs::read(&path).unwrap(), body);
152153// inode shouldn't change if the content doesn't change.
154let metadata2 = std::fs::metadata(&path).unwrap();
155assert_eq!(metadata1.dev(), metadata2.dev());
156assert_eq!(metadata1.ino(), metadata2.ino());
157158// We should persist if the contents changed (even though the length
159 // did not).
160*body.last_mut().unwrap() = 1;
161162let mut tmp3 = NamedTempFile::new_in(dir.path()).unwrap();
163 tmp3.write_all(&body).unwrap();
164 tmp3.persist_if_changed(&path).unwrap();
165assert_eq!(std::fs::read(&path).unwrap(), body);
166167let metadata3 = std::fs::metadata(&path).unwrap();
168assert_eq!(metadata1.dev(), metadata3.dev());
169assert_ne!(metadata1.ino(), metadata3.ino());
170171// We should persist if the contents changed length.
172body.push(2);
173174let mut tmp4 = NamedTempFile::new_in(dir.path()).unwrap();
175 tmp4.write_all(&body).unwrap();
176 tmp4.persist_if_changed(&path).unwrap();
177assert_eq!(std::fs::read(&path).unwrap(), body);
178179let metadata4 = std::fs::metadata(&path).unwrap();
180assert_eq!(metadata3.dev(), metadata4.dev());
181assert_ne!(metadata3.ino(), metadata4.ino());
182 }
183 }
184185#[test]
186fn test_files_have_same_content_same_contents() {
187let dir = TempDir::new().unwrap();
188let path1 = dir.path().join("file1");
189let path2 = dir.path().join("file2");
190191 std::fs::write(&path1, b"hello world").unwrap();
192let mut file1 = File::open(&path1).unwrap();
193194 std::fs::write(&path2, b"hello world").unwrap();
195let mut file2 = File::open(&path2).unwrap();
196197assert!(files_have_same_content(&mut file1, &mut file2).unwrap());
198 }
199200#[test]
201fn test_files_have_same_content_different_contents() {
202let dir = TempDir::new().unwrap();
203let path1 = dir.path().join("file1");
204let path2 = dir.path().join("file2");
205206 std::fs::write(&path1, b"hello world").unwrap();
207let mut file1 = File::open(&path1).unwrap();
208209 std::fs::write(&path2, b"jello world").unwrap();
210let mut file2 = File::open(&path2).unwrap();
211212assert!(!files_have_same_content(&mut file1, &mut file2).unwrap());
213 }
214215#[test]
216fn test_files_have_same_content_truncated() {
217let dir = TempDir::new().unwrap();
218let path1 = dir.path().join("file1");
219let path2 = dir.path().join("file2");
220221 std::fs::write(&path1, b"hello world").unwrap();
222let mut file1 = File::open(&path1).unwrap();
223224 std::fs::write(&path2, b"jello").unwrap();
225let mut file2 = File::open(&path2).unwrap();
226227assert!(!files_after_checking_length_have_same_content(&mut file1, &mut file2).unwrap());
228 }
229230#[test]
231fn test_files_have_same_content_too_long() {
232let dir = TempDir::new().unwrap();
233let path1 = dir.path().join("file1");
234let path2 = dir.path().join("file2");
235236 std::fs::write(&path1, b"hello world").unwrap();
237let mut file1 = File::open(&path1).unwrap();
238239 std::fs::write(&path2, b"hello world jello").unwrap();
240let mut file2 = File::open(&path2).unwrap();
241242assert!(!files_after_checking_length_have_same_content(&mut file1, &mut file2).unwrap());
243 }
244}