/build/source/nativelink-util/src/fs.rs
Line | Count | Source |
1 | | // Copyright 2024 The NativeLink Authors. All rights reserved. |
2 | | // |
3 | | // Licensed under the Apache License, Version 2.0 (the "License"); |
4 | | // you may not use this file except in compliance with the License. |
5 | | // You may obtain a copy of the License at |
6 | | // |
7 | | // http://www.apache.org/licenses/LICENSE-2.0 |
8 | | // |
9 | | // Unless required by applicable law or agreed to in writing, software |
10 | | // distributed under the License is distributed on an "AS IS" BASIS, |
11 | | // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
12 | | // See the License for the specific language governing permissions and |
13 | | // limitations under the License. |
14 | | |
15 | | use std::fs::Metadata; |
16 | | use std::io::{IoSlice, Seek}; |
17 | | use std::path::{Path, PathBuf}; |
18 | | use std::pin::Pin; |
19 | | use std::sync::atomic::{AtomicUsize, Ordering}; |
20 | | use std::task::{Context, Poll}; |
21 | | |
22 | | use nativelink_error::{make_err, Code, Error, ResultExt}; |
23 | | use rlimit::increase_nofile_limit; |
24 | | /// We wrap all `tokio::fs` items in our own wrapper so we can limit the number of outstanding |
25 | | /// open files at any given time. This will greatly reduce the chance we'll hit open file limit |
26 | | /// issues. |
27 | | pub use tokio::fs::DirEntry; |
28 | | use tokio::io::{AsyncRead, AsyncReadExt, AsyncSeek, AsyncWrite, ReadBuf, SeekFrom, Take}; |
29 | | use tokio::sync::{Semaphore, SemaphorePermit}; |
30 | | use tracing::{event, Level}; |
31 | | |
32 | | use crate::spawn_blocking; |
33 | | |
34 | | /// Default read buffer size when reading to/from disk. |
35 | | pub const DEFAULT_READ_BUFF_SIZE: usize = 16384; |
36 | | |
37 | | #[derive(Debug)] |
38 | | pub struct FileSlot { |
39 | | // We hold the permit because once it is dropped it goes back into the queue. |
40 | | _permit: SemaphorePermit<'static>, |
41 | | inner: tokio::fs::File, |
42 | | } |
43 | | |
44 | | impl AsRef<tokio::fs::File> for FileSlot { |
45 | 112 | fn as_ref(&self) -> &tokio::fs::File { |
46 | 112 | &self.inner |
47 | 112 | } |
48 | | } |
49 | | |
50 | | impl AsMut<tokio::fs::File> for FileSlot { |
51 | 2 | fn as_mut(&mut self) -> &mut tokio::fs::File { |
52 | 2 | &mut self.inner |
53 | 2 | } |
54 | | } |
55 | | |
56 | | impl AsyncRead for FileSlot { |
57 | 2.52k | fn poll_read( |
58 | 2.52k | mut self: Pin<&mut Self>, |
59 | 2.52k | cx: &mut Context<'_>, |
60 | 2.52k | buf: &mut ReadBuf<'_>, |
61 | 2.52k | ) -> Poll<Result<(), tokio::io::Error>> { |
62 | 2.52k | Pin::new(&mut self.inner).poll_read(cx, buf) |
63 | 2.52k | } |
64 | | } |
65 | | |
66 | | impl AsyncSeek for FileSlot { |
67 | 23 | fn start_seek(mut self: Pin<&mut Self>, position: SeekFrom) -> Result<(), tokio::io::Error> { |
68 | 23 | Pin::new(&mut self.inner).start_seek(position) |
69 | 23 | } |
70 | | |
71 | 68 | fn poll_complete( |
72 | 68 | mut self: Pin<&mut Self>, |
73 | 68 | cx: &mut Context<'_>, |
74 | 68 | ) -> Poll<Result<u64, tokio::io::Error>> { |
75 | 68 | Pin::new(&mut self.inner).poll_complete(cx) |
76 | 68 | } |
77 | | } |
78 | | |
79 | | impl AsyncWrite for FileSlot { |
80 | 2 | fn poll_write( |
81 | 2 | mut self: Pin<&mut Self>, |
82 | 2 | cx: &mut Context<'_>, |
83 | 2 | buf: &[u8], |
84 | 2 | ) -> Poll<Result<usize, tokio::io::Error>> { |
85 | 2 | Pin::new(&mut self.inner).poll_write(cx, buf) |
86 | 2 | } |
87 | | |
88 | 0 | fn poll_flush( |
89 | 0 | mut self: Pin<&mut Self>, |
90 | 0 | cx: &mut Context<'_>, |
91 | 0 | ) -> Poll<Result<(), tokio::io::Error>> { |
92 | 0 | Pin::new(&mut self.inner).poll_flush(cx) |
93 | 0 | } |
94 | | |
95 | 0 | fn poll_shutdown( |
96 | 0 | mut self: Pin<&mut Self>, |
97 | 0 | cx: &mut Context<'_>, |
98 | 0 | ) -> Poll<Result<(), tokio::io::Error>> { |
99 | 0 | Pin::new(&mut self.inner).poll_shutdown(cx) |
100 | 0 | } |
101 | | |
102 | 75 | fn poll_write_vectored( |
103 | 75 | mut self: Pin<&mut Self>, |
104 | 75 | cx: &mut Context<'_>, |
105 | 75 | bufs: &[IoSlice<'_>], |
106 | 75 | ) -> Poll<Result<usize, tokio::io::Error>> { |
107 | 75 | Pin::new(&mut self.inner).poll_write_vectored(cx, bufs) |
108 | 75 | } |
109 | | |
110 | 75 | fn is_write_vectored(&self) -> bool { |
111 | 75 | self.inner.is_write_vectored() |
112 | 75 | } |
113 | | } |
114 | | |
115 | | // Note: If the default changes make sure you update the documentation in |
116 | | // `config/cas_server.rs`. |
117 | | pub const DEFAULT_OPEN_FILE_LIMIT: usize = 24 * 1024; // 24k. |
118 | | static OPEN_FILE_LIMIT: AtomicUsize = AtomicUsize::new(DEFAULT_OPEN_FILE_LIMIT); |
119 | | pub static OPEN_FILE_SEMAPHORE: Semaphore = Semaphore::const_new(DEFAULT_OPEN_FILE_LIMIT); |
120 | | |
121 | | /// Try to acquire a permit from the open file semaphore. |
122 | | #[inline] |
123 | 25.3k | pub async fn get_permit() -> Result<SemaphorePermit<'static>, Error> { |
124 | 25.3k | OPEN_FILE_SEMAPHORE |
125 | 25.3k | .acquire() |
126 | 25.3k | .await |
127 | 25.3k | .map_err(|e| make_err!(Code::Internal, "Open file semaphore closed {:?}", e)0 ) |
128 | 25.3k | } |
129 | | /// Acquire a permit from the open file semaphore and call a raw function. |
130 | | #[inline] |
131 | 736 | pub async fn call_with_permit<F, T>(f: F) -> Result<T, Error> |
132 | 736 | where |
133 | 736 | F: FnOnce(SemaphorePermit<'static>) -> Result<T, Error> + Send + 'static, |
134 | 736 | T: Send + 'static, |
135 | 736 | { |
136 | 736 | let permit = get_permit().await?0 ; |
137 | 736 | spawn_blocking!("fs_call_with_permit", move || f(permit)) |
138 | 736 | .await |
139 | 734 | .unwrap_or_else(|e| Err(make_err!(Code::Internal, "background task failed: {e:?}"))0 ) |
140 | 734 | } |
141 | | |
142 | | /// Sets the soft nofile limit to `desired_open_file_limit` and adjusts |
143 | | /// `OPEN_FILE_SEMAPHORE` accordingly. |
144 | | /// |
145 | | /// # Panics |
146 | | /// |
147 | | /// If any type conversion fails. This can't happen if `usize` is smaller than |
148 | | /// `u64`. |
149 | 0 | pub fn set_open_file_limit(desired_open_file_limit: usize) { |
150 | 0 | let new_open_file_limit = { |
151 | 0 | match increase_nofile_limit( |
152 | 0 | u64::try_from(desired_open_file_limit) |
153 | 0 | .expect("desired_open_file_limit is too large to convert to u64."), |
154 | 0 | ) { |
155 | 0 | Ok(open_file_limit) => { |
156 | 0 | event!( |
157 | 0 | Level::INFO, |
158 | 0 | "set_open_file_limit() assigns new open file limit {open_file_limit}.", |
159 | | ); |
160 | 0 | usize::try_from(open_file_limit) |
161 | 0 | .expect("open_file_limit is too large to convert to usize.") |
162 | | } |
163 | 0 | Err(e) => { |
164 | 0 | event!( |
165 | 0 | Level::ERROR, |
166 | 0 | "set_open_file_limit() failed to assign open file limit. Maybe system does not have ulimits, continuing anyway. - {e:?}", |
167 | | ); |
168 | 0 | DEFAULT_OPEN_FILE_LIMIT |
169 | | } |
170 | | } |
171 | | }; |
172 | | // TODO(jaroeichler): Can we give a better estimate? |
173 | 0 | if new_open_file_limit < DEFAULT_OPEN_FILE_LIMIT { Branch (173:8): [True: 0, False: 0]
Branch (173:8): [Folded - Ignored]
|
174 | 0 | event!( |
175 | 0 | Level::WARN, |
176 | 0 | "The new open file limit ({new_open_file_limit}) is below the recommended value of {DEFAULT_OPEN_FILE_LIMIT}. Consider raising max_open_files.", |
177 | | ); |
178 | 0 | } |
179 | | |
180 | | // Use only 80% of the open file limit for permits from OPEN_FILE_SEMAPHORE |
181 | | // to give extra room for other file descriptors like sockets, pipes, and |
182 | | // other things. |
183 | 0 | let reduced_open_file_limit = new_open_file_limit.saturating_sub(new_open_file_limit / 5); |
184 | 0 | let previous_open_file_limit = OPEN_FILE_LIMIT.load(Ordering::Acquire); |
185 | 0 | // No permit should be aquired yet, so this warning should not occur. |
186 | 0 | if (OPEN_FILE_SEMAPHORE.available_permits() + reduced_open_file_limit) Branch (186:8): [True: 0, False: 0]
Branch (186:8): [Folded - Ignored]
|
187 | 0 | < previous_open_file_limit |
188 | | { |
189 | 0 | event!( |
190 | 0 | Level::WARN, |
191 | 0 | "There are not enough available permits to remove {previous_open_file_limit} - {reduced_open_file_limit} permits.", |
192 | | ); |
193 | 0 | } |
194 | 0 | if previous_open_file_limit <= reduced_open_file_limit { Branch (194:8): [True: 0, False: 0]
Branch (194:8): [Folded - Ignored]
|
195 | 0 | OPEN_FILE_LIMIT.fetch_add( |
196 | 0 | reduced_open_file_limit - previous_open_file_limit, |
197 | 0 | Ordering::Release, |
198 | 0 | ); |
199 | 0 | OPEN_FILE_SEMAPHORE.add_permits(reduced_open_file_limit - previous_open_file_limit); |
200 | 0 | } else { |
201 | 0 | OPEN_FILE_LIMIT.fetch_sub( |
202 | 0 | previous_open_file_limit - reduced_open_file_limit, |
203 | 0 | Ordering::Release, |
204 | 0 | ); |
205 | 0 | OPEN_FILE_SEMAPHORE.forget_permits(previous_open_file_limit - reduced_open_file_limit); |
206 | 0 | } |
207 | 0 | } |
208 | | |
209 | 13 | pub fn get_open_files_for_test() -> usize { |
210 | 13 | OPEN_FILE_LIMIT.load(Ordering::Acquire) - OPEN_FILE_SEMAPHORE.available_permits() |
211 | 13 | } |
212 | | |
213 | 60 | pub async fn open_file( |
214 | 60 | path: impl AsRef<Path>, |
215 | 60 | start: u64, |
216 | 60 | limit: u64, |
217 | 60 | ) -> Result<Take<FileSlot>, Error> { |
218 | 60 | let path = path.as_ref().to_owned(); |
219 | 60 | let (permit, os_file58 ) = call_with_permit(move |permit| { |
220 | 58 | let mut os_file = |
221 | 60 | std::fs::File::open(&path).err_tip(|| format!("Could not open {path:?}")2 )?2 ; |
222 | 58 | if start > 0 { Branch (222:12): [True: 0, False: 0]
Branch (222:12): [Folded - Ignored]
Branch (222:12): [True: 0, False: 1]
Branch (222:12): [True: 0, False: 2]
Branch (222:12): [True: 0, False: 4]
Branch (222:12): [True: 0, False: 6]
Branch (222:12): [True: 0, False: 0]
Branch (222:12): [Folded - Ignored]
Branch (222:12): [True: 0, False: 0]
Branch (222:12): [True: 0, False: 38]
Branch (222:12): [True: 0, False: 3]
Branch (222:12): [True: 0, False: 4]
|
223 | 0 | os_file |
224 | 0 | .seek(std::io::SeekFrom::Start(start)) |
225 | 0 | .err_tip(|| format!("Could not seek to {start} in {path:?}"))?; |
226 | 58 | } |
227 | 58 | Ok((permit, os_file)) |
228 | 60 | }) |
229 | 60 | .await?2 ; |
230 | 58 | Ok(FileSlot { |
231 | 58 | _permit: permit, |
232 | 58 | inner: tokio::fs::File::from_std(os_file), |
233 | 58 | } |
234 | 58 | .take(limit)) |
235 | 60 | } |
236 | | |
237 | 112 | pub async fn create_file(path: impl AsRef<Path>) -> Result<FileSlot, Error> { |
238 | 112 | let path = path.as_ref().to_owned(); |
239 | 112 | let (permit, os_file) = call_with_permit(move |permit| { |
240 | 112 | Ok(( |
241 | 112 | permit, |
242 | 112 | std::fs::File::options() |
243 | 112 | .read(true) |
244 | 112 | .write(true) |
245 | 112 | .create(true) |
246 | 112 | .truncate(true) |
247 | 112 | .open(&path) |
248 | 112 | .err_tip(|| format!("Could not open {path:?}")0 )?0 , |
249 | | )) |
250 | 112 | }) |
251 | 112 | .await?0 ; |
252 | 112 | Ok(FileSlot { |
253 | 112 | _permit: permit, |
254 | 112 | inner: tokio::fs::File::from_std(os_file), |
255 | 112 | }) |
256 | 112 | } |
257 | | |
258 | 4 | pub async fn hard_link(src: impl AsRef<Path>, dst: impl AsRef<Path>) -> Result<(), Error> { |
259 | 4 | let src = src.as_ref().to_owned(); |
260 | 4 | let dst = dst.as_ref().to_owned(); |
261 | 4 | call_with_permit(move |_| std::fs::hard_link(src, dst).map_err(Into::<Error>::into)).await |
262 | 4 | } |
263 | | |
264 | 1 | pub async fn set_permissions( |
265 | 1 | src: impl AsRef<Path>, |
266 | 1 | perm: std::fs::Permissions, |
267 | 1 | ) -> Result<(), Error> { |
268 | 1 | let src = src.as_ref().to_owned(); |
269 | 1 | call_with_permit(move |_| std::fs::set_permissions(src, perm).map_err(Into::<Error>::into)) |
270 | 1 | .await |
271 | 1 | } |
272 | | |
273 | 38 | pub async fn create_dir(path: impl AsRef<Path>) -> Result<(), Error> { |
274 | 38 | let path = path.as_ref().to_owned(); |
275 | 38 | call_with_permit(move |_| std::fs::create_dir(path).map_err(Into::<Error>::into)).await |
276 | 38 | } |
277 | | |
278 | 197 | pub async fn create_dir_all(path: impl AsRef<Path>) -> Result<(), Error> { |
279 | 197 | let path = path.as_ref().to_owned(); |
280 | 197 | call_with_permit(move |_| std::fs::create_dir_all(path).map_err(Into::<Error>::into)).await |
281 | 197 | } |
282 | | |
283 | | #[cfg(target_family = "unix")] |
284 | 1 | pub async fn symlink(src: impl AsRef<Path>, dst: impl AsRef<Path>) -> Result<(), Error> { |
285 | 1 | let src = src.as_ref().to_owned(); |
286 | 1 | let dst = dst.as_ref().to_owned(); |
287 | 1 | call_with_permit(move |_| { |
288 | 1 | tokio::runtime::Handle::current() |
289 | 1 | .block_on(tokio::fs::symlink(src, dst)) |
290 | 1 | .map_err(Into::<Error>::into) |
291 | 1 | }) |
292 | 1 | .await |
293 | 1 | } |
294 | | |
295 | 2 | pub async fn read_link(path: impl AsRef<Path>) -> Result<std::path::PathBuf, Error> { |
296 | 2 | let path = path.as_ref().to_owned(); |
297 | 2 | call_with_permit(move |_| std::fs::read_link(path).map_err(Into::<Error>::into)).await |
298 | 2 | } |
299 | | |
300 | | pub struct ReadDir { |
301 | | // We hold the permit because once it is dropped it goes back into the queue. |
302 | | permit: SemaphorePermit<'static>, |
303 | | inner: tokio::fs::ReadDir, |
304 | | } |
305 | | |
306 | | impl ReadDir { |
307 | 220 | pub fn into_inner(self) -> (SemaphorePermit<'static>, tokio::fs::ReadDir) { |
308 | 220 | (self.permit, self.inner) |
309 | 220 | } |
310 | | } |
311 | | |
312 | | impl AsRef<tokio::fs::ReadDir> for ReadDir { |
313 | 0 | fn as_ref(&self) -> &tokio::fs::ReadDir { |
314 | 0 | &self.inner |
315 | 0 | } |
316 | | } |
317 | | |
318 | | impl AsMut<tokio::fs::ReadDir> for ReadDir { |
319 | 2 | fn as_mut(&mut self) -> &mut tokio::fs::ReadDir { |
320 | 2 | &mut self.inner |
321 | 2 | } |
322 | | } |
323 | | |
324 | 222 | pub async fn read_dir(path: impl AsRef<Path>) -> Result<ReadDir, Error> { |
325 | 222 | let path = path.as_ref().to_owned(); |
326 | 222 | let (permit, inner) = call_with_permit(move |permit| { |
327 | 222 | Ok(( |
328 | 222 | permit, |
329 | 222 | tokio::runtime::Handle::current() |
330 | 222 | .block_on(tokio::fs::read_dir(path)) |
331 | 222 | .map_err(Into::<Error>::into)?0 , |
332 | | )) |
333 | 222 | }) |
334 | 222 | .await?0 ; |
335 | 222 | Ok(ReadDir { permit, inner }) |
336 | 222 | } |
337 | | |
338 | 27 | pub async fn rename(from: impl AsRef<Path>, to: impl AsRef<Path>) -> Result<(), Error> { |
339 | 27 | let from = from.as_ref().to_owned(); |
340 | 27 | let to = to.as_ref().to_owned(); |
341 | 27 | call_with_permit(move |_| std::fs::rename(from, to).map_err(Into::<Error>::into)).await |
342 | 27 | } |
343 | | |
344 | 25 | pub async fn remove_file(path: impl AsRef<Path>) -> Result<(), Error> { |
345 | 25 | let path = path.as_ref().to_owned(); |
346 | 25 | call_with_permit(move |_| std::fs::remove_file(path).map_err(Into::<Error>::into)).await |
347 | 23 | } |
348 | | |
349 | 2 | pub async fn canonicalize(path: impl AsRef<Path>) -> Result<PathBuf, Error> { |
350 | 2 | let path = path.as_ref().to_owned(); |
351 | 2 | call_with_permit(move |_| std::fs::canonicalize(path).map_err(Into::<Error>::into)).await |
352 | 2 | } |
353 | | |
354 | 16 | pub async fn metadata(path: impl AsRef<Path>) -> Result<Metadata, Error> { |
355 | 16 | let path = path.as_ref().to_owned(); |
356 | 16 | call_with_permit(move |_| std::fs::metadata(path).map_err(Into::<Error>::into)).await |
357 | 16 | } |
358 | | |
359 | 4 | pub async fn read(path: impl AsRef<Path>) -> Result<Vec<u8>, Error> { |
360 | 4 | let path = path.as_ref().to_owned(); |
361 | 4 | call_with_permit(move |_| std::fs::read(path).map_err(Into::<Error>::into)).await |
362 | 4 | } |
363 | | |
364 | 8 | pub async fn symlink_metadata(path: impl AsRef<Path>) -> Result<Metadata, Error> { |
365 | 8 | let path = path.as_ref().to_owned(); |
366 | 8 | call_with_permit(move |_| std::fs::symlink_metadata(path).map_err(Into::<Error>::into)).await |
367 | 8 | } |
368 | | |
369 | 17 | pub async fn remove_dir_all(path: impl AsRef<Path>) -> Result<(), Error> { |
370 | 17 | let path = path.as_ref().to_owned(); |
371 | 17 | call_with_permit(move |_| std::fs::remove_dir_all(path).map_err(Into::<Error>::into)).await |
372 | 17 | } |