pict-rs/src/file.rs

458 lines
13 KiB
Rust
Raw Normal View History

2021-10-14 00:06:53 +00:00
use futures_util::stream::Stream;
use std::{
pin::Pin,
task::{Context, Poll},
};
2021-10-13 04:16:31 +00:00
#[cfg(feature = "io-uring")]
pub(crate) use io_uring::File;
#[cfg(not(feature = "io-uring"))]
2021-10-14 00:06:53 +00:00
pub(crate) use tokio_file::File;
2021-10-13 04:16:31 +00:00
2021-10-14 00:06:53 +00:00
struct CrateError<S>(S);
impl<T, E, S> Stream for CrateError<S>
where
S: Stream<Item = Result<T, E>> + Unpin,
crate::error::Error: From<E>,
{
type Item = Result<T, crate::error::Error>;
fn poll_next(mut self: Pin<&mut Self>, cx: &mut Context<'_>) -> Poll<Option<Self::Item>> {
Pin::new(&mut self.0)
.poll_next(cx)
.map(|opt| opt.map(|res| res.map_err(Into::into)))
}
}
#[cfg(not(feature = "io-uring"))]
mod tokio_file {
use crate::Either;
use actix_web::web::{Bytes, BytesMut};
use futures_util::stream::Stream;
use std::{fs::Metadata, io::SeekFrom, path::Path};
use tokio::io::{AsyncRead, AsyncReadExt, AsyncSeekExt, AsyncWrite, AsyncWriteExt};
use tokio_util::codec::{BytesCodec, FramedRead};
pub(crate) struct File {
inner: tokio::fs::File,
}
2021-10-13 04:16:31 +00:00
2021-10-14 00:06:53 +00:00
impl File {
pub(crate) async fn open(path: impl AsRef<Path>) -> std::io::Result<Self> {
Ok(File {
inner: tokio::fs::File::open(path).await?,
})
}
2021-10-13 04:16:31 +00:00
2021-10-14 00:06:53 +00:00
pub(crate) async fn create(path: impl AsRef<Path>) -> std::io::Result<Self> {
Ok(File {
inner: tokio::fs::File::create(path).await?,
})
}
pub(crate) async fn metadata(&self) -> std::io::Result<Metadata> {
self.inner.metadata().await
}
2021-10-13 04:16:31 +00:00
2021-10-14 00:06:53 +00:00
pub(crate) async fn write_from_bytes<'a>(
&'a mut self,
mut bytes: Bytes,
) -> std::io::Result<()> {
self.inner.write_all_buf(&mut bytes).await?;
Ok(())
}
2021-10-13 04:16:31 +00:00
2021-10-14 00:06:53 +00:00
pub(crate) async fn write_from_async_read<'a, R>(
&'a mut self,
mut reader: R,
) -> std::io::Result<()>
where
R: AsyncRead + Unpin,
{
tokio::io::copy(&mut reader, &mut self.inner).await?;
Ok(())
}
2021-10-13 04:16:31 +00:00
2021-10-14 00:06:53 +00:00
pub(crate) async fn read_to_async_write<'a, W>(
&'a mut self,
writer: &'a mut W,
) -> std::io::Result<()>
where
W: AsyncWrite + Unpin,
{
tokio::io::copy(&mut self.inner, writer).await?;
Ok(())
}
pub(crate) async fn read_to_stream(
mut self,
from_start: Option<u64>,
len: Option<u64>,
) -> Result<
impl Stream<Item = Result<Bytes, crate::error::Error>> + Unpin,
crate::error::Error,
> {
let obj = match (from_start, len) {
(Some(lower), Some(upper)) => {
self.inner.seek(SeekFrom::Start(lower)).await?;
Either::Left(self.inner.take(upper))
}
(None, Some(upper)) => Either::Left(self.inner.take(upper)),
(Some(lower), None) => {
self.inner.seek(SeekFrom::Start(lower)).await?;
Either::Right(self.inner)
}
(None, None) => Either::Right(self.inner),
};
Ok(super::CrateError(BytesFreezer(FramedRead::new(
obj,
BytesCodec::new(),
))))
}
2021-10-13 04:16:31 +00:00
}
2021-10-14 00:06:53 +00:00
struct BytesFreezer<S>(S);
impl<S, E> Stream for BytesFreezer<S>
where
S: Stream<Item = Result<BytesMut, E>> + Unpin,
{
type Item = Result<Bytes, E>;
fn poll_next(
mut self: std::pin::Pin<&mut Self>,
cx: &mut std::task::Context<'_>,
) -> std::task::Poll<Option<Self::Item>> {
std::pin::Pin::new(&mut self.0)
.poll_next(cx)
.map(|opt| opt.map(|res| res.map(BytesMut::freeze)))
2021-10-13 04:16:31 +00:00
}
}
2021-10-14 00:06:53 +00:00
}
#[cfg(feature = "io-uring")]
mod io_uring {
use actix_web::web::Bytes;
use futures_util::stream::Stream;
use std::{
convert::TryInto,
fs::Metadata,
future::Future,
path::{Path, PathBuf},
pin::Pin,
task::{Context, Poll},
};
use tokio::io::{AsyncRead, AsyncReadExt, AsyncWrite, AsyncWriteExt};
use tokio_uring::{
2021-10-14 00:50:07 +00:00
buf::{IoBuf, IoBufMut},
2021-10-14 00:06:53 +00:00
BufResult,
};
2021-10-13 04:16:31 +00:00
pub(crate) struct File {
path: PathBuf,
2021-10-14 00:06:53 +00:00
inner: tokio_uring::fs::File,
2021-10-13 04:16:31 +00:00
}
impl File {
pub(crate) async fn open(path: impl AsRef<Path>) -> std::io::Result<Self> {
tracing::info!("Opening io-uring file");
Ok(File {
path: path.as_ref().to_owned(),
2021-10-14 00:06:53 +00:00
inner: tokio_uring::fs::File::open(path).await?,
2021-10-13 04:16:31 +00:00
})
}
pub(crate) async fn create(path: impl AsRef<Path>) -> std::io::Result<Self> {
tracing::info!("Creating io-uring file");
Ok(File {
path: path.as_ref().to_owned(),
2021-10-14 00:06:53 +00:00
inner: tokio_uring::fs::File::create(path).await?,
2021-10-13 04:16:31 +00:00
})
}
pub(crate) async fn metadata(&self) -> std::io::Result<Metadata> {
tokio::fs::metadata(&self.path).await
}
2021-10-14 00:06:53 +00:00
pub(crate) async fn write_from_bytes<'a>(
&'a mut self,
bytes: Bytes,
) -> std::io::Result<()> {
let mut buf = bytes.to_vec();
let len: u64 = buf.len().try_into().unwrap();
2021-10-13 04:16:31 +00:00
2021-10-14 00:06:53 +00:00
let mut cursor: u64 = 0;
2021-10-13 04:16:31 +00:00
2021-10-14 00:06:53 +00:00
loop {
if cursor == len {
break;
2021-10-13 04:16:31 +00:00
}
2021-10-14 00:06:53 +00:00
let cursor_usize: usize = cursor.try_into().unwrap();
let (res, slice) = self.inner.write_at(buf.slice(cursor_usize..), cursor).await;
let n: usize = res?;
2021-10-13 04:16:31 +00:00
2021-10-14 00:06:53 +00:00
if n == 0 {
return Err(std::io::ErrorKind::UnexpectedEof.into());
2021-10-13 04:16:31 +00:00
}
2021-10-14 00:06:53 +00:00
buf = slice.into_inner();
let n: u64 = n.try_into().unwrap();
cursor += n;
2021-10-13 04:16:31 +00:00
}
2021-10-14 00:06:53 +00:00
2021-10-14 00:50:07 +00:00
self.inner.sync_all().await?;
2021-10-14 00:06:53 +00:00
Ok(())
2021-10-13 04:16:31 +00:00
}
2021-10-14 00:06:53 +00:00
pub(crate) async fn write_from_async_read<'a, R>(
&'a mut self,
mut reader: R,
) -> std::io::Result<()>
where
R: AsyncRead + Unpin,
{
let mut cursor: u64 = 0;
2021-10-13 04:16:31 +00:00
2021-10-14 00:06:53 +00:00
loop {
2021-10-14 00:50:07 +00:00
let max_size = 65_536;
2021-10-14 00:06:53 +00:00
let mut buf = Vec::with_capacity(max_size.try_into().unwrap());
2021-10-13 04:16:31 +00:00
2021-10-14 00:06:53 +00:00
let n = (&mut reader).take(max_size).read_to_end(&mut buf).await?;
2021-10-13 04:16:31 +00:00
2021-10-14 00:06:53 +00:00
if n == 0 {
break;
2021-10-13 04:16:31 +00:00
}
2021-10-14 00:06:53 +00:00
let mut position = 0;
2021-10-13 04:16:31 +00:00
2021-10-14 00:06:53 +00:00
loop {
2021-10-14 00:50:07 +00:00
if position == n {
2021-10-14 00:06:53 +00:00
break;
2021-10-13 04:16:31 +00:00
}
2021-10-14 00:50:07 +00:00
let position_u64: u64 = position.try_into().unwrap();
let (res, slice) = self
.write_at(buf.slice(position..n), cursor + position_u64)
.await;
let n = res?;
if n == 0 {
return Err(std::io::ErrorKind::UnexpectedEof.into());
}
position += n;
2021-10-13 04:16:31 +00:00
2021-10-14 00:06:53 +00:00
buf = slice.into_inner();
2021-10-13 04:16:31 +00:00
}
2021-10-14 00:06:53 +00:00
let position: u64 = position.try_into().unwrap();
cursor += position;
2021-10-13 04:16:31 +00:00
}
2021-10-14 00:50:07 +00:00
self.inner.sync_all().await?;
2021-10-14 00:06:53 +00:00
Ok(())
2021-10-13 04:16:31 +00:00
}
2021-10-14 00:06:53 +00:00
pub(crate) async fn read_to_async_write<'a, W>(
&'a mut self,
writer: &mut W,
) -> std::io::Result<()>
where
W: AsyncWrite + Unpin,
{
let metadata = self.metadata().await?;
let size = metadata.len();
let mut cursor: u64 = 0;
loop {
if cursor == size {
break;
}
2021-10-13 04:16:31 +00:00
2021-10-14 00:06:53 +00:00
let max_size = (size - cursor).min(65_536);
let buf = Vec::with_capacity(max_size.try_into().unwrap());
2021-10-13 04:16:31 +00:00
2021-10-14 00:06:53 +00:00
let (res, mut buf): (_, Vec<u8>) = self.read_at(buf, cursor).await;
let n: usize = res?;
2021-10-13 04:16:31 +00:00
2021-10-14 00:06:53 +00:00
if n == 0 {
return Err(std::io::ErrorKind::UnexpectedEof.into());
2021-10-13 04:16:31 +00:00
}
2021-10-14 00:06:53 +00:00
writer.write_all(&mut buf[0..n]).await?;
2021-10-13 04:16:31 +00:00
2021-10-14 00:06:53 +00:00
let n: u64 = n.try_into().unwrap();
cursor += n;
}
2021-10-13 04:16:31 +00:00
2021-10-14 00:06:53 +00:00
Ok(())
2021-10-13 04:16:31 +00:00
}
2021-10-14 00:06:53 +00:00
pub(crate) async fn read_to_stream(
self,
from_start: Option<u64>,
len: Option<u64>,
) -> Result<
impl Stream<Item = Result<Bytes, crate::error::Error>> + Unpin,
crate::error::Error,
> {
let size = self.metadata().await?.len();
let cursor = from_start.unwrap_or(0);
let size = len.unwrap_or(size - cursor) + cursor;
Ok(super::CrateError(BytesStream {
file: Some(self),
size,
cursor,
fut: None,
}))
}
2021-10-13 04:16:31 +00:00
2021-10-14 00:06:53 +00:00
async fn read_at<T: IoBufMut>(&self, buf: T, pos: u64) -> BufResult<usize, T> {
self.inner.read_at(buf, pos).await
}
2021-10-13 04:16:31 +00:00
2021-10-14 00:06:53 +00:00
async fn write_at<T: IoBuf>(&self, buf: T, pos: u64) -> BufResult<usize, T> {
self.inner.write_at(buf, pos).await
2021-10-13 04:16:31 +00:00
}
}
2021-10-14 00:06:53 +00:00
struct BytesStream {
file: Option<File>,
size: u64,
cursor: u64,
fut: Option<Pin<Box<dyn Future<Output = (File, BufResult<usize, Vec<u8>>)>>>>,
2021-10-13 04:16:31 +00:00
}
2021-10-14 00:06:53 +00:00
impl Stream for BytesStream {
type Item = std::io::Result<Bytes>;
2021-10-13 04:16:31 +00:00
2021-10-14 00:06:53 +00:00
fn poll_next(mut self: Pin<&mut Self>, cx: &mut Context<'_>) -> Poll<Option<Self::Item>> {
let mut fut = if let Some(fut) = self.fut.take() {
fut
} else {
let file = self.file.take().unwrap();
2021-10-13 04:16:31 +00:00
2021-10-14 00:06:53 +00:00
if self.cursor == self.size {
return Poll::Ready(None);
2021-10-13 04:16:31 +00:00
}
2021-10-14 00:06:53 +00:00
let cursor = self.cursor;
let max_size = self.size - self.cursor;
2021-10-13 04:16:31 +00:00
2021-10-14 00:06:53 +00:00
Box::pin(async move {
let buf = Vec::with_capacity(max_size.try_into().unwrap());
2021-10-13 04:16:31 +00:00
2021-10-14 00:06:53 +00:00
let buf_res = file.read_at(buf, cursor).await;
2021-10-13 04:16:31 +00:00
2021-10-14 00:06:53 +00:00
(file, buf_res)
})
};
2021-10-13 04:16:31 +00:00
2021-10-14 00:06:53 +00:00
match Pin::new(&mut fut).poll(cx) {
Poll::Pending => {
self.fut = Some(fut);
Poll::Pending
2021-10-13 04:16:31 +00:00
}
2021-10-14 00:06:53 +00:00
Poll::Ready((file, (Ok(n), mut buf))) => {
self.file = Some(file);
let _ = buf.split_off(n);
let n: u64 = match n.try_into() {
Ok(n) => n,
Err(_) => return Poll::Ready(Some(Err(std::io::ErrorKind::Other.into()))),
};
self.cursor += n;
Poll::Ready(Some(Ok(Bytes::from(buf))))
}
Poll::Ready((_, (Err(e), _))) => Poll::Ready(Some(Err(e))),
2021-10-13 04:16:31 +00:00
}
}
}
2021-10-14 00:50:07 +00:00
#[cfg(test)]
mod tests {
use std::io::Read;
macro_rules! test_on_arbiter {
($fut:expr) => {
actix_rt::System::new().block_on(async move {
let arbiter = actix_rt::Arbiter::new();
let (tx, rx) = tokio::sync::oneshot::channel();
arbiter.spawn(async move {
let handle = actix_rt::spawn($fut);
let _ = tx.send(handle.await.unwrap());
});
rx.await.unwrap()
})
};
}
const EARTH_GIF: &'static str = "client-examples/earth.gif";
#[test]
fn read() {
let tmp = "/tmp/read-test";
test_on_arbiter!(async move {
let mut file = super::File::open(EARTH_GIF).await.unwrap();
let mut tmp_file = tokio::fs::File::create(tmp).await.unwrap();
file.read_to_async_write(&mut tmp_file).await.unwrap();
});
let mut source = std::fs::File::open(EARTH_GIF).unwrap();
let mut dest = std::fs::File::open(tmp).unwrap();
let mut source_vec = Vec::new();
source.read_to_end(&mut source_vec).unwrap();
let mut dest_vec = Vec::new();
dest.read_to_end(&mut dest_vec).unwrap();
drop(dest);
std::fs::remove_file(tmp).unwrap();
assert_eq!(source_vec.len(), dest_vec.len());
assert_eq!(source_vec, dest_vec);
}
#[test]
fn write() {
let tmp = "/tmp/write-test";
test_on_arbiter!(async move {
let mut file = tokio::fs::File::open(EARTH_GIF).await.unwrap();
let mut tmp_file = super::File::create(tmp).await.unwrap();
tmp_file.write_from_async_read(&mut file).await.unwrap();
});
let mut source = std::fs::File::open(EARTH_GIF).unwrap();
let mut dest = std::fs::File::open(tmp).unwrap();
let mut source_vec = Vec::new();
source.read_to_end(&mut source_vec).unwrap();
let mut dest_vec = Vec::new();
dest.read_to_end(&mut dest_vec).unwrap();
drop(dest);
std::fs::remove_file(tmp).unwrap();
assert_eq!(source_vec.len(), dest_vec.len());
assert_eq!(source_vec, dest_vec);
}
}
2021-10-13 04:16:31 +00:00
}