24#include <seastar/util/std-compat.hh>
25#include <seastar/core/coroutine.hh>
26#include <seastar/coroutine/generator.hh>
27#include <seastar/core/do_with.hh>
28#include <seastar/core/stream.hh>
29#include <seastar/core/sstring.hh>
30#include <seastar/core/shared_ptr.hh>
31#include <seastar/core/align.hh>
32#include <seastar/core/io_priority_class.hh>
33#include <seastar/core/file-types.hh>
34#include <seastar/core/circular_buffer.hh>
35#include <seastar/util/modules.hh>
37#include <sys/statvfs.h>
51SEASTAR_MODULE_EXPORT_BEGIN
61 std::optional<directory_entry_type>
type;
67 uint64_t inode_number;
70 uint64_t number_of_links;
76 uint64_t allocated_size;
78 std::chrono::system_clock::time_point time_accessed;
79 std::chrono::system_clock::time_point time_modified;
80 std::chrono::system_clock::time_point time_changed;
96 static constexpr uint64_t max_extent_allocation_size_hint = 1 << 31;
100 static constexpr uint32_t min_extent_size_hint_alignment{128u << 10};
107class file_data_sink_impl;
108class file_data_source_impl;
115 virtual std::unique_ptr<file_handle_impl> clone()
const = 0;
123 unsigned _memory_dma_alignment = 4096;
124 unsigned _disk_read_dma_alignment = 4096;
125 unsigned _disk_write_dma_alignment = 4096;
126 unsigned _disk_overwrite_dma_alignment = 4096;
127 unsigned _read_max_length = 1u << 30;
128 unsigned _write_max_length = 1u << 30;
132#if SEASTAR_API_LEVEL >= 7
139 virtual future<size_t> write_dma(uint64_t pos,
const void* buffer,
size_t len,
const io_priority_class& pc) = 0;
140 virtual future<size_t> write_dma(uint64_t pos, std::vector<iovec> iov,
const io_priority_class& pc) = 0;
141 virtual future<size_t> read_dma(uint64_t pos,
void* buffer,
size_t len,
const io_priority_class& pc) = 0;
142 virtual future<size_t> read_dma(uint64_t pos, std::vector<iovec> iov,
const io_priority_class& pc) = 0;
145 virtual future<size_t> write_dma(uint64_t pos,
const void* buffer,
size_t len,
const io_priority_class& pc,
io_intent*) {
146 return write_dma(pos, buffer, len, pc);
148 virtual future<size_t> write_dma(uint64_t pos, std::vector<iovec> iov,
const io_priority_class& pc,
io_intent*) {
149 return write_dma(pos, std::move(iov), pc);
151 virtual future<size_t> read_dma(uint64_t pos,
void* buffer,
size_t len,
const io_priority_class& pc,
io_intent*) {
152 return read_dma(pos, buffer, len, pc);
154 virtual future<size_t> read_dma(uint64_t pos, std::vector<iovec> iov,
const io_priority_class& pc,
io_intent*) {
155 return read_dma(pos, std::move(iov), pc);
158 return dma_read_bulk(offset, range_size, pc);
164 virtual future<> truncate(uint64_t length) = 0;
165 virtual future<> discard(uint64_t offset, uint64_t length) = 0;
166 virtual future<int> ioctl(uint64_t cmd,
void* argp)
noexcept;
167 virtual future<int> ioctl_short(uint64_t cmd,
void* argp)
noexcept;
168 virtual future<int> fcntl(
int op, uintptr_t arg)
noexcept;
169 virtual future<int> fcntl_short(
int op, uintptr_t arg)
noexcept;
170 virtual future<> allocate(uint64_t position, uint64_t length) = 0;
173 virtual std::unique_ptr<file_handle_impl> dup();
206 file() noexcept : _file_impl(
nullptr) {}
209 : _file_impl(std::move(
impl)) {}
218 explicit operator bool() const noexcept {
return bool(_file_impl); }
226 file(
file&& x) noexcept : _file_impl(std::move(x._file_impl)) {}
245 return _file_impl->_disk_read_dma_alignment;
250 return _file_impl->_disk_write_dma_alignment;
260 return _file_impl->_disk_overwrite_dma_alignment;
265 return _file_impl->_memory_dma_alignment;
273 return _file_impl->_read_max_length;
281 return _file_impl->_write_max_length;
284#if SEASTAR_API_LEVEL < 7
302 template <
typename CharType>
303 [[deprecated(
"Use scheduling_groups and API level >= 7")]]
305 dma_read(uint64_t aligned_pos, CharType* aligned_buffer,
size_t aligned_len,
const io_priority_class& pc,
io_intent* intent =
nullptr) noexcept {
306 return dma_read_impl(aligned_pos,
reinterpret_cast<uint8_t*
>(aligned_buffer), aligned_len, internal::maybe_priority_class_ref(pc), intent);
324 template <
typename CharType>
326 dma_read(uint64_t aligned_pos, CharType* aligned_buffer,
size_t aligned_len,
io_intent* intent =
nullptr) noexcept {
327 return dma_read_impl(aligned_pos,
reinterpret_cast<uint8_t*
>(aligned_buffer), aligned_len, internal::maybe_priority_class_ref(), intent);
330#if SEASTAR_API_LEVEL < 7
349 template <
typename CharType>
350 [[deprecated(
"Use scheduling_groups and API level >= 7")]]
373 template <
typename CharType>
384#if SEASTAR_API_LEVEL < 7
400 template <
typename CharType>
401 [[deprecated(
"Use scheduling_groups and API level >= 7")]]
404 return dma_read_exactly_impl(pos, len, internal::maybe_priority_class_ref(pc), intent).then([] (
temporary_buffer<uint8_t> t) {
422 template <
typename CharType>
423 future<temporary_buffer<CharType>>
425 return dma_read_exactly_impl(pos, len, internal::maybe_priority_class_ref(), intent).then([] (
temporary_buffer<uint8_t> t) {
430#if SEASTAR_API_LEVEL < 7
443 [[deprecated(
"Use scheduling_groups and API level >= 7")]]
445 return dma_read_impl(pos, std::move(iov), internal::maybe_priority_class_ref(pc), intent);
459 return dma_read_impl(pos, std::move(iov), internal::maybe_priority_class_ref(), intent);
462#if SEASTAR_API_LEVEL < 7
476 template <
typename CharType>
477 [[deprecated(
"Use scheduling_groups and API level >= 7")]]
479 return dma_write_impl(pos,
reinterpret_cast<const uint8_t*
>(buffer), len, internal::maybe_priority_class_ref(pc), intent);
493 template <
typename CharType>
495 return dma_write_impl(pos,
reinterpret_cast<const uint8_t*
>(buffer), len, internal::maybe_priority_class_ref(), intent);
498#if SEASTAR_API_LEVEL < 7
511 [[deprecated(
"Use scheduling_groups and API level >= 7")]]
513 return dma_write_impl(pos, std::move(iov), internal::maybe_priority_class_ref(pc), intent);
527 return dma_write_impl(pos, std::move(iov), internal::maybe_priority_class_ref(), intent);
631 [[deprecated("This API was removed from the kernel")]]
658 [[deprecated("This API was removed from the kernel")]]
697#if SEASTAR_API_LEVEL < 7
715 template <
typename CharType>
716 [[deprecated(
"Use scheduling_groups and API level >= 7")]]
718 dma_read_bulk(uint64_t offset,
size_t range_size,
const io_priority_class& pc,
io_intent* intent =
nullptr) noexcept {
719 return dma_read_bulk_impl(offset, range_size, internal::maybe_priority_class_ref(pc), intent).then([] (
temporary_buffer<uint8_t> t) {
739 template <
typename CharType>
742 return dma_read_bulk_impl(offset, range_size, internal::maybe_priority_class_ref(), intent).then([] (
temporary_buffer<uint8_t> t) {
758 dma_read_bulk_impl(uint64_t offset,
size_t range_size, internal::maybe_priority_class_ref pc,
io_intent* intent)
noexcept;
761 dma_write_impl(uint64_t pos,
const uint8_t* buffer,
size_t len, internal::maybe_priority_class_ref pc,
io_intent* intent)
noexcept;
764 dma_write_impl(uint64_t pos, std::vector<iovec> iov, internal::maybe_priority_class_ref pc,
io_intent* intent)
noexcept;
767 dma_read_impl(uint64_t pos,
size_t len, internal::maybe_priority_class_ref pc,
io_intent* intent)
noexcept;
770 dma_read_impl(uint64_t aligned_pos, uint8_t* aligned_buffer,
size_t aligned_len, internal::maybe_priority_class_ref pc,
io_intent* intent)
noexcept;
773 dma_read_impl(uint64_t pos, std::vector<iovec> iov, internal::maybe_priority_class_ref pc,
io_intent* intent)
noexcept;
776 dma_read_exactly_impl(uint64_t pos,
size_t len, internal::maybe_priority_class_ref pc,
io_intent* intent)
noexcept;
779 future<> set_lifetime_hint_impl(
int op, uint64_t hint)
noexcept;
782 friend class file_data_sink_impl;
783 friend class file_data_source_impl;
793template <std::invocable<file&> Func>
794requires std::is_nothrow_move_constructible_v<Func>
796 static_assert(std::is_nothrow_move_constructible_v<Func>,
"Func's move constructor must not throw");
797 return file_fut.then([func = std::move(func)] (
file f)
mutable {
798 return do_with(std::move(f), [func = std::move(func)] (
file& f)
mutable {
799 return futurize_invoke(func, f).finally([&f] {
820template <std::invocable<file&> Func>
821requires std::is_nothrow_move_constructible_v<Func>
823 static_assert(std::is_nothrow_move_constructible_v<Func>,
"Func's move constructor must not throw");
824 return file_fut.then([func = std::move(func)] (
file f)
mutable {
825 return do_with(std::move(f), [func = std::move(func)] (
file& f)
mutable {
826 return futurize_invoke(std::move(func), f).then_wrapped([&f] (
auto ret)
mutable {
830 return ret.finally([&f] {
851 std::unique_ptr<file_handle_impl> _impl;
876 virtual const char* what()
const noexcept {
881SEASTAR_MODULE_EXPORT_END
An exception Cancelled IOs resolve their future into (see io_intent)
Definition: file.hh:874
Definition: generator.hh:33
A shard-transportable handle to a file.
Definition: file.hh:850
file_handle(file_handle &&) noexcept
Moves a file handle object.
file_handle(const file_handle &)
Copies a file handle object.
file to_file() const &
Converts the file handle object to a file.
future< int > ioctl(uint64_t cmd, void *argp) noexcept
future< temporary_buffer< CharType > > dma_read(uint64_t pos, size_t len, io_intent *intent=nullptr) noexcept
Definition: file.hh:374
file & operator=(file &&x) noexcept=default
Moves assigns a file object.
future< temporary_buffer< CharType > > dma_read_bulk(uint64_t offset, size_t range_size, io_intent *intent=nullptr) noexcept
Definition: file.hh:741
subscription< directory_entry > list_directory(std::function< future<>(directory_entry de)> next)
Returns a directory listing, given that this file object is a directory.
file & operator=(const file &x) noexcept=default
future< size_t > dma_write(uint64_t pos, std::vector< iovec > iov, io_intent *intent=nullptr) noexcept
Definition: file.hh:526
future allocate(uint64_t position, uint64_t length) noexcept
future set_inode_lifetime_hint(uint64_t hint) noexcept
uint64_t memory_dma_alignment() const noexcept
Alignment requirement for data buffers.
Definition: file.hh:264
file(file_handle &&handle) noexcept
Constructs a file object from a file_handle obtained from another shard.
future< size_t > dma_write(uint64_t pos, const CharType *buffer, size_t len, io_intent *intent=nullptr) noexcept
Definition: file.hh:494
future< int > fcntl_short(int op, uintptr_t arg=0UL) noexcept
size_t disk_read_max_length() const noexcept
Definition: file.hh:272
future< size_t > dma_read(uint64_t pos, std::vector< iovec > iov, io_intent *intent=nullptr) noexcept
Definition: file.hh:458
future set_file_lifetime_hint(uint64_t hint) noexcept
file_handle dup()
Creates a handle that can be transported across shards.
future< uint64_t > get_inode_lifetime_hint() noexcept
file(file &&x) noexcept
Moves a file object.
Definition: file.hh:226
uint64_t disk_read_dma_alignment() const noexcept
Alignment requirement for file offsets (for reads)
Definition: file.hh:244
future< uint64_t > size() const noexcept
Gets the file size.
future discard(uint64_t offset, uint64_t length) noexcept
future< struct stat > stat() noexcept
Returns stat information about the file.
uint64_t disk_overwrite_dma_alignment() const noexcept
Definition: file.hh:259
future< size_t > dma_read(uint64_t aligned_pos, CharType *aligned_buffer, size_t aligned_len, io_intent *intent=nullptr) noexcept
Definition: file.hh:326
future truncate(uint64_t length) noexcept
Truncates the file to a specified length.
future< int > ioctl_short(uint64_t cmd, void *argp) noexcept
coroutine::experimental::generator< directory_entry > experimental_list_directory()
Returns a directory listing, given that this file object is a directory.
size_t disk_write_max_length() const noexcept
Definition: file.hh:280
uint64_t disk_write_dma_alignment() const noexcept
Alignment requirement for file offsets (for writes)
Definition: file.hh:249
future< int > fcntl(int op, uintptr_t arg=0UL) noexcept
future< uint64_t > get_file_lifetime_hint() noexcept
file() noexcept
Definition: file.hh:206
file(const file &x)=default
future< temporary_buffer< CharType > > dma_read_exactly(uint64_t pos, size_t len, io_intent *intent=nullptr) noexcept
Definition: file.hh:424
A representation of a possibly not-yet-computed value.
Definition: future.hh:1240
Definition: io_intent.hh:44
Definition: shared_ptr.hh:513
Definition: stream.hh:127
Definition: temporary_buffer.hh:67
deleter release() noexcept
Definition: temporary_buffer.hh:203
size_t size() const noexcept
Gets the buffer size.
Definition: temporary_buffer.hh:130
CharType * get_write() noexcept
Definition: temporary_buffer.hh:128
std::optional< directory_entry_type > type
Type of the directory entry, if known.
Definition: file.hh:61
sstring name
Name of the file in a directory entry. Will never be "." or "..". Only the last component is included...
Definition: file.hh:59
directory_entry_type
Definition: file-types.hh:70
auto with_file_close_on_failure(future< file > file_fut, Func func) noexcept
Helper for ensuring a file is closed if func fails.
Definition: file.hh:822
auto with_file(future< file > file_fut, Func func) noexcept
Helper for ensuring a file is closed after func is called.
Definition: file.hh:795
A directory entry being listed.
Definition: file.hh:57
Filesystem object stat information.
Definition: file.hh:65
auto do_with(T1 &&rv1, T2 &&rv2, More &&... more) noexcept
Definition: do_with.hh:135
holds the implementation parts of the metrics layer, do not use directly.
Seastar API namespace.
Definition: abort_on_ebadf.hh:26
bool sloppy_size
Allow the file size not to track the amount of data written until a flush.
Definition: file.hh:90
uint64_t sloppy_size_hint
Hint as to what the eventual file size will be.
Definition: file.hh:91
bool append_is_unlikely
Hint that user promises (or at least tries hard) not to write behind file size.
Definition: file.hh:93
file_permissions create_permissions
File permissions to use when creating a file.
Definition: file.hh:92
uint64_t extent_allocation_size_hint
Allocate this much disk space when extending the file.
Definition: file.hh:89