Commit 96b9c617 authored by Vladislav Vaintroub's avatar Vladislav Vaintroub

MDEV-13941 Fix high NTFS fragmentation on 10.2

Prior to this patch, creating or even opening any innodb file in 10.2
would set a sparse flag on file. The file extension was done by setting
end of file, without writing zeros. This technique is fine, however
due to sparsedness, it created a hole at the end of the file, which
lead to much higher fragmentation subsequently.

The fix is only to use sparse flag for compressed tables, where holes
are actually wanted, but not for normal tables.
parent 24d9664a
...@@ -1062,32 +1062,23 @@ fil_space_extend_must_retry( ...@@ -1062,32 +1062,23 @@ fil_space_extend_must_retry(
const ulint page_size = pageSize.physical(); const ulint page_size = pageSize.physical();
#ifdef _WIN32 #ifdef _WIN32
/* Logically or physically extend the file with zero bytes, os_offset_t new_file_size =
depending on whether it is sparse. */ std::max(
/* FIXME: Call DeviceIoControl(node->handle, FSCTL_SET_SPARSE, ...)
when opening a file when FSP_FLAGS_HAS_PAGE_COMPRESSION(). */
{
FILE_END_OF_FILE_INFO feof;
/* fil_read_first_page() expects UNIV_PAGE_SIZE bytes.
fil_node_open_file() expects at least 4 * UNIV_PAGE_SIZE bytes.
Do not shrink short ROW_FORMAT=COMPRESSED files. */
feof.EndOfFile.QuadPart = std::max(
os_offset_t(size - file_start_page_no) * page_size, os_offset_t(size - file_start_page_no) * page_size,
os_offset_t(FIL_IBD_FILE_INITIAL_SIZE os_offset_t(FIL_IBD_FILE_INITIAL_SIZE * UNIV_PAGE_SIZE));
* UNIV_PAGE_SIZE));
*success = SetFileInformationByHandle(node->handle, /* os_file_change_size_win32() handles both compressed(sparse)
FileEndOfFileInfo, and normal files correctly.
&feof, sizeof feof); It allocates physical storage for normal files and "virtual"
if (!*success) { storage for sparse ones.*/
ib::error() << "extending file '" << node->name *success = os_file_change_size_win32(node->name,
<< "' from " node->handle, new_file_size);
<< os_offset_t(node->size) * page_size
<< " to " << feof.EndOfFile.QuadPart if (*success) {
<< " bytes failed with " << GetLastError(); last_page_no = size;
} else { } else {
last_page_no = size; ib::error() << "extending file '" << node->name
} << " to size " << new_file_size << " failed";
} }
#else #else
/* We will logically extend the file with ftruncate() if /* We will logically extend the file with ftruncate() if
...@@ -3843,7 +3834,19 @@ fil_ibd_create( ...@@ -3843,7 +3834,19 @@ fil_ibd_create(
return(DB_ERROR); return(DB_ERROR);
} }
success= false; bool punch_hole = false;
#ifdef _WIN32
if (FSP_FLAGS_HAS_PAGE_COMPRESSION(flags)) {
punch_hole = os_file_set_sparse_win32(file);
}
success = os_file_change_size_win32(path, file, size * UNIV_PAGE_SIZE);
#else
success= false;
#ifdef HAVE_POSIX_FALLOCATE #ifdef HAVE_POSIX_FALLOCATE
/* /*
Extend the file using posix_fallocate(). This is required by Extend the file using posix_fallocate(). This is required by
...@@ -3882,7 +3885,7 @@ fil_ibd_create( ...@@ -3882,7 +3885,7 @@ fil_ibd_create(
be lost after this call, if it succeeds. In this case the file be lost after this call, if it succeeds. In this case the file
should be full of NULs. */ should be full of NULs. */
bool punch_hole = os_is_sparse_file_supported(path, file); punch_hole = os_is_sparse_file_supported(file);
if (punch_hole) { if (punch_hole) {
...@@ -3894,6 +3897,7 @@ fil_ibd_create( ...@@ -3894,6 +3897,7 @@ fil_ibd_create(
punch_hole = false; punch_hole = false;
} }
} }
#endif
ulint block_size = os_file_get_block_size(file, path); ulint block_size = os_file_get_block_size(file, path);
......
...@@ -1569,20 +1569,48 @@ innobase_mysql_tmpfile( ...@@ -1569,20 +1569,48 @@ innobase_mysql_tmpfile(
void void
os_file_set_umask(ulint umask); os_file_set_umask(ulint umask);
#ifdef _WIN32
/**
Make file sparse, on Windows.
@param[in] file file handle
@return true on success, false on error */
bool os_file_set_sparse_win32(os_file_t file);
/**
Changes file size on Windows
If file is extended, following happens the bytes between
old and new EOF are zeros.
If file is sparse, "virtual" block is added at the end of
allocated area.
If file is normal, file system allocates storage.
@param[in] pathname file path
@param[in] file file handle
@param[in] size size to preserve in bytes
@return true if success */
bool
os_file_change_size_win32(
const char* pathname,
os_file_t file,
os_offset_t size);
#endif /*_WIN32 */
/** Check if the file system supports sparse files. /** Check if the file system supports sparse files.
Warning: On POSIX systems we try and punch a hole from offset 0 to Warning: On POSIX systems we try and punch a hole from offset 0 to
the system configured page size. This should only be called on an empty the system configured page size. This should only be called on an empty
file. file.
Note: On Windows we use the name and on Unices we use the file handle.
@param[in] name File name
@param[in] fh File handle for the file - if opened @param[in] fh File handle for the file - if opened
@return true if the file system supports sparse files */ @return true if the file system supports sparse files */
bool bool
os_is_sparse_file_supported( os_is_sparse_file_supported(
const char* path,
os_file_t fh) os_file_t fh)
MY_ATTRIBUTE((warn_unused_result)); MY_ATTRIBUTE((warn_unused_result));
......
...@@ -858,7 +858,8 @@ os_file_get_block_size( ...@@ -858,7 +858,8 @@ os_file_get_block_size(
&tmp); &tmp);
if (!result) { if (!result) {
if (GetLastError() == ERROR_INVALID_FUNCTION) { DWORD err = GetLastError();
if (err == ERROR_INVALID_FUNCTION || err == ERROR_NOT_SUPPORTED) {
// Don't report error, it is driver's fault, not ours or users. // Don't report error, it is driver's fault, not ours or users.
// We handle this with fallback. Report wit info message, just once. // We handle this with fallback. Report wit info message, just once.
static bool write_info = true; static bool write_info = true;
...@@ -3779,6 +3780,7 @@ os_file_get_last_error_low( ...@@ -3779,6 +3780,7 @@ os_file_get_last_error_low(
return(OS_FILE_ERROR_MAX + err); return(OS_FILE_ERROR_MAX + err);
} }
/** NOTE! Use the corresponding macro os_file_create_simple(), not directly /** NOTE! Use the corresponding macro os_file_create_simple(), not directly
this function! this function!
A simple function to open or create a file. A simple function to open or create a file.
...@@ -3897,15 +3899,6 @@ os_file_create_simple_func( ...@@ -3897,15 +3899,6 @@ os_file_create_simple_func(
retry = false; retry = false;
*success = true; *success = true;
DWORD temp;
/* This is a best effort use case, if it fails then
we will find out when we try and punch the hole. */
os_win32_device_io_control(
file, FSCTL_SET_SPARSE, NULL, 0, NULL, 0,
&temp);
} }
} while (retry); } while (retry);
...@@ -4298,13 +4291,6 @@ os_file_create_func( ...@@ -4298,13 +4291,6 @@ os_file_create_func(
/* Bind the file handle to completion port */ /* Bind the file handle to completion port */
ut_a(CreateIoCompletionPort(file, completion_port, 0, 0)); ut_a(CreateIoCompletionPort(file, completion_port, 0, 0));
} }
DWORD temp;
/* This is a best effort use case, if it fails then
we will find out when we try and punch the hole. */
os_win32_device_io_control(
file, FSCTL_SET_SPARSE, NULL, 0, NULL, 0,
&temp);
} }
} while (retry); } while (retry);
...@@ -4752,16 +4738,36 @@ os_file_get_status_win32( ...@@ -4752,16 +4738,36 @@ os_file_get_status_win32(
return(DB_SUCCESS); return(DB_SUCCESS);
} }
/** Truncates a file to a specified size in bytes. /**
Do nothing if the size to preserve is greater or equal to the current Sets a sparse flag on Windows file.
size of the file. @param[in] file file handle
@return true on success, false on error
*/
bool os_file_set_sparse_win32(os_file_t file)
{
DWORD temp;
return os_win32_device_io_control(file, FSCTL_SET_SPARSE, 0, 0, 0, 0,&temp);
}
/**
Change file size on Windows.
If file is extended, the bytes between old and new EOF
are zeros.
If file is sparse, "virtual" block is added at the end of
allocated area.
If file is normal, file system allocates storage.
@param[in] pathname file path @param[in] pathname file path
@param[in] file file to be truncated @param[in] file file handle
@param[in] size size to preserve in bytes @param[in] size size to preserve in bytes
@return true if success */ @return true if success */
static
bool bool
os_file_truncate_win32( os_file_change_size_win32(
const char* pathname, const char* pathname,
os_file_t file, os_file_t file,
os_offset_t size) os_offset_t size)
...@@ -5327,6 +5333,9 @@ os_file_set_size( ...@@ -5327,6 +5333,9 @@ os_file_set_size(
os_offset_t size, os_offset_t size,
bool read_only) bool read_only)
{ {
#ifdef _WIN32
return os_file_change_size_win32(name, file, size);
#endif
/* Write up to 1 megabyte at a time. */ /* Write up to 1 megabyte at a time. */
ulint buf_size = ut_min( ulint buf_size = ut_min(
static_cast<ulint>(64), static_cast<ulint>(64),
...@@ -5416,7 +5425,7 @@ os_file_truncate( ...@@ -5416,7 +5425,7 @@ os_file_truncate(
} }
#ifdef _WIN32 #ifdef _WIN32
return(os_file_truncate_win32(pathname, file, size)); return(os_file_change_size_win32(pathname, file, size));
#else /* _WIN32 */ #else /* _WIN32 */
return(os_file_truncate_posix(pathname, file, size)); return(os_file_truncate_posix(pathname, file, size));
#endif /* _WIN32 */ #endif /* _WIN32 */
...@@ -5556,14 +5565,10 @@ IORequest::punch_hole(os_file_t fh, os_offset_t off, ulint len) ...@@ -5556,14 +5565,10 @@ IORequest::punch_hole(os_file_t fh, os_offset_t off, ulint len)
Warning: On POSIX systems we try and punch a hole from offset 0 to Warning: On POSIX systems we try and punch a hole from offset 0 to
the system configured page size. This should only be called on an empty the system configured page size. This should only be called on an empty
file. file.
Note: On Windows we use the name and on Unices we use the file handle.
@param[in] name File name
@param[in] fh File handle for the file - if opened @param[in] fh File handle for the file - if opened
@return true if the file system supports sparse files */ @return true if the file system supports sparse files */
bool bool
os_is_sparse_file_supported(const char* path, os_file_t fh) os_is_sparse_file_supported(os_file_t fh)
{ {
/* In this debugging mode, we act as if punch hole is supported, /* In this debugging mode, we act as if punch hole is supported,
then we skip any calls to actually punch a hole. In this way, then we skip any calls to actually punch a hole. In this way,
...@@ -5573,7 +5578,13 @@ os_is_sparse_file_supported(const char* path, os_file_t fh) ...@@ -5573,7 +5578,13 @@ os_is_sparse_file_supported(const char* path, os_file_t fh)
); );
#ifdef _WIN32 #ifdef _WIN32
return(os_is_sparse_file_supported_win32(path)); BY_HANDLE_FILE_INFORMATION info;
if (GetFileInformationByHandle(fh,&info)) {
if (info.dwFileAttributes != INVALID_FILE_ATTRIBUTES) {
return (info.dwFileAttributes & FILE_ATTRIBUTE_SPARSE_FILE) != 0;
}
}
return false;
#else #else
dberr_t err; dberr_t err;
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment