Skip to content

Commit

Permalink
os/filestore/FileJournal: set block size via config option ceph#7628
Browse files Browse the repository at this point in the history
We were setting the block_size as the MIN of the min size (4096) and the
block size reported for the journal file/device.  In reality, file systmes
report all kinds of crazy block sizes.  Usually it's the page size, but
sometimes it is larger (e.g., 128KB for ZFS), and that's not actually what
we want.  Using a size smaller than the file systems block size is not
optimal for performance, but it doesn't affect how the IO happens--as long
as it is larger than the hardware sector size, which is either 512 or
4096 bytes.  And our min was hard-coded at 4096.

So, instead, just set a config option to specify teh block size, and
default that to 4096.

The other uses of this constant we about *alignment* of memory buffers
for the purposes of direct IO.  Rename the constant but do not change
the logic.  That means we continue to use 4k alignment for direct io even
if the device has 512 byte sectors, but that's fine--no reason to use
a smaller alignment.

Signed-off-by: Sage Weil <sage@redhat.com>
  • Loading branch information
wjwithagen committed Mar 2, 2016
1 parent 9b64380 commit f618815
Show file tree
Hide file tree
Showing 2 changed files with 13 additions and 12 deletions.
1 change: 1 addition & 0 deletions src/common/config_opts.h
Expand Up @@ -1051,6 +1051,7 @@ OPTION(filestore_debug_verify_split, OPT_BOOL, false)
OPTION(journal_dio, OPT_BOOL, true)
OPTION(journal_aio, OPT_BOOL, true)
OPTION(journal_force_aio, OPT_BOOL, false)
OPTION(journal_block_size, OPT_INT, 4096)

// max bytes to search ahead in journal searching for corruption
OPTION(journal_max_corrupt_search, OPT_U64, 10<<20)
Expand Down
24 changes: 12 additions & 12 deletions src/os/filestore/FileJournal.cc
Expand Up @@ -44,7 +44,7 @@
#define dout_prefix *_dout << "journal "

const static int64_t ONE_MEG(1 << 20);
const static int CEPH_MINIMUM_BLOCK_SIZE(4096);
const static int CEPH_DIRECTIO_ALIGNMENT(4096);

int FileJournal::_open(bool forwrite, bool create)
{
Expand Down Expand Up @@ -148,7 +148,7 @@ int FileJournal::_open_block_device()
<< dendl;
max_size = bdev_sz;

block_size = CEPH_MINIMUM_BLOCK_SIZE;
block_size = g_conf->journal_block_size;

if (g_conf->journal_discard) {
discard = block_device_support_discard(fn.c_str());
Expand Down Expand Up @@ -290,7 +290,7 @@ int FileJournal::_open_file(int64_t oldsize, blksize_t blksize,
else {
max_size = oldsize;
}
block_size = MAX(blksize, (blksize_t)CEPH_MINIMUM_BLOCK_SIZE);
block_size = g_conf->journal_block_size;

if (create && g_conf->journal_zero_on_create) {
derr << "FileJournal::_open_file : zeroing journal" << dendl;
Expand Down Expand Up @@ -505,9 +505,9 @@ int FileJournal::open(uint64_t fs_op_seq)
<< block_size << " (required for direct_io journal mode)" << dendl;
return -EINVAL;
}
if ((header.alignment % CEPH_MINIMUM_BLOCK_SIZE) && directio) {
if ((header.alignment % CEPH_DIRECTIO_ALIGNMENT) && directio) {
dout(0) << "open journal alignment " << header.alignment << " is not multiple of minimum block size "
<< CEPH_MINIMUM_BLOCK_SIZE << " (required for direct_io journal mode)" << dendl;
<< CEPH_DIRECTIO_ALIGNMENT << " (required for direct_io journal mode)" << dendl;
return -EINVAL;
}

Expand Down Expand Up @@ -1040,13 +1040,13 @@ void FileJournal::align_bl(off64_t pos, bufferlist& bl)
{
// make sure list segments are page aligned
if (directio && (!bl.is_aligned(block_size) ||
!bl.is_n_align_sized(CEPH_MINIMUM_BLOCK_SIZE))) {
assert(0 == "bl should be align");
if ((bl.length() & (CEPH_MINIMUM_BLOCK_SIZE - 1)) != 0 ||
(pos & (CEPH_MINIMUM_BLOCK_SIZE - 1)) != 0)
!bl.is_n_align_sized(CEPH_DIRECTIO_ALIGNMENT))) {
if ((bl.length() & (CEPH_DIRECTIO_ALIGNMENT - 1)) != 0 ||
(pos & (CEPH_DIRECTIO_ALIGNMENT - 1)) != 0)
dout(0) << "rebuild_page_aligned failed, " << bl << dendl;
assert((bl.length() & (CEPH_MINIMUM_BLOCK_SIZE - 1)) == 0);
assert((pos & (CEPH_MINIMUM_BLOCK_SIZE - 1)) == 0);
assert((bl.length() & (CEPH_DIRECTIO_ALIGNMENT - 1)) == 0);
assert((pos & (CEPH_DIRECTIO_ALIGNMENT - 1)) == 0);
assert(0 == "bl should be align");
}
}

Expand Down Expand Up @@ -1633,7 +1633,7 @@ int FileJournal::prepare_entry(vector<ObjectStore::Transaction>& tls, bufferlist
}
// footer
ebl.append((const char*)&h, sizeof(h));
ebl.rebuild_aligned(CEPH_MINIMUM_BLOCK_SIZE);
ebl.rebuild_aligned(CEPH_DIRECTIO_ALIGNMENT);
tbl->claim(ebl);
return h.len;
}
Expand Down

0 comments on commit f618815

Please sign in to comment.