polardbxengine/storage/innobase/include/buf0flu.h

341 lines
14 KiB
C++

/*****************************************************************************
Copyright (c) 1995, 2019, Oracle and/or its affiliates. All Rights Reserved.
This program is free software; you can redistribute it and/or modify it under
the terms of the GNU General Public License, version 2.0, as published by the
Free Software Foundation.
This program is also distributed with certain software (including but not
limited to OpenSSL) that is licensed under separate terms, as designated in a
particular file or component or in included license documentation. The authors
of MySQL hereby grant you an additional permission to link the program and
your derivative works with the separately licensed software that they have
included with MySQL.
This program is distributed in the hope that it will be useful, but WITHOUT
ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
FOR A PARTICULAR PURPOSE. See the GNU General Public License, version 2.0,
for more details.
You should have received a copy of the GNU General Public License along with
this program; if not, write to the Free Software Foundation, Inc.,
51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
*****************************************************************************/
/** @file include/buf0flu.h
The database buffer pool flush algorithm
Created 11/5/1995 Heikki Tuuri
*******************************************************/
#ifndef buf0flu_h
#define buf0flu_h
#include "buf0types.h"
#include "log0log.h"
#include "univ.i"
#include "ut0byte.h"
#ifndef UNIV_HOTBACKUP
/** Checks if the page_cleaner is in active state. */
bool buf_flush_page_cleaner_is_active();
#ifdef UNIV_DEBUG
/** Value of MySQL global variable used to disable page cleaner. */
extern bool innodb_page_cleaner_disabled_debug;
#endif /* UNIV_DEBUG */
/** Event to synchronise with the flushing. */
extern os_event_t buf_flush_event;
class ut_stage_alter_t;
/** Remove a block from the flush list of modified blocks.
@param[in] bpage pointer to the block in question */
void buf_flush_remove(buf_page_t *bpage);
/** Relocates a buffer control block on the flush_list.
Note that it is assumed that the contents of bpage has already been
copied to dpage. */
void buf_flush_relocate_on_flush_list(
buf_page_t *bpage, /*!< in/out: control block being moved */
buf_page_t *dpage); /*!< in/out: destination block */
/** Updates the flush system data structures when a write is completed.
@param[in] bpage pointer to the block in question */
void buf_flush_write_complete(buf_page_t *bpage);
#endif /* !UNIV_HOTBACKUP */
/** Check if page type is uncompressed.
@param[in] page page frame
@return true if uncompressed page type. */
bool page_is_uncompressed_type(const byte *page);
/** Initialize a page for writing to the tablespace.
@param[in] block buffer block; NULL if bypassing the buffer pool
@param[in,out] page page frame
@param[in,out] page_zip_ compressed page, or NULL if uncompressed
@param[in] newest_lsn newest modification LSN to the page
@param[in] skip_checksum whether to disable the page checksum
@param[in] skip_lsn_check true to skip check for lsn (in DEBUG) */
void buf_flush_init_for_writing(const buf_block_t *block, byte *page,
void *page_zip_, lsn_t newest_lsn,
bool skip_checksum, bool skip_lsn_check);
#ifndef UNIV_HOTBACKUP
#if defined UNIV_DEBUG || defined UNIV_IBUF_DEBUG
/** Writes a flushable page asynchronously from the buffer pool to a file.
NOTE: block and LRU list mutexes must be held upon entering this function, and
they will be released by this function after flushing. This is loosely based on
buf_flush_batch() and buf_flush_page().
@param[in,out] buf_pool buffer pool instance
@param[in,out] block buffer control block
@return true if the page was flushed and the mutex released */
ibool buf_flush_page_try(buf_pool_t *buf_pool, buf_block_t *block)
MY_ATTRIBUTE((warn_unused_result));
#endif /* UNIV_DEBUG || UNIV_IBUF_DEBUG */
/** Do flushing batch of a given type.
NOTE: The calling thread is not allowed to own any latches on pages!
@param[in,out] buf_pool buffer pool instance
@param[in] type flush type
@param[in] min_n wished minimum mumber of blocks flushed
(it is not guaranteed that the actual number is that big, though)
@param[in] lsn_limit in the case BUF_FLUSH_LIST all blocks whose
oldest_modification is smaller than this should be flushed (if their number
does not exceed min_n), otherwise ignored
@param[out] n_processed the number of pages which were processed is
passed back to caller. Ignored if NULL
@retval true if a batch was queued successfully.
@retval false if another batch of same type was already running. */
bool buf_flush_do_batch(buf_pool_t *buf_pool, buf_flush_t type, ulint min_n,
lsn_t lsn_limit, ulint *n_processed);
/** This utility flushes dirty blocks from the end of the flush list of all
buffer pool instances.
NOTE: The calling thread is not allowed to own any latches on pages!
@param[in] min_n wished minimum mumber of blocks flushed (it is
not guaranteed that the actual number is that big, though)
@param[in] lsn_limit in the case BUF_FLUSH_LIST all blocks whose
oldest_modification is smaller than this should be flushed (if their number
does not exceed min_n), otherwise ignored
@param[out] n_processed the number of pages which were processed is
passed back to caller. Ignored if NULL.
@return true if a batch was queued successfully for each buffer pool
instance. false if another batch of same type was already running in
at least one of the buffer pool instance */
bool buf_flush_lists(ulint min_n, lsn_t lsn_limit, ulint *n_processed);
/** This function picks up a single page from the tail of the LRU
list, flushes it (if it is dirty), removes it from page_hash and LRU
list and puts it on the free list. It is called from user threads when
they are unable to find a replaceable page at the tail of the LRU
list i.e.: when the background LRU flushing in the page_cleaner thread
is not fast enough to keep pace with the workload.
@param[in,out] buf_pool buffer pool instance
@return true if success. */
bool buf_flush_single_page_from_LRU(buf_pool_t *buf_pool);
/** Waits until a flush batch of the given type ends */
void buf_flush_wait_batch_end(
buf_pool_t *buf_pool, /*!< in: buffer pool instance */
buf_flush_t type); /*!< in: BUF_FLUSH_LRU
or BUF_FLUSH_LIST */
/** Waits until a flush batch of the given type ends. This is called by a
thread that only wants to wait for a flush to end but doesn't do any flushing
itself.
@param[in] buf_pool buffer pool instance
@param[in] type BUF_FLUSH_LRU or BUF_FLUSH_LIST */
void buf_flush_wait_batch_end_wait_only(buf_pool_t *buf_pool, buf_flush_t type);
/** This function should be called at a mini-transaction commit, if a page was
modified in it. Puts the block to the list of modified blocks, if it not
already in it.
@param[in] block block which is modified
@param[in] start_lsn start lsn of the first mtr in a set of mtr's
@param[in] end_lsn end lsn of the last mtr in the set of mtr's
@param[in] observer flush observer */
UNIV_INLINE
void buf_flush_note_modification(buf_block_t *block, lsn_t start_lsn,
lsn_t end_lsn, FlushObserver *observer);
/** This function should be called when recovery has modified a buffer page.
@param[in] block block which is modified
@param[in] start_lsn start lsn of the first mtr in a set of mtr's
@param[in] end_lsn end lsn of the last mtr in the set of mtr's */
UNIV_INLINE
void buf_flush_recv_note_modification(buf_block_t *block, lsn_t start_lsn,
lsn_t end_lsn);
/** Returns TRUE if the file page block is immediately suitable for replacement,
i.e., the transition FILE_PAGE => NOT_USED allowed. The caller must hold the
LRU list and block mutexes.
@param[in] bpage buffer control block, must be buf_page_in_file() and
in the LRU list
@return true if can replace immediately */
ibool buf_flush_ready_for_replace(buf_page_t *bpage);
#ifdef UNIV_DEBUG
struct SYS_VAR;
/** Disables page cleaner threads (coordinator and workers).
It's used by: SET GLOBAL innodb_page_cleaner_disabled_debug = 1 (0).
@param[in] thd thread handle
@param[in] var pointer to system variable
@param[out] var_ptr where the formal string goes
@param[in] save immediate result from check function */
void buf_flush_page_cleaner_disabled_debug_update(THD *thd, SYS_VAR *var,
void *var_ptr,
const void *save);
#endif /* UNIV_DEBUG */
/** Initialize page_cleaner.
@param[in] n_page_cleaners Number of page cleaner threads to create */
void buf_flush_page_cleaner_init(size_t n_page_cleaners);
/** Wait for any possible LRU flushes that are in progress to end. */
void buf_flush_wait_LRU_batch_end();
#if defined UNIV_DEBUG || defined UNIV_BUF_DEBUG
/** Validates the flush list.
@return true if ok */
ibool buf_flush_validate(buf_pool_t *buf_pool);
#endif /* UNIV_DEBUG || UNIV_BUF_DEBUG */
/** Initialize the red-black tree to speed up insertions into the flush_list
during recovery process. Should be called at the start of recovery
process before any page has been read/written. */
void buf_flush_init_flush_rbt(void);
/** Frees up the red-black tree. */
void buf_flush_free_flush_rbt(void);
/** Writes a flushable page asynchronously from the buffer pool to a file.
NOTE: 1. in simulated aio we must call os_aio_simulated_wake_handler_threads
after we have posted a batch of writes! 2. buf_page_get_mutex(bpage) must be
held upon entering this function. The LRU list mutex must be held if flush_type
== BUF_FLUSH_SINGLE_PAGE. Both mutexes will be released by this function if it
returns true.
@param[in] buf_pool buffer pool instance
@param[in] bpage buffer control block
@param[in] flush_type type of flush
@param[in] sync true if sync IO request
@return true if page was flushed */
ibool buf_flush_page(buf_pool_t *buf_pool, buf_page_t *bpage,
buf_flush_t flush_type, bool sync);
/** Check if the block is modified and ready for flushing.
@param[in] bpage buffer control block, must be buf_page_in_file()
@param[in] flush_type type of flush
@return true if can flush immediately */
bool buf_flush_ready_for_flush(buf_page_t *bpage, buf_flush_t flush_type)
MY_ATTRIBUTE((warn_unused_result));
/** Check if there are any dirty pages that belong to a space id in the flush
list in a particular buffer pool.
@return number of dirty pages present in a single buffer pool */
ulint buf_pool_get_dirty_pages_count(
buf_pool_t *buf_pool, /*!< in: buffer pool */
space_id_t id, /*!< in: space id to check */
FlushObserver *observer); /*!< in: flush observer to check */
/** Synchronously flush dirty blocks from the end of the flush list of all
buffer pool instances. NOTE: The calling thread is not allowed to own any
latches on pages! */
void buf_flush_sync_all_buf_pools(void);
/** Request IO burst and wake page_cleaner up.
@param[in] lsn_limit upper limit of LSN to be flushed
@return true if we requested higher lsn than ever requested so far */
bool buf_flush_request_force(lsn_t lsn_limit);
/** Checks if all flush lists are empty. It is supposed to be used in
single thread, during startup or shutdown. Hence it does not acquire
lock and it is caller's responsibility to guarantee that flush lists
are not changed in background.
@return true if all flush lists were empty. */
bool buf_are_flush_lists_empty_validate();
/** We use FlushObserver to track flushing of non-redo logged pages in bulk
create index(BtrBulk.cc).Since we disable redo logging during a index build,
we need to make sure that all dirty pages modifed by the index build are
flushed to disk before any redo logged operations go to the index. */
class FlushObserver {
public:
/** Constructor
@param[in] space_id table space id
@param[in] trx trx instance
@param[in] stage performance schema accounting object,
used by ALTER TABLE. It is passed to log_preflush_pool_modified_pages()
for accounting. */
FlushObserver(space_id_t space_id, trx_t *trx, ut_stage_alter_t *stage);
/** Deconstructor */
~FlushObserver();
/** Check pages have been flushed and removed from the flush list
in a buffer pool instance.
@param[in] instance_no buffer pool instance no
@return true if the pages were removed from the flush list */
bool is_complete(ulint instance_no) {
os_rmb;
return (m_flushed->at(instance_no) == m_removed->at(instance_no) ||
m_interrupted);
}
/** Interrupt observer not to wait. */
void interrupted() { m_interrupted = true; }
/** Check whether trx is interrupted
@return true if trx is interrupted */
bool check_interrupted();
/** Flush dirty pages. */
void flush();
/** Notify observer of flushing a page
@param[in] buf_pool buffer pool instance
@param[in] bpage buffer page to flush */
void notify_flush(buf_pool_t *buf_pool, buf_page_t *bpage);
/** Notify observer of removing a page from flush list
@param[in] buf_pool buffer pool instance
@param[in] bpage buffer page flushed */
void notify_remove(buf_pool_t *buf_pool, buf_page_t *bpage);
private:
/** Table space id */
space_id_t m_space_id;
/** Trx instance */
trx_t *m_trx;
/** Performance schema accounting object, used by ALTER TABLE.
If not NULL, then stage->begin_phase_flush() will be called initially,
specifying the number of pages to be attempted to be flushed and
subsequently, stage->inc() will be called for each page we attempt to
flush. */
ut_stage_alter_t *m_stage;
/* Flush request sent */
std::vector<ulint> *m_flushed;
/* Flush request finished */
std::vector<ulint> *m_removed;
/* True if the operation was interrupted. */
bool m_interrupted;
};
#endif /* !UNIV_HOTBACKUP */
#include "buf0flu.ic"
#endif