/* -*- mode: C++; c-basic-offset: 4; indent-tabs-mode: nil -*- */ // vim: ft=cpp:expandtab:ts=8:sw=4:softtabstop=4: #ifndef FT_FLUSHER_H #define FT_FLUSHER_H #ident "$Id$" #ident "Copyright (c) 2007-2012 Tokutek Inc. All rights reserved." #ident "The technology is licensed by the Massachusetts Institute of Technology, Rutgers State University of New Jersey, and the Research Foundation of State University of New York at Stony Brook under United States of America Serial No. 11/760379 and to the patents and/or patent applications resulting from it." // This must be first to make the 64-bit file mode work right in Linux #include "fttypes.h" typedef enum { FT_FLUSHER_CLEANER_TOTAL_NODES = 0, // total number of nodes whose buffers are potentially flushed by cleaner thread FT_FLUSHER_CLEANER_H1_NODES, // number of nodes of height one whose message buffers are flushed by cleaner thread FT_FLUSHER_CLEANER_HGT1_NODES, // number of nodes of height > 1 whose message buffers are flushed by cleaner thread FT_FLUSHER_CLEANER_EMPTY_NODES, // number of nodes that are selected by cleaner, but whose buffers are empty FT_FLUSHER_CLEANER_NODES_DIRTIED, // number of nodes that are made dirty by the cleaner thread FT_FLUSHER_CLEANER_MAX_BUFFER_SIZE, // max number of bytes in message buffer flushed by cleaner thread FT_FLUSHER_CLEANER_MIN_BUFFER_SIZE, FT_FLUSHER_CLEANER_TOTAL_BUFFER_SIZE, FT_FLUSHER_CLEANER_MAX_BUFFER_WORKDONE, // max workdone value of any message buffer flushed by cleaner thread FT_FLUSHER_CLEANER_MIN_BUFFER_WORKDONE, FT_FLUSHER_CLEANER_TOTAL_BUFFER_WORKDONE, FT_FLUSHER_CLEANER_NUM_LEAF_MERGES_STARTED, // number of times cleaner thread tries to merge a leaf FT_FLUSHER_CLEANER_NUM_LEAF_MERGES_RUNNING, // number of cleaner thread leaf merges in progress FT_FLUSHER_CLEANER_NUM_LEAF_MERGES_COMPLETED, // number of times cleaner thread successfully merges a leaf FT_FLUSHER_CLEANER_NUM_DIRTIED_FOR_LEAF_MERGE, // nodes dirtied by the "flush from root" process to merge a leaf node FT_FLUSHER_FLUSH_TOTAL, // total number of flushes done by flusher threads or cleaner threads FT_FLUSHER_FLUSH_IN_MEMORY, // number of in memory flushes FT_FLUSHER_FLUSH_NEEDED_IO, // number of flushes that had to read a child (or part) off disk FT_FLUSHER_FLUSH_CASCADES, // number of flushes that triggered another flush in the child FT_FLUSHER_FLUSH_CASCADES_1, // number of flushes that triggered 1 cascading flush FT_FLUSHER_FLUSH_CASCADES_2, // number of flushes that triggered 2 cascading flushes FT_FLUSHER_FLUSH_CASCADES_3, // number of flushes that triggered 3 cascading flushes FT_FLUSHER_FLUSH_CASCADES_4, // number of flushes that triggered 4 cascading flushes FT_FLUSHER_FLUSH_CASCADES_5, // number of flushes that triggered 5 cascading flushes FT_FLUSHER_FLUSH_CASCADES_GT_5, // number of flushes that triggered more than 5 cascading flushes FT_FLUSHER_SPLIT_LEAF, // number of leaf nodes split FT_FLUSHER_SPLIT_NONLEAF, // number of nonleaf nodes split FT_FLUSHER_MERGE_LEAF, // number of times leaf nodes are merged FT_FLUSHER_MERGE_NONLEAF, // number of times nonleaf nodes are merged FT_FLUSHER_BALANCE_LEAF, // number of times a leaf node is balanced inside brt FT_FLUSHER_STATUS_NUM_ROWS } ft_flusher_status_entry; typedef struct { bool initialized; TOKU_ENGINE_STATUS_ROW_S status[FT_FLUSHER_STATUS_NUM_ROWS]; } FT_FLUSHER_STATUS_S, *FT_FLUSHER_STATUS; void toku_ft_flusher_status_init(void) __attribute__((__constructor__)); void toku_ft_flusher_get_status(FT_FLUSHER_STATUS); /** * Only for testing, not for production. * * Set a callback the flusher thread will use to signal various points * during its execution. */ void toku_flusher_thread_set_callback( void (*callback_f)(int, void*), void* extra ); /** * Puts a workitem on the flusher thread queue, scheduling the node to be * flushed by flush_some_child. */ void flush_node_on_background_thread( FT h, FTNODE parent ); /** * Effect: Split a leaf node. * Argument "node" is node to be split. * Upon return: * nodea and nodeb point to new nodes that result from split of "node" * nodea is the left node that results from the split * splitk is the right-most key of nodea */ void ftleaf_split( FT h, FTNODE node, FTNODE *nodea, FTNODE *nodeb, DBT *splitk, bool create_new_node, enum split_mode split_mode, uint32_t num_dependent_nodes, FTNODE* dependent_nodes ); /** * Effect: node must be a node-leaf node. It is split into two nodes, and * the fanout is split between them. * Sets splitk->data pointer to a malloc'd value * Sets nodea, and nodeb to the two new nodes. * The caller must replace the old node with the two new nodes. * This function will definitely reduce the number of children for the node, * but it does not guarantee that the resulting nodes are smaller than nodesize. */ void ft_nonleaf_split( FT h, FTNODE node, FTNODE *nodea, FTNODE *nodeb, DBT *splitk, uint32_t num_dependent_nodes, FTNODE* dependent_nodes ); /************************************************************************ * HOT optimize, should perhaps be factored out to its own header file * ************************************************************************ */ typedef enum { FT_HOT_NUM_STARTED = 0, // number of HOT operations that have begun FT_HOT_NUM_COMPLETED, // number of HOT operations that have successfully completed FT_HOT_NUM_ABORTED, // number of HOT operations that have been aborted FT_HOT_MAX_ROOT_FLUSH_COUNT, // max number of flushes from root ever required to optimize a tree FT_HOT_STATUS_NUM_ROWS } ft_hot_status_entry; typedef struct { bool initialized; TOKU_ENGINE_STATUS_ROW_S status[FT_HOT_STATUS_NUM_ROWS]; } FT_HOT_STATUS_S, *FT_HOT_STATUS; void toku_ft_hot_status_init(void) __attribute__((__constructor__)); void toku_ft_hot_get_status(FT_HOT_STATUS); /** * Takes given FT and pushes all pending messages to the leaf nodes. */ int toku_ft_hot_optimize(FT_HANDLE brt, int (*progress_callback)(void *extra, float progress), void *progress_extra); #endif // End of header guardian.