2005-12-16 06:31:24 +08:00
|
|
|
/* -*- mode: c; c-basic-offset: 8; -*-
|
|
|
|
* vim: noexpandtab sw=8 ts=8 sts=0:
|
|
|
|
*
|
|
|
|
* suballoc.h
|
|
|
|
*
|
|
|
|
* Defines sub allocator api
|
|
|
|
*
|
|
|
|
* Copyright (C) 2003, 2004 Oracle. All rights reserved.
|
|
|
|
*
|
|
|
|
* This program is free software; you can redistribute it and/or
|
|
|
|
* modify it under the terms of the GNU General Public
|
|
|
|
* License as published by the Free Software Foundation; either
|
|
|
|
* version 2 of the License, or (at your option) any later version.
|
|
|
|
*
|
|
|
|
* This program is distributed in the hope that it will be useful,
|
|
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
|
|
* General Public License for more details.
|
|
|
|
*
|
|
|
|
* You should have received a copy of the GNU General Public
|
|
|
|
* License along with this program; if not, write to the
|
|
|
|
* Free Software Foundation, Inc., 59 Temple Place - Suite 330,
|
|
|
|
* Boston, MA 021110-1307, USA.
|
|
|
|
*/
|
|
|
|
|
|
|
|
#ifndef _CHAINALLOC_H_
|
|
|
|
#define _CHAINALLOC_H_
|
|
|
|
|
|
|
|
typedef int (group_search_t)(struct inode *,
|
|
|
|
struct buffer_head *,
|
2008-09-04 11:03:39 +08:00
|
|
|
u32, /* bits_wanted */
|
|
|
|
u32, /* min_bits */
|
|
|
|
u64, /* max_block */
|
|
|
|
u16 *, /* *bit_off */
|
|
|
|
u16 *); /* *bits_found */
|
2005-12-16 06:31:24 +08:00
|
|
|
|
|
|
|
struct ocfs2_alloc_context {
|
|
|
|
struct inode *ac_inode; /* which bitmap are we allocating from? */
|
|
|
|
struct buffer_head *ac_bh; /* file entry bh */
|
2008-03-03 17:12:30 +08:00
|
|
|
u32 ac_alloc_slot; /* which slot are we allocating from? */
|
2005-12-16 06:31:24 +08:00
|
|
|
u32 ac_bits_wanted;
|
|
|
|
u32 ac_bits_given;
|
|
|
|
#define OCFS2_AC_USE_LOCAL 1
|
|
|
|
#define OCFS2_AC_USE_MAIN 2
|
|
|
|
#define OCFS2_AC_USE_INODE 3
|
|
|
|
#define OCFS2_AC_USE_META 4
|
|
|
|
u32 ac_which;
|
|
|
|
|
|
|
|
/* these are used by the chain search */
|
|
|
|
u16 ac_chain;
|
|
|
|
int ac_allow_chain_relink;
|
|
|
|
group_search_t *ac_group_search;
|
2006-06-06 04:41:00 +08:00
|
|
|
|
|
|
|
u64 ac_last_group;
|
2008-09-04 11:03:39 +08:00
|
|
|
u64 ac_max_block; /* Highest block number to allocate. 0 is
|
|
|
|
is the same as ~0 - unlimited */
|
2005-12-16 06:31:24 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
void ocfs2_free_alloc_context(struct ocfs2_alloc_context *ac);
|
|
|
|
static inline int ocfs2_alloc_context_bits_left(struct ocfs2_alloc_context *ac)
|
|
|
|
{
|
|
|
|
return ac->ac_bits_wanted - ac->ac_bits_given;
|
|
|
|
}
|
|
|
|
|
2008-08-18 17:38:43 +08:00
|
|
|
/*
|
|
|
|
* Please note that the caller must make sure that root_el is the root
|
|
|
|
* of extent tree. So for an inode, it should be &fe->id2.i_list. Otherwise
|
|
|
|
* the result may be wrong.
|
|
|
|
*/
|
2005-12-16 06:31:24 +08:00
|
|
|
int ocfs2_reserve_new_metadata(struct ocfs2_super *osb,
|
2008-08-18 17:38:43 +08:00
|
|
|
struct ocfs2_extent_list *root_el,
|
2005-12-16 06:31:24 +08:00
|
|
|
struct ocfs2_alloc_context **ac);
|
2008-08-18 17:11:00 +08:00
|
|
|
int ocfs2_reserve_new_metadata_blocks(struct ocfs2_super *osb,
|
|
|
|
int blocks,
|
|
|
|
struct ocfs2_alloc_context **ac);
|
2005-12-16 06:31:24 +08:00
|
|
|
int ocfs2_reserve_new_inode(struct ocfs2_super *osb,
|
|
|
|
struct ocfs2_alloc_context **ac);
|
|
|
|
int ocfs2_reserve_clusters(struct ocfs2_super *osb,
|
|
|
|
u32 bits_wanted,
|
|
|
|
struct ocfs2_alloc_context **ac);
|
|
|
|
|
|
|
|
int ocfs2_claim_metadata(struct ocfs2_super *osb,
|
2006-10-10 09:11:45 +08:00
|
|
|
handle_t *handle,
|
2005-12-16 06:31:24 +08:00
|
|
|
struct ocfs2_alloc_context *ac,
|
|
|
|
u32 bits_wanted,
|
|
|
|
u16 *suballoc_bit_start,
|
|
|
|
u32 *num_bits,
|
|
|
|
u64 *blkno_start);
|
|
|
|
int ocfs2_claim_new_inode(struct ocfs2_super *osb,
|
2006-10-10 09:11:45 +08:00
|
|
|
handle_t *handle,
|
2005-12-16 06:31:24 +08:00
|
|
|
struct ocfs2_alloc_context *ac,
|
|
|
|
u16 *suballoc_bit,
|
|
|
|
u64 *fe_blkno);
|
|
|
|
int ocfs2_claim_clusters(struct ocfs2_super *osb,
|
2006-10-10 09:11:45 +08:00
|
|
|
handle_t *handle,
|
2005-12-16 06:31:24 +08:00
|
|
|
struct ocfs2_alloc_context *ac,
|
|
|
|
u32 min_clusters,
|
|
|
|
u32 *cluster_start,
|
|
|
|
u32 *num_clusters);
|
2007-09-17 11:10:16 +08:00
|
|
|
/*
|
|
|
|
* Use this variant of ocfs2_claim_clusters to specify a maxiumum
|
|
|
|
* number of clusters smaller than the allocation reserved.
|
|
|
|
*/
|
|
|
|
int __ocfs2_claim_clusters(struct ocfs2_super *osb,
|
|
|
|
handle_t *handle,
|
|
|
|
struct ocfs2_alloc_context *ac,
|
|
|
|
u32 min_clusters,
|
|
|
|
u32 max_clusters,
|
|
|
|
u32 *cluster_start,
|
|
|
|
u32 *num_clusters);
|
2005-12-16 06:31:24 +08:00
|
|
|
|
2007-06-23 06:45:27 +08:00
|
|
|
int ocfs2_free_suballoc_bits(handle_t *handle,
|
|
|
|
struct inode *alloc_inode,
|
|
|
|
struct buffer_head *alloc_bh,
|
|
|
|
unsigned int start_bit,
|
|
|
|
u64 bg_blkno,
|
|
|
|
unsigned int count);
|
2006-10-10 09:11:45 +08:00
|
|
|
int ocfs2_free_dinode(handle_t *handle,
|
2005-12-16 06:31:24 +08:00
|
|
|
struct inode *inode_alloc_inode,
|
|
|
|
struct buffer_head *inode_alloc_bh,
|
|
|
|
struct ocfs2_dinode *di);
|
2006-10-10 09:11:45 +08:00
|
|
|
int ocfs2_free_clusters(handle_t *handle,
|
2005-12-16 06:31:24 +08:00
|
|
|
struct inode *bitmap_inode,
|
|
|
|
struct buffer_head *bitmap_bh,
|
|
|
|
u64 start_blk,
|
|
|
|
unsigned int num_clusters);
|
|
|
|
|
2007-06-23 06:45:27 +08:00
|
|
|
static inline u64 ocfs2_which_suballoc_group(u64 block, unsigned int bit)
|
|
|
|
{
|
|
|
|
u64 group = block - (u64) bit;
|
|
|
|
|
|
|
|
return group;
|
|
|
|
}
|
|
|
|
|
2005-12-16 06:31:24 +08:00
|
|
|
static inline u32 ocfs2_cluster_from_desc(struct ocfs2_super *osb,
|
|
|
|
u64 bg_blkno)
|
|
|
|
{
|
|
|
|
/* This should work for all block group descriptors as only
|
|
|
|
* the 1st group descriptor of the cluster bitmap is
|
|
|
|
* different. */
|
|
|
|
|
|
|
|
if (bg_blkno == osb->first_cluster_group_blkno)
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
/* the rest of the block groups are located at the beginning
|
|
|
|
* of their 1st cluster, so a direct translation just
|
|
|
|
* works. */
|
|
|
|
return ocfs2_blocks_to_clusters(osb->sb, bg_blkno);
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline int ocfs2_is_cluster_bitmap(struct inode *inode)
|
|
|
|
{
|
|
|
|
struct ocfs2_super *osb = OCFS2_SB(inode->i_sb);
|
|
|
|
return osb->bitmap_blkno == OCFS2_I(inode)->ip_blkno;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* This is for local alloc ONLY. Others should use the task-specific
|
|
|
|
* apis above. */
|
|
|
|
int ocfs2_reserve_cluster_bitmap_bits(struct ocfs2_super *osb,
|
|
|
|
struct ocfs2_alloc_context *ac);
|
ocfs2: throttle back local alloc when low on disk space
Ocfs2's local allocator disables itself for the duration of a mount point
when it has trouble allocating a large enough area from the primary bitmap.
That can cause performance problems, especially for disks which were only
temporarily full or fragmented. This patch allows for the allocator to
shrink it's window first, before being disabled. Later, it can also be
re-enabled so that any performance drop is minimized.
To do this, we allow the value of osb->local_alloc_bits to be shrunk when
needed. The default value is recorded in a mostly read-only variable so that
we can re-initialize when required.
Locking had to be updated so that we could protect changes to
local_alloc_bits. Mostly this involves protecting various local alloc values
with the osb spinlock. A new state is also added, OCFS2_LA_THROTTLED, which
is used when the local allocator is has shrunk, but is not disabled. If the
available space dips below 1 megabyte, the local alloc file is disabled. In
either case, local alloc is re-enabled 30 seconds after the event, or when
an appropriate amount of bits is seen in the primary bitmap.
Signed-off-by: Mark Fasheh <mfasheh@suse.com>
2008-07-29 09:02:53 +08:00
|
|
|
void ocfs2_free_ac_resource(struct ocfs2_alloc_context *ac);
|
2005-12-16 06:31:24 +08:00
|
|
|
|
2007-12-18 15:47:03 +08:00
|
|
|
/* given a cluster offset, calculate which block group it belongs to
|
|
|
|
* and return that block offset. */
|
|
|
|
u64 ocfs2_which_cluster_group(struct inode *inode, u32 cluster);
|
|
|
|
|
2008-11-14 06:49:13 +08:00
|
|
|
/*
|
|
|
|
* By default, ocfs2_validate_group_descriptor() calls ocfs2_error() when it
|
|
|
|
* finds a problem. A caller that wants to check a group descriptor
|
|
|
|
* without going readonly passes a nonzero clean_error. This is only
|
2008-11-14 06:49:14 +08:00
|
|
|
* resize, really. Everyone else should be using
|
|
|
|
* ocfs2_read_group_descriptor().
|
2008-11-14 06:49:13 +08:00
|
|
|
*/
|
|
|
|
int ocfs2_validate_group_descriptor(struct super_block *sb,
|
|
|
|
struct ocfs2_dinode *di,
|
2008-11-14 06:49:14 +08:00
|
|
|
struct buffer_head *bh,
|
2008-11-14 06:49:13 +08:00
|
|
|
int clean_error);
|
2008-11-14 06:49:14 +08:00
|
|
|
/*
|
|
|
|
* Read a group descriptor block into *bh. If *bh is NULL, a bh will be
|
|
|
|
* allocated. This is a cached read. The descriptor will be validated with
|
|
|
|
* ocfs2_validate_group_descriptor().
|
|
|
|
*/
|
|
|
|
int ocfs2_read_group_descriptor(struct inode *inode, struct ocfs2_dinode *di,
|
|
|
|
u64 gd_blkno, struct buffer_head **bh);
|
2008-11-14 06:49:13 +08:00
|
|
|
|
2008-08-21 10:36:33 +08:00
|
|
|
int ocfs2_lock_allocators(struct inode *inode, struct ocfs2_extent_tree *et,
|
2008-08-18 17:38:44 +08:00
|
|
|
u32 clusters_to_add, u32 extents_to_split,
|
|
|
|
struct ocfs2_alloc_context **data_ac,
|
2008-08-21 10:36:33 +08:00
|
|
|
struct ocfs2_alloc_context **meta_ac);
|
2005-12-16 06:31:24 +08:00
|
|
|
#endif /* _CHAINALLOC_H_ */
|