[PATCH] per-task-delay-accounting: sync block I/O and swapin delay collection
Unlike earlier iterations of the delay accounting patches, now delays are only collected for the actual I/O waits rather than try and cover the delays seen in I/O submission paths. Account separately for block I/O delays incurred as a result of swapin page faults whose frequency can be affected by the task/process' rss limit. Hence swapin delays can act as feedback for rss limit changes independent of I/O priority changes. Signed-off-by: Shailabh Nagar <nagar@watson.ibm.com> Signed-off-by: Balbir Singh <balbir@in.ibm.com> Cc: Jes Sorensen <jes@sgi.com> Cc: Peter Chubb <peterc@gelato.unsw.edu.au> Cc: Erich Focht <efocht@ess.nec.de> Cc: Levent Serinol <lserinol@gmail.com> Cc: Jay Lan <jlan@engr.sgi.com> Signed-off-by: Andrew Morton <akpm@osdl.org> Signed-off-by: Linus Torvalds <torvalds@osdl.org>
This commit is contained in:
parent
ca74e92b46
commit
0ff922452d
@ -19,6 +19,13 @@
|
|||||||
|
|
||||||
#include <linux/sched.h>
|
#include <linux/sched.h>
|
||||||
|
|
||||||
|
/*
|
||||||
|
* Per-task flags relevant to delay accounting
|
||||||
|
* maintained privately to avoid exhausting similar flags in sched.h:PF_*
|
||||||
|
* Used to set current->delays->flags
|
||||||
|
*/
|
||||||
|
#define DELAYACCT_PF_SWAPIN 0x00000001 /* I am doing a swapin */
|
||||||
|
|
||||||
#ifdef CONFIG_TASK_DELAY_ACCT
|
#ifdef CONFIG_TASK_DELAY_ACCT
|
||||||
|
|
||||||
extern int delayacct_on; /* Delay accounting turned on/off */
|
extern int delayacct_on; /* Delay accounting turned on/off */
|
||||||
@ -26,6 +33,8 @@ extern kmem_cache_t *delayacct_cache;
|
|||||||
extern void delayacct_init(void);
|
extern void delayacct_init(void);
|
||||||
extern void __delayacct_tsk_init(struct task_struct *);
|
extern void __delayacct_tsk_init(struct task_struct *);
|
||||||
extern void __delayacct_tsk_exit(struct task_struct *);
|
extern void __delayacct_tsk_exit(struct task_struct *);
|
||||||
|
extern void __delayacct_blkio_start(void);
|
||||||
|
extern void __delayacct_blkio_end(void);
|
||||||
|
|
||||||
static inline void delayacct_set_flag(int flag)
|
static inline void delayacct_set_flag(int flag)
|
||||||
{
|
{
|
||||||
@ -53,6 +62,18 @@ static inline void delayacct_tsk_exit(struct task_struct *tsk)
|
|||||||
__delayacct_tsk_exit(tsk);
|
__delayacct_tsk_exit(tsk);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
static inline void delayacct_blkio_start(void)
|
||||||
|
{
|
||||||
|
if (current->delays)
|
||||||
|
__delayacct_blkio_start();
|
||||||
|
}
|
||||||
|
|
||||||
|
static inline void delayacct_blkio_end(void)
|
||||||
|
{
|
||||||
|
if (current->delays)
|
||||||
|
__delayacct_blkio_end();
|
||||||
|
}
|
||||||
|
|
||||||
#else
|
#else
|
||||||
static inline void delayacct_set_flag(int flag)
|
static inline void delayacct_set_flag(int flag)
|
||||||
{}
|
{}
|
||||||
@ -64,6 +85,10 @@ static inline void delayacct_tsk_init(struct task_struct *tsk)
|
|||||||
{}
|
{}
|
||||||
static inline void delayacct_tsk_exit(struct task_struct *tsk)
|
static inline void delayacct_tsk_exit(struct task_struct *tsk)
|
||||||
{}
|
{}
|
||||||
|
static inline void delayacct_blkio_start(void)
|
||||||
|
{}
|
||||||
|
static inline void delayacct_blkio_end(void)
|
||||||
|
{}
|
||||||
#endif /* CONFIG_TASK_DELAY_ACCT */
|
#endif /* CONFIG_TASK_DELAY_ACCT */
|
||||||
|
|
||||||
#endif
|
#endif
|
||||||
|
@ -566,6 +566,19 @@ struct task_delay_info {
|
|||||||
* Atomicity of updates to XXX_delay, XXX_count protected by
|
* Atomicity of updates to XXX_delay, XXX_count protected by
|
||||||
* single lock above (split into XXX_lock if contention is an issue).
|
* single lock above (split into XXX_lock if contention is an issue).
|
||||||
*/
|
*/
|
||||||
|
|
||||||
|
/*
|
||||||
|
* XXX_count is incremented on every XXX operation, the delay
|
||||||
|
* associated with the operation is added to XXX_delay.
|
||||||
|
* XXX_delay contains the accumulated delay time in nanoseconds.
|
||||||
|
*/
|
||||||
|
struct timespec blkio_start, blkio_end; /* Shared by blkio, swapin */
|
||||||
|
u64 blkio_delay; /* wait for sync block io completion */
|
||||||
|
u64 swapin_delay; /* wait for swapin block io completion */
|
||||||
|
u32 blkio_count; /* total count of the number of sync block */
|
||||||
|
/* io operations performed */
|
||||||
|
u32 swapin_count; /* total count of the number of swapin block */
|
||||||
|
/* io operations performed */
|
||||||
};
|
};
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
|
@ -85,3 +85,22 @@ static void delayacct_end(struct timespec *start, struct timespec *end,
|
|||||||
spin_unlock(¤t->delays->lock);
|
spin_unlock(¤t->delays->lock);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
void __delayacct_blkio_start(void)
|
||||||
|
{
|
||||||
|
delayacct_start(¤t->delays->blkio_start);
|
||||||
|
}
|
||||||
|
|
||||||
|
void __delayacct_blkio_end(void)
|
||||||
|
{
|
||||||
|
if (current->delays->flags & DELAYACCT_PF_SWAPIN)
|
||||||
|
/* Swapin block I/O */
|
||||||
|
delayacct_end(¤t->delays->blkio_start,
|
||||||
|
¤t->delays->blkio_end,
|
||||||
|
¤t->delays->swapin_delay,
|
||||||
|
¤t->delays->swapin_count);
|
||||||
|
else /* Other block I/O */
|
||||||
|
delayacct_end(¤t->delays->blkio_start,
|
||||||
|
¤t->delays->blkio_end,
|
||||||
|
¤t->delays->blkio_delay,
|
||||||
|
¤t->delays->blkio_count);
|
||||||
|
}
|
||||||
|
@ -51,6 +51,7 @@
|
|||||||
#include <linux/times.h>
|
#include <linux/times.h>
|
||||||
#include <linux/acct.h>
|
#include <linux/acct.h>
|
||||||
#include <linux/kprobes.h>
|
#include <linux/kprobes.h>
|
||||||
|
#include <linux/delayacct.h>
|
||||||
#include <asm/tlb.h>
|
#include <asm/tlb.h>
|
||||||
|
|
||||||
#include <asm/unistd.h>
|
#include <asm/unistd.h>
|
||||||
@ -4534,9 +4535,11 @@ void __sched io_schedule(void)
|
|||||||
{
|
{
|
||||||
struct rq *rq = &__raw_get_cpu_var(runqueues);
|
struct rq *rq = &__raw_get_cpu_var(runqueues);
|
||||||
|
|
||||||
|
delayacct_blkio_start();
|
||||||
atomic_inc(&rq->nr_iowait);
|
atomic_inc(&rq->nr_iowait);
|
||||||
schedule();
|
schedule();
|
||||||
atomic_dec(&rq->nr_iowait);
|
atomic_dec(&rq->nr_iowait);
|
||||||
|
delayacct_blkio_end();
|
||||||
}
|
}
|
||||||
EXPORT_SYMBOL(io_schedule);
|
EXPORT_SYMBOL(io_schedule);
|
||||||
|
|
||||||
@ -4545,9 +4548,11 @@ long __sched io_schedule_timeout(long timeout)
|
|||||||
struct rq *rq = &__raw_get_cpu_var(runqueues);
|
struct rq *rq = &__raw_get_cpu_var(runqueues);
|
||||||
long ret;
|
long ret;
|
||||||
|
|
||||||
|
delayacct_blkio_start();
|
||||||
atomic_inc(&rq->nr_iowait);
|
atomic_inc(&rq->nr_iowait);
|
||||||
ret = schedule_timeout(timeout);
|
ret = schedule_timeout(timeout);
|
||||||
atomic_dec(&rq->nr_iowait);
|
atomic_dec(&rq->nr_iowait);
|
||||||
|
delayacct_blkio_end();
|
||||||
return ret;
|
return ret;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -47,6 +47,7 @@
|
|||||||
#include <linux/pagemap.h>
|
#include <linux/pagemap.h>
|
||||||
#include <linux/rmap.h>
|
#include <linux/rmap.h>
|
||||||
#include <linux/module.h>
|
#include <linux/module.h>
|
||||||
|
#include <linux/delayacct.h>
|
||||||
#include <linux/init.h>
|
#include <linux/init.h>
|
||||||
|
|
||||||
#include <asm/pgalloc.h>
|
#include <asm/pgalloc.h>
|
||||||
@ -1934,6 +1935,7 @@ static int do_swap_page(struct mm_struct *mm, struct vm_area_struct *vma,
|
|||||||
migration_entry_wait(mm, pmd, address);
|
migration_entry_wait(mm, pmd, address);
|
||||||
goto out;
|
goto out;
|
||||||
}
|
}
|
||||||
|
delayacct_set_flag(DELAYACCT_PF_SWAPIN);
|
||||||
page = lookup_swap_cache(entry);
|
page = lookup_swap_cache(entry);
|
||||||
if (!page) {
|
if (!page) {
|
||||||
swapin_readahead(entry, address, vma);
|
swapin_readahead(entry, address, vma);
|
||||||
@ -1946,6 +1948,7 @@ static int do_swap_page(struct mm_struct *mm, struct vm_area_struct *vma,
|
|||||||
page_table = pte_offset_map_lock(mm, pmd, address, &ptl);
|
page_table = pte_offset_map_lock(mm, pmd, address, &ptl);
|
||||||
if (likely(pte_same(*page_table, orig_pte)))
|
if (likely(pte_same(*page_table, orig_pte)))
|
||||||
ret = VM_FAULT_OOM;
|
ret = VM_FAULT_OOM;
|
||||||
|
delayacct_clear_flag(DELAYACCT_PF_SWAPIN);
|
||||||
goto unlock;
|
goto unlock;
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -1955,6 +1958,7 @@ static int do_swap_page(struct mm_struct *mm, struct vm_area_struct *vma,
|
|||||||
grab_swap_token();
|
grab_swap_token();
|
||||||
}
|
}
|
||||||
|
|
||||||
|
delayacct_clear_flag(DELAYACCT_PF_SWAPIN);
|
||||||
mark_page_accessed(page);
|
mark_page_accessed(page);
|
||||||
lock_page(page);
|
lock_page(page);
|
||||||
|
|
||||||
|
Loading…
Reference in New Issue
Block a user