Subject: zoned vm counters: conversion of nr_dirty to per zone counter From: Christoph Lameter This makes nr_dirty a per zone counter. Looping over all processors is avoided during writeback state determination. The counter aggregation for nr_dirty had to be undone in the NFS layer since we summed up the page counts from multiple zones. Someone more familiar with NFS should probably review what I have done. Signed-off-by: Christoph Lameter Signed-off-by: Andrew Morton Index: linux-2.6.17-rc6-cl/arch/i386/mm/pgtable.c =================================================================== --- linux-2.6.17-rc6-cl.orig/arch/i386/mm/pgtable.c 2006-06-13 17:14:25.000611421 -0700 +++ linux-2.6.17-rc6-cl/arch/i386/mm/pgtable.c 2006-06-13 17:14:28.824593774 -0700 @@ -59,7 +59,7 @@ void show_mem(void) printk(KERN_INFO "%d pages swap cached\n", cached); get_page_state(&ps); - printk(KERN_INFO "%lu pages dirty\n", ps.nr_dirty); + printk(KERN_INFO "%lu pages dirty\n", global_page_state(NR_DIRTY)); printk(KERN_INFO "%lu pages writeback\n", ps.nr_writeback); printk(KERN_INFO "%lu pages mapped\n", global_page_state(NR_MAPPED)); printk(KERN_INFO "%lu pages slab\n", global_page_state(NR_SLAB)); Index: linux-2.6.17-rc6-cl/drivers/base/node.c =================================================================== --- linux-2.6.17-rc6-cl.orig/drivers/base/node.c 2006-06-13 17:14:05.953937307 -0700 +++ linux-2.6.17-rc6-cl/drivers/base/node.c 2006-06-13 17:14:28.825570276 -0700 @@ -50,8 +50,6 @@ static ssize_t node_read_meminfo(struct __get_zone_counts(&active, &inactive, &free, NODE_DATA(nid)); /* Check for negative values in these approximate counters */ - if ((long)ps.nr_dirty < 0) - ps.nr_dirty = 0; if ((long)ps.nr_writeback < 0) ps.nr_writeback = 0; @@ -81,7 +79,7 @@ static ssize_t node_read_meminfo(struct nid, K(i.freehigh), nid, K(i.totalram - i.totalhigh), nid, K(i.freeram - i.freehigh), - nid, K(ps.nr_dirty), + nid, K(node_page_state(nid, NR_DIRTY)), nid, K(ps.nr_writeback), nid, K(node_page_state(nid, NR_PAGECACHE)), nid, K(node_page_state(nid, NR_MAPPED)), Index: linux-2.6.17-rc6-cl/fs/buffer.c =================================================================== --- linux-2.6.17-rc6-cl.orig/fs/buffer.c 2006-06-12 12:42:47.348762564 -0700 +++ linux-2.6.17-rc6-cl/fs/buffer.c 2006-06-13 17:14:28.827523281 -0700 @@ -854,7 +854,7 @@ int __set_page_dirty_buffers(struct page write_lock_irq(&mapping->tree_lock); if (page->mapping) { /* Race with truncate? */ if (mapping_cap_account_dirty(mapping)) - inc_page_state(nr_dirty); + __inc_zone_page_state(page, NR_DIRTY); radix_tree_tag_set(&mapping->page_tree, page_index(page), PAGECACHE_TAG_DIRTY); Index: linux-2.6.17-rc6-cl/fs/fs-writeback.c =================================================================== --- linux-2.6.17-rc6-cl.orig/fs/fs-writeback.c 2006-06-12 12:42:47.502073390 -0700 +++ linux-2.6.17-rc6-cl/fs/fs-writeback.c 2006-06-13 17:14:28.828499783 -0700 @@ -472,7 +472,7 @@ void sync_inodes_sb(struct super_block * .range_start = 0, .range_end = LLONG_MAX, }; - unsigned long nr_dirty = read_page_state(nr_dirty); + unsigned long nr_dirty = global_page_state(NR_DIRTY); unsigned long nr_unstable = read_page_state(nr_unstable); wbc.nr_to_write = nr_dirty + nr_unstable + Index: linux-2.6.17-rc6-cl/fs/nfs/pagelist.c =================================================================== --- linux-2.6.17-rc6-cl.orig/fs/nfs/pagelist.c 2006-06-05 17:57:02.000000000 -0700 +++ linux-2.6.17-rc6-cl/fs/nfs/pagelist.c 2006-06-13 17:14:28.828499783 -0700 @@ -315,6 +315,7 @@ nfs_scan_lock_dirty(struct nfs_inode *nf req->wb_index, NFS_PAGE_TAG_DIRTY); nfs_list_remove_request(req); nfs_list_add_request(req, dst); + dec_zone_page_state(req->wb_page, NR_DIRTY); res++; } } Index: linux-2.6.17-rc6-cl/fs/nfs/write.c =================================================================== --- linux-2.6.17-rc6-cl.orig/fs/nfs/write.c 2006-06-12 12:42:48.111410682 -0700 +++ linux-2.6.17-rc6-cl/fs/nfs/write.c 2006-06-13 17:14:28.829476285 -0700 @@ -497,7 +497,7 @@ nfs_mark_request_dirty(struct nfs_page * nfs_list_add_request(req, &nfsi->dirty); nfsi->ndirty++; spin_unlock(&nfsi->req_lock); - inc_page_state(nr_dirty); + inc_zone_page_state(req->wb_page, NR_DIRTY); mark_inode_dirty(inode); } @@ -598,7 +598,6 @@ nfs_scan_dirty(struct inode *inode, stru if (nfsi->ndirty != 0) { res = nfs_scan_lock_dirty(nfsi, dst, idx_start, npages); nfsi->ndirty -= res; - sub_page_state(nr_dirty,res); if ((nfsi->ndirty == 0) != list_empty(&nfsi->dirty)) printk(KERN_ERR "NFS: desynchronized value of nfs_i.ndirty.\n"); } Index: linux-2.6.17-rc6-cl/fs/proc/proc_misc.c =================================================================== --- linux-2.6.17-rc6-cl.orig/fs/proc/proc_misc.c 2006-06-13 17:14:05.949054797 -0700 +++ linux-2.6.17-rc6-cl/fs/proc/proc_misc.c 2006-06-13 17:14:28.830452787 -0700 @@ -190,7 +190,7 @@ static int meminfo_read_proc(char *page, K(i.freeram-i.freehigh), K(i.totalswap), K(i.freeswap), - K(ps.nr_dirty), + K(global_page_state(NR_DIRTY)), K(ps.nr_writeback), K(global_page_state(NR_ANON)), K(global_page_state(NR_MAPPED)), Index: linux-2.6.17-rc6-cl/include/linux/mmzone.h =================================================================== --- linux-2.6.17-rc6-cl.orig/include/linux/mmzone.h 2006-06-13 17:14:05.950031299 -0700 +++ linux-2.6.17-rc6-cl/include/linux/mmzone.h 2006-06-13 17:14:28.831429289 -0700 @@ -53,6 +53,7 @@ enum zone_stat_item { NR_PAGECACHE, NR_SLAB, /* Pages used by slab allocator */ NR_PAGETABLE, /* used for pagetables */ + NR_DIRTY, NR_VM_ZONE_STAT_ITEMS }; struct per_cpu_pages { Index: linux-2.6.17-rc6-cl/mm/page_alloc.c =================================================================== --- linux-2.6.17-rc6-cl.orig/mm/page_alloc.c 2006-06-13 17:14:05.952960805 -0700 +++ linux-2.6.17-rc6-cl/mm/page_alloc.c 2006-06-13 17:14:28.833382294 -0700 @@ -1404,7 +1404,7 @@ void show_free_areas(void) "unstable:%lu free:%u slab:%lu mapped:%lu pagetables:%lu\n", active, inactive, - ps.nr_dirty, + global_page_state(NR_DIRTY), ps.nr_writeback, ps.nr_unstable, nr_free_pages(), Index: linux-2.6.17-rc6-cl/mm/page-writeback.c =================================================================== --- linux-2.6.17-rc6-cl.orig/mm/page-writeback.c 2006-06-13 17:13:02.930489551 -0700 +++ linux-2.6.17-rc6-cl/mm/page-writeback.c 2006-06-13 17:14:28.833382294 -0700 @@ -109,7 +109,7 @@ struct writeback_state static void get_writeback_state(struct writeback_state *wbs) { - wbs->nr_dirty = read_page_state(nr_dirty); + wbs->nr_dirty = global_page_state(NR_DIRTY); wbs->nr_unstable = read_page_state(nr_unstable); wbs->nr_mapped = global_page_state(NR_MAPPED) + global_page_state(NR_ANON); @@ -641,7 +641,7 @@ int __set_page_dirty_nobuffers(struct pa if (mapping2) { /* Race with truncate? */ BUG_ON(mapping2 != mapping); if (mapping_cap_account_dirty(mapping)) - inc_page_state(nr_dirty); + __inc_zone_page_state(page, NR_DIRTY); radix_tree_tag_set(&mapping->page_tree, page_index(page), PAGECACHE_TAG_DIRTY); } @@ -728,9 +728,9 @@ int test_clear_page_dirty(struct page *p radix_tree_tag_clear(&mapping->page_tree, page_index(page), PAGECACHE_TAG_DIRTY); - write_unlock_irqrestore(&mapping->tree_lock, flags); if (mapping_cap_account_dirty(mapping)) - dec_page_state(nr_dirty); + __dec_zone_page_state(page, NR_DIRTY); + write_unlock_irqrestore(&mapping->tree_lock, flags); return 1; } write_unlock_irqrestore(&mapping->tree_lock, flags); @@ -761,7 +761,7 @@ int clear_page_dirty_for_io(struct page if (mapping) { if (TestClearPageDirty(page)) { if (mapping_cap_account_dirty(mapping)) - dec_page_state(nr_dirty); + dec_zone_page_state(page, NR_DIRTY); return 1; } return 0; Index: linux-2.6.17-rc6-cl/mm/vmstat.c =================================================================== --- linux-2.6.17-rc6-cl.orig/mm/vmstat.c 2006-06-13 17:14:05.955890311 -0700 +++ linux-2.6.17-rc6-cl/mm/vmstat.c 2006-06-13 17:14:28.834358796 -0700 @@ -462,9 +462,9 @@ static char *vmstat_text[] = { "nr_pagecache", "nr_slab", "nr_page_table_pages", + "nr_dirty", /* Page state */ - "nr_dirty", "nr_writeback", "nr_unstable",