From 328f263a571c5561f933b89152984a263145f7e8 Mon Sep 17 00:00:00 2001 From: Christoph Lameter Date: Wed, 25 Jul 2007 20:39:08 -0700 Subject: [PATCH] Large page order operations, zeroing and flushing We may have to zero and flush higher order pages. Implement clear_mapping_page and flush_mapping_page to do that job. Replace the flushing and clearing at some key locations for the pagecache. In some places it is necesssary to determine the page order in use from the page struct since no mapping is available. Add a series of page_cache_page_xx functions: page_cache_head(page) -> Determine head page from a tail page page_cache_base_pages(page) -> Number of base pages of a page page_cache_page_order(page) -> Determine page order of a page page_cache_page_size(page) -> Determine page size of a page page_cache_page_shift(page) -> Determine page shif of a page Signed-off-by: Christoph Lameter --- fs/libfs.c | 4 +-- include/linux/highmem.h | 5 ++-- include/linux/pagemap.h | 54 +++++++++++++++++++++++++++++++++++++++++++++++- mm/filemap.c | 8 +++---- mm/filemap_xip.c | 4 +-- 5 files changed, 64 insertions(+), 11 deletions(-) Index: mm/include/linux/pagemap.h =================================================================== --- mm.orig/include/linux/pagemap.h 2007-11-28 14:10:28.745227175 -0800 +++ mm/include/linux/pagemap.h 2007-11-28 14:15:15.441727161 -0800 @@ -91,6 +91,31 @@ static inline unsigned int page_cache_of return pos & ~PAGE_MASK; } +static inline struct page *page_cache_head(struct page *page) +{ + return page; +} + +static inline int page_cache_base_pages(struct page *page) +{ + return 1; +} + +static inline unsigned long page_cache_page_order(struct page *page) +{ + return 0; +} + +static inline unsigned long page_cache_page_size(struct page *page) +{ + return PAGE_SIZE; +} + +static inline unsigned long page_cache_page_shift(struct page *page) +{ + return PAGE_SHIFT; +} + static inline pgoff_t page_cache_index(struct address_space *a, loff_t pos) { @@ -330,4 +355,31 @@ static inline int fault_in_pages_readabl return ret; } -#endif /* _LINUX_PAGEMAP_H */ +/* + * Clear a higher order page + */ +static inline void clear_mapping_page(struct page *page) +{ + int nr_pages = page_cache_base_pages(page); + int i; + + for (i = 0; i < nr_pages; i++) + clear_highpage(page + i); +} + +/* + * Primitive support for flushing higher order pages. + * + * A bit stupid: On many platforms flushing the first page + * will flush any TLB starting there + */ +static inline void flush_mapping_page(struct page *page) +{ + int nr_pages = page_cache_base_pages(page); + int i; + + for (i = 0; i < nr_pages; i++) + flush_dcache_page(page + i); +} + + Index: mm/fs/libfs.c =================================================================== --- mm.orig/fs/libfs.c 2007-11-28 14:10:51.773477763 -0800 +++ mm/fs/libfs.c 2007-11-28 14:15:15.441727161 -0800 @@ -331,8 +331,8 @@ int simple_rename(struct inode *old_dir, int simple_readpage(struct file *file, struct page *page) { - clear_highpage(page); - flush_dcache_page(page); + clear_mapping_page(page); + flush_mapping_page(page); SetPageUptodate(page); unlock_page(page); return 0; Index: mm/mm/filemap.c =================================================================== --- mm.orig/mm/filemap.c 2007-11-28 14:10:29.408977142 -0800 +++ mm/mm/filemap.c 2007-11-28 14:15:15.441727161 -0800 @@ -960,7 +960,7 @@ page_ok: * before reading the page on the kernel side. */ if (mapping_writably_mapped(mapping)) - flush_dcache_page(page); + flush_mapping_page(page); /* * When a sequential read accesses a page several times, @@ -1948,7 +1948,7 @@ int pagecache_write_end(struct file *fil unsigned offset = page_cache_offset(mapping, pos); struct inode *inode = mapping->host; - flush_dcache_page(page); + flush_mapping_page(page); ret = aops->commit_write(file, page, offset, offset+len); unlock_page(page); mark_page_accessed(page); @@ -2161,7 +2161,7 @@ static ssize_t generic_perform_write_2co kunmap_atomic(src, KM_USER0); copied = bytes; } - flush_dcache_page(page); + flush_mapping_page(page); status = a_ops->commit_write(file, page, offset, offset+bytes); if (unlikely(status < 0)) @@ -2256,7 +2256,7 @@ again: pagefault_disable(); copied = iov_iter_copy_from_user_atomic(page, i, offset, bytes); pagefault_enable(); - flush_dcache_page(page); + flush_mapping_page(page); status = a_ops->write_end(file, mapping, pos, bytes, copied, page, fsdata); Index: mm/mm/filemap_xip.c =================================================================== --- mm.orig/mm/filemap_xip.c 2007-11-28 14:10:46.124978450 -0800 +++ mm/mm/filemap_xip.c 2007-11-28 14:15:15.441727161 -0800 @@ -103,7 +103,7 @@ do_xip_mapping_read(struct address_space * before reading the page on the kernel side. */ if (mapping_writably_mapped(mapping)) - flush_dcache_page(page); + flush_mapping_page(page); /* * Ok, we have the page, so now we can copy it to user space... @@ -316,7 +316,7 @@ __xip_file_write(struct file *filp, cons copied = bytes - __copy_from_user_inatomic_nocache(kaddr, buf, bytes); kunmap_atomic(kaddr, KM_USER0); - flush_dcache_page(page); + flush_mapping_page(page); if (likely(copied > 0)) { status = copied; Index: mm/include/linux/highmem.h =================================================================== --- mm.orig/include/linux/highmem.h 2007-11-28 12:26:49.652967040 -0800 +++ mm/include/linux/highmem.h 2007-11-28 14:15:15.441727161 -0800 @@ -130,7 +130,8 @@ static inline void zero_user_segments(st { void *kaddr = kmap_atomic(page, KM_USER0); - BUG_ON(end1 > PAGE_SIZE || end2 > PAGE_SIZE); + BUG_ON(end1 > page_cache_page_size(page) || + end2 > page_cache_page_size(page)); if (end1 > start1) memset(kaddr + start1, 0, end1 - start1); @@ -139,7 +140,7 @@ static inline void zero_user_segments(st memset(kaddr + start2, 0, end2 - start2); kunmap_atomic(kaddr, KM_USER0); - flush_dcache_page(page); + flush_mapping_page(page); } static inline void zero_user_segment(struct page *page,