blob: 1332adc0b9fae2b8ede59c9b30d2dcffe9d6a366 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
Dave Kleikamp7fab4792005-05-02 12:25:02 -06002 * Copyright (C) International Business Machines Corp., 2000-2005
Linus Torvalds1da177e2005-04-16 15:20:36 -07003 * Portions Copyright (C) Christoph Hellwig, 2001-2002
4 *
5 * This program is free software; you can redistribute it and/or modify
6 * it under the terms of the GNU General Public License as published by
Dave Kleikamp63f83c92006-10-02 09:55:27 -05007 * the Free Software Foundation; either version 2 of the License, or
Linus Torvalds1da177e2005-04-16 15:20:36 -07008 * (at your option) any later version.
Dave Kleikamp63f83c92006-10-02 09:55:27 -05009 *
Linus Torvalds1da177e2005-04-16 15:20:36 -070010 * This program is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See
13 * the GNU General Public License for more details.
14 *
15 * You should have received a copy of the GNU General Public License
Dave Kleikamp63f83c92006-10-02 09:55:27 -050016 * along with this program; if not, write to the Free Software
Linus Torvalds1da177e2005-04-16 15:20:36 -070017 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
18 */
19
20#include <linux/fs.h>
Dave Kleikamp7fab4792005-05-02 12:25:02 -060021#include <linux/mm.h>
22#include <linux/bio.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070023#include <linux/init.h>
24#include <linux/buffer_head.h>
25#include <linux/mempool.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070026#include "jfs_incore.h"
27#include "jfs_superblock.h"
28#include "jfs_filsys.h"
29#include "jfs_metapage.h"
30#include "jfs_txnmgr.h"
31#include "jfs_debug.h"
32
Linus Torvalds1da177e2005-04-16 15:20:36 -070033#ifdef CONFIG_JFS_STATISTICS
34static struct {
35 uint pagealloc; /* # of page allocations */
36 uint pagefree; /* # of page frees */
37 uint lockwait; /* # of sleeping lock_metapage() calls */
38} mpStat;
39#endif
40
Dave Kleikamp7fab4792005-05-02 12:25:02 -060041#define metapage_locked(mp) test_bit(META_locked, &(mp)->flag)
42#define trylock_metapage(mp) test_and_set_bit(META_locked, &(mp)->flag)
Linus Torvalds1da177e2005-04-16 15:20:36 -070043
44static inline void unlock_metapage(struct metapage *mp)
45{
46 clear_bit(META_locked, &mp->flag);
47 wake_up(&mp->wait);
48}
49
Dave Kleikamp7fab4792005-05-02 12:25:02 -060050static inline void __lock_metapage(struct metapage *mp)
Linus Torvalds1da177e2005-04-16 15:20:36 -070051{
52 DECLARE_WAITQUEUE(wait, current);
Linus Torvalds1da177e2005-04-16 15:20:36 -070053 INCREMENT(mpStat.lockwait);
Linus Torvalds1da177e2005-04-16 15:20:36 -070054 add_wait_queue_exclusive(&mp->wait, &wait);
55 do {
56 set_current_state(TASK_UNINTERRUPTIBLE);
57 if (metapage_locked(mp)) {
Dave Kleikamp7fab4792005-05-02 12:25:02 -060058 unlock_page(mp->page);
Dave Kleikamp4aa0d232007-01-17 21:18:35 -060059 io_schedule();
Dave Kleikamp7fab4792005-05-02 12:25:02 -060060 lock_page(mp->page);
Linus Torvalds1da177e2005-04-16 15:20:36 -070061 }
62 } while (trylock_metapage(mp));
63 __set_current_state(TASK_RUNNING);
64 remove_wait_queue(&mp->wait, &wait);
65}
66
Dave Kleikamp7fab4792005-05-02 12:25:02 -060067/*
68 * Must have mp->page locked
69 */
Linus Torvalds1da177e2005-04-16 15:20:36 -070070static inline void lock_metapage(struct metapage *mp)
71{
72 if (trylock_metapage(mp))
73 __lock_metapage(mp);
74}
75
76#define METAPOOL_MIN_PAGES 32
Christoph Lametere18b8902006-12-06 20:33:20 -080077static struct kmem_cache *metapage_cache;
Linus Torvalds1da177e2005-04-16 15:20:36 -070078static mempool_t *metapage_mempool;
79
Dave Kleikamp7fab4792005-05-02 12:25:02 -060080#define MPS_PER_PAGE (PAGE_CACHE_SIZE >> L2PSIZE)
81
82#if MPS_PER_PAGE > 1
83
84struct meta_anchor {
85 int mp_count;
86 atomic_t io_count;
87 struct metapage *mp[MPS_PER_PAGE];
88};
Hugh Dickins4c21e2f2005-10-29 18:16:40 -070089#define mp_anchor(page) ((struct meta_anchor *)page_private(page))
Dave Kleikamp7fab4792005-05-02 12:25:02 -060090
91static inline struct metapage *page_to_mp(struct page *page, uint offset)
92{
93 if (!PagePrivate(page))
94 return NULL;
95 return mp_anchor(page)->mp[offset >> L2PSIZE];
96}
97
98static inline int insert_metapage(struct page *page, struct metapage *mp)
99{
100 struct meta_anchor *a;
101 int index;
102 int l2mp_blocks; /* log2 blocks per metapage */
103
104 if (PagePrivate(page))
105 a = mp_anchor(page);
106 else {
Eric Sesterhenn5b3030e2006-02-23 09:47:13 -0600107 a = kzalloc(sizeof(struct meta_anchor), GFP_NOFS);
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600108 if (!a)
109 return -ENOMEM;
Hugh Dickins4c21e2f2005-10-29 18:16:40 -0700110 set_page_private(page, (unsigned long)a);
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600111 SetPagePrivate(page);
112 kmap(page);
113 }
114
115 if (mp) {
116 l2mp_blocks = L2PSIZE - page->mapping->host->i_blkbits;
117 index = (mp->index >> l2mp_blocks) & (MPS_PER_PAGE - 1);
118 a->mp_count++;
119 a->mp[index] = mp;
120 }
121
122 return 0;
123}
124
125static inline void remove_metapage(struct page *page, struct metapage *mp)
126{
127 struct meta_anchor *a = mp_anchor(page);
128 int l2mp_blocks = L2PSIZE - page->mapping->host->i_blkbits;
129 int index;
130
131 index = (mp->index >> l2mp_blocks) & (MPS_PER_PAGE - 1);
132
133 BUG_ON(a->mp[index] != mp);
134
135 a->mp[index] = NULL;
136 if (--a->mp_count == 0) {
137 kfree(a);
Hugh Dickins4c21e2f2005-10-29 18:16:40 -0700138 set_page_private(page, 0);
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600139 ClearPagePrivate(page);
140 kunmap(page);
141 }
142}
143
144static inline void inc_io(struct page *page)
145{
146 atomic_inc(&mp_anchor(page)->io_count);
147}
148
149static inline void dec_io(struct page *page, void (*handler) (struct page *))
150{
151 if (atomic_dec_and_test(&mp_anchor(page)->io_count))
152 handler(page);
153}
154
155#else
156static inline struct metapage *page_to_mp(struct page *page, uint offset)
157{
Hugh Dickins4c21e2f2005-10-29 18:16:40 -0700158 return PagePrivate(page) ? (struct metapage *)page_private(page) : NULL;
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600159}
160
161static inline int insert_metapage(struct page *page, struct metapage *mp)
162{
163 if (mp) {
Hugh Dickins4c21e2f2005-10-29 18:16:40 -0700164 set_page_private(page, (unsigned long)mp);
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600165 SetPagePrivate(page);
166 kmap(page);
167 }
168 return 0;
169}
170
171static inline void remove_metapage(struct page *page, struct metapage *mp)
172{
Hugh Dickins4c21e2f2005-10-29 18:16:40 -0700173 set_page_private(page, 0);
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600174 ClearPagePrivate(page);
175 kunmap(page);
176}
177
178#define inc_io(page) do {} while(0)
179#define dec_io(page, handler) handler(page)
180
181#endif
182
Christoph Lametere18b8902006-12-06 20:33:20 -0800183static void init_once(void *foo, struct kmem_cache *cachep, unsigned long flags)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700184{
185 struct metapage *mp = (struct metapage *)foo;
186
Christoph Lametera35afb82007-05-16 22:10:57 -0700187 mp->lid = 0;
188 mp->lsn = 0;
189 mp->flag = 0;
190 mp->data = NULL;
191 mp->clsn = 0;
192 mp->log = NULL;
193 set_bit(META_free, &mp->flag);
194 init_waitqueue_head(&mp->wait);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700195}
196
Al Viro27496a82005-10-21 03:20:48 -0400197static inline struct metapage *alloc_metapage(gfp_t gfp_mask)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700198{
199 return mempool_alloc(metapage_mempool, gfp_mask);
200}
201
202static inline void free_metapage(struct metapage *mp)
203{
204 mp->flag = 0;
205 set_bit(META_free, &mp->flag);
206
207 mempool_free(mp, metapage_mempool);
208}
209
210int __init metapage_init(void)
211{
212 /*
213 * Allocate the metapage structures
214 */
215 metapage_cache = kmem_cache_create("jfs_mp", sizeof(struct metapage),
Paul Mundt20c2df82007-07-20 10:11:58 +0900216 0, 0, init_once);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700217 if (metapage_cache == NULL)
218 return -ENOMEM;
219
Matthew Dobson93d23412006-03-26 01:37:50 -0800220 metapage_mempool = mempool_create_slab_pool(METAPOOL_MIN_PAGES,
221 metapage_cache);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700222
223 if (metapage_mempool == NULL) {
224 kmem_cache_destroy(metapage_cache);
225 return -ENOMEM;
226 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700227
228 return 0;
229}
230
231void metapage_exit(void)
232{
233 mempool_destroy(metapage_mempool);
234 kmem_cache_destroy(metapage_cache);
235}
236
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600237static inline void drop_metapage(struct page *page, struct metapage *mp)
238{
239 if (mp->count || mp->nohomeok || test_bit(META_dirty, &mp->flag) ||
240 test_bit(META_io, &mp->flag))
241 return;
242 remove_metapage(page, mp);
243 INCREMENT(mpStat.pagefree);
244 free_metapage(mp);
245}
246
Linus Torvalds1da177e2005-04-16 15:20:36 -0700247/*
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600248 * Metapage address space operations
Linus Torvalds1da177e2005-04-16 15:20:36 -0700249 */
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600250
251static sector_t metapage_get_blocks(struct inode *inode, sector_t lblock,
252 unsigned int *len)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700253{
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600254 int rc = 0;
255 int xflag;
256 s64 xaddr;
Theodore Ts'oba52de12006-09-27 01:50:49 -0700257 sector_t file_blocks = (inode->i_size + inode->i_sb->s_blocksize - 1) >>
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600258 inode->i_blkbits;
259
260 if (lblock >= file_blocks)
261 return 0;
262 if (lblock + *len > file_blocks)
263 *len = file_blocks - lblock;
264
265 if (inode->i_ino) {
266 rc = xtLookup(inode, (s64)lblock, *len, &xflag, &xaddr, len, 0);
267 if ((rc == 0) && *len)
268 lblock = (sector_t)xaddr;
269 else
270 lblock = 0;
271 } /* else no mapping */
272
273 return lblock;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700274}
275
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600276static void last_read_complete(struct page *page)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700277{
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600278 if (!PageError(page))
279 SetPageUptodate(page);
280 unlock_page(page);
281}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700282
NeilBrown6712ecf2007-09-27 12:47:43 +0200283static void metapage_read_end_io(struct bio *bio, int err)
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600284{
285 struct page *page = bio->bi_private;
286
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600287 if (!test_bit(BIO_UPTODATE, &bio->bi_flags)) {
288 printk(KERN_ERR "metapage_read_end_io: I/O error\n");
289 SetPageError(page);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700290 }
291
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600292 dec_io(page, last_read_complete);
293 bio_put(bio);
294
295 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700296}
297
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600298static void remove_from_logsync(struct metapage *mp)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700299{
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600300 struct jfs_log *log = mp->log;
301 unsigned long flags;
302/*
303 * This can race. Recheck that log hasn't been set to null, and after
304 * acquiring logsync lock, recheck lsn
305 */
306 if (!log)
307 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700308
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600309 LOGSYNC_LOCK(log, flags);
310 if (mp->lsn) {
311 mp->log = NULL;
312 mp->lsn = 0;
313 mp->clsn = 0;
314 log->count--;
315 list_del(&mp->synclist);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700316 }
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600317 LOGSYNC_UNLOCK(log, flags);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700318}
319
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600320static void last_write_complete(struct page *page)
321{
322 struct metapage *mp;
323 unsigned int offset;
324
325 for (offset = 0; offset < PAGE_CACHE_SIZE; offset += PSIZE) {
326 mp = page_to_mp(page, offset);
327 if (mp && test_bit(META_io, &mp->flag)) {
328 if (mp->lsn)
329 remove_from_logsync(mp);
330 clear_bit(META_io, &mp->flag);
331 }
332 /*
333 * I'd like to call drop_metapage here, but I don't think it's
334 * safe unless I have the page locked
335 */
336 }
337 end_page_writeback(page);
338}
339
NeilBrown6712ecf2007-09-27 12:47:43 +0200340static void metapage_write_end_io(struct bio *bio, int err)
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600341{
342 struct page *page = bio->bi_private;
343
344 BUG_ON(!PagePrivate(page));
345
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600346 if (! test_bit(BIO_UPTODATE, &bio->bi_flags)) {
347 printk(KERN_ERR "metapage_write_end_io: I/O error\n");
348 SetPageError(page);
349 }
350 dec_io(page, last_write_complete);
351 bio_put(bio);
352 return 0;
353}
354
355static int metapage_writepage(struct page *page, struct writeback_control *wbc)
356{
357 struct bio *bio = NULL;
358 unsigned int block_offset; /* block offset of mp within page */
359 struct inode *inode = page->mapping->host;
360 unsigned int blocks_per_mp = JFS_SBI(inode->i_sb)->nbperpage;
361 unsigned int len;
362 unsigned int xlen;
363 struct metapage *mp;
364 int redirty = 0;
365 sector_t lblock;
366 sector_t pblock;
367 sector_t next_block = 0;
368 sector_t page_start;
369 unsigned long bio_bytes = 0;
370 unsigned long bio_offset = 0;
371 unsigned int offset;
372
373 page_start = (sector_t)page->index <<
374 (PAGE_CACHE_SHIFT - inode->i_blkbits);
375 BUG_ON(!PageLocked(page));
376 BUG_ON(PageWriteback(page));
377
378 for (offset = 0; offset < PAGE_CACHE_SIZE; offset += PSIZE) {
379 mp = page_to_mp(page, offset);
380
381 if (!mp || !test_bit(META_dirty, &mp->flag))
382 continue;
383
384 if (mp->nohomeok && !test_bit(META_forcewrite, &mp->flag)) {
385 redirty = 1;
Dave Kleikampac17b8b2005-10-03 15:32:11 -0500386 /*
387 * Make sure this page isn't blocked indefinitely.
388 * If the journal isn't undergoing I/O, push it
389 */
390 if (mp->log && !(mp->log->cflag & logGC_PAGEOUT))
391 jfs_flush_journal(mp->log, 0);
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600392 continue;
393 }
394
395 clear_bit(META_dirty, &mp->flag);
396 block_offset = offset >> inode->i_blkbits;
397 lblock = page_start + block_offset;
398 if (bio) {
399 if (xlen && lblock == next_block) {
400 /* Contiguous, in memory & on disk */
401 len = min(xlen, blocks_per_mp);
402 xlen -= len;
403 bio_bytes += len << inode->i_blkbits;
404 set_bit(META_io, &mp->flag);
405 continue;
406 }
407 /* Not contiguous */
408 if (bio_add_page(bio, page, bio_bytes, bio_offset) <
409 bio_bytes)
410 goto add_failed;
411 /*
412 * Increment counter before submitting i/o to keep
413 * count from hitting zero before we're through
414 */
415 inc_io(page);
416 if (!bio->bi_size)
417 goto dump_bio;
418 submit_bio(WRITE, bio);
419 bio = NULL;
420 } else {
421 set_page_writeback(page);
422 inc_io(page);
423 }
424 xlen = (PAGE_CACHE_SIZE - offset) >> inode->i_blkbits;
425 pblock = metapage_get_blocks(inode, lblock, &xlen);
426 if (!pblock) {
427 /* Need better error handling */
428 printk(KERN_ERR "JFS: metapage_get_blocks failed\n");
429 dec_io(page, last_write_complete);
430 continue;
431 }
432 set_bit(META_io, &mp->flag);
433 len = min(xlen, (uint) JFS_SBI(inode->i_sb)->nbperpage);
434
435 bio = bio_alloc(GFP_NOFS, 1);
436 bio->bi_bdev = inode->i_sb->s_bdev;
437 bio->bi_sector = pblock << (inode->i_blkbits - 9);
438 bio->bi_end_io = metapage_write_end_io;
439 bio->bi_private = page;
440
441 /* Don't call bio_add_page yet, we may add to this vec */
442 bio_offset = offset;
443 bio_bytes = len << inode->i_blkbits;
444
445 xlen -= len;
446 next_block = lblock + len;
447 }
448 if (bio) {
449 if (bio_add_page(bio, page, bio_bytes, bio_offset) < bio_bytes)
450 goto add_failed;
451 if (!bio->bi_size)
452 goto dump_bio;
Dave Kleikamp63f83c92006-10-02 09:55:27 -0500453
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600454 submit_bio(WRITE, bio);
455 }
456 if (redirty)
457 redirty_page_for_writepage(wbc, page);
458
459 unlock_page(page);
460
461 return 0;
462add_failed:
463 /* We should never reach here, since we're only adding one vec */
464 printk(KERN_ERR "JFS: bio_add_page failed unexpectedly\n");
465 goto skip;
466dump_bio:
Dave Kleikamp288e4d82007-06-13 10:17:50 -0500467 print_hex_dump(KERN_ERR, "JFS: dump of bio: ", DUMP_PREFIX_ADDRESS, 16,
468 4, bio, sizeof(*bio), 0);
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600469skip:
470 bio_put(bio);
471 unlock_page(page);
472 dec_io(page, last_write_complete);
473
474 return -EIO;
475}
476
477static int metapage_readpage(struct file *fp, struct page *page)
478{
479 struct inode *inode = page->mapping->host;
480 struct bio *bio = NULL;
481 unsigned int block_offset;
482 unsigned int blocks_per_page = PAGE_CACHE_SIZE >> inode->i_blkbits;
483 sector_t page_start; /* address of page in fs blocks */
484 sector_t pblock;
485 unsigned int xlen;
486 unsigned int len;
487 unsigned int offset;
488
489 BUG_ON(!PageLocked(page));
490 page_start = (sector_t)page->index <<
491 (PAGE_CACHE_SHIFT - inode->i_blkbits);
492
493 block_offset = 0;
494 while (block_offset < blocks_per_page) {
495 xlen = blocks_per_page - block_offset;
496 pblock = metapage_get_blocks(inode, page_start + block_offset,
497 &xlen);
498 if (pblock) {
499 if (!PagePrivate(page))
500 insert_metapage(page, NULL);
501 inc_io(page);
502 if (bio)
503 submit_bio(READ, bio);
504
505 bio = bio_alloc(GFP_NOFS, 1);
506 bio->bi_bdev = inode->i_sb->s_bdev;
507 bio->bi_sector = pblock << (inode->i_blkbits - 9);
508 bio->bi_end_io = metapage_read_end_io;
509 bio->bi_private = page;
510 len = xlen << inode->i_blkbits;
511 offset = block_offset << inode->i_blkbits;
512 if (bio_add_page(bio, page, len, offset) < len)
513 goto add_failed;
514 block_offset += xlen;
515 } else
516 block_offset++;
517 }
518 if (bio)
519 submit_bio(READ, bio);
520 else
521 unlock_page(page);
522
523 return 0;
524
525add_failed:
526 printk(KERN_ERR "JFS: bio_add_page failed unexpectedly\n");
527 bio_put(bio);
528 dec_io(page, last_read_complete);
529 return -EIO;
530}
531
Al Viro27496a82005-10-21 03:20:48 -0400532static int metapage_releasepage(struct page *page, gfp_t gfp_mask)
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600533{
534 struct metapage *mp;
Dave Kleikampb9646382006-05-24 07:43:38 -0500535 int ret = 1;
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600536 unsigned int offset;
537
538 for (offset = 0; offset < PAGE_CACHE_SIZE; offset += PSIZE) {
539 mp = page_to_mp(page, offset);
540
541 if (!mp)
542 continue;
543
544 jfs_info("metapage_releasepage: mp = 0x%p", mp);
Dave Kleikampb9646382006-05-24 07:43:38 -0500545 if (mp->count || mp->nohomeok ||
546 test_bit(META_dirty, &mp->flag)) {
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600547 jfs_info("count = %ld, nohomeok = %d", mp->count,
548 mp->nohomeok);
Dave Kleikampb9646382006-05-24 07:43:38 -0500549 ret = 0;
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600550 continue;
551 }
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600552 if (mp->lsn)
553 remove_from_logsync(mp);
554 remove_metapage(page, mp);
555 INCREMENT(mpStat.pagefree);
556 free_metapage(mp);
557 }
Dave Kleikampb9646382006-05-24 07:43:38 -0500558 return ret;
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600559}
560
NeilBrown2ff28e22006-03-26 01:37:18 -0800561static void metapage_invalidatepage(struct page *page, unsigned long offset)
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600562{
563 BUG_ON(offset);
564
NeilBrown2ff28e22006-03-26 01:37:18 -0800565 BUG_ON(PageWriteback(page));
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600566
NeilBrown2ff28e22006-03-26 01:37:18 -0800567 metapage_releasepage(page, 0);
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600568}
569
Christoph Hellwigf5e54d62006-06-28 04:26:44 -0700570const struct address_space_operations jfs_metapage_aops = {
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600571 .readpage = metapage_readpage,
572 .writepage = metapage_writepage,
573 .sync_page = block_sync_page,
574 .releasepage = metapage_releasepage,
575 .invalidatepage = metapage_invalidatepage,
576 .set_page_dirty = __set_page_dirty_nobuffers,
577};
578
Linus Torvalds1da177e2005-04-16 15:20:36 -0700579struct metapage *__get_metapage(struct inode *inode, unsigned long lblock,
580 unsigned int size, int absolute,
581 unsigned long new)
582{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700583 int l2BlocksPerPage;
584 int l2bsize;
585 struct address_space *mapping;
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600586 struct metapage *mp = NULL;
587 struct page *page;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700588 unsigned long page_index;
589 unsigned long page_offset;
590
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600591 jfs_info("__get_metapage: ino = %ld, lblock = 0x%lx, abs=%d",
592 inode->i_ino, lblock, absolute);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700593
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600594 l2bsize = inode->i_blkbits;
595 l2BlocksPerPage = PAGE_CACHE_SHIFT - l2bsize;
596 page_index = lblock >> l2BlocksPerPage;
597 page_offset = (lblock - (page_index << l2BlocksPerPage)) << l2bsize;
598 if ((page_offset + size) > PAGE_CACHE_SIZE) {
599 jfs_err("MetaData crosses page boundary!!");
600 jfs_err("lblock = %lx, size = %d", lblock, size);
601 dump_stack();
602 return NULL;
603 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700604 if (absolute)
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600605 mapping = JFS_SBI(inode->i_sb)->direct_inode->i_mapping;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700606 else {
607 /*
608 * If an nfs client tries to read an inode that is larger
609 * than any existing inodes, we may try to read past the
610 * end of the inode map
611 */
612 if ((lblock << inode->i_blkbits) >= inode->i_size)
613 return NULL;
614 mapping = inode->i_mapping;
615 }
616
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600617 if (new && (PSIZE == PAGE_CACHE_SIZE)) {
618 page = grab_cache_page(mapping, page_index);
619 if (!page) {
620 jfs_err("grab_cache_page failed!");
621 return NULL;
622 }
623 SetPageUptodate(page);
624 } else {
Pekka Enberg090d2b12006-06-23 02:05:08 -0700625 page = read_mapping_page(mapping, page_index, NULL);
Dave Kleikampc40c20242005-07-22 11:08:44 -0500626 if (IS_ERR(page) || !PageUptodate(page)) {
Pekka Enberg090d2b12006-06-23 02:05:08 -0700627 jfs_err("read_mapping_page failed!");
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600628 return NULL;
629 }
630 lock_page(page);
631 }
632
633 mp = page_to_mp(page, page_offset);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700634 if (mp) {
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600635 if (mp->logical_size != size) {
636 jfs_error(inode->i_sb,
637 "__get_metapage: mp->logical_size != size");
638 jfs_err("logical_size = %d, size = %d",
639 mp->logical_size, size);
640 dump_stack();
Dave Kleikamp63f83c92006-10-02 09:55:27 -0500641 goto unlock;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700642 }
643 mp->count++;
644 lock_metapage(mp);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700645 if (test_bit(META_discard, &mp->flag)) {
646 if (!new) {
647 jfs_error(inode->i_sb,
648 "__get_metapage: using a "
649 "discarded metapage");
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600650 discard_metapage(mp);
Dave Kleikamp63f83c92006-10-02 09:55:27 -0500651 goto unlock;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700652 }
653 clear_bit(META_discard, &mp->flag);
654 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700655 } else {
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600656 INCREMENT(mpStat.pagealloc);
657 mp = alloc_metapage(GFP_NOFS);
658 mp->page = page;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700659 mp->flag = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700660 mp->xflag = COMMIT_PAGE;
661 mp->count = 1;
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600662 mp->nohomeok = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700663 mp->logical_size = size;
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600664 mp->data = page_address(page) + page_offset;
665 mp->index = lblock;
666 if (unlikely(insert_metapage(page, mp))) {
667 free_metapage(mp);
668 goto unlock;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700669 }
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600670 lock_metapage(mp);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700671 }
672
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600673 if (new) {
674 jfs_info("zeroing mp = 0x%p", mp);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700675 memset(mp->data, 0, PSIZE);
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600676 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700677
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600678 unlock_page(page);
679 jfs_info("__get_metapage: returning = 0x%p data = 0x%p", mp, mp->data);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700680 return mp;
681
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600682unlock:
683 unlock_page(page);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700684 return NULL;
685}
686
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600687void grab_metapage(struct metapage * mp)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700688{
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600689 jfs_info("grab_metapage: mp = 0x%p", mp);
690 page_cache_get(mp->page);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700691 lock_page(mp->page);
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600692 mp->count++;
693 lock_metapage(mp);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700694 unlock_page(mp->page);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700695}
696
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600697void force_metapage(struct metapage *mp)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700698{
699 struct page *page = mp->page;
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600700 jfs_info("force_metapage: mp = 0x%p", mp);
701 set_bit(META_forcewrite, &mp->flag);
702 clear_bit(META_sync, &mp->flag);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700703 page_cache_get(page);
704 lock_page(page);
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600705 set_page_dirty(page);
706 write_one_page(page, 1);
707 clear_bit(META_forcewrite, &mp->flag);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700708 page_cache_release(page);
709}
710
Dave Kleikamp1868f4a2005-05-04 15:29:35 -0500711void hold_metapage(struct metapage *mp)
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600712{
713 lock_page(mp->page);
714}
715
Dave Kleikamp1868f4a2005-05-04 15:29:35 -0500716void put_metapage(struct metapage *mp)
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600717{
718 if (mp->count || mp->nohomeok) {
719 /* Someone else will release this */
720 unlock_page(mp->page);
721 return;
722 }
723 page_cache_get(mp->page);
724 mp->count++;
725 lock_metapage(mp);
726 unlock_page(mp->page);
727 release_metapage(mp);
728}
729
Linus Torvalds1da177e2005-04-16 15:20:36 -0700730void release_metapage(struct metapage * mp)
731{
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600732 struct page *page = mp->page;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700733 jfs_info("release_metapage: mp = 0x%p, flag = 0x%lx", mp, mp->flag);
734
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600735 BUG_ON(!page);
736
737 lock_page(page);
738 unlock_metapage(mp);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700739
740 assert(mp->count);
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600741 if (--mp->count || mp->nohomeok) {
742 unlock_page(page);
743 page_cache_release(page);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700744 return;
745 }
746
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600747 if (test_bit(META_dirty, &mp->flag)) {
748 set_page_dirty(page);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700749 if (test_bit(META_sync, &mp->flag)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700750 clear_bit(META_sync, &mp->flag);
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600751 write_one_page(page, 1);
752 lock_page(page); /* write_one_page unlocks the page */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700753 }
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600754 } else if (mp->lsn) /* discard_metapage doesn't remove it */
755 remove_from_logsync(mp);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700756
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600757 /* Try to keep metapages from using up too much memory */
758 drop_metapage(page, mp);
Dave Kleikampd0e671a2006-12-20 15:55:35 -0600759
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600760 unlock_page(page);
761 page_cache_release(page);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700762}
763
764void __invalidate_metapages(struct inode *ip, s64 addr, int len)
765{
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600766 sector_t lblock;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700767 int l2BlocksPerPage = PAGE_CACHE_SHIFT - ip->i_blkbits;
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600768 int BlocksPerPage = 1 << l2BlocksPerPage;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700769 /* All callers are interested in block device's mapping */
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600770 struct address_space *mapping =
771 JFS_SBI(ip->i_sb)->direct_inode->i_mapping;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700772 struct metapage *mp;
773 struct page *page;
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600774 unsigned int offset;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700775
776 /*
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600777 * Mark metapages to discard. They will eventually be
Linus Torvalds1da177e2005-04-16 15:20:36 -0700778 * released, but should not be written.
779 */
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600780 for (lblock = addr & ~(BlocksPerPage - 1); lblock < addr + len;
781 lblock += BlocksPerPage) {
782 page = find_lock_page(mapping, lblock >> l2BlocksPerPage);
783 if (!page)
784 continue;
785 for (offset = 0; offset < PAGE_CACHE_SIZE; offset += PSIZE) {
786 mp = page_to_mp(page, offset);
787 if (!mp)
788 continue;
789 if (mp->index < addr)
790 continue;
791 if (mp->index >= addr + len)
792 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700793
794 clear_bit(META_dirty, &mp->flag);
795 set_bit(META_discard, &mp->flag);
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600796 if (mp->lsn)
797 remove_from_logsync(mp);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700798 }
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600799 unlock_page(page);
800 page_cache_release(page);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700801 }
802}
803
804#ifdef CONFIG_JFS_STATISTICS
805int jfs_mpstat_read(char *buffer, char **start, off_t offset, int length,
806 int *eof, void *data)
807{
808 int len = 0;
809 off_t begin;
810
811 len += sprintf(buffer,
812 "JFS Metapage statistics\n"
813 "=======================\n"
814 "page allocations = %d\n"
815 "page frees = %d\n"
816 "lock waits = %d\n",
817 mpStat.pagealloc,
818 mpStat.pagefree,
819 mpStat.lockwait);
820
821 begin = offset;
822 *start = buffer + begin;
823 len -= begin;
824
825 if (len > length)
826 len = length;
827 else
828 *eof = 1;
829
830 if (len < 0)
831 len = 0;
832
833 return len;
834}
835#endif