diff options
Diffstat (limited to 'packages/linux/openzaurus-pxa27x-2.4.20-rmk2-embedix20050602/P14-lowlatency_041221.patch')
-rw-r--r-- | packages/linux/openzaurus-pxa27x-2.4.20-rmk2-embedix20050602/P14-lowlatency_041221.patch | 1677 |
1 files changed, 0 insertions, 1677 deletions
diff --git a/packages/linux/openzaurus-pxa27x-2.4.20-rmk2-embedix20050602/P14-lowlatency_041221.patch b/packages/linux/openzaurus-pxa27x-2.4.20-rmk2-embedix20050602/P14-lowlatency_041221.patch deleted file mode 100644 index edd63fb13b..0000000000 --- a/packages/linux/openzaurus-pxa27x-2.4.20-rmk2-embedix20050602/P14-lowlatency_041221.patch +++ /dev/null @@ -1,1677 +0,0 @@ -diff -Nur c3000_pre/linux/arch/arm/config.in c3000_test/linux/arch/arm/config.in ---- c3000_pre/linux/arch/arm/config.in 2004-12-16 22:55:34.000000000 +0900 -+++ c3000_test/linux/arch/arm/config.in 2004-12-20 23:23:28.000000000 +0900 -@@ -574,6 +574,8 @@ - fi - fi - dep_bool 'Preemptible Kernel support' CONFIG_PREEMPT $CONFIG_CPU_32 -+bool 'Low latency scheduling' CONFIG_LOLAT -+dep_bool 'Control low latency with sysctl' CONFIG_LOLAT_SYSCTL $CONFIG_LOLAT - - endmenu - -diff -Nur c3000_pre/linux/arch/i386/config.in c3000_test/linux/arch/i386/config.in ---- c3000_pre/linux/arch/i386/config.in 2004-08-21 09:48:09.000000000 +0900 -+++ c3000_test/linux/arch/i386/config.in 2004-12-20 22:56:21.000000000 +0900 -@@ -25,6 +25,9 @@ - - mainmenu_option next_comment - comment 'Processor type and features' -+bool 'Low latency scheduling' CONFIG_LOLAT -+dep_bool 'Control low latency with sysctl' CONFIG_LOLAT_SYSCTL $CONFIG_LOLAT -+ - choice 'Processor family' \ - "386 CONFIG_M386 \ - 486 CONFIG_M486 \ -diff -Nur c3000_pre/linux/drivers/block/ll_rw_blk.c c3000_test/linux/drivers/block/ll_rw_blk.c ---- c3000_pre/linux/drivers/block/ll_rw_blk.c 2004-08-21 09:48:24.000000000 +0900 -+++ c3000_test/linux/drivers/block/ll_rw_blk.c 2004-12-20 22:56:21.000000000 +0900 -@@ -1211,6 +1211,7 @@ - kstat.pgpgin += count; - break; - } -+ conditional_schedule(); - } - - /** -diff -Nur c3000_pre/linux/drivers/char/mem.c c3000_test/linux/drivers/char/mem.c ---- c3000_pre/linux/drivers/char/mem.c 2004-08-21 09:48:25.000000000 +0900 -+++ c3000_test/linux/drivers/char/mem.c 2004-12-20 22:56:21.000000000 +0900 -@@ -422,7 +422,7 @@ - if (count > size) - count = size; - -- zap_page_range(mm, addr, count); -+ zap_page_range(mm, addr, count, 0); - zeromap_page_range(addr, count, PAGE_COPY); - - size -= count; -diff -Nur c3000_pre/linux/drivers/char/random.c c3000_test/linux/drivers/char/random.c ---- c3000_pre/linux/drivers/char/random.c 2004-08-21 09:48:25.000000000 +0900 -+++ c3000_test/linux/drivers/char/random.c 2004-12-20 22:56:21.000000000 +0900 -@@ -1374,6 +1374,11 @@ - buf += i; - ret += i; - add_timer_randomness(&extract_timer_state, nbytes); -+#if LOWLATENCY_NEEDED -+ /* This can happen in softirq's, but that's what we want */ -+ if (conditional_schedule_needed()) -+ break; -+#endif - } - - /* Wipe data just returned from memory */ -diff -Nur c3000_pre/linux/drivers/i2c/i2c-core.c c3000_test/linux/drivers/i2c/i2c-core.c ---- c3000_pre/linux/drivers/i2c/i2c-core.c 2004-08-21 09:48:34.000000000 +0900 -+++ c3000_test/linux/drivers/i2c/i2c-core.c 2004-12-20 22:56:21.000000000 +0900 -@@ -761,6 +761,8 @@ - { - int ret; - -+ conditional_schedule(); -+ - if (adap->algo->master_xfer) { - DEB2(printk("i2c-core.o: master_xfer: %s with %d msgs.\n", - adap->name,num)); -@@ -783,6 +785,8 @@ - struct i2c_adapter *adap=client->adapter; - struct i2c_msg msg; - -+ conditional_schedule(); -+ - if (client->adapter->algo->master_xfer) { - msg.addr = client->addr; - msg.flags = client->flags & I2C_M_TEN; -@@ -812,6 +816,9 @@ - struct i2c_adapter *adap=client->adapter; - struct i2c_msg msg; - int ret; -+ -+ conditional_schedule(); -+ - if (client->adapter->algo->master_xfer) { - msg.addr = client->addr; - msg.flags = client->flags & I2C_M_TEN; -diff -Nur c3000_pre/linux/fs/buffer.c c3000_test/linux/fs/buffer.c ---- c3000_pre/linux/fs/buffer.c 2004-08-21 09:48:58.000000000 +0900 -+++ c3000_test/linux/fs/buffer.c 2004-12-20 22:56:21.000000000 +0900 -@@ -216,8 +216,10 @@ - - if (dev != NODEV && bh->b_dev != dev) - continue; -- if (test_and_set_bit(BH_Lock, &bh->b_state)) -+ if (test_and_set_bit(BH_Lock, &bh->b_state)) { -+ __refile_buffer(bh); - continue; -+ } - if (atomic_set_buffer_clean(bh)) { - __refile_buffer(bh); - get_bh(bh); -@@ -227,6 +229,7 @@ - - spin_unlock(&lru_list_lock); - write_locked_buffers(array, count); -+ conditional_schedule(); - return -EAGAIN; - } - unlock_buffer(bh); -@@ -260,12 +263,19 @@ - struct buffer_head * next; - int nr; - -- next = lru_list[index]; - nr = nr_buffers_type[index]; -+repeat: -+ next = lru_list[index]; - while (next && --nr >= 0) { - struct buffer_head *bh = next; - next = bh->b_next_free; - -+ if (conditional_schedule_needed()) { -+ spin_unlock(&lru_list_lock); -+ unconditional_schedule(); -+ spin_lock(&lru_list_lock); -+ goto repeat; -+ } - if (!buffer_locked(bh)) { - if (refile) - __refile_buffer(bh); -@@ -273,7 +283,6 @@ - } - if (dev != NODEV && bh->b_dev != dev) - continue; -- - get_bh(bh); - spin_unlock(&lru_list_lock); - wait_on_buffer (bh); -@@ -306,6 +315,15 @@ - { - int err = 0; - -+#if LOWLATENCY_NEEDED -+ /* -+ * syncing devA when there are lots of buffers dirty against -+ * devB is expensive. -+ */ -+ if (enable_lowlatency) -+ dev = NODEV; -+#endif -+ - /* One pass for no-wait, three for wait: - * 0) write out all dirty, unlocked buffers; - * 1) wait for all dirty locked buffers; -@@ -697,6 +715,16 @@ - /* Not hashed? */ - if (!bh->b_pprev) - continue; -+ -+ if (conditional_schedule_needed()) { -+ get_bh(bh); -+ spin_unlock(&lru_list_lock); -+ unconditional_schedule(); -+ spin_lock(&lru_list_lock); -+ put_bh(bh); -+ slept = 1; -+ } -+ - if (buffer_locked(bh)) { - get_bh(bh); - spin_unlock(&lru_list_lock); -@@ -848,12 +876,19 @@ - struct buffer_head *bh; - struct inode tmp; - int err = 0, err2; -- -+ DEFINE_RESCHED_COUNT; -+ - INIT_LIST_HEAD(&tmp.i_dirty_buffers); -- -+ -+repeat: - spin_lock(&lru_list_lock); - - while (!list_empty(list)) { -+ if (conditional_schedule_needed()) { -+ spin_unlock(&lru_list_lock); -+ unconditional_schedule(); -+ goto repeat; -+ } - bh = BH_ENTRY(list->next); - list_del(&bh->b_inode_buffers); - if (!buffer_dirty(bh) && !buffer_locked(bh)) -@@ -878,8 +913,18 @@ - spin_lock(&lru_list_lock); - } - } -+ if (TEST_RESCHED_COUNT(32)) { -+ RESET_RESCHED_COUNT(); -+ if (conditional_schedule_needed()) { -+ spin_unlock(&lru_list_lock); -+ unconditional_schedule(); /* Syncing many dirty buffers */ -+ spin_lock(&lru_list_lock); -+ } -+ } - } - -+ RESET_RESCHED_COUNT(); -+ - while (!list_empty(&tmp.i_dirty_buffers)) { - bh = BH_ENTRY(tmp.i_dirty_buffers.prev); - remove_inode_queue(bh); -@@ -889,6 +934,7 @@ - if (!buffer_uptodate(bh)) - err = -EIO; - brelse(bh); -+ conditional_schedule(); - spin_lock(&lru_list_lock); - } - -@@ -916,11 +962,20 @@ - struct buffer_head *bh; - struct list_head *p; - int err = 0; -+ DEFINE_RESCHED_COUNT; - -+repeat: -+ conditional_schedule(); - spin_lock(&lru_list_lock); - -- repeat: - list_for_each_prev(p, list) { -+ if (TEST_RESCHED_COUNT(32)) { -+ RESET_RESCHED_COUNT(); -+ if (conditional_schedule_needed()) { -+ spin_unlock(&lru_list_lock); -+ goto repeat; -+ } -+ } - bh = BH_ENTRY(p); - if (buffer_locked(bh)) { - get_bh(bh); -@@ -929,7 +984,6 @@ - if (!buffer_uptodate(bh)) - err = -EIO; - brelse(bh); -- spin_lock(&lru_list_lock); - goto repeat; - } - } -@@ -946,12 +1000,24 @@ - void invalidate_inode_buffers(struct inode *inode) - { - struct list_head * entry; -- -+ -+repeat: -+ conditional_schedule(); - spin_lock(&lru_list_lock); -- while ((entry = inode->i_dirty_buffers.next) != &inode->i_dirty_buffers) -+ while ((entry = inode->i_dirty_buffers.next) != &inode->i_dirty_buffers) { -+ if (conditional_schedule_needed()) { -+ spin_unlock(&lru_list_lock); -+ goto repeat; -+ } - remove_inode_queue(BH_ENTRY(entry)); -- while ((entry = inode->i_dirty_data_buffers.next) != &inode->i_dirty_data_buffers) -+ } -+ while ((entry = inode->i_dirty_data_buffers.next) != &inode->i_dirty_data_buffers) { -+ if (conditional_schedule_needed()) { -+ spin_unlock(&lru_list_lock); -+ goto repeat; -+ } - remove_inode_queue(BH_ENTRY(entry)); -+ } - spin_unlock(&lru_list_lock); - } - -@@ -974,6 +1040,7 @@ - bh = get_hash_table(dev, block, size); - if (bh) { - touch_buffer(bh); -+ conditional_schedule(); - return bh; - } - -@@ -2831,7 +2898,7 @@ - - DECLARE_WAIT_QUEUE_HEAD(bdflush_wait); - --void wakeup_bdflush(void) -+void wakeup_bdflush(void) - { - wake_up_interruptible(&bdflush_wait); - } -diff -Nur c3000_pre/linux/fs/dcache.c c3000_test/linux/fs/dcache.c ---- c3000_pre/linux/fs/dcache.c 2004-08-21 09:48:58.000000000 +0900 -+++ c3000_test/linux/fs/dcache.c 2004-12-20 22:56:21.000000000 +0900 -@@ -320,11 +320,23 @@ - - void prune_dcache(int count) - { -+ DEFINE_RESCHED_COUNT; -+ -+redo: - spin_lock(&dcache_lock); - for (;;) { - struct dentry *dentry; - struct list_head *tmp; - -+ if (TEST_RESCHED_COUNT(100)) { -+ RESET_RESCHED_COUNT(); -+ if (conditional_schedule_needed()) { -+ spin_unlock(&dcache_lock); -+ unconditional_schedule(); -+ goto redo; -+ } -+ } -+ - tmp = dentry_unused.prev; - - if (tmp == &dentry_unused) -@@ -479,6 +491,7 @@ - struct dentry *this_parent = parent; - struct list_head *next; - int found = 0; -+ DEFINE_RESCHED_COUNT; - - spin_lock(&dcache_lock); - repeat: -@@ -493,6 +506,13 @@ - list_add(&dentry->d_lru, dentry_unused.prev); - found++; - } -+ -+ if (TEST_RESCHED_COUNT(500) && found > 10) { -+ if (conditional_schedule_needed()) /* Typically sys_rmdir() */ -+ goto out; -+ RESET_RESCHED_COUNT(); -+ } -+ - /* - * Descend a level if the d_subdirs list is non-empty. - */ -@@ -517,6 +537,7 @@ - #endif - goto resume; - } -+out: - spin_unlock(&dcache_lock); - return found; - } -@@ -532,8 +553,10 @@ - { - int found; - -- while ((found = select_parent(parent)) != 0) -+ while ((found = select_parent(parent)) != 0) { - prune_dcache(found); -+ conditional_schedule(); /* Typically sys_rmdir() */ -+ } - } - - /* -diff -Nur c3000_pre/linux/fs/exec.c c3000_test/linux/fs/exec.c ---- c3000_pre/linux/fs/exec.c 2004-08-21 09:48:58.000000000 +0900 -+++ c3000_test/linux/fs/exec.c 2004-12-20 22:56:21.000000000 +0900 -@@ -249,7 +249,7 @@ - memset(kaddr+offset+len, 0, - PAGE_SIZE-offset-len); - } -- err = copy_from_user(kaddr+offset, str, bytes_to_copy); -+ err = ll_copy_from_user(kaddr+offset, str, bytes_to_copy); - if (err) { - ret = -EFAULT; - goto out; -diff -Nur c3000_pre/linux/fs/ext2/dir.c c3000_test/linux/fs/ext2/dir.c ---- c3000_pre/linux/fs/ext2/dir.c 2004-08-21 09:48:59.000000000 +0900 -+++ c3000_test/linux/fs/ext2/dir.c 2004-12-20 22:56:21.000000000 +0900 -@@ -153,6 +153,7 @@ - struct address_space *mapping = dir->i_mapping; - struct page *page = read_cache_page(mapping, n, - (filler_t*)mapping->a_ops->readpage, NULL); -+ conditional_schedule(); /* Scanning large directories */ - if (!IS_ERR(page)) { - wait_on_page(page); - kmap(page); -diff -Nur c3000_pre/linux/fs/ext2/inode.c c3000_test/linux/fs/ext2/inode.c ---- c3000_pre/linux/fs/ext2/inode.c 2004-08-21 09:48:59.000000000 +0900 -+++ c3000_test/linux/fs/ext2/inode.c 2004-12-20 22:56:21.000000000 +0900 -@@ -715,8 +715,13 @@ - { - unsigned long block_to_free = 0, count = 0; - unsigned long nr; -+ DEFINE_RESCHED_COUNT; - - for ( ; p < q ; p++) { -+ if (TEST_RESCHED_COUNT(32)) { -+ RESET_RESCHED_COUNT(); -+ conditional_schedule(); -+ } - nr = le32_to_cpu(*p); - if (nr) { - *p = 0; -@@ -759,6 +764,7 @@ - if (depth--) { - int addr_per_block = EXT2_ADDR_PER_BLOCK(inode->i_sb); - for ( ; p < q ; p++) { -+ conditional_schedule(); /* Deleting large files */ - nr = le32_to_cpu(*p); - if (!nr) - continue; -diff -Nur c3000_pre/linux/fs/ext3/balloc.c c3000_test/linux/fs/ext3/balloc.c ---- c3000_pre/linux/fs/ext3/balloc.c 2004-08-21 09:48:59.000000000 +0900 -+++ c3000_test/linux/fs/ext3/balloc.c 2004-12-20 22:56:21.000000000 +0900 -@@ -363,6 +363,9 @@ - } - } - #endif -+ /* superblock lock is held, so this is safe */ -+ conditional_schedule(); -+ - BUFFER_TRACE(bitmap_bh, "clear bit"); - if (!ext3_clear_bit (bit + i, bitmap_bh->b_data)) { - ext3_error (sb, __FUNCTION__, -diff -Nur c3000_pre/linux/fs/ext3/inode.c c3000_test/linux/fs/ext3/inode.c ---- c3000_pre/linux/fs/ext3/inode.c 2004-08-21 09:48:59.000000000 +0900 -+++ c3000_test/linux/fs/ext3/inode.c 2004-12-20 22:56:21.000000000 +0900 -@@ -902,6 +902,8 @@ - - prev_blocks = inode->i_blocks; - -+ conditional_schedule(); /* Reading large directories */ -+ - bh = ext3_getblk (handle, inode, block, create, err); - if (!bh) - return bh; -@@ -1605,6 +1607,7 @@ - */ - for (p = first; p < last; p++) { - u32 nr = le32_to_cpu(*p); -+ conditional_schedule(); - if (nr) { - struct buffer_head *bh; - -@@ -1659,6 +1662,7 @@ - } - - for (p = first; p < last; p++) { -+ conditional_schedule(); - nr = le32_to_cpu(*p); - if (nr) { - /* accumulate blocks to free if they're contiguous */ -diff -Nur c3000_pre/linux/fs/ext3/namei.c c3000_test/linux/fs/ext3/namei.c ---- c3000_pre/linux/fs/ext3/namei.c 2004-08-21 09:48:59.000000000 +0900 -+++ c3000_test/linux/fs/ext3/namei.c 2004-12-20 22:56:21.000000000 +0900 -@@ -157,6 +157,7 @@ - if ((bh = bh_use[ra_ptr++]) == NULL) - goto next; - wait_on_buffer(bh); -+ conditional_schedule(); - if (!buffer_uptodate(bh)) { - /* read error, skip block & hope for the best */ - brelse(bh); -diff -Nur c3000_pre/linux/fs/inode.c c3000_test/linux/fs/inode.c ---- c3000_pre/linux/fs/inode.c 2004-08-21 09:48:58.000000000 +0900 -+++ c3000_test/linux/fs/inode.c 2004-12-20 23:00:06.000000000 +0900 -@@ -251,6 +251,8 @@ - - filemap_fdatawait(inode->i_mapping); - -+ conditional_schedule(); -+ - spin_lock(&inode_lock); - inode->i_state &= ~I_LOCK; - if (!(inode->i_state & I_FREEING)) { -@@ -561,6 +563,7 @@ - - while ((inode_entry = head->next) != head) - { -+ conditional_schedule(); - list_del(inode_entry); - - inode = list_entry(inode_entry, struct inode, i_list); -@@ -589,9 +592,22 @@ - if (tmp == head) - break; - inode = list_entry(tmp, struct inode, i_list); -+ -+ if (conditional_schedule_needed()) { -+ atomic_inc(&inode->i_count); -+ spin_unlock(&inode_lock); -+ unconditional_schedule(); -+ spin_lock(&inode_lock); -+ atomic_dec(&inode->i_count); -+ } -+ - if (inode->i_sb != sb) - continue; -+ atomic_inc(&inode->i_count); -+ spin_unlock(&inode_lock); - invalidate_inode_buffers(inode); -+ spin_lock(&inode_lock); -+ atomic_dec(&inode->i_count); - if (!atomic_read(&inode->i_count)) { - list_del_init(&inode->i_hash); - list_del(&inode->i_list); -@@ -896,6 +912,8 @@ - if (inode) { - struct inode * old; - -+ conditional_schedule(); /* sync_old_buffers */ -+ - spin_lock(&inode_lock); - /* We released the lock, so.. */ - old = find_inode(sb, ino, head, find_actor, opaque); -@@ -1313,18 +1331,32 @@ - int request=goal; - int loop=0; - #endif -+ int nr_to_scan = inodes_stat.nr_unused; - -+resume: - spin_lock(&inode_lock); - - count = 0; - entry = inode_unused.prev; -- while (entry != &inode_unused) -- { -+ while (entry != &inode_unused && nr_to_scan--) { - struct list_head *tmp = entry; - - #ifdef JFFS2_INODE_DEBUG - loop++; - #endif -+ if (conditional_schedule_needed()) { -+ /* -+ * Need to drop the lock. Reposition -+ * the list head so we start here next time. -+ * This can corrupt the LRU nature of the -+ * unused list, but this isn't very important. -+ */ -+ list_del(&inode_unused); -+ list_add(&inode_unused, entry); -+ spin_unlock(&inode_lock); -+ unconditional_schedule(); -+ goto resume; -+ } - entry = entry->prev; - inode = INODE(tmp); - if (inode->i_state & (I_FREEING|I_CLEAR|I_LOCK)) -diff -Nur c3000_pre/linux/fs/jbd/checkpoint.c c3000_test/linux/fs/jbd/checkpoint.c ---- c3000_pre/linux/fs/jbd/checkpoint.c 2004-08-21 09:48:59.000000000 +0900 -+++ c3000_test/linux/fs/jbd/checkpoint.c 2004-12-20 22:56:21.000000000 +0900 -@@ -431,7 +431,11 @@ - { - transaction_t *transaction, *last_transaction, *next_transaction; - int ret = 0; -+ int ll_retries = 4; /* lowlatency addition */ - -+restart: -+ if (ll_retries-- == 0) -+ goto out; - transaction = journal->j_checkpoint_transactions; - if (transaction == 0) - goto out; -@@ -451,6 +455,12 @@ - jh = next_jh; - next_jh = jh->b_cpnext; - ret += __try_to_free_cp_buf(jh); -+ if (conditional_schedule_needed()) { -+ spin_unlock(&journal_datalist_lock); -+ unconditional_schedule(); -+ spin_lock(&journal_datalist_lock); -+ goto restart; -+ } - } while (jh != last_jh); - } - } while (transaction != last_transaction); -diff -Nur c3000_pre/linux/fs/jbd/commit.c c3000_test/linux/fs/jbd/commit.c ---- c3000_pre/linux/fs/jbd/commit.c 2004-08-21 09:48:59.000000000 +0900 -+++ c3000_test/linux/fs/jbd/commit.c 2004-12-20 22:56:21.000000000 +0900 -@@ -212,6 +212,16 @@ - __journal_remove_journal_head(bh); - refile_buffer(bh); - __brelse(bh); -+ if (conditional_schedule_needed()) { -+ if (commit_transaction->t_sync_datalist) -+ commit_transaction->t_sync_datalist = -+ next_jh; -+ if (bufs) -+ break; -+ spin_unlock(&journal_datalist_lock); -+ unconditional_schedule(); -+ goto write_out_data; -+ } - } - } - if (bufs == ARRAY_SIZE(wbuf)) { -@@ -235,8 +245,7 @@ - journal_brelse_array(wbuf, bufs); - lock_journal(journal); - spin_lock(&journal_datalist_lock); -- if (bufs) -- goto write_out_data_locked; -+ goto write_out_data_locked; - } - - /* -@@ -272,6 +281,14 @@ - */ - while ((jh = commit_transaction->t_async_datalist)) { - struct buffer_head *bh = jh2bh(jh); -+ if (conditional_schedule_needed()) { -+ spin_unlock(&journal_datalist_lock); -+ unlock_journal(journal); -+ unconditional_schedule(); -+ lock_journal(journal); -+ spin_lock(&journal_datalist_lock); -+ continue; /* List may have changed */ -+ } - if (buffer_locked(bh)) { - spin_unlock(&journal_datalist_lock); - unlock_journal(journal); -@@ -486,6 +503,8 @@ - wait_for_iobuf: - while (commit_transaction->t_iobuf_list != NULL) { - struct buffer_head *bh; -+ -+ conditional_schedule(); - jh = commit_transaction->t_iobuf_list->b_tprev; - bh = jh2bh(jh); - if (buffer_locked(bh)) { -@@ -644,6 +663,8 @@ - transaction_t *cp_transaction; - struct buffer_head *bh; - -+ conditional_schedule(); /* journal is locked */ -+ - jh = commit_transaction->t_forget; - J_ASSERT_JH(jh, jh->b_transaction == commit_transaction || - jh->b_transaction == journal->j_running_transaction); -diff -Nur c3000_pre/linux/fs/proc/array.c c3000_test/linux/fs/proc/array.c ---- c3000_pre/linux/fs/proc/array.c 2004-08-21 09:49:01.000000000 +0900 -+++ c3000_test/linux/fs/proc/array.c 2004-12-20 22:56:21.000000000 +0900 -@@ -498,9 +498,11 @@ - if (end > PMD_SIZE) - end = PMD_SIZE; - do { -- pte_t page = *pte; -+ pte_t page; - struct page *ptpage; - -+ conditional_schedule(); /* For `top' and `ps' */ -+ page = *pte; - address += PAGE_SIZE; - pte++; - if (pte_none(page)) -diff -Nur c3000_pre/linux/fs/proc/generic.c c3000_test/linux/fs/proc/generic.c ---- c3000_pre/linux/fs/proc/generic.c 2004-08-21 09:49:01.000000000 +0900 -+++ c3000_test/linux/fs/proc/generic.c 2004-12-20 22:56:21.000000000 +0900 -@@ -98,6 +98,8 @@ - retval = n; - break; - } -+ -+ conditional_schedule(); /* Some /proc files are large */ - - /* This is a hack to allow mangling of file pos independent - * of actual bytes read. Simply place the data at page, -diff -Nur c3000_pre/linux/fs/reiserfs/buffer2.c c3000_test/linux/fs/reiserfs/buffer2.c ---- c3000_pre/linux/fs/reiserfs/buffer2.c 2004-08-21 09:49:01.000000000 +0900 -+++ c3000_test/linux/fs/reiserfs/buffer2.c 2004-12-20 22:56:21.000000000 +0900 -@@ -54,6 +54,7 @@ - PROC_EXP( unsigned int ctx_switches = kstat.context_swtch ); - - result = bread (super -> s_dev, n_block, n_size); -+ conditional_schedule(); - PROC_INFO_INC( super, breads ); - PROC_EXP( if( kstat.context_swtch != ctx_switches ) - PROC_INFO_INC( super, bread_miss ) ); -diff -Nur c3000_pre/linux/fs/reiserfs/journal.c c3000_test/linux/fs/reiserfs/journal.c ---- c3000_pre/linux/fs/reiserfs/journal.c 2004-08-21 09:49:01.000000000 +0900 -+++ c3000_test/linux/fs/reiserfs/journal.c 2004-12-20 22:56:21.000000000 +0900 -@@ -573,6 +573,7 @@ - /* lock the current transaction */ - inline static void lock_journal(struct super_block *p_s_sb) { - PROC_INFO_INC( p_s_sb, journal.lock_journal ); -+ conditional_schedule(); - while(atomic_read(&(SB_JOURNAL(p_s_sb)->j_wlock)) > 0) { - PROC_INFO_INC( p_s_sb, journal.lock_journal_wait ); - sleep_on(&(SB_JOURNAL(p_s_sb)->j_wait)) ; -@@ -703,6 +704,7 @@ - mark_buffer_dirty(tbh) ; - } - ll_rw_block(WRITE, 1, &tbh) ; -+ conditional_schedule(); - count++ ; - put_bh(tbh) ; /* once for our get_hash */ - } -@@ -832,6 +834,7 @@ - set_bit(BH_Dirty, &(SB_JOURNAL(p_s_sb)->j_header_bh->b_state)) ; - ll_rw_block(WRITE, 1, &(SB_JOURNAL(p_s_sb)->j_header_bh)) ; - wait_on_buffer((SB_JOURNAL(p_s_sb)->j_header_bh)) ; -+ conditional_schedule(); - if (!buffer_uptodate(SB_JOURNAL(p_s_sb)->j_header_bh)) { - printk( "reiserfs: journal-837: IO error during journal replay\n" ); - return -EIO ; -@@ -2125,6 +2128,7 @@ - } - - int journal_begin(struct reiserfs_transaction_handle *th, struct super_block * p_s_sb, unsigned long nblocks) { -+ conditional_schedule(); - return do_journal_begin_r(th, p_s_sb, nblocks, 0) ; - } - -@@ -2265,6 +2269,7 @@ - } - - int journal_end(struct reiserfs_transaction_handle *th, struct super_block *p_s_sb, unsigned long nblocks) { -+ conditional_schedule(); - return do_journal_end(th, p_s_sb, nblocks, 0) ; - } - -@@ -2716,6 +2721,7 @@ - RFALSE( buffer_locked(bh) && cur_tb != NULL, - "waiting while do_balance was running\n") ; - wait_on_buffer(bh) ; -+ conditional_schedule(); - } - PROC_INFO_INC( p_s_sb, journal.prepare_retry ); - retry_count++ ; -@@ -2888,6 +2894,7 @@ - /* copy all the real blocks into log area. dirty log blocks */ - if (test_bit(BH_JDirty, &cn->bh->b_state)) { - struct buffer_head *tmp_bh ; -+ conditional_schedule(); - tmp_bh = sb_getblk(p_s_sb, reiserfs_get_journal_block(p_s_sb) + - ((cur_write_start + jindex) % JOURNAL_BLOCK_COUNT)) ; - mark_buffer_uptodate(tmp_bh, 1) ; -diff -Nur c3000_pre/linux/fs/reiserfs/stree.c c3000_test/linux/fs/reiserfs/stree.c ---- c3000_pre/linux/fs/reiserfs/stree.c 2004-08-21 09:49:01.000000000 +0900 -+++ c3000_test/linux/fs/reiserfs/stree.c 2004-12-20 22:56:21.000000000 +0900 -@@ -652,9 +652,8 @@ - stop at leaf level - set to - DISK_LEAF_NODE_LEVEL */ - ) { -- int n_block_number = SB_ROOT_BLOCK (p_s_sb), -- expected_level = SB_TREE_HEIGHT (p_s_sb), -- n_block_size = p_s_sb->s_blocksize; -+ int n_block_number, expected_level; -+ int n_block_size = p_s_sb->s_blocksize; - struct buffer_head * p_s_bh; - struct path_element * p_s_last_element; - int n_node_level, n_retval; -@@ -666,7 +665,8 @@ - #endif - - PROC_INFO_INC( p_s_sb, search_by_key ); -- -+ conditional_schedule(); -+ - /* As we add each node to a path we increase its count. This means that - we must be careful to release all nodes in a path before we either - discard the path struct or re-use the path struct, as we do here. */ -@@ -678,6 +678,8 @@ - /* With each iteration of this loop we search through the items in the - current node, and calculate the next current node(next path element) - for the next iteration of this loop.. */ -+ n_block_number = SB_ROOT_BLOCK (p_s_sb); -+ expected_level = SB_TREE_HEIGHT (p_s_sb); - while ( 1 ) { - - #ifdef CONFIG_REISERFS_CHECK -@@ -1104,6 +1106,8 @@ - for (n_counter = *p_n_removed; - n_counter < n_unfm_number; n_counter++, p_n_unfm_pointer-- ) { - -+ conditional_schedule(); -+ - if (item_moved (&s_ih, p_s_path)) { - need_research = 1 ; - break; -diff -Nur c3000_pre/linux/include/linux/low-latency.h c3000_test/linux/include/linux/low-latency.h ---- c3000_pre/linux/include/linux/low-latency.h 1970-01-01 09:00:00.000000000 +0900 -+++ c3000_test/linux/include/linux/low-latency.h 2004-12-20 22:56:21.000000000 +0900 -@@ -0,0 +1,109 @@ -+/* -+ * include/linux/low-latency.h -+ * -+ * Andrew Morton <akpm@zip.com.au> -+ */ -+ -+#ifndef LOW_LATENCY_H_INCLUDED -+#define LOW_LATENCY_H_INCLUDED -+ -+#if defined(CONFIG_LOLAT) -+#define LOWLATENCY_NEEDED 1 -+#else -+#define LOWLATENCY_NEEDED 0 -+#endif -+ -+#if LOWLATENCY_NEEDED -+ -+#include <linux/cache.h> /* For ____cacheline_aligned */ -+ -+#ifdef CONFIG_LOLAT_SYSCTL -+extern struct low_latency_enable_struct { -+ int yep; -+} ____cacheline_aligned __enable_lowlatency; -+#define enable_lowlatency __enable_lowlatency.yep -+ -+#else -+#define enable_lowlatency 1 -+#endif -+ -+/* -+ * Set this non-zero to generate low-latency instrumentation -+ */ -+#define LOWLATENCY_DEBUG 0 -+ -+/* -+ * Set this non-zero for robustness testing -+ */ -+#define LOWLATENCY_ALWAYS_SCHEDULE 0 -+ -+#if LOWLATENCY_DEBUG -+ -+#if LOWLATENCY_ALWAYS_SCHEDULE -+#define conditional_schedule_needed() ((enable_lowlatency == 2) || (enable_lowlatency && current->need_resched)) -+#else -+#define conditional_schedule_needed() (enable_lowlatency && current->need_resched) -+#endif -+ -+struct lolat_stats_t { -+ unsigned long count; -+ int visited; -+ const char *file; -+ int line; -+ struct lolat_stats_t *next; -+}; -+ -+void set_running_and_schedule(struct lolat_stats_t *stats); -+ -+#define unconditional_schedule() \ -+ do { \ -+ static struct lolat_stats_t stats = { \ -+ file: __FILE__, \ -+ line: __LINE__, \ -+ }; \ -+ set_running_and_schedule(&stats); \ -+ } while (0) -+ -+extern void show_lolat_stats(void); -+ -+#else /* LOWLATENCY_DEBUG */ -+ -+#if LOWLATENCY_ALWAYS_SCHEDULE -+#define conditional_schedule_needed() 1 -+#else -+#define conditional_schedule_needed() (current->need_resched) -+#endif -+ -+void set_running_and_schedule(void); -+#define unconditional_schedule() set_running_and_schedule() -+ -+#endif /* LOWLATENCY_DEBUG */ -+ -+#define conditional_schedule() \ -+ do { \ -+ if (conditional_schedule_needed()) \ -+ unconditional_schedule(); \ -+ } while (0) -+ -+#define DEFINE_RESCHED_COUNT int resched_count = 0 -+#define TEST_RESCHED_COUNT(n) (enable_lowlatency && (++resched_count > (n))) -+#define RESET_RESCHED_COUNT() resched_count = 0 -+extern int ll_copy_to_user(void *to_user, const void *from, unsigned long len); -+extern int ll_copy_from_user(void *to, const void *from_user, unsigned long len); -+ -+#else /* LOWLATENCY_NEEDED */ -+ -+#define conditional_schedule_needed() 0 -+#define conditional_schedule() -+#define unconditional_schedule() -+ -+#define DEFINE_RESCHED_COUNT -+#define TEST_RESCHED_COUNT(n) 0 -+#define RESET_RESCHED_COUNT() -+#define ll_copy_to_user(to_user, from, len) copy_to_user((to_user), (from), (len)) -+#define ll_copy_from_user(to, from_user, len) copy_from_user((to), (from_user), (len)) -+ -+#endif /* LOWLATENCY_NEEDED */ -+ -+#endif /* LOW_LATENCY_H_INCLUDED */ -+ -diff -Nur c3000_pre/linux/include/linux/mm.h c3000_test/linux/include/linux/mm.h ---- c3000_pre/linux/include/linux/mm.h 2004-08-21 09:49:13.000000000 +0900 -+++ c3000_test/linux/include/linux/mm.h 2004-12-20 22:56:21.000000000 +0900 -@@ -149,6 +149,8 @@ - */ - extern pgprot_t protection_map[16]; - -+/* Actions for zap_page_range() */ -+#define ZPR_COND_RESCHED 1 /* Do a conditional_schedule() occasionally */ - - /* - * These are the virtual MM functions - opening of an area, closing and -@@ -500,7 +502,7 @@ - extern void shmem_lock(struct file * file, int lock); - extern int shmem_zero_setup(struct vm_area_struct *); - --extern void zap_page_range(struct mm_struct *mm, unsigned long address, unsigned long size); -+extern void zap_page_range(struct mm_struct *mm, unsigned long address, unsigned long size, int actions); - extern int copy_page_range(struct mm_struct *dst, struct mm_struct *src, struct vm_area_struct *vma); - extern int remap_page_range(unsigned long from, unsigned long to, unsigned long size, pgprot_t prot); - extern int zeromap_page_range(unsigned long from, unsigned long size, pgprot_t prot); -diff -Nur c3000_pre/linux/include/linux/reiserfs_fs.h c3000_test/linux/include/linux/reiserfs_fs.h ---- c3000_pre/linux/include/linux/reiserfs_fs.h 2004-08-21 09:49:13.000000000 +0900 -+++ c3000_test/linux/include/linux/reiserfs_fs.h 2004-12-20 22:56:21.000000000 +0900 -@@ -1197,8 +1197,8 @@ - #define fs_generation(s) ((s)->u.reiserfs_sb.s_generation_counter) - #define get_generation(s) atomic_read (&fs_generation(s)) - #define FILESYSTEM_CHANGED_TB(tb) (get_generation((tb)->tb_sb) != (tb)->fs_gen) --#define fs_changed(gen,s) (gen != get_generation (s)) -- -+#define __fs_changed(gen,s) (gen != get_generation (s)) -+#define fs_changed(gen,s) ({conditional_schedule(); __fs_changed(gen,s);}) - - /***************************************************************************/ - /* FIXATE NODES */ -diff -Nur c3000_pre/linux/include/linux/sched.h c3000_test/linux/include/linux/sched.h ---- c3000_pre/linux/include/linux/sched.h 2004-08-21 09:49:13.000000000 +0900 -+++ c3000_test/linux/include/linux/sched.h 2004-12-20 22:56:21.000000000 +0900 -@@ -1092,6 +1092,7 @@ - #include <linux/dcache.h> - #include <linux/tqueue.h> - #include <linux/fs_struct.h> -+#include <linux/low-latency.h> - - #endif /* __KERNEL__ */ - #endif -diff -Nur c3000_pre/linux/include/linux/sysctl.h c3000_test/linux/include/linux/sysctl.h ---- c3000_pre/linux/include/linux/sysctl.h 2004-08-21 09:49:13.000000000 +0900 -+++ c3000_test/linux/include/linux/sysctl.h 2004-12-20 22:56:21.000000000 +0900 -@@ -131,6 +131,7 @@ - KERN_CORE_USES_PID=52, /* int: use core or core.%pid */ - KERN_TAINTED=53, /* int: various kernel tainted flags */ - KERN_CADPID=54, /* int: PID of the process to notify on CAD */ -+ KERN_LOWLATENCY=55, /* int: enable low latency scheduling */ - }; - - -diff -Nur c3000_pre/linux/kernel/exit.c c3000_test/linux/kernel/exit.c ---- c3000_pre/linux/kernel/exit.c 2004-08-21 09:49:14.000000000 +0900 -+++ c3000_test/linux/kernel/exit.c 2004-12-20 22:56:21.000000000 +0900 -@@ -196,6 +196,7 @@ - } - i++; - set >>= 1; -+ conditional_schedule(); /* sys_exit, many files open */ - } - } - } -diff -Nur c3000_pre/linux/kernel/ksyms.c c3000_test/linux/kernel/ksyms.c ---- c3000_pre/linux/kernel/ksyms.c 2004-12-19 00:35:59.000000000 +0900 -+++ c3000_test/linux/kernel/ksyms.c 2004-12-20 23:07:26.000000000 +0900 -@@ -481,6 +481,13 @@ - EXPORT_SYMBOL(do_gettimeofday); - EXPORT_SYMBOL(do_settimeofday); - -+#if LOWLATENCY_NEEDED -+EXPORT_SYMBOL(set_running_and_schedule); -+#ifdef CONFIG_LOLAT_SYSCTL -+EXPORT_SYMBOL(__enable_lowlatency); -+#endif -+#endif -+ - #if !defined(__ia64__) - EXPORT_SYMBOL(loops_per_jiffy); - #endif -diff -Nur c3000_pre/linux/kernel/module.c c3000_test/linux/kernel/module.c ---- c3000_pre/linux/kernel/module.c 2004-08-21 09:49:14.000000000 +0900 -+++ c3000_test/linux/kernel/module.c 2004-12-20 22:56:21.000000000 +0900 -@@ -1174,6 +1174,11 @@ - return ERR_PTR(-ENOMEM); - lock_kernel(); - for (v = module_list, n = *pos; v; n -= v->nsyms, v = v->next) { -+#if 0 -+ /* We can't actually do this, because we'd create a -+ * race against module unload. Need a semaphore. */ -+ conditional_schedule(); -+#endif - if (n < v->nsyms) { - p->mod = v; - p->index = n; -diff -Nur c3000_pre/linux/kernel/sched.c c3000_test/linux/kernel/sched.c ---- c3000_pre/linux/kernel/sched.c 2004-08-21 09:49:14.000000000 +0900 -+++ c3000_test/linux/kernel/sched.c 2004-12-20 22:56:21.000000000 +0900 -@@ -302,6 +302,17 @@ - if (tsk->processor != this_cpu) - smp_send_reschedule(tsk->processor); - } -+#if LOWLATENCY_NEEDED -+ if (enable_lowlatency && (p->policy != SCHED_OTHER)) { -+ struct task_struct *t; -+ for (i = 0; i < smp_num_cpus; i++) { -+ cpu = cpu_logical_map(i); -+ t = cpu_curr(cpu); -+ if (t != tsk) -+ t->need_resched = 1; -+ } -+ } -+#endif - return; - - -@@ -1429,3 +1440,93 @@ - atomic_inc(&init_mm.mm_count); - enter_lazy_tlb(&init_mm, current, cpu); - } -+ -+#if LOWLATENCY_NEEDED -+#if LOWLATENCY_DEBUG -+ -+static struct lolat_stats_t *lolat_stats_head; -+static spinlock_t lolat_stats_lock = SPIN_LOCK_UNLOCKED; -+ -+void set_running_and_schedule(struct lolat_stats_t *stats) -+{ -+ spin_lock(&lolat_stats_lock); -+ if (stats->visited == 0) { -+ stats->visited = 1; -+ stats->next = lolat_stats_head; -+ lolat_stats_head = stats; -+ } -+ stats->count++; -+ spin_unlock(&lolat_stats_lock); -+ -+ if (current->state != TASK_RUNNING) -+ set_current_state(TASK_RUNNING); -+ schedule(); -+} -+ -+void show_lolat_stats(void) -+{ -+ struct lolat_stats_t *stats = lolat_stats_head; -+ -+ printk("Low latency scheduling stats:\n"); -+ while (stats) { -+ printk("%s:%d: %lu\n", stats->file, stats->line, stats->count); -+ stats->count = 0; -+ stats = stats->next; -+ } -+} -+ -+#else /* LOWLATENCY_DEBUG */ -+ -+void set_running_and_schedule() -+{ -+ if (current->state != TASK_RUNNING) -+ __set_current_state(TASK_RUNNING); -+ schedule(); -+} -+ -+#endif /* LOWLATENCY_DEBUG */ -+ -+int ll_copy_to_user(void *to_user, const void *from, unsigned long len) -+{ -+ while (len) { -+ unsigned long n_to_copy = len; -+ unsigned long remainder; -+ -+ if (n_to_copy > 4096) -+ n_to_copy = 4096; -+ remainder = copy_to_user(to_user, from, n_to_copy); -+ if (remainder) -+ return remainder + len; -+ to_user = ((char *)to_user) + n_to_copy; -+ from = ((char *)from) + n_to_copy; -+ len -= n_to_copy; -+ conditional_schedule(); -+ } -+ return 0; -+} -+ -+int ll_copy_from_user(void *to, const void *from_user, unsigned long len) -+{ -+ while (len) { -+ unsigned long n_to_copy = len; -+ unsigned long remainder; -+ -+ if (n_to_copy > 4096) -+ n_to_copy = 4096; -+ remainder = copy_from_user(to, from_user, n_to_copy); -+ if (remainder) -+ return remainder + len; -+ to = ((char *)to) + n_to_copy; -+ from_user = ((char *)from_user) + n_to_copy; -+ len -= n_to_copy; -+ conditional_schedule(); -+ } -+ return 0; -+} -+ -+#ifdef CONFIG_LOLAT_SYSCTL -+struct low_latency_enable_struct __enable_lowlatency = { 0, }; -+#endif -+ -+#endif /* LOWLATENCY_NEEDED */ -+ -diff -Nur c3000_pre/linux/kernel/sysctl.c c3000_test/linux/kernel/sysctl.c ---- c3000_pre/linux/kernel/sysctl.c 2004-08-21 09:49:14.000000000 +0900 -+++ c3000_test/linux/kernel/sysctl.c 2004-12-20 22:56:21.000000000 +0900 -@@ -271,6 +271,10 @@ - {KERN_S390_USER_DEBUG_LOGGING,"userprocess_debug", - &sysctl_userprocess_debug,sizeof(int),0644,NULL,&proc_dointvec}, - #endif -+#ifdef CONFIG_LOLAT_SYSCTL -+ {KERN_LOWLATENCY, "lowlatency", &enable_lowlatency, sizeof (int), -+ 0644, NULL, &proc_dointvec}, -+#endif - {0} - }; - -diff -Nur c3000_pre/linux/mm/filemap.c c3000_test/linux/mm/filemap.c ---- c3000_pre/linux/mm/filemap.c 2004-08-21 09:49:15.000000000 +0900 -+++ c3000_test/linux/mm/filemap.c 2004-12-20 22:56:21.000000000 +0900 -@@ -179,7 +179,9 @@ - { - struct list_head *head, *curr; - struct page * page; -+ int ll_count = 100; - -+restart: - head = &inode->i_mapping->clean_pages; - - spin_lock(&pagemap_lru_lock); -@@ -190,6 +192,14 @@ - page = list_entry(curr, struct page, list); - curr = curr->next; - -+ if (conditional_schedule_needed() && ll_count) { -+ spin_unlock(&pagecache_lock); -+ spin_unlock(&pagemap_lru_lock); -+ unconditional_schedule(); -+ ll_count--; -+ goto restart; -+ } -+ - /* We cannot invalidate something in dirty.. */ - if (PageDirty(page)) - continue; -@@ -253,8 +263,7 @@ - page_cache_release(page); - } - --static int FASTCALL(truncate_list_pages(struct list_head *, unsigned long, unsigned *)); --static int truncate_list_pages(struct list_head *head, unsigned long start, unsigned *partial) -+static int truncate_list_pages(struct list_head *head, unsigned long start, unsigned *partial, int *restart_count) - { - struct list_head *curr; - struct page * page; -@@ -265,6 +274,17 @@ - while (curr != head) { - unsigned long offset; - -+ if (conditional_schedule_needed() && *restart_count) { -+ (*restart_count)--; -+ list_del(head); -+ list_add(head, curr); /* Restart on this page */ -+ spin_unlock(&pagecache_lock); -+ unconditional_schedule(); -+ spin_lock(&pagecache_lock); -+ unlocked = 1; -+ goto restart; -+ } -+ - page = list_entry(curr, struct page, list); - offset = page->index; - -@@ -297,13 +317,11 @@ - } else - wait_on_page(page); - -- page_cache_release(page); -- -- if (current->need_resched) { -- __set_current_state(TASK_RUNNING); -- schedule(); -+ if (LOWLATENCY_NEEDED) { -+ *restart_count = 4; /* We made progress */ - } - -+ page_cache_release(page); - spin_lock(&pagecache_lock); - goto restart; - } -@@ -326,13 +344,14 @@ - { - unsigned long start = (lstart + PAGE_CACHE_SIZE - 1) >> PAGE_CACHE_SHIFT; - unsigned partial = lstart & (PAGE_CACHE_SIZE - 1); -+ int restart_count = 4; - int unlocked; - - spin_lock(&pagecache_lock); - do { -- unlocked = truncate_list_pages(&mapping->clean_pages, start, &partial); -- unlocked |= truncate_list_pages(&mapping->dirty_pages, start, &partial); -- unlocked |= truncate_list_pages(&mapping->locked_pages, start, &partial); -+ unlocked = truncate_list_pages(&mapping->clean_pages, start, &partial, &restart_count); -+ unlocked |= truncate_list_pages(&mapping->dirty_pages, start, &partial, &restart_count); -+ unlocked |= truncate_list_pages(&mapping->locked_pages, start, &partial, &restart_count); - } while (unlocked); - /* Traversed all three lists without dropping the lock */ - spin_unlock(&pagecache_lock); -@@ -477,6 +496,7 @@ - - page_cache_get(page); - spin_unlock(&pagecache_lock); -+ conditional_schedule(); /* sys_msync() (only used by minixfs, udf) */ - lock_page(page); - - /* The buffers could have been free'd while we waited for the page lock */ -@@ -563,12 +583,14 @@ - list_del(&page->list); - list_add(&page->list, &mapping->locked_pages); - -- if (!PageDirty(page)) -- continue; -- - page_cache_get(page); - spin_unlock(&pagecache_lock); - -+ conditional_schedule(); /* sys_msync() */ -+ -+ if (!PageDirty(page)) -+ goto clean; -+ - lock_page(page); - - if (PageDirty(page)) { -@@ -579,7 +601,7 @@ - ret = err; - } else - UnlockPage(page); -- -+clean: - page_cache_release(page); - spin_lock(&pagecache_lock); - } -@@ -597,7 +619,8 @@ - int filemap_fdatawait(struct address_space * mapping) - { - int ret = 0; -- -+ DEFINE_RESCHED_COUNT; -+restart: - spin_lock(&pagecache_lock); - - while (!list_empty(&mapping->locked_pages)) { -@@ -606,6 +629,17 @@ - list_del(&page->list); - list_add(&page->list, &mapping->clean_pages); - -+ if (TEST_RESCHED_COUNT(32)) { -+ RESET_RESCHED_COUNT(); -+ if (conditional_schedule_needed()) { -+ page_cache_get(page); -+ spin_unlock(&pagecache_lock); -+ unconditional_schedule(); -+ page_cache_release(page); -+ goto restart; -+ } -+ } -+ - if (!PageLocked(page)) - continue; - -@@ -706,8 +740,10 @@ - spin_lock(&pagecache_lock); - page = __find_page_nolock(mapping, offset, *hash); - spin_unlock(&pagecache_lock); -- if (page) -+ if (page) { -+ conditional_schedule(); - return 0; -+ } - - page = page_cache_alloc(mapping); - if (!page) -@@ -963,6 +999,11 @@ - * the hash-list needs a held write-lock. - */ - repeat: -+ if (conditional_schedule_needed()) { -+ spin_unlock(&pagecache_lock); -+ unconditional_schedule(); -+ spin_lock(&pagecache_lock); -+ } - page = __find_page_nolock(mapping, offset, hash); - if (page) { - page_cache_get(page); -@@ -1413,6 +1454,8 @@ - page_cache_get(page); - spin_unlock(&pagecache_lock); - -+ conditional_schedule(); /* sys_read() */ -+ - if (!Page_Uptodate(page)) - goto page_not_up_to_date; - generic_file_readahead(reada_ok, filp, inode, page); -@@ -2114,6 +2157,12 @@ - address += PAGE_SIZE; - pte++; - } while (address && (address < end)); -+ -+ if (conditional_schedule_needed()) { -+ spin_unlock(&vma->vm_mm->page_table_lock); -+ unconditional_schedule(); /* syncing large mapped files */ -+ spin_lock(&vma->vm_mm->page_table_lock); -+ } - return error; - } - -@@ -2530,7 +2579,9 @@ - if (vma->vm_flags & VM_LOCKED) - return -EINVAL; - -- zap_page_range(vma->vm_mm, start, end - start); -+ zap_page_range(vma->vm_mm, start, end - start, -+ ZPR_COND_RESCHED); /* sys_madvise(MADV_DONTNEED) */ -+ - return 0; - } - -@@ -3095,6 +3146,9 @@ - goto sync_failure; - page_fault = __copy_from_user(kaddr+offset, buf, bytes); - flush_dcache_page(page); -+ -+ conditional_schedule(); -+ - status = mapping->a_ops->commit_write(file, page, offset, offset+bytes); - if (page_fault) - goto fail_write; -diff -Nur c3000_pre/linux/mm/memory.c c3000_test/linux/mm/memory.c ---- c3000_pre/linux/mm/memory.c 2004-08-21 09:49:15.000000000 +0900 -+++ c3000_test/linux/mm/memory.c 2004-12-20 22:56:21.000000000 +0900 -@@ -370,7 +370,7 @@ - /* - * remove user pages in a given range. - */ --void zap_page_range(struct mm_struct *mm, unsigned long address, unsigned long size) -+static void do_zap_page_range(struct mm_struct *mm, unsigned long address, unsigned long size) - { - mmu_gather_t *tlb; - pgd_t * dir; -@@ -494,6 +494,10 @@ - struct page *map; - while (!(map = follow_page(mm, start, write))) { - spin_unlock(&mm->page_table_lock); -+ -+ /* Pinning down many physical pages (kiobufs, mlockall) */ -+ conditional_schedule(); -+ - switch (handle_mm_fault(mm, vma, start, write)) { - case 1: - tsk->min_flt++; -@@ -655,6 +659,21 @@ - iobuf->locked = 0; - } - -+#define MAX_ZAP_BYTES 256*PAGE_SIZE -+ -+void zap_page_range(struct mm_struct *mm, unsigned long address, unsigned long size, int actions) -+{ -+ while (size) { -+ unsigned long chunk = size; -+ if (actions & ZPR_COND_RESCHED && chunk > MAX_ZAP_BYTES) -+ chunk = MAX_ZAP_BYTES; -+ do_zap_page_range(mm, address, chunk); -+ if (actions & ZPR_COND_RESCHED) -+ conditional_schedule(); -+ address += chunk; -+ size -= chunk; -+ } -+} - - /* - * Lock down all of the pages of a kiovec for IO. -@@ -764,11 +783,18 @@ - return 0; - } - --static inline void zeromap_pte_range(pte_t * pte, unsigned long address, -- unsigned long size, pgprot_t prot) -+static inline void zeromap_pte_range(struct mm_struct *mm, pte_t * pte, -+ unsigned long address, unsigned long size, -+ pgprot_t prot) - { - unsigned long end; - -+ if (conditional_schedule_needed()) { -+ spin_unlock(&mm->page_table_lock); -+ unconditional_schedule(); /* mmap(/dev/zero) */ -+ spin_lock(&mm->page_table_lock); -+ } -+ - address &= ~PMD_MASK; - end = address + size; - if (end > PMD_SIZE) -@@ -796,7 +822,7 @@ - pte_t * pte = pte_alloc(mm, pmd, address); - if (!pte) - return -ENOMEM; -- zeromap_pte_range(pte, address, end - address, prot); -+ zeromap_pte_range(mm, pte, address, end - address, prot); - address = (address + PMD_SIZE) & PMD_MASK; - pmd++; - } while (address && (address < end)); -@@ -1044,7 +1070,7 @@ - - /* mapping wholly truncated? */ - if (mpnt->vm_pgoff >= pgoff) { -- zap_page_range(mm, start, len); -+ zap_page_range(mm, start, len, 0); - continue; - } - -@@ -1057,7 +1083,7 @@ - /* Ok, partially affected.. */ - start += diff << PAGE_SHIFT; - len = (len - diff) << PAGE_SHIFT; -- zap_page_range(mm, start, len); -+ zap_page_range(mm, start, len, 0); - } while ((mpnt = mpnt->vm_next_share) != NULL); - } - -diff -Nur c3000_pre/linux/mm/mmap.c c3000_test/linux/mm/mmap.c ---- c3000_pre/linux/mm/mmap.c 2004-12-16 22:55:54.000000000 +0900 -+++ c3000_test/linux/mm/mmap.c 2004-12-20 23:07:25.000000000 +0900 -@@ -598,7 +598,7 @@ - fput(file); - - /* Undo any partial mapping done by a device driver. */ -- zap_page_range(mm, vma->vm_start, vma->vm_end - vma->vm_start); -+ zap_page_range(mm, vma->vm_start, vma->vm_end - vma->vm_start, 0); - free_vma: - kmem_cache_free(vm_area_cachep, vma); - return error; -@@ -998,7 +998,7 @@ - remove_shared_vm_struct(mpnt); - mm->map_count--; - -- zap_page_range(mm, st, size); -+ zap_page_range(mm, st, size, ZPR_COND_RESCHED); /* sys_munmap() */ - - /* - * Fix the mapping, and free the old area if it wasn't reused. -@@ -1158,7 +1158,7 @@ - } - mm->map_count--; - remove_shared_vm_struct(mpnt); -- zap_page_range(mm, start, size); -+ zap_page_range(mm, start, size, ZPR_COND_RESCHED); /* sys_exit() */ - if (mpnt->vm_file) - fput(mpnt->vm_file); - kmem_cache_free(vm_area_cachep, mpnt); -diff -Nur c3000_pre/linux/mm/mremap.c c3000_test/linux/mm/mremap.c ---- c3000_pre/linux/mm/mremap.c 2004-12-16 22:55:54.000000000 +0900 -+++ c3000_test/linux/mm/mremap.c 2004-12-20 23:07:25.000000000 +0900 -@@ -121,7 +121,7 @@ - flush_cache_range(mm, new_addr, new_addr + len); - while ((offset += PAGE_SIZE) < len) - move_one_page(mm, new_addr + offset, old_addr + offset); -- zap_page_range(mm, new_addr, len); -+ zap_page_range(mm, new_addr, len, 0); - #ifdef __arm__ - memc_update_mm(mm); - #endif -diff -Nur c3000_pre/linux/mm/slab.c c3000_test/linux/mm/slab.c ---- c3000_pre/linux/mm/slab.c 2004-11-16 15:31:09.000000000 +0900 -+++ c3000_test/linux/mm/slab.c 2004-12-20 22:56:21.000000000 +0900 -@@ -940,6 +940,7 @@ - list_del(&slabp->list); - - spin_unlock_irq(&cachep->spinlock); -+ conditional_schedule(); - kmem_slab_destroy(cachep, slabp); - ret++; - spin_lock_irq(&cachep->spinlock); -@@ -1853,6 +1854,7 @@ - */ - spin_unlock_irq(&best_cachep->spinlock); - kmem_slab_destroy(best_cachep, slabp); -+ conditional_schedule(); /* try_to_free_pages() */ - spin_lock_irq(&best_cachep->spinlock); - } - spin_unlock_irq(&best_cachep->spinlock); -diff -Nur c3000_pre/linux/mm/swapfile.c c3000_test/linux/mm/swapfile.c ---- c3000_pre/linux/mm/swapfile.c 2004-08-21 09:49:16.000000000 +0900 -+++ c3000_test/linux/mm/swapfile.c 2004-12-20 22:56:21.000000000 +0900 -@@ -819,7 +819,7 @@ - len += sprintf(buf + len, "partition\t"); - - usedswap = 0; -- for (j = 0; j < ptr->max; ++j) -+ for (j = 0; j < ptr->max; ++j) { - switch (ptr->swap_map[j]) { - case SWAP_MAP_BAD: - case 0: -@@ -827,6 +827,8 @@ - default: - usedswap++; - } -+ conditional_schedule(); -+ } - len += sprintf(buf + len, "%d\t%d\t%d\n", ptr->pages << (PAGE_SHIFT - 10), - usedswap << (PAGE_SHIFT - 10), ptr->prio); - } -@@ -1120,6 +1122,11 @@ - if (swap_info[i].flags != SWP_USED) - continue; - for (j = 0; j < swap_info[i].max; ++j) { -+ if (conditional_schedule_needed()) { -+ swap_list_unlock(); -+ conditional_schedule(); -+ swap_list_lock(); -+ } - switch (swap_info[i].swap_map[j]) { - case 0: - case SWAP_MAP_BAD: -diff -Nur c3000_pre/linux/mm/vmscan.c c3000_test/linux/mm/vmscan.c ---- c3000_pre/linux/mm/vmscan.c 2004-08-21 09:49:16.000000000 +0900 -+++ c3000_test/linux/mm/vmscan.c 2004-12-20 22:56:21.000000000 +0900 -@@ -173,6 +173,7 @@ - { - pte_t * pte; - unsigned long pmd_end; -+ DEFINE_RESCHED_COUNT; - - if (pmd_none(*dir)) - return count; -@@ -198,11 +199,17 @@ - address += PAGE_SIZE; - break; - } -+ if (TEST_RESCHED_COUNT(4)) { -+ if (conditional_schedule_needed()) -+ goto out; -+ RESET_RESCHED_COUNT(); -+ } - } - } - address += PAGE_SIZE; - pte++; - } while (address && (address < end)); -+out: - mm->swap_address = address; - return count; - } -@@ -231,6 +238,8 @@ - count = swap_out_pmd(mm, vma, pmd, address, end, count, classzone); - if (!count) - break; -+ if (conditional_schedule_needed()) -+ return count; - address = (address + PMD_SIZE) & PMD_MASK; - pmd++; - } while (address && (address < end)); -@@ -255,6 +264,8 @@ - count = swap_out_pgd(mm, vma, pgdir, address, end, count, classzone); - if (!count) - break; -+ if (conditional_schedule_needed()) -+ return count; - address = (address + PGDIR_SIZE) & PGDIR_MASK; - pgdir++; - } while (address && (address < end)); -@@ -276,6 +287,7 @@ - * Find the proper vm-area after freezing the vma chain - * and ptes. - */ -+continue_scan: - spin_lock(&mm->page_table_lock); - address = mm->swap_address; - if (address == TASK_SIZE || swap_mm != mm) { -@@ -293,6 +305,12 @@ - vma = vma->vm_next; - if (!vma) - break; -+ if (conditional_schedule_needed()) { /* Scanning a large vma */ -+ spin_unlock(&mm->page_table_lock); -+ unconditional_schedule(); -+ /* Continue from where we left off */ -+ goto continue_scan; -+ } - if (!count) - goto out_unlock; - address = vma->vm_start; -diff -Nur c3000_pre/linux/net/core/iovec.c c3000_test/linux/net/core/iovec.c ---- c3000_pre/linux/net/core/iovec.c 2004-08-21 11:23:13.000000000 +0900 -+++ c3000_test/linux/net/core/iovec.c 2004-12-20 22:56:21.000000000 +0900 -@@ -88,7 +88,7 @@ - if(iov->iov_len) - { - int copy = min_t(unsigned int, iov->iov_len, len); -- if (copy_to_user(iov->iov_base, kdata, copy)) -+ if (ll_copy_to_user(iov->iov_base, kdata, copy)) - goto out; - kdata+=copy; - len-=copy; -diff -Nur c3000_pre/linux/net/ipv4/tcp_minisocks.c c3000_test/linux/net/ipv4/tcp_minisocks.c ---- c3000_pre/linux/net/ipv4/tcp_minisocks.c 2004-08-21 09:49:22.000000000 +0900 -+++ c3000_test/linux/net/ipv4/tcp_minisocks.c 2004-12-20 22:56:21.000000000 +0900 -@@ -440,6 +440,9 @@ - { - struct tcp_tw_bucket *tw; - int killed = 0; -+#if LOWLATENCY_NEEDED -+ int max_killed = 0; -+#endif - - /* NOTE: compare this to previous version where lock - * was released after detaching chain. It was racy, -@@ -453,6 +456,13 @@ - goto out; - - while((tw = tcp_tw_death_row[tcp_tw_death_row_slot]) != NULL) { -+#if LOWLATENCY_NEEDED -+ /* This loop takes ~6 usecs per iteration. */ -+ if (killed > 100) { -+ max_killed = 1; -+ break; -+ } -+#endif - tcp_tw_death_row[tcp_tw_death_row_slot] = tw->next_death; - tw->pprev_death = NULL; - spin_unlock(&tw_death_lock); -@@ -463,12 +473,24 @@ - killed++; - - spin_lock(&tw_death_lock); -+ -+ } -+ -+#if LOWLATENCY_NEEDED -+ if (max_killed) { /* More to do: do it soon */ -+ mod_timer(&tcp_tw_timer, jiffies+2); -+ tcp_tw_count -= killed; -+ } -+ else -+#endif -+ { -+ tcp_tw_death_row_slot = -+ ((tcp_tw_death_row_slot + 1) & (TCP_TWKILL_SLOTS - 1)); -+ -+ if ((tcp_tw_count -= killed) != 0) -+ mod_timer(&tcp_tw_timer, jiffies+TCP_TWKILL_PERIOD); - } -- tcp_tw_death_row_slot = -- ((tcp_tw_death_row_slot + 1) & (TCP_TWKILL_SLOTS - 1)); - -- if ((tcp_tw_count -= killed) != 0) -- mod_timer(&tcp_tw_timer, jiffies+TCP_TWKILL_PERIOD); - net_statistics[smp_processor_id()*2].TimeWaited += killed; - out: - spin_unlock(&tw_death_lock); |