Merge into 1.0.07-rc : pbxt-07-low-disk-index-flush : Code : PBXT

Status:	Rejected
Rejected by:	Paul McCullagh on 2010-03-17
Proposed branch:	lp:~vkolesnikov/pbxt/pbxt-07-low-disk-index-flush
Merge into:	lp:pbxt/1.0.07-rc
Diff against target:	None lines
To merge this branch:	bzr merge lp:~vkolesnikov/pbxt/pbxt-07-low-disk-index-flush
Related bugs:	Link a bug report

Reviewer	Review Type	Date Requested	Status
Paul McCullagh		2009-08-14	Abstain on 2010-03-17
Review via email: mp+10141@code.launchpad.net

Revision history for this message

Paul McCullagh (paul-mccullagh) wrote on 2009-08-17:

#

Download full text (4.8 KiB)

Hi Vlad,

There is a problem with this change. Actually a serious bug.

See below:

On Aug 14, 2009, at 11:30 AM, Vladimir Kolesnikov wrote:

> Vladimir Kolesnikov has proposed merging lp:~vkolesnikov/pbxt/
> pbxt-07-low-disk-index-flush into lp:pbxt/1.0.07-rc.
>
> Requested reviews:
> PBXT Core (pbxt-core)
> --
> https://code.launchpad.net/~vkolesnikov/pbxt/pbxt-07-low-disk-index-
> flush/+merge/10141
> Your team PBXT Core is subscribed to branch lp:pbxt/1.0.07-rc.
> === modified file 'ChangeLog'
> --- ChangeLog 2009-08-11 09:17:53 +0000
> +++ ChangeLog 2009-08-14 09:23:20 +0000
> @@ -1,6 +1,10 @@
> PBXT Release Notes
> ==================
>
> +------- 1.0.07r RC - 2009-08-14
> +
> +RN267: Fixed an assertion failure: if checkpointer failed to
> successully flush indices (e.g. due to low disk state) then next
> time xt_flush_indices is called it would generate an assertion failure
> +
> RN266: Fixed a crash: when initialization failed with an exception
> THD structure was released twice
>
> ------- 1.0.07q RC - 2009-08-09
>
> === modified file 'src/index_xt.cc'
> --- src/index_xt.cc 2009-07-07 14:21:07 +0000
> +++ src/index_xt.cc 2009-08-13 13:49:21 +0000
> @@ -2785,7 +2785,6 @@
> *bytes_flushed += (dirty_blocks * XT_INDEX_PAGE_SIZE);
>
> curr_flush_seq = tab->tab_ind_flush_seq;
> - tab->tab_ind_flush_seq++;
>
> /* Write the dirty pages: */
> indp = tab->tab_dic.dic_keys;
> @@ -2981,6 +2980,13 @@
> }
> }
>
> + /* At this point all dirty blocks should have been successully
> flushed to disk,
> + * otherwise we must not increment this value as an assertion
> above in this
> + * function ASSERT_NS(block->cp_flush_seq == curr_flush_seq)
> + * will fail.
> + */
> + tab->tab_ind_flush_seq++;
> +
> indp = tab->tab_dic.dic_keys;
> for (i=0; i<tab->tab_dic.dic_key_count; i++, indp++) {
> ind = *indp;

I think you have moved tab_ind_flush_seq++ too far down. All locks on
the index are released before the if (wrote_something) block:

indp = tab->tab_dic.dic_keys;
for (i=0; i<tab->tab_dic.dic_key_count; i++, indp++) {
ind = *indp;
XT_INDEX_UNLOCK(ind, ot);
}

if (wrote_something) {
....

After that point, the index can be updated again. Then it is important
that the updates use a different flush sequence number. If not, the
page will be freed by the code that occurred just above this point:

  /* Free up flushed pages: */
  indp = tab->tab_dic.dic_keys;
  for (i=0; i<tab->tab_dic.dic_key_count; i++, indp++) {
                    ...

And the changes in the cache will be lost!

>
> === modified file 'src/lock_xt.h'
> --- src/lock_xt.h 2008-11-17 10:14:17 +0000
> +++ src/lock_xt.h 2009-08-13 13:49:21 +0000
> @@ -234,6 +234,38 @@
> return val;
> }
>
> +inline void xt_atomic_inc4(volatile xtWord4 *mptr)
> +{
> +#ifdef XT_ATOMIC_WIN32_X86
> + __asm MOV ECX, mptr
> + __asm LOCK INC DWORD PTR [ECX]
> +#elif defined(XT_ATOMIC_GNUC_X86)
> + asm volatile ("lock; incl %0" : : "m" (*mptr) : "memory");
> +#elif defined(XT_ATOMIC_GCC_OPS)
> + __sync_fetch_and_add(mptr, 1);
> +#elif defined(XT_ATOMIC_SOLARIS_LIB)
> + atomic_inc_32_nv(mptr);
> +#else
> + ++(*mptr);
> +#endif
> +}
> +
> +inline void x...

Hi Vlad,

There is a problem with this change. Actually a serious bug.

See below:

On Aug 14, 2009, at 11:30 AM, Vladimir Kolesnikov wrote:

> Vladimir Kolesnikov has proposed merging lp:~vkolesnikov/pbxt/ 
> pbxt-07-low-disk-index-flush into lp:pbxt/1.0.07-rc.
>
> Requested reviews:
>    PBXT Core (pbxt-core)
> -- 
> https://code.launchpad.net/~vkolesnikov/pbxt/pbxt-07-low-disk-index- 
> flush/+merge/10141
> Your team PBXT Core is subscribed to branch lp:pbxt/1.0.07-rc.
> === modified file 'ChangeLog'
> --- ChangeLog	2009-08-11 09:17:53 +0000
> +++ ChangeLog	2009-08-14 09:23:20 +0000
> @@ -1,6 +1,10 @@
> PBXT Release Notes
> ==================
>
> +------- 1.0.07r RC - 2009-08-14
> +
> +RN267: Fixed an assertion failure: if checkpointer failed to  
> successully flush indices (e.g. due to low disk state) then next  
> time xt_flush_indices is called it would generate an assertion failure
> +
> RN266: Fixed a crash: when initialization failed with an exception  
> THD structure was released twice
>
> ------- 1.0.07q RC - 2009-08-09
>
> === modified file 'src/index_xt.cc'
> --- src/index_xt.cc	2009-07-07 14:21:07 +0000
> +++ src/index_xt.cc	2009-08-13 13:49:21 +0000
> @@ -2785,7 +2785,6 @@
> 		*bytes_flushed += (dirty_blocks * XT_INDEX_PAGE_SIZE);
>
> 	curr_flush_seq = tab->tab_ind_flush_seq;
> -	tab->tab_ind_flush_seq++;
>
> 	/* Write the dirty pages: */
> 	indp = tab->tab_dic.dic_keys;
> @@ -2981,6 +2980,13 @@
> 			}
> 		}
>
> +		/* At this point all dirty blocks should have been successully  
> flushed to disk,
> +		 * otherwise we must not increment this value as an assertion  
> above in this
> +		 * function ASSERT_NS(block->cp_flush_seq == curr_flush_seq)
> +		 * will fail.
> +		 */
> +		tab->tab_ind_flush_seq++;
> +
> 		indp = tab->tab_dic.dic_keys;
> 		for (i=0; i<tab->tab_dic.dic_key_count; i++, indp++) {
> 			ind = *indp;

I think you have moved tab_ind_flush_seq++ too far down. All locks on  
the index are released before the if (wrote_something) block:

indp = tab->tab_dic.dic_keys;
	for (i=0; i<tab->tab_dic.dic_key_count; i++, indp++) {
		ind = *indp;
		XT_INDEX_UNLOCK(ind, ot);
	}

if (wrote_something) {
            ....

After that point, the index can be updated again. Then it is important  
that the updates use a different flush sequence number. If not, the  
page will be freed by the code that occurred just above this point:

/* Free up flushed pages: */
		indp = tab->tab_dic.dic_keys;
		for (i=0; i<tab->tab_dic.dic_key_count; i++, indp++) {
                    ...

And the changes in the cache will be lost!

>
> === modified file 'src/lock_xt.h'
> --- src/lock_xt.h	2008-11-17 10:14:17 +0000
> +++ src/lock_xt.h	2009-08-13 13:49:21 +0000
> @@ -234,6 +234,38 @@
> 	return val;
> }
>
> +inline void xt_atomic_inc4(volatile xtWord4 *mptr)
> +{
> +#ifdef XT_ATOMIC_WIN32_X86
> +	__asm MOV  ECX, mptr
> +	__asm LOCK INC	DWORD PTR [ECX]
> +#elif defined(XT_ATOMIC_GNUC_X86)
> +	asm volatile ("lock; incl %0" : : "m" (*mptr) : "memory");
> +#elif defined(XT_ATOMIC_GCC_OPS)
> +	__sync_fetch_and_add(mptr, 1);
> +#elif defined(XT_ATOMIC_SOLARIS_LIB)
> +	atomic_inc_32_nv(mptr);
> +#else
> +	++(*mptr);
> +#endif
> +}
> +
> +inline void xt_atomic_dec4(volatile xtWord4 *mptr)
> +{
> +#ifdef XT_ATOMIC_WIN32_X86
> +	__asm MOV  ECX, mptr
> +	__asm LOCK DEC	DWORD PTR [ECX]
> +#elif defined(XT_ATOMIC_GNUC_X86)
> +	asm volatile ("lock; decl %0" : : "m" (*mptr) : "memory");
> +#elif defined(XT_ATOMIC_GCC_OPS)
> +	__sync_fetch_and_sub(mptr, 1);
> +#elif defined(XT_ATOMIC_SOLARIS_LIB)
> +	atomic_dec_32_nv(mptr);
> +#else
> +	--(*mptr);
> +#endif
> +}
> +

Please check your merge, I have blank lines between each line in the  
code above.

>
> inline void xt_atomic_set4(volatile xtWord4 *mptr, xtWord4 val)
> {
> #ifdef XT_SPL_WIN32_ASM
>
> === modified file 'src/strutil_xt.cc'
> --- src/strutil_xt.cc	2009-08-09 15:46:45 +0000
> +++ src/strutil_xt.cc	2009-08-14 09:23:20 +0000
> @@ -367,7 +367,7 @@
>
> xtPublic c_char *xt_get_version(void)
> {
> -	return "1.0.07q RC";
> +	return "1.0.07r RC";
> }
>
> /* Copy and URL decode! */
>
> === modified file 'src/tabcache_xt.cc'
> --- src/tabcache_xt.cc	2009-01-30 10:23:54 +0000
> +++ src/tabcache_xt.cc	2009-08-13 13:49:21 +0000
> @@ -345,7 +345,7 @@
> 	if (!tc_fetch(file, ref_id, &seg, &page, offset, thread))
> 		return FAILED;
> #endif
> -	page->tcp_lock_count++;
> +	xt_atomic_inc4(&page->tcp_lock_count);

An atomic operation is not required here because the page is locked.

Question: is it required because of on chip cache co-ordination  
problems?

> 	xt_rwmutex_unlock(&seg->tcs_lock, thread->t_id);
> 	*ret_page = page;
> 	return OK;
> @@ -376,7 +376,7 @@
> #endif
>
> 	if (page->tcp_lock_count > 0)
> -		page->tcp_lock_count--;
> +		xt_atomic_dec4(&page->tcp_lock_count);
>
> 	xt_rwmutex_unlock(&seg->tcs_lock, thread->t_id);
> }
>

--
Paul McCullagh
PrimeBase Technologies
www.primebase.org
www.blobstreaming.org
pbxt.blogspot.com

Revision history for this message

Vladimir Kolesnikov (vkolesnikov) wrote on 2009-08-18:

#

Hi Paul,

I pushed fix update. Please check the latest rev.

lp:~vkolesnikov/pbxt/pbxt-07-low-disk-index-flush updated on 2009-08-18

558. By Vladimir Kolesnikov on 2009-08-18: out-of-disk handling improvements: keep and retry ilog

Revision history for this message

Paul McCullagh (paul-mccullagh) wrote on 2009-08-19:

#

Download full text (3.2 KiB)

Hi Vlad,

Some points to look at. I have pasted the code below, and added
references.

(1) The variable "curr_flush_seq" is now only used for debug code. It
should probably be place in: #ifdef DEBUG

(2) The tab_ind_flush_lock should not be held across calls to this
function, because there is no guarantee that the thread that failed
the first flush will return.

(3) goto failed_2 here is way to early to save the il!

(4) the il should be saved at this point. I recommend, setting tab-
>tab_ind_unflushed_ilog = il at this point, and setting, tab-
>tab_ind_unflushed_ilog = NULL, later after success.

(5) This must be done before the checkpoint is ended.

-----------------------------
(1) xtWord2 curr_flush_seq;
XTIndFreeListPtr list_ptr;
u_int dirty_blocks;
XTCheckPointTablePtr cp_tab;
XTCheckPointStatePtr cp = NULL;
xtBool retry_old_ilog = FALSE;

restart:
if (!xt_begin_checkpoint(tab->tab_db, have_table_lock, ot->ot_thread))
return FAILED;

if (tab->tab_ind_unflushed_ilog) {
  wrote_something = TRUE;
  retry_old_ilog = TRUE;
  il = tab->tab_ind_unflushed_ilog;
  goto previous_ilog;
}

#ifdef DEBUG_CHECK_IND_CACHE
xt_ind_check_cache(NULL);
#endif
xt_lock_mutex_ns(&tab->tab_ind_flush_lock);

if (!tab->tab_db->db_indlogs.ilp_get_log(&il, ot->ot_thread))
goto failed_3;

il->il_reset(tab);
if (!il->il_write_byte(ot, XT_DT_FREE_LIST))
goto failed_2;
if (!il->il_write_word4(ot, tab->tab_id))
goto failed_2;
if (!il->il_write_word4(ot, 0))
(3) goto failed_2;

----------------------

previous_ilog:
if (wrote_something) {
(4) tab->tab_ind_unflushed_ilog = il;
il = NULL;

----------------------
if (!retry_old_ilog)
xt_unlock_mutex_ns(&tab->tab_ind_flush_lock);

#ifdef DEBUG_CHECK_IND_CACHE
xt_ind_check_cache((XTIndex *) 1);
#endif
#ifdef TRACE_FLUSH
printf("FLUSH --end-- %s\n", tab->tab_name->ps_path);
fflush(stdout);
#endif
if (!xt_end_checkpoint(tab->tab_db, ot->ot_thread, NULL))
return FAILED;

(5) if (retry_old_ilog) {
  tab->tab_ind_unflushed_ilog = NULL;
  retry_old_ilog = FALSE;
  goto restart;
}

return OK;

failed:
indp = tab->tab_dic.dic_keys;
for (i=0; i<tab->tab_dic.dic_key_count; i++, indp++) {
ind = *indp;
XT_INDEX_UNLOCK(ind, ot);
}

/* we failed with a partially written ilog. keep it and try to write
it next time this function is called */
failed_2:
ASSERT_NS(il);
/* either there was no unflushed ilog, or our current ilog is the
unflushed one */
ASSERT_NS(tab->tab_ind_unflushed_ilog == NULL || tab-
>tab_ind_unflushed_ilog == il);
tab->tab_ind_unflushed_ilog = il;

/* this label is for the case when there's no [yet] ilog, otherwise
must preserve ilog to be flushed later
  * (see failed_2)
  */
failed_3:
(2) if (!retry_old_ilog)
  xt_unlock_mutex_ns(&tab->tab_ind_flush_lock);
#ifdef DEBUG_CHECK_IND_CACHE
xt_ind_check_cache(NULL);
#endif
return FAILED;
---------------------------

On Aug 18, 2009, at 10:40 PM, Vladimir Kolesnikov wrote:

> Hi Paul,
>
> I pushed fix update. Please check the latest rev.
> --
> https://code.launchpad.net/~vkolesnikov/pbxt/pbxt-07-low-disk-index-
> flush/+merge/10141
> Your team PBXT Core is subscribed to branch lp:p...

Hi Vlad,

Some points to look at. I have pasted the code below, and added  
references.

(1) The variable "curr_flush_seq" is now only used for debug code. It  
should probably be place in: #ifdef DEBUG

(2) The tab_ind_flush_lock should not be held across calls to this  
function, because there is no guarantee that the thread that failed  
the first flush will return.

(3) goto failed_2 here is way to early to save the il!

(4) the il should be saved at this point. I recommend, setting tab- 
 >tab_ind_unflushed_ilog = il at this point, and setting, tab- 
 >tab_ind_unflushed_ilog = NULL, later after success.

(5) This must be done before the checkpoint is ended.

-----------------------------
(1)	xtWord2					curr_flush_seq;
	XTIndFreeListPtr		list_ptr;
	u_int					dirty_blocks;
	XTCheckPointTablePtr	cp_tab;
	XTCheckPointStatePtr	cp = NULL;
	xtBool					retry_old_ilog = FALSE;

restart:
	if (!xt_begin_checkpoint(tab->tab_db, have_table_lock, ot->ot_thread))
		return FAILED;

if (tab->tab_ind_unflushed_ilog) {
		wrote_something = TRUE;
		retry_old_ilog = TRUE;
		il = tab->tab_ind_unflushed_ilog;
		goto previous_ilog;
	}

#ifdef DEBUG_CHECK_IND_CACHE
	xt_ind_check_cache(NULL);
#endif
	xt_lock_mutex_ns(&tab->tab_ind_flush_lock);

if (!tab->tab_db->db_indlogs.ilp_get_log(&il, ot->ot_thread))
		goto failed_3;

il->il_reset(tab);
	if (!il->il_write_byte(ot, XT_DT_FREE_LIST))
		goto failed_2;
	if (!il->il_write_word4(ot, tab->tab_id))
		goto failed_2;
	if (!il->il_write_word4(ot, 0))
(3)		goto failed_2;

----------------------

previous_ilog:
	if (wrote_something) {
(4)		tab->tab_ind_unflushed_ilog = il;
		il = NULL;

----------------------
	if (!retry_old_ilog)
		xt_unlock_mutex_ns(&tab->tab_ind_flush_lock);

#ifdef DEBUG_CHECK_IND_CACHE
	xt_ind_check_cache((XTIndex *) 1);
#endif
#ifdef TRACE_FLUSH
	printf("FLUSH --end-- %s\n", tab->tab_name->ps_path);
	fflush(stdout);
#endif
	if (!xt_end_checkpoint(tab->tab_db, ot->ot_thread, NULL))
		return FAILED;
	
(5)	if (retry_old_ilog) {
		tab->tab_ind_unflushed_ilog = NULL;
		retry_old_ilog = FALSE;
		goto restart;
	}
	
	return OK;

failed:
	indp = tab->tab_dic.dic_keys;
	for (i=0; i<tab->tab_dic.dic_key_count; i++, indp++) {
		ind = *indp;
		XT_INDEX_UNLOCK(ind, ot);
	}

/* we failed with a partially written ilog. keep it and try to write  
it next time this function is called */
	failed_2:
	ASSERT_NS(il);
	/* either there was no unflushed ilog, or our current ilog is the  
unflushed one */
	ASSERT_NS(tab->tab_ind_unflushed_ilog == NULL || tab- 
 >tab_ind_unflushed_ilog == il);
	tab->tab_ind_unflushed_ilog = il;

/* this label is for the case when there's no [yet] ilog, otherwise  
must preserve ilog to be flushed later
	 * (see failed_2)
	 */
	failed_3:
(2)	if (!retry_old_ilog)
		xt_unlock_mutex_ns(&tab->tab_ind_flush_lock);
#ifdef DEBUG_CHECK_IND_CACHE
	xt_ind_check_cache(NULL);
#endif
	return FAILED;
---------------------------

On Aug 18, 2009, at 10:40 PM, Vladimir Kolesnikov wrote:

> Hi Paul,
>
> I pushed fix update. Please check the latest rev.
> -- 
> https://code.launchpad.net/~vkolesnikov/pbxt/pbxt-07-low-disk-index- 
> flush/+merge/10141
> Your team PBXT Core is subscribed to branch lp:pbxt/1.0.07-rc.

--
Paul McCullagh
PrimeBase Technologies
www.primebase.org
www.blobstreaming.org
pbxt.blogspot.com

Revision history for this message

Paul McCullagh (paul-mccullagh) wrote on 2009-08-19:

#

And one other thing:

tab_ind_unflushed_ilog must be freed when the table object is freed.

On Aug 18, 2009, at 10:40 PM, Vladimir Kolesnikov wrote:

> Hi Paul,
>
> I pushed fix update. Please check the latest rev.
> --
> https://code.launchpad.net/~vkolesnikov/pbxt/pbxt-07-low-disk-index-
> flush/+merge/10141
> Your team PBXT Core is subscribed to branch lp:pbxt/1.0.07-rc.

--
Paul McCullagh
PrimeBase Technologies
www.primebase.org
www.blobstreaming.org
pbxt.blogspot.com

lp:~vkolesnikov/pbxt/pbxt-07-low-disk-index-flush updated on 2009-08-26

559. By Vladimir Kolesnikov on 2009-08-26: more improvements for the index flush fix

Revision history for this message

Paul McCullagh (paul-mccullagh) wrote on 2009-09-08:

#

Hi Vlad,

The patch is looking a lot better. Some more comments:

xt_xlog_flush_log() should not return FALSE unless it raises an error.

So I think we just have to return OK, although the flush is not done. I have a better solution for this in 1.0.08 now, I pass in the db pointer to the function.

xtPublic xtBool xt_xlog_flush_log(XTThreadPtr thread)
{
if (thread->st_database)
return thread->st_database->db_xlog.xlog_flush(thread);
else
return FALSE;
}

"il_flush_seq = tab->tab_ind_flush_seq" cannot be done here. It must rather be done where the old assignment ("curr_flush_seq = tab->tab_ind_flush_seq") took place. This is after all indexes have been locked:

void XTIndexLog::il_reset(XTTable *tab)
{
il_tab_id = tab->tab_id;
il_log_eof = 0;
il_buffer_len = 0;
il_buffer_offset = 0;
il_flush_seq = tab->tab_ind_flush_seq;
}

I don't like "ilp_db = NULL". Could we rather move the ilp_exit() to after xt_tab_exit_db(). If that works then add a comment to ensure that we know that xt_tab_exit_db() is dependent on db->db_indlogs.

void XTIndexLogPool::ilp_exit(struct XTThread *self)
{
ilp_close(self, FALSE);
ASSERT_NS(il_pool_count == 0);
xt_free_mutex(&ilp_lock);
ilp_db = NULL; /* reset backpointer to flag the "exit" state */
}

lock_xt.h: Something is wrong with the line endings.

review: Needs Fixing

Revision history for this message

Paul McCullagh (paul-mccullagh) wrote on 2010-03-17:

#

This fix has been superseded by lp:~vkolesnikov/pbxt/pbxt-ilog-out-of-disk.

review: Abstain

PBXT

Merge lp:~vkolesnikov/pbxt/pbxt-07-low-disk-index-flush into lp:pbxt/1.0.07-rc

Commit message

Description of the change

Unmerged revisions

Preview Diff

Subscribers

 === modified file 'ChangeLog'
 --- ChangeLog	2009-08-11 09:17:53 +0000
 +++ ChangeLog	2009-08-14 09:23:20 +0000
@@ -1,6 +1,10 @@
  PBXT Release Notes
  ==================
++------- 1.0.07r RC - 2009-08-14
++
++RN267: Fixed an assertion failure: if checkpointer failed to successully flush indices (e.g. due to low disk state) then next time xt_flush_indices is called it would generate an assertion failure
++
  RN266: Fixed a crash: when initialization failed with an exception THD structure was released twice
  ------- 1.0.07q RC - 2009-08-09
 === modified file 'src/index_xt.cc'
 --- src/index_xt.cc	2009-07-07 14:21:07 +0000
 +++ src/index_xt.cc	2009-08-13 13:49:21 +0000
@@ -2785,7 +2785,6 @@
  		*bytes_flushed += (dirty_blocks * XT_INDEX_PAGE_SIZE);
  	curr_flush_seq = tab->tab_ind_flush_seq;
--	tab->tab_ind_flush_seq++;
  	/* Write the dirty pages: */
  	indp = tab->tab_dic.dic_keys;
@@ -2981,6 +2980,13 @@
+ 			}
+ 		}
++		/* At this point all dirty blocks should have been successully flushed to disk,
++		 * otherwise we must not increment this value as an assertion above in this
++		 * function ASSERT_NS(block->cp_flush_seq == curr_flush_seq)
++		 * will fail.
++		 */
++		tab->tab_ind_flush_seq++;
++
  		indp = tab->tab_dic.dic_keys;
  		for (i=0; i<tab->tab_dic.dic_key_count; i++, indp++) {
  			ind = *indp;
 === modified file 'src/lock_xt.h'
 --- src/lock_xt.h	2008-11-17 10:14:17 +0000
 +++ src/lock_xt.h	2009-08-13 13:49:21 +0000
@@ -234,6 +234,38 @@
  	return val;
+ }
++inline void xt_atomic_inc4(volatile xtWord4 *mptr)
++{
++#ifdef XT_ATOMIC_WIN32_X86
++	__asm MOV  ECX, mptr
++	__asm LOCK INC	DWORD PTR [ECX]
++#elif defined(XT_ATOMIC_GNUC_X86)
++	asm volatile ("lock; incl %0" : : "m" (*mptr) : "memory");
++#elif defined(XT_ATOMIC_GCC_OPS)
++	__sync_fetch_and_add(mptr, 1);
++#elif defined(XT_ATOMIC_SOLARIS_LIB)
++	atomic_inc_32_nv(mptr);
++#else
++	++(*mptr);
++#endif
++}
++
++inline void xt_atomic_dec4(volatile xtWord4 *mptr)
++{
++#ifdef XT_ATOMIC_WIN32_X86
++	__asm MOV  ECX, mptr
++	__asm LOCK DEC	DWORD PTR [ECX]
++#elif defined(XT_ATOMIC_GNUC_X86)
++	asm volatile ("lock; decl %0" : : "m" (*mptr) : "memory");
++#elif defined(XT_ATOMIC_GCC_OPS)
++	__sync_fetch_and_sub(mptr, 1);
++#elif defined(XT_ATOMIC_SOLARIS_LIB)
++	atomic_dec_32_nv(mptr);
++#else
++	--(*mptr);
++#endif
++}
++
  inline void xt_atomic_set4(volatile xtWord4 *mptr, xtWord4 val)
+ {
  #ifdef XT_SPL_WIN32_ASM
 === modified file 'src/strutil_xt.cc'
 --- src/strutil_xt.cc	2009-08-09 15:46:45 +0000
 +++ src/strutil_xt.cc	2009-08-14 09:23:20 +0000
@@ -367,7 +367,7 @@
  xtPublic c_char *xt_get_version(void)
+ {
--	return "1.0.07q RC";
++	return "1.0.07r RC";
+ }
  /* Copy and URL decode! */
 === modified file 'src/tabcache_xt.cc'
 --- src/tabcache_xt.cc	2009-01-30 10:23:54 +0000
 +++ src/tabcache_xt.cc	2009-08-13 13:49:21 +0000
@@ -345,7 +345,7 @@
  	if (!tc_fetch(file, ref_id, &seg, &page, offset, thread))
  		return FAILED;
  #endif
--	page->tcp_lock_count++;
++	xt_atomic_inc4(&page->tcp_lock_count);
  	xt_rwmutex_unlock(&seg->tcs_lock, thread->t_id);
  	*ret_page = page;
  	return OK;
@@ -376,7 +376,7 @@
  #endif
  	if (page->tcp_lock_count > 0)
--		page->tcp_lock_count--;
++		xt_atomic_dec4(&page->tcp_lock_count);
  	xt_rwmutex_unlock(&seg->tcs_lock, thread->t_id);
+ }