/* * remote_rwlock.c - kernel remote rwlock implementation. * * Authors Alain Greiner (2016,2017,2018) * * Copyright (c) UPMC Sorbonne Universites * * This file is part of ALMOS-MKH. * * ALMOS-MKH is free software; you can redistribute it and/or modify it * under the terms of the GNU General Public License as published by * the Free Software Foundation; version 2.0 of the License. * * ALMOS-MKH is distributed in the hope that it will be useful, but * WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU * General Public License for more details. * * You should have received a copy of the GNU General Public License * along with ALMOS-MKH; if not, write to the Free Software Foundation, * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA */ #include #include #include #include #include #include #include #include ////////////////////////////////////////////////////////////////////////////// // Extern global variables ////////////////////////////////////////////////////////////////////////////// extern char * lock_type_str[]; // allocated in kernel_init.c ////////////////////////////////////////// void remote_rwlock_init( xptr_t lock_xp, uint32_t type ) { remote_rwlock_t * lock_ptr = GET_PTR( lock_xp ); cxy_t lock_cxy = GET_CXY( lock_xp ); hal_remote_s32 ( XPTR( lock_cxy , &lock_ptr->taken ) , 0 ); hal_remote_s32 ( XPTR( lock_cxy , &lock_ptr->count ) , 0 ); xlist_root_init( XPTR( lock_cxy , &lock_ptr->rd_xroot ) ); xlist_root_init( XPTR( lock_cxy , &lock_ptr->wr_xroot ) ); remote_busylock_init( XPTR( lock_cxy , &lock_ptr->lock ) , type ); } /////////////////////////////////////////////// void remote_rwlock_rd_acquire( xptr_t lock_xp ) { thread_t * this = CURRENT_THREAD; // check calling thread can yield thread_assert_can_yield( this , __FUNCTION__ ); // get cluster and local pointer on remote_rwlock remote_rwlock_t * lock_ptr = GET_PTR( lock_xp ); cxy_t lock_cxy = GET_CXY( lock_xp ); // build useful extended pointers xptr_t busylock_xp = XPTR( lock_cxy , &lock_ptr->lock ); xptr_t taken_xp = XPTR( lock_cxy , &lock_ptr->taken ); xptr_t count_xp = XPTR( lock_cxy , &lock_ptr->count ); xptr_t rd_root_xp = XPTR( lock_cxy , &lock_ptr->rd_xroot ); // get busylock remote_busylock_acquire( busylock_xp ); // block and deschedule if lock taken while( hal_remote_l32( taken_xp ) ) { #if DEBUG_RWLOCK if( DEBUG_RWLOCK < (uint32_t)hal_get_cycles() ) { uint32_t type = hal_remote_l32( XPTR( lock_cxy , &lock_ptr->lock.type ) ); printk("\n[DBG] %s : thread %x (%s) READ BLOCK on rwlock %s [%x,%x] / cycle %d\n", __FUNCTION__, this->trdid, thread_type_str(this->type), lock_type_str[type], lock_cxy, lock_ptr, (uint32_t)hal_get_cycles() ); } #endif // get pointer on calling thread thread_t * this = CURRENT_THREAD; // register reader thread in waiting queue xlist_add_last( rd_root_xp , XPTR( local_cxy , &this->wait_xlist ) ); // block reader thread thread_block( XPTR( local_cxy , this ) , THREAD_BLOCKED_LOCK ); // release busylock remote_busylock_release( busylock_xp ); // deschedule sched_yield("reader wait remote_rwlock"); // get busylock remote_busylock_acquire( busylock_xp ); } #if DEBUG_RWLOCK if( DEBUG_RWLOCK < (uint32_t)hal_get_cycles() ) { uint32_t type = hal_remote_l32( XPTR( lock_cxy , &lock_ptr->lock.type ) ); printk("\n[DBG] %s : thread %x (%s) READ ACQUIRE on rwlock %s [%x,%x] / cycle %d\n", __FUNCTION__, this->trdid, thread_type_str(this->type), lock_type_str[type], lock_cxy, lock_ptr, (uint32_t)hal_get_cycles() ); } #endif // increment number of readers hal_remote_atomic_add( count_xp , 1 ); // release busylock remote_busylock_release( busylock_xp ); } // end remote_rwlock_rd_acquire() /////////////////////////////////////////////// void remote_rwlock_wr_acquire( xptr_t lock_xp ) { thread_t * this = CURRENT_THREAD; // check calling thread can yield thread_assert_can_yield( this , __FUNCTION__ ); // get cluster and local pointer on remote_rwlock remote_rwlock_t * lock_ptr = GET_PTR( lock_xp ); cxy_t lock_cxy = GET_CXY( lock_xp ); // build useful extended pointers xptr_t busylock_xp = XPTR( lock_cxy , &lock_ptr->lock ); xptr_t taken_xp = XPTR( lock_cxy , &lock_ptr->taken ); xptr_t count_xp = XPTR( lock_cxy , &lock_ptr->count ); xptr_t wr_root_xp = XPTR( lock_cxy , &lock_ptr->wr_xroot ); // get busylock remote_busylock_acquire( busylock_xp ); // block and deschedule if lock already taken or current readers while( hal_remote_l32( taken_xp ) || hal_remote_l32( count_xp ) ) { #if DEBUG_RWLOCK if( DEBUG_RWLOCK < (uint32_t)hal_get_cycles() ) { uint32_t type = hal_remote_l32( XPTR( lock_cxy , &lock_ptr->lock.type ) ); printk("\n[DBG] %s : thread %x (%s) WRITE BLOCK on rwlock %s [%x,%x] / cycle %d\n", __FUNCTION__, this->trdid, thread_type_str(this->type), lock_type_str[type], lock_cxy, lock_ptr, (uint32_t)hal_get_cycles() ); } #endif // get local pointer on calling thread thread_t * this = CURRENT_THREAD; // register writer thread in waiting queue xlist_add_last( wr_root_xp , XPTR( local_cxy , &this->wait_xlist ) ); // block writer thread thread_block( XPTR( local_cxy , this ) , THREAD_BLOCKED_LOCK ); // release busylock remote_busylock_release( busylock_xp ); // deschedule sched_yield("writer wait remote_rwlock"); // get busylock remote_busylock_acquire( busylock_xp ); } #if DEBUG_RWLOCK if( DEBUG_RWLOCK < (uint32_t)hal_get_cycles() ) { uint32_t type = hal_remote_l32( XPTR( lock_cxy , &lock_ptr->lock.type ) ); printk("\n[DBG] %s : thread %x (%s) WRITE ACQUIRE on rwlock %s [%x,%x] / cycle %d\n", __FUNCTION__, this->trdid, thread_type_str(this->type), lock_type_str[type], lock_cxy, lock_ptr, (uint32_t)hal_get_cycles() ); } #endif // take rwlock hal_remote_s32( taken_xp , 1 ); // release busylock remote_busylock_release( busylock_xp ); } // end remote_rwlock_wr_acquire() /////////////////////////////////////////////// void remote_rwlock_rd_release( xptr_t lock_xp ) { // memory barrier before lock release hal_fence(); // get cluster and local pointer on remote_rwlock remote_rwlock_t * lock_ptr = GET_PTR( lock_xp ); cxy_t lock_cxy = GET_CXY( lock_xp ); // build useful extended pointers xptr_t busylock_xp = XPTR( lock_cxy , &lock_ptr->lock ); xptr_t count_xp = XPTR( lock_cxy , &lock_ptr->count ); xptr_t rd_root_xp = XPTR( lock_cxy , &lock_ptr->rd_xroot ); xptr_t wr_root_xp = XPTR( lock_cxy , &lock_ptr->wr_xroot ); // get busylock remote_busylock_acquire( busylock_xp ); #if DEBUG_RWLOCK if( DEBUG_RWLOCK < (uint32_t)hal_get_cycles() ) { thread_t * this = CURRENT_THREAD; uint32_t type = hal_remote_l32( XPTR( lock_cxy , &lock_ptr->lock.type ) ); printk("\n[DBG] %s : thread %x (%s) READ RELEASE on rwlock %s [%x,%x] / cycle %d\n", __FUNCTION__, this->trdid, thread_type_str(this->type), lock_type_str[type], lock_cxy, lock_ptr, (uint32_t)hal_get_cycles() ); } #endif // decrement number of readers hal_remote_atomic_add( count_xp , -1 ); // release first writer in waiting queue if no current readers // and writers waiting queue non empty if( (hal_remote_l32( count_xp ) == 0) && (xlist_is_empty( wr_root_xp ) == false) ) { // get first writer thread xptr_t thread_xp = XLIST_FIRST( wr_root_xp , thread_t, wait_xlist ); cxy_t thread_cxy = GET_CXY( thread_xp ); thread_t * thread_ptr = GET_PTR( thread_xp ); // remove this waiting thread from waiting list xlist_unlink( XPTR( thread_cxy , &thread_ptr->wait_xlist ) ); // unblock this waiting thread thread_unblock( thread_xp , THREAD_BLOCKED_LOCK ); #if DEBUG_RWLOCK if( (uint32_t)hal_get_cycles() > DEBUG_RWLOCK ) { thread_t * this = CURRENT_THREAD; uint32_t lock_type = hal_remote_l32( XPTR( lock_cxy , &lock_ptr->lock.type ) ); trdid_t trdid = hal_remote_l32( XPTR( thread_cxy , &thread_ptr->trdid ) ); uint32_t thread_type = hal_remote_lpt( XPTR( thread_cxy , &thread_ptr->type ) ); printk("\n[DBG] %s : thread %x (%s) UNBLOCK thread %x (%s)" " / rwlock %s [%x,%x] / cycle %d\n", __FUNCTION__, this->trdid, thread_type_str(this->type), trdid, thread_type_str(thread_type), lock_type_str[lock_type], lock_cxy, lock_ptr, (uint32_t)hal_get_cycles() ); } #endif } // release all readers in waiting queue if writers waiting queue empty // and readers waiting queue non empty else if( xlist_is_empty( wr_root_xp ) && (xlist_is_empty( rd_root_xp ) == false) ) { while( xlist_is_empty( rd_root_xp ) == false ) { // get first writer thread xptr_t thread_xp = XLIST_FIRST( wr_root_xp , thread_t, wait_xlist ); cxy_t thread_cxy = GET_CXY( thread_xp ); thread_t * thread_ptr = GET_PTR( thread_xp ); // remove this waiting thread from waiting list xlist_unlink( XPTR( thread_cxy , &thread_ptr->wait_xlist ) ); // unblock this waiting thread thread_unblock( thread_xp , THREAD_BLOCKED_LOCK ); #if DEBUG_RWLOCK if( (uint32_t)hal_get_cycles() > DEBUG_RWLOCK ) { thread_t * this = CURRENT_THREAD; uint32_t lock_type = hal_remote_l32( XPTR( lock_cxy , &lock_ptr->lock.type ) ); trdid_t trdid = hal_remote_l32( XPTR( thread_cxy , &thread_ptr->trdid ) ); uint32_t thread_type = hal_remote_lpt( XPTR( thread_cxy , &thread_ptr->type ) ); printk("\n[DBG] %s : thread %x (%s) UNBLOCK thread %x (%s)" " / rwlock %s [%x,%x] / cycle %d\n", __FUNCTION__, this->trdid, thread_type_str(this->type), trdid, thread_type_str(thread_type), lock_type_str[lock_type], lock_cxy, lock_ptr, (uint32_t)hal_get_cycles() ); } #endif } } // release busylock remote_busylock_release( busylock_xp ); } // end remote_rwlock_rd_release() /////////////////////////////////////////////// void remote_rwlock_wr_release( xptr_t lock_xp ) { // memory barrier before lock release hal_fence(); // get cluster and local pointer on remote_rwlock remote_rwlock_t * lock_ptr = GET_PTR( lock_xp ); cxy_t lock_cxy = GET_CXY( lock_xp ); // build useful extended pointers xptr_t busylock_xp = XPTR( lock_cxy , &lock_ptr->lock ); xptr_t taken_xp = XPTR( lock_cxy , &lock_ptr->taken ); xptr_t rd_root_xp = XPTR( lock_cxy , &lock_ptr->rd_xroot ); xptr_t wr_root_xp = XPTR( lock_cxy , &lock_ptr->wr_xroot ); // get busylock remote_busylock_acquire( busylock_xp ); #if DEBUG_RWLOCK if( DEBUG_RWLOCK < (uint32_t)hal_get_cycles() ) { thread_t * this = CURRENT_THREAD; uint32_t type = hal_remote_l32( XPTR( lock_cxy , &lock_ptr->lock.type ) ); printk("\n[DBG] %s : thread %x (%s) WRITE RELEASE on rwlock %s [%x,%x] / cycle %d\n", __FUNCTION__, this->trdid, thread_type_str(this->type), lock_type_str[type], lock_cxy, lock_ptr, (uint32_t)hal_get_cycles() ); } #endif // release rwlock hal_remote_s32( taken_xp , 0 ); // unblock first waiting writer thread if writers waiting queue non empty if( xlist_is_empty( wr_root_xp ) == false ) { // get first writer thread xptr_t thread_xp = XLIST_FIRST( wr_root_xp , thread_t, wait_xlist ); cxy_t thread_cxy = GET_CXY( thread_xp ); thread_t * thread_ptr = GET_PTR( thread_xp ); // remove this waiting thread from waiting list xlist_unlink( XPTR( thread_cxy , &thread_ptr->wait_xlist ) ); // unblock this waiting thread thread_unblock( thread_xp , THREAD_BLOCKED_LOCK ); #if DEBUG_RWLOCK if( (uint32_t)hal_get_cycles() > DEBUG_RWLOCK ) { thread_t * this = CURRENT_THREAD; uint32_t lock_type = hal_remote_l32( XPTR( lock_cxy , &lock_ptr->lock.type ) ); trdid_t trdid = hal_remote_l32( XPTR( thread_cxy , &thread_ptr->trdid ) ); uint32_t thread_type = hal_remote_lpt( XPTR( thread_cxy , &thread_ptr->type ) ); printk("\n[DBG] %s : thread %x (%s) UNBLOCK thread %x (%s)" " / rwlock %s [%x,%x] / cycle %d\n", __FUNCTION__, this->trdid, thread_type_str(this->type), trdid, thread_type_str(thread_type), lock_type_str[lock_type], lock_cxy, lock_ptr, (uint32_t)hal_get_cycles() ); } #endif } // check readers waiting queue and unblock all if writers waiting queue empty else { while( xlist_is_empty( rd_root_xp ) == false ) { // get first writer thread xptr_t thread_xp = XLIST_FIRST( rd_root_xp , thread_t, wait_xlist ); cxy_t thread_cxy = GET_CXY( thread_xp ); thread_t * thread_ptr = GET_PTR( thread_xp ); // remove this waiting thread from waiting list xlist_unlink( XPTR( thread_cxy , &thread_ptr->wait_xlist ) ); // unblock this waiting thread thread_unblock( thread_xp , THREAD_BLOCKED_LOCK ); #if DEBUG_RWLOCK if( (uint32_t)hal_get_cycles() > DEBUG_RWLOCK ) { thread_t * this = CURRENT_THREAD; uint32_t lock_type = hal_remote_l32( XPTR( lock_cxy , &lock_ptr->lock.type ) ); trdid_t trdid = hal_remote_l32( XPTR( thread_cxy , &thread_ptr->trdid ) ); uint32_t thread_type = hal_remote_lpt( XPTR( thread_cxy , &thread_ptr->type ) ); printk("\n[DBG] %s : thread %x (%s) UNBLOCK thread %x (%s)" " / rwlock %s [%x,%x] / cycle %d\n", __FUNCTION__, this->trdid, thread_type_str(this->type), trdid, thread_type_str(thread_type), lock_type_str[lock_type], lock_cxy, lock_ptr, (uint32_t)hal_get_cycles() ); } #endif } } // release busylock remote_busylock_release( busylock_xp ); } // end remote_rwlock_wr_release()