source: trunk/kernel/kern/thread.c @ 471

Last change on this file since 471 was 469, checked in by alain, 6 years ago

1) Introduce the libsemaphore library.
2) Introduce a small libmath library, required by the "fft" application..
3) Introduce the multithreaded "fft" application.
4) Fix a bad synchronisation bug in the Copy-On-Write mechanism.

File size: 41.5 KB
Line 
1/*
2 * thread.c -  implementation of thread operations (user & kernel)
3 *
4 * Author  Ghassan Almaless (2008,2009,2010,2011,2012)
5 *         Alain Greiner (2016,2017)
6 *
7 * Copyright (c) UPMC Sorbonne Universites
8 *
9 * This file is part of ALMOS-MKH.
10 *
11 * ALMOS-MKH is free software; you can redistribute it and/or modify it
12 * under the terms of the GNU General Public License as published by
13 * the Free Software Foundation; version 2.0 of the License.
14 *
15 * ALMOS-MKH is distributed in the hope that it will be useful, but
16 * WITHOUT ANY WARRANTY; without even the implied warranty of
17 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
18 * General Public License for more details.
19 *
20 * You should have received a copy of the GNU General Public License
21 * along with ALMOS-MKH; if not, write to the Free Software Foundation,
22 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
23 */
24
25#include <kernel_config.h>
26#include <hal_kernel_types.h>
27#include <hal_context.h>
28#include <hal_irqmask.h>
29#include <hal_special.h>
30#include <hal_remote.h>
31#include <memcpy.h>
32#include <printk.h>
33#include <cluster.h>
34#include <process.h>
35#include <scheduler.h>
36#include <dev_pic.h>
37#include <core.h>
38#include <list.h>
39#include <xlist.h>
40#include <page.h>
41#include <kmem.h>
42#include <ppm.h>
43#include <thread.h>
44#include <rpc.h>
45
46//////////////////////////////////////////////////////////////////////////////////////
47// Extern global variables
48//////////////////////////////////////////////////////////////////////////////////////
49
50extern process_t      process_zero;
51
52//////////////////////////////////////////////////////////////////////////////////////
53// This function returns a printable string for the thread type.
54//////////////////////////////////////////////////////////////////////////////////////
55char * thread_type_str( uint32_t type )
56{
57    if     ( type == THREAD_USER   ) return "USR";
58    else if( type == THREAD_RPC    ) return "RPC";
59    else if( type == THREAD_DEV    ) return "DEV";
60    else if( type == THREAD_IDLE   ) return "IDL";
61    else                             return "undefined";
62}
63
64/////////////////////////////////////////////////////////////////////////////////////
65// This static function allocates physical memory for a thread descriptor.
66// It can be called by the three functions:
67// - thread_user_create()
68// - thread_user_fork()
69// - thread_kernel_create()
70/////////////////////////////////////////////////////////////////////////////////////
71// @ return pointer on thread descriptor if success / return NULL if failure.
72/////////////////////////////////////////////////////////////////////////////////////
73static thread_t * thread_alloc()
74{
75        page_t       * page;   // pointer on page descriptor containing thread descriptor
76        kmem_req_t     req;    // kmem request
77
78        // allocates memory for thread descriptor + kernel stack
79        req.type  = KMEM_PAGE;
80        req.size  = CONFIG_THREAD_DESC_ORDER;
81        req.flags = AF_KERNEL | AF_ZERO;
82        page      = kmem_alloc( &req );
83
84        if( page == NULL ) return NULL;
85
86    // return pointer on new thread descriptor
87    xptr_t base_xp = ppm_page2base( XPTR(local_cxy , page ) );
88    return GET_PTR( base_xp );
89
90}  // end thread_alloc()
91 
92
93/////////////////////////////////////////////////////////////////////////////////////
94// This static function releases the physical memory for a thread descriptor.
95// It is called by the three functions:
96// - thread_user_create()
97// - thread_user_fork()
98// - thread_kernel_create()
99/////////////////////////////////////////////////////////////////////////////////////
100// @ thread  : pointer on thread descriptor.
101/////////////////////////////////////////////////////////////////////////////////////
102static void thread_release( thread_t * thread )
103{
104    kmem_req_t   req;
105
106    xptr_t base_xp = ppm_base2page( XPTR(local_cxy , thread ) );
107
108    req.type  = KMEM_PAGE;
109    req.ptr   = GET_PTR( base_xp );
110    kmem_free( &req );
111}
112
113/////////////////////////////////////////////////////////////////////////////////////
114// This static function initializes a thread descriptor (kernel or user).
115// It can be called by the four functions:
116// - thread_user_create()
117// - thread_user_fork()
118// - thread_kernel_create()
119// - thread_idle_init()
120// It updates the local DQDT.
121/////////////////////////////////////////////////////////////////////////////////////
122// @ thread       : pointer on thread descriptor
123// @ process      : pointer on process descriptor.
124// @ type         : thread type.
125// @ func         : pointer on thread entry function.
126// @ args         : pointer on thread entry function arguments.
127// @ core_lid     : target core local index.
128// @ u_stack_base : stack base (user thread only)
129// @ u_stack_size : stack base (user thread only)
130/////////////////////////////////////////////////////////////////////////////////////
131static error_t thread_init( thread_t      * thread,
132                            process_t     * process,
133                            thread_type_t   type,
134                            void          * func,
135                            void          * args,
136                            lid_t           core_lid,
137                            intptr_t        u_stack_base,
138                            uint32_t        u_stack_size )
139{
140    error_t        error;
141    trdid_t        trdid;      // allocated thread identifier
142
143        cluster_t    * local_cluster = LOCAL_CLUSTER;
144
145#if DEBUG_THREAD_USER_INIT
146uint32_t cycle = (uint32_t)hal_get_cycles();
147if( DEBUG_THREAD_USER_INIT < cycle )
148printk("\n[DBG] %s : thread %x enter to init thread %x in process %x / cycle %d\n",
149__FUNCTION__, CURRENT_THREAD, thread, process->pid , cycle );
150#endif
151
152    // register new thread in process descriptor, and get a TRDID
153    error = process_register_thread( process, thread , &trdid );
154
155    if( error )
156    {
157        printk("\n[ERROR] in %s : cannot get TRDID\n", __FUNCTION__ );
158        return EINVAL;
159    }
160
161    // compute thread descriptor size without kernel stack
162    uint32_t desc_size = (intptr_t)(&thread->signature) - (intptr_t)thread + 4; 
163
164        // Initialize new thread descriptor
165    thread->trdid           = trdid;
166        thread->type            = type;
167    thread->quantum         = 0;            // TODO
168    thread->ticks_nr        = 0;            // TODO
169    thread->time_last_check = 0;            // TODO
170        thread->core            = &local_cluster->core_tbl[core_lid];
171        thread->process         = process;
172
173    thread->local_locks     = 0;
174    thread->remote_locks    = 0;
175
176#if CONFIG_LOCKS_DEBUG
177    list_root_init( &thread->locks_root ); 
178    xlist_root_init( XPTR( local_cxy , &thread->xlocks_root ) );
179#endif
180
181    thread->u_stack_base    = u_stack_base;
182    thread->u_stack_size    = u_stack_size;
183    thread->k_stack_base    = (intptr_t)thread + desc_size;
184    thread->k_stack_size    = CONFIG_THREAD_DESC_SIZE - desc_size;
185
186    thread->entry_func      = func;         // thread entry point
187    thread->entry_args      = args;         // thread function arguments
188    thread->flags           = 0;            // all flags reset
189    thread->errno           = 0;            // no error detected
190    thread->fork_user       = 0;            // no user defined placement for fork
191    thread->fork_cxy        = 0;            // user defined target cluster for fork
192    thread->blocked         = THREAD_BLOCKED_GLOBAL;
193
194    // reset sched list
195    list_entry_init( &thread->sched_list );
196
197    // reset thread info
198    memset( &thread->info , 0 , sizeof(thread_info_t) );
199
200    // initializes join_lock
201    remote_spinlock_init( XPTR( local_cxy , &thread->join_lock ) );
202
203    // initialise signature
204        thread->signature = THREAD_SIGNATURE;
205
206    // FIXME define and call an architecture specific hal_thread_init()
207    // function to initialise the save_sr field
208    thread->save_sr = 0xFF13;
209
210    // register new thread in core scheduler
211    sched_register_thread( thread->core , thread );
212
213        // update DQDT
214    dqdt_update_threads( 1 );
215
216#if DEBUG_THREAD_USER_INIT
217cycle = (uint32_t)hal_get_cycles();
218if( DEBUG_THREAD_USER_INIT < cycle )
219printk("\n[DBG] %s : thread %x exit  after init of thread %x in process %x / cycle %d\n",
220__FUNCTION__, CURRENT_THREAD, thread, process->pid , cycle );
221#endif
222
223        return 0;
224
225} // end thread_init()
226
227/////////////////////////////////////////////////////////
228error_t thread_user_create( pid_t             pid,
229                            void            * start_func,
230                            void            * start_arg,
231                            pthread_attr_t  * attr,
232                            thread_t       ** new_thread )
233{
234    error_t        error;
235        thread_t     * thread;       // pointer on created thread descriptor
236    process_t    * process;      // pointer to local process descriptor
237    lid_t          core_lid;     // selected core local index
238    vseg_t       * vseg;         // stack vseg
239
240    assert( (attr != NULL) , __FUNCTION__, "pthread attributes must be defined" );
241
242#if DEBUG_THREAD_USER_CREATE
243uint32_t cycle = (uint32_t)hal_get_cycles();
244if( DEBUG_THREAD_USER_CREATE < cycle )
245printk("\n[DBG] %s : thread %x in process %x enter in cluster %x / cycle %d\n",
246__FUNCTION__, CURRENT_THREAD->trdid, pid , local_cxy , cycle );
247#endif
248
249    // get process descriptor local copy
250    process = process_get_local_copy( pid );
251
252    if( process == NULL )
253    {
254                printk("\n[ERROR] in %s : cannot get process descriptor %x\n",
255               __FUNCTION__ , pid );
256        return ENOMEM;
257    }
258
259#if( DEBUG_THREAD_USER_CREATE & 1)
260if( DEBUG_THREAD_USER_CREATE < cycle )
261printk("\n[DBG] %s : process descriptor = %x for process %x in cluster %x\n",
262__FUNCTION__, process , pid , local_cxy );
263#endif
264
265    // select a target core in local cluster
266    if( attr->attributes & PT_ATTR_CORE_DEFINED )
267    {
268        core_lid = attr->lid;
269        if( core_lid >= LOCAL_CLUSTER->cores_nr )
270        {
271                printk("\n[ERROR] in %s : illegal core index attribute = %d\n",
272            __FUNCTION__ , core_lid );
273            return EINVAL;
274        }
275    }
276    else
277    {
278        core_lid = cluster_select_local_core();
279    }
280
281#if( DEBUG_THREAD_USER_CREATE & 1)
282if( DEBUG_THREAD_USER_CREATE < cycle )
283printk("\n[DBG] %s : core[%x,%d] selected\n",
284__FUNCTION__, local_cxy , core_lid );
285#endif
286
287    // allocate a stack from local VMM
288    vseg = vmm_create_vseg( process,
289                            VSEG_TYPE_STACK,
290                            0,                 // size unused
291                            0,                 // length unused
292                            0,                 // file_offset unused
293                            0,                 // file_size unused
294                            XPTR_NULL,         // mapper_xp unused
295                            local_cxy );
296
297    if( vseg == NULL )
298    {
299            printk("\n[ERROR] in %s : cannot create stack vseg\n", __FUNCTION__ );
300                return ENOMEM;
301    }
302
303#if( DEBUG_THREAD_USER_CREATE & 1)
304if( DEBUG_THREAD_USER_CREATE < cycle )
305printk("\n[DBG] %s : stack vseg created / vpn_base %x / %d pages\n",
306__FUNCTION__, vseg->vpn_base, vseg->vpn_size );
307#endif
308
309    // allocate memory for thread descriptor
310    thread = thread_alloc();
311
312    if( thread == NULL )
313    {
314            printk("\n[ERROR] in %s : cannot create new thread\n", __FUNCTION__ );
315        vmm_remove_vseg( vseg );
316        return ENOMEM;
317    }
318
319#if( DEBUG_THREAD_USER_CREATE & 1)
320if( DEBUG_THREAD_USER_CREATE < cycle )
321printk("\n[DBG] %s : new thread descriptor %x allocated\n",
322__FUNCTION__, thread );
323#endif
324
325    // initialize thread descriptor
326    error = thread_init( thread,
327                         process,
328                         THREAD_USER,
329                         start_func,
330                         start_arg,
331                         core_lid,
332                         vseg->min,
333                         vseg->max - vseg->min );
334    if( error )
335    {
336            printk("\n[ERROR] in %s : cannot initialize new thread\n", __FUNCTION__ );
337        vmm_remove_vseg( vseg );
338        thread_release( thread );
339        return EINVAL;
340    }
341
342#if( DEBUG_THREAD_USER_CREATE & 1)
343if( DEBUG_THREAD_USER_CREATE < cycle )
344printk("\n[DBG] %s : new thread descriptor initialised / trdid %x\n",
345__FUNCTION__, thread->trdid );
346#endif
347
348    // set DETACHED flag if required
349    if( attr->attributes & PT_ATTR_DETACH ) 
350    {
351        thread->flags |= THREAD_FLAG_DETACHED;
352    }
353
354    // allocate & initialize CPU context
355        if( hal_cpu_context_alloc( thread ) )
356    {
357            printk("\n[ERROR] in %s : cannot create CPU context\n", __FUNCTION__ );
358        vmm_remove_vseg( vseg );
359        thread_release( thread );
360        return ENOMEM;
361    }
362    hal_cpu_context_init( thread );
363
364    // allocate & initialize FPU context
365    if( hal_fpu_context_alloc( thread ) )
366    {
367            printk("\n[ERROR] in %s : cannot create FPU context\n", __FUNCTION__ );
368        vmm_remove_vseg( vseg );
369        thread_release( thread );
370        return ENOMEM;
371    }
372    hal_fpu_context_init( thread );
373
374#if( DEBUG_THREAD_USER_CREATE & 1)
375if( DEBUG_THREAD_USER_CREATE < cycle )
376printk("\n[DBG] %s : CPU & FPU contexts created\n",
377__FUNCTION__, thread->trdid );
378vmm_display( process , true );
379#endif
380
381#if DEBUG_THREAD_USER_CREATE
382cycle = (uint32_t)hal_get_cycles();
383if( DEBUG_THREAD_USER_CREATE < cycle )
384printk("\n[DBG] %s : thread %x in process %x exit / new_thread %x / core %d / cycle %d\n",
385__FUNCTION__, CURRENT_THREAD->trdid , pid, thread->trdid, core_lid, cycle );
386#endif
387
388    *new_thread = thread;
389        return 0;
390
391}  // end thread_user_create()
392
393///////////////////////////////////////////////////////
394error_t thread_user_fork( xptr_t      parent_thread_xp,
395                          process_t * child_process,
396                          thread_t ** child_thread )
397{
398    error_t        error;
399        thread_t     * child_ptr;        // local pointer on local child thread
400    lid_t          core_lid;         // selected core local index
401
402    thread_t     * parent_ptr;       // local pointer on remote parent thread
403    cxy_t          parent_cxy;       // parent thread cluster
404    process_t    * parent_process;   // local pointer on parent process
405    xptr_t         parent_gpt_xp;    // extended pointer on parent thread GPT
406
407    void         * func;             // parent thread entry_func
408    void         * args;             // parent thread entry_args
409    intptr_t       base;             // parent thread u_stack_base
410    uint32_t       size;             // parent thread u_stack_size
411    uint32_t       flags;            // parent_thread flags
412    vpn_t          vpn_base;         // parent thread stack vpn_base
413    vpn_t          vpn_size;         // parent thread stack vpn_size
414    reg_t        * uzone;            // parent thread pointer on uzone 
415
416    vseg_t       * vseg;             // child thread STACK vseg
417
418#if DEBUG_THREAD_USER_FORK
419uint32_t cycle = (uint32_t)hal_get_cycles();
420if( DEBUG_THREAD_USER_FORK < cycle )
421printk("\n[DBG] %s : thread %x in process %x enter / child_process %x / cycle %d\n",
422__FUNCTION__, CURRENT_THREAD->trdid, CURRENT_THREAD->process->pid, child_process->pid, cycle );
423#endif
424
425    // select a target core in local cluster
426    core_lid = cluster_select_local_core();
427
428    // get cluster and local pointer on parent thread descriptor
429    parent_cxy = GET_CXY( parent_thread_xp );
430    parent_ptr = GET_PTR( parent_thread_xp );
431
432    // get relevant fields from parent thread
433    func  = (void *)  hal_remote_lpt( XPTR( parent_cxy , &parent_ptr->entry_func    ));
434    args  = (void *)  hal_remote_lpt( XPTR( parent_cxy , &parent_ptr->entry_args    ));
435    base  = (intptr_t)hal_remote_lpt( XPTR( parent_cxy , &parent_ptr->u_stack_base  ));
436    size  = (uint32_t)hal_remote_lw ( XPTR( parent_cxy , &parent_ptr->u_stack_size  ));
437    flags =           hal_remote_lw ( XPTR( parent_cxy , &parent_ptr->flags         ));
438    uzone = (reg_t *) hal_remote_lpt( XPTR( parent_cxy , &parent_ptr->uzone_current ));
439
440    vpn_base = base >> CONFIG_PPM_PAGE_SHIFT;
441    vpn_size = size >> CONFIG_PPM_PAGE_SHIFT;
442
443    // get pointer on parent process in parent thread cluster
444    parent_process = (process_t *)hal_remote_lpt( XPTR( parent_cxy,
445                                                        &parent_ptr->process ) );
446 
447    // get extended pointer on parent GPT in parent thread cluster
448    parent_gpt_xp = XPTR( parent_cxy , &parent_process->vmm.gpt );
449
450    // allocate memory for child thread descriptor
451    child_ptr = thread_alloc();
452    if( child_ptr == NULL )
453    {
454        printk("\n[ERROR] in %s : cannot allocate new thread\n", __FUNCTION__ );
455        return -1;
456    }
457
458    // initialize thread descriptor
459    error = thread_init( child_ptr,
460                         child_process,
461                         THREAD_USER,
462                         func,
463                         args,
464                         core_lid,
465                         base,
466                         size );
467    if( error )
468    {
469            printk("\n[ERROR] in %s : cannot initialize child thread\n", __FUNCTION__ );
470        thread_release( child_ptr );
471        return EINVAL;
472    }
473
474    // return child pointer
475    *child_thread = child_ptr;
476
477    // set detached flag if required
478    if( flags & THREAD_FLAG_DETACHED ) child_ptr->flags = THREAD_FLAG_DETACHED;
479
480    // update uzone pointer in child thread descriptor
481    child_ptr->uzone_current = (char *)((intptr_t)uzone +
482                                        (intptr_t)child_ptr - 
483                                        (intptr_t)parent_ptr );
484 
485
486    // allocate CPU context for child thread
487        if( hal_cpu_context_alloc( child_ptr ) )
488    {
489            printk("\n[ERROR] in %s : cannot allocate CPU context\n", __FUNCTION__ );
490        thread_release( child_ptr );
491        return -1;
492    }
493
494    // allocate FPU context for child thread
495        if( hal_fpu_context_alloc( child_ptr ) )
496    {
497            printk("\n[ERROR] in %s : cannot allocate FPU context\n", __FUNCTION__ );
498        thread_release( child_ptr );
499        return -1;
500    }
501
502    // create and initialize STACK vseg
503    vseg = vseg_alloc();
504    vseg_init( vseg,
505               VSEG_TYPE_STACK,
506               base,
507               size,
508               vpn_base,
509               vpn_size,
510               0, 0, XPTR_NULL,                         // not a file vseg
511               local_cxy );
512
513    // register STACK vseg in local child VSL
514    vseg_attach( &child_process->vmm , vseg );
515
516    // copy all valid STACK GPT entries   
517    vpn_t          vpn;
518    bool_t         mapped;
519    ppn_t          ppn;
520    for( vpn = vpn_base ; vpn < (vpn_base + vpn_size) ; vpn++ )
521    {
522        error = hal_gpt_pte_copy( &child_process->vmm.gpt,
523                                  parent_gpt_xp,
524                                  vpn,
525                                  true,                 // set cow
526                                  &ppn,
527                                  &mapped );
528        if( error )
529        {
530            vseg_detach( &child_process->vmm , vseg );
531            vseg_free( vseg );
532            thread_release( child_ptr );
533            printk("\n[ERROR] in %s : cannot update child GPT\n", __FUNCTION__ );
534            return -1;
535        }
536
537        // increment pending forks counter for the page if mapped
538        if( mapped )
539        {
540            // get pointers on the page descriptor
541            xptr_t   page_xp  = ppm_ppn2page( ppn );
542            cxy_t    page_cxy = GET_CXY( page_xp );
543            page_t * page_ptr = GET_PTR( page_xp );
544
545            // get extended pointers on forks and lock fields
546            xptr_t forks_xp = XPTR( page_cxy , &page_ptr->forks );
547            xptr_t lock_xp  = XPTR( page_cxy , &page_ptr->lock );
548
549            // increment the forks counter
550            remote_spinlock_lock( lock_xp ); 
551            hal_remote_atomic_add( XPTR( page_cxy , &page_ptr->forks ) , 1 );
552            remote_spinlock_unlock( lock_xp ); 
553
554#if (DEBUG_THREAD_USER_FORK & 1)
555cycle = (uint32_t)hal_get_cycles();
556if( DEBUG_THREAD_USER_FORK < cycle )
557printk("\n[DBG] %s : thread %x in process %x copied one PTE to child GPT : vpn %x / forks %d\n",
558__FUNCTION__, CURRENT_THREAD->trdid, CURRENT_THREAD->process->pid, vpn,
559hal_remote_lw( XPTR( page_cxy , &page_ptr->forks) ) );
560#endif
561
562        }
563    }
564
565    // set COW flag for all mapped entries of STAK vseg in parent thread GPT
566    hal_gpt_set_cow( parent_gpt_xp,
567                     vpn_base,
568                     vpn_size );
569 
570#if DEBUG_THREAD_USER_FORK
571cycle = (uint32_t)hal_get_cycles();
572if( DEBUG_THREAD_USER_FORK < cycle )
573printk("\n[DBG] %s : thread %x in process %x exit / child_thread %x / cycle %d\n",
574__FUNCTION__, CURRENT_THREAD->trdid, CURRENT_THREAD->process->pid, child_ptr, cycle );
575#endif
576
577        return 0;
578
579}  // end thread_user_fork()
580
581////////////////////////////////////////////////
582error_t thread_user_exec( void     * entry_func,
583                          uint32_t   argc,
584                          char    ** argv )
585{
586    thread_t  * thread  = CURRENT_THREAD;
587    process_t * process = thread->process;
588
589#if DEBUG_THREAD_USER_EXEC
590uint32_t cycle = (uint32_t)hal_get_cycles();
591if( DEBUG_THREAD_USER_EXEC < cycle )
592printk("\n[DBG] %s : thread %x in process %x enter / cycle %d\n",
593__FUNCTION__, thread->trdid, process->pid, cycle );
594#endif
595
596        assert( (thread->type == THREAD_USER )          , __FUNCTION__, "bad type" );
597        assert( (thread->signature == THREAD_SIGNATURE) , __FUNCTION__, "bad signature" );
598        assert( (thread->local_locks == 0)              , __FUNCTION__, "bad local locks" );
599        assert( (thread->remote_locks == 0)             , __FUNCTION__, "bad remote locks" );
600
601        // re-initialize various thread descriptor fields
602    thread->quantum         = 0;            // TODO
603    thread->ticks_nr        = 0;            // TODO
604    thread->time_last_check = 0;            // TODO
605
606#if CONFIG_LOCKS_DEBUG
607    list_root_init( &thread->locks_root ); 
608    xlist_root_init( XPTR( local_cxy , &thread->xlocks_root ) );
609#endif
610
611    thread->entry_func      = entry_func;
612    thread->main_argc       = argc; 
613    thread->main_argv       = argv;
614
615    // the main thread is always detached
616    thread->flags           = THREAD_FLAG_DETACHED;
617    thread->blocked         = 0;
618    thread->errno           = 0;
619    thread->fork_user       = 0;    // not inherited
620    thread->fork_cxy        = 0;    // not inherited
621
622    // reset thread info
623    memset( &thread->info , 0 , sizeof(thread_info_t) );
624
625    // initialize join_lock
626    remote_spinlock_init( XPTR( local_cxy , &thread->join_lock ) );
627
628    // allocate an user stack vseg for main thread
629    vseg_t * vseg = vmm_create_vseg( process,
630                                     VSEG_TYPE_STACK,
631                                     0,                 // size unused
632                                     0,                 // length unused
633                                     0,                 // file_offset unused
634                                     0,                 // file_size unused
635                                     XPTR_NULL,         // mapper_xp unused
636                                     local_cxy );
637    if( vseg == NULL )
638    {
639            printk("\n[ERROR] in %s : cannot create stack vseg for main thread\n", __FUNCTION__ );
640                return -1;
641    }
642
643    // update user stack in thread descriptor
644    thread->u_stack_base = vseg->min;
645    thread->u_stack_size = vseg->max - vseg->min;
646   
647    // release FPU ownership if required
648    if( thread->core->fpu_owner == thread ) thread->core->fpu_owner = NULL;
649
650    // re-initialize  FPU context
651    hal_fpu_context_init( thread );
652
653#if DEBUG_THREAD_USER_EXEC
654cycle = (uint32_t)hal_get_cycles();
655if( DEBUG_THREAD_USER_EXEC < cycle )
656printk("\n[DBG] %s : thread %x in process %x set CPU context & jump to user code / cycle %d\n",
657__FUNCTION__, thread->trdid, process->pid, cycle );
658vmm_display( process , true );
659#endif
660
661    // re-initialize CPU context... and jump to user code
662        hal_cpu_context_exec( thread );
663
664    assert( false, __FUNCTION__, "we should execute this code");
665 
666    return 0;
667
668}  // end thread_user_exec()
669
670/////////////////////////////////////////////////////////
671error_t thread_kernel_create( thread_t     ** new_thread,
672                              thread_type_t   type,
673                              void          * func,
674                              void          * args,
675                                              lid_t           core_lid )
676{
677    error_t        error;
678        thread_t     * thread;       // pointer on new thread descriptor
679
680    assert( ( (type == THREAD_IDLE) || (type == THREAD_RPC) || (type == THREAD_DEV) ) ,
681    __FUNCTION__ , "illegal thread type" );
682
683    assert( (core_lid < LOCAL_CLUSTER->cores_nr) ,
684            __FUNCTION__ , "illegal core_lid" );
685
686#if DEBUG_THREAD_KERNEL_CREATE
687uint32_t cycle = (uint32_t)hal_get_cycles();
688if( DEBUG_THREAD_KERNEL_CREATE < cycle )
689printk("\n[DBG] %s : thread %x enter / requested_type %s / cycle %d\n",
690__FUNCTION__, CURRENT_THREAD, thread, thread_type_str(type), cycle );
691#endif
692
693    // allocate memory for new thread descriptor
694    thread = thread_alloc();
695
696    if( thread == NULL ) return ENOMEM;
697
698    // initialize thread descriptor
699    error = thread_init( thread,
700                         &process_zero,
701                         type,
702                         func,
703                         args,
704                         core_lid,
705                         0 , 0 );  // no user stack for a kernel thread
706
707    if( error ) // release allocated memory for thread descriptor
708    {
709        thread_release( thread );
710        return ENOMEM;
711    }
712
713    // allocate & initialize CPU context
714        error = hal_cpu_context_alloc( thread );
715    if( error )
716    {
717        thread_release( thread );
718        return EINVAL;
719    }
720    hal_cpu_context_init( thread );
721
722
723#if DEBUG_THREAD_KERNEL_CREATE
724cycle = (uint32_t)hal_get_cycles();
725if( DEBUG_THREAD_KERNEL_CREATE < cycle )
726printk("\n[DBG] %s : thread %x exit / new_thread %x / type %s / cycle %d\n",
727__FUNCTION__, CURRENT_THREAD, thread, thread_type_str(type), cycle );
728#endif
729
730    *new_thread = thread;
731        return 0;
732
733} // end thread_kernel_create()
734
735//////////////////////////////////////////////
736void thread_idle_init( thread_t      * thread,
737                       thread_type_t   type,
738                       void          * func,
739                       void          * args,
740                           lid_t           core_lid )
741{
742    assert( (type == THREAD_IDLE) , __FUNCTION__ , "illegal thread type" );
743    assert( (core_lid < LOCAL_CLUSTER->cores_nr) , __FUNCTION__ , "illegal core index" );
744
745    // initialize thread descriptor
746    error_t  error = thread_init( thread,
747                                  &process_zero,
748                                  type,
749                                  func,
750                                  args,
751                                  core_lid,
752                                  0 , 0 );   // no user stack for a kernel thread
753
754    assert( (error == 0), __FUNCTION__, "cannot create thread idle" );
755
756    // allocate & initialize CPU context if success
757    error = hal_cpu_context_alloc( thread );
758
759    assert( (error == 0), __FUNCTION__, "cannot allocate CPU context" );
760
761    hal_cpu_context_init( thread );
762
763}  // end thread_idle_init()
764
765///////////////////////////////////////////////////////////////////////////////////////
766// TODO: check that all memory dynamically allocated during thread execution
767// has been released, using a cache of mmap requests. [AG]
768///////////////////////////////////////////////////////////////////////////////////////
769bool_t thread_destroy( thread_t * thread )
770{
771    reg_t        save_sr;
772    bool_t       last_thread;
773
774    process_t  * process    = thread->process;
775    core_t     * core       = thread->core;
776
777#if DEBUG_THREAD_DESTROY
778uint32_t cycle = (uint32_t)hal_get_cycles();
779if( DEBUG_THREAD_DESTROY < cycle )
780printk("\n[DBG] %s : thread %x enter to destroy thread %x in process %x / cycle %d\n",
781__FUNCTION__, CURRENT_THREAD, thread->trdid, process->pid, cycle );
782#endif
783
784    assert( (thread->local_locks == 0) , __FUNCTION__ , 
785    "local lock not released for thread %x in process %x", thread->trdid, process->pid );
786
787    assert( (thread->remote_locks == 0) , __FUNCTION__ , 
788    "remote lock not released for thread %x in process %x", thread->trdid, process->pid );
789
790    // update intrumentation values
791        process->vmm.pgfault_nr += thread->info.pgfault_nr;
792
793    // release memory allocated for CPU context and FPU context
794        hal_cpu_context_destroy( thread );
795        if ( thread->type == THREAD_USER ) hal_fpu_context_destroy( thread );
796       
797    // release FPU ownership if required
798        hal_disable_irq( &save_sr );
799        if( core->fpu_owner == thread )
800        {
801                core->fpu_owner = NULL;
802                hal_fpu_disable();
803        }
804        hal_restore_irq( save_sr );
805
806    // remove thread from process th_tbl[]
807    last_thread = process_remove_thread( thread );
808       
809    // update DQDT
810    dqdt_update_threads( -1 );
811
812    // invalidate thread descriptor
813        thread->signature = 0;
814
815    // release memory for thread descriptor
816    thread_release( thread );
817
818#if DEBUG_THREAD_DESTROY
819cycle = (uint32_t)hal_get_cycles();
820if( DEBUG_THREAD_DESTROY < cycle )
821printk("\n[DBG] %s : thread %x exit / destroyed thread %x in process %x / last %d / cycle %d\n",
822__FUNCTION__, CURRENT_THREAD, thread->trdid, process->pid, last_thread / cycle );
823#endif
824
825    return last_thread;
826
827}   // end thread_destroy()
828
829//////////////////////////////////////////////////
830inline void thread_set_req_ack( thread_t * target,
831                                uint32_t * rsp_count )
832{
833    reg_t    save_sr;   // for critical section
834
835    // get pointer on target thread scheduler
836    scheduler_t * sched = &target->core->scheduler;
837
838    // wait scheduler ready to handle a new request
839    while( sched->req_ack_pending ) asm volatile( "nop" );
840   
841    // enter critical section
842    hal_disable_irq( &save_sr );
843     
844    // set request in target thread scheduler
845    sched->req_ack_pending = true;
846
847    // set ack request in target thread "flags"
848    hal_atomic_or( &target->flags , THREAD_FLAG_REQ_ACK );
849
850    // set pointer on responses counter in target thread
851    target->ack_rsp_count = rsp_count;
852   
853    // exit critical section
854    hal_restore_irq( save_sr );
855
856    hal_fence();
857
858}  // thread_set_req_ack()
859
860/////////////////////////////////////////////////////
861inline void thread_reset_req_ack( thread_t * target )
862{
863    reg_t    save_sr;   // for critical section
864
865    // get pointer on target thread scheduler
866    scheduler_t * sched = &target->core->scheduler;
867
868    // check signal pending in scheduler
869    assert( sched->req_ack_pending , __FUNCTION__ , "no pending signal" );
870   
871    // enter critical section
872    hal_disable_irq( &save_sr );
873     
874    // reset signal in scheduler
875    sched->req_ack_pending = false;
876
877    // reset signal in thread "flags"
878    hal_atomic_and( &target->flags , ~THREAD_FLAG_REQ_ACK );
879
880    // reset pointer on responses counter
881    target->ack_rsp_count = NULL;
882   
883    // exit critical section
884    hal_restore_irq( save_sr );
885
886    hal_fence();
887
888}  // thread_reset_req_ack()
889
890////////////////////////////////
891inline bool_t thread_can_yield()
892{
893    thread_t * this = CURRENT_THREAD;
894    return (this->local_locks == 0) && (this->remote_locks == 0);
895}
896
897/////////////////////////
898void thread_check_sched()
899{
900    thread_t * this = CURRENT_THREAD;
901
902        if( (this->local_locks == 0) && 
903        (this->remote_locks == 0) &&
904        (this->flags & THREAD_FLAG_SCHED) ) 
905    {
906        this->flags &= ~THREAD_FLAG_SCHED;
907        sched_yield( "delayed scheduling" );
908    }
909
910}  // end thread_check_sched()
911
912//////////////////////////////////////
913void thread_block( xptr_t   thread_xp,
914                   uint32_t cause )
915{
916    // get thread cluster and local pointer
917    cxy_t      cxy = GET_CXY( thread_xp );
918    thread_t * ptr = GET_PTR( thread_xp );
919
920    // set blocking cause
921    hal_remote_atomic_or( XPTR( cxy , &ptr->blocked ) , cause );
922    hal_fence();
923
924#if DEBUG_THREAD_BLOCK
925uint32_t    cycle   = (uint32_t)hal_get_cycles();
926process_t * process = hal_remote_lpt( XPTR( cxy , &ptr->process ) );
927if( DEBUG_THREAD_BLOCK < cycle )
928printk("\n[DBG] %s : thread %x in process %x blocked thread %x in process %x / cause %x\n",
929__FUNCTION__, CURRENT_THREAD->trdid, CURRENT_THREAD->process->pid,
930ptr->trdid, hal_remote_lw(XPTR( cxy , &process->pid )), cause );
931#endif
932
933} // end thread_block()
934
935////////////////////////////////////////////
936uint32_t thread_unblock( xptr_t   thread_xp,
937                         uint32_t cause )
938{
939    // get thread cluster and local pointer
940    cxy_t      cxy = GET_CXY( thread_xp );
941    thread_t * ptr = GET_PTR( thread_xp );
942
943    // reset blocking cause
944    uint32_t previous = hal_remote_atomic_and( XPTR( cxy , &ptr->blocked ) , ~cause );
945    hal_fence();
946
947#if DEBUG_THREAD_BLOCK
948uint32_t    cycle   = (uint32_t)hal_get_cycles();
949process_t * process = hal_remote_lpt( XPTR( cxy , &ptr->process ) );
950if( DEBUG_THREAD_BLOCK < cycle )
951printk("\n[DBG] %s : thread %x in process %x unblocked thread %x in process %x / cause %x\n",
952__FUNCTION__, CURRENT_THREAD->trdid, CURRENT_THREAD->process->pid,
953ptr->trdid, hal_remote_lw(XPTR( cxy , &process->pid )), cause );
954#endif
955
956    // return a non zero value if the cause bit is modified
957    return( previous & cause );
958
959}  // end thread_unblock()
960
961//////////////////////////////////////
962void thread_delete( xptr_t  target_xp,
963                    pid_t   pid,
964                    bool_t  is_forced )
965{
966    reg_t       save_sr;                // for critical section
967    bool_t      target_join_done;       // joining thread arrived first
968    bool_t      target_attached;        // target thread attached
969    xptr_t      killer_xp;              // extended pointer on killer thread (this)
970    thread_t  * killer_ptr;             // pointer on killer thread (this)
971    cxy_t       target_cxy;             // target thread cluster     
972    thread_t  * target_ptr;             // pointer on target thread
973    xptr_t      target_flags_xp;        // extended pointer on target thread <flags>
974    uint32_t    target_flags;           // target thread <flags> value
975    xptr_t      target_join_lock_xp;    // extended pointer on target thread <join_lock>
976    xptr_t      target_join_xp_xp;      // extended pointer on target thread <join_xp>
977    trdid_t     target_trdid;           // target thread identifier
978    ltid_t      target_ltid;            // target thread local index
979    xptr_t      joining_xp;             // extended pointer on joining thread
980    thread_t  * joining_ptr;            // pointer on joining thread
981    cxy_t       joining_cxy;            // joining thread cluster
982    cxy_t       owner_cxy;              // process owner cluster
983
984
985    // get target thread pointers, identifiers, and flags
986    target_cxy      = GET_CXY( target_xp );
987    target_ptr      = GET_PTR( target_xp );
988    target_trdid    = hal_remote_lw( XPTR( target_cxy , &target_ptr->trdid ) );
989    target_ltid     = LTID_FROM_TRDID( target_trdid );
990    target_flags_xp = XPTR( target_cxy , &target_ptr->flags ); 
991    target_flags    = hal_remote_lw( target_flags_xp );
992
993    // get killer thread pointers
994    killer_ptr = CURRENT_THREAD;
995    killer_xp  = XPTR( local_cxy , killer_ptr );
996
997#if DEBUG_THREAD_DELETE
998uint32_t cycle  = (uint32_t)hal_get_cycles;
999if( DEBUG_THREAD_DELETE < cycle )
1000printk("\n[DBG] %s : killer thread %x enter for target thread %x / cycle %d\n",
1001__FUNCTION__, killer_ptr, target_ptr, cycle );
1002#endif
1003
1004    // target thread cannot be the main thread, because the main thread
1005    // must be deleted by the parent process sys_wait() function
1006    owner_cxy = CXY_FROM_PID( pid );
1007    assert( ((owner_cxy != target_cxy) || (target_ltid != 0)), __FUNCTION__,
1008    "tharget thread cannot be the main thread\n" );
1009
1010    // block the target thread
1011    thread_block( target_xp , THREAD_BLOCKED_GLOBAL );
1012
1013    // get attached from target flag descriptor
1014    target_attached = ((hal_remote_lw( target_flags_xp ) & THREAD_FLAG_DETACHED) != 0);
1015
1016    // synchronize with the joining thread if the target thread is attached
1017    if( target_attached && (is_forced == false) )
1018    {
1019        // build extended pointers on target thread join fields
1020        target_join_lock_xp  = XPTR( target_cxy , &target_ptr->join_lock );
1021        target_join_xp_xp    = XPTR( target_cxy , &target_ptr->join_xp );
1022
1023        // enter critical section
1024        hal_disable_irq( &save_sr );
1025
1026        // take the join_lock in target thread descriptor
1027        remote_spinlock_lock( target_join_lock_xp );
1028
1029        // get join_done from target thread descriptor
1030        target_join_done = ((hal_remote_lw( target_flags_xp ) & THREAD_FLAG_JOIN_DONE) != 0);
1031   
1032        if( target_join_done )  // joining thread arrived first => unblock the joining thread
1033        {
1034            // get extended pointer on joining thread
1035            joining_xp  = (xptr_t)hal_remote_lwd( target_join_xp_xp );
1036            joining_ptr = GET_PTR( joining_xp );
1037            joining_cxy = GET_CXY( joining_xp );
1038           
1039            // reset the join_done flag in target thread
1040            hal_remote_atomic_and( target_flags_xp , ~THREAD_FLAG_JOIN_DONE );
1041
1042            // unblock the joining thread
1043            thread_unblock( joining_xp , THREAD_BLOCKED_JOIN );
1044
1045            // release the join_lock in target thread descriptor
1046            remote_spinlock_unlock( target_join_lock_xp );
1047
1048            // restore IRQs
1049            hal_restore_irq( save_sr );
1050        }
1051        else                // this thread arrived first => register flags and deschedule
1052        {
1053            // set the kill_done flag in target thread
1054            hal_remote_atomic_or( target_flags_xp , THREAD_FLAG_KILL_DONE );
1055
1056            // block this thread on BLOCKED_JOIN
1057            thread_block( killer_xp , THREAD_BLOCKED_JOIN );
1058
1059            // set extended pointer on killer thread in target thread
1060            hal_remote_swd( target_join_xp_xp , killer_xp );
1061
1062            // release the join_lock in target thread descriptor
1063            remote_spinlock_unlock( target_join_lock_xp );
1064
1065            // deschedule
1066            sched_yield( "killer thread wait joining thread" );
1067
1068            // restore IRQs
1069            hal_restore_irq( save_sr );
1070        }
1071    }  // end if attached
1072
1073    // set the REQ_DELETE flag in target thread descriptor
1074    hal_remote_atomic_or( target_flags_xp , THREAD_FLAG_REQ_DELETE );
1075
1076#if DEBUG_THREAD_DELETE
1077cycle  = (uint32_t)hal_get_cycles;
1078if( DEBUG_THREAD_DELETE < cycle )
1079printk("\n[DBG] %s : killer thread %x exit for target thread %x / cycle %d\n",
1080__FUNCTION__, killer_ptr, target_ptr, cycle );
1081#endif
1082
1083}  // end thread_delete()
1084
1085
1086
1087///////////////////////
1088void thread_idle_func()
1089{
1090
1091#if DEBUG_THREAD_IDLE
1092uint32_t cycle;
1093#endif
1094
1095    while( 1 )
1096    {
1097        // unmask IRQs
1098        hal_enable_irq( NULL );
1099
1100        // force core to low-power mode (optional)
1101        if( CONFIG_THREAD_IDLE_MODE_SLEEP ) 
1102        {
1103
1104#if (DEBUG_THREAD_IDLE & 1)
1105cycle  = (uint32_t)hal_get_cycles;
1106if( DEBUG_THREAD_IDLE < cycle )
1107printk("\n[DBG] %s : idle thread on core[%x,%d] goes to sleep / cycle %d\n",
1108__FUNCTION__, local_cxy, CURRENT_THREAD->core->lid, cycle );
1109#endif
1110
1111            hal_core_sleep();
1112
1113#if (DEBUG_THREAD_IDLE & 1)
1114cycle  = (uint32_t)hal_get_cycles;
1115if( DEBUG_THREAD_IDLE < cycle )
1116printk("\n[DBG] %s : idle thread on core[%x,%d] wake up / cycle %d\n",
1117__FUNCTION__, this, local_cxy, this->core->lid, cycle );
1118#endif
1119
1120        }
1121
1122#if DEBUG_THREAD_IDLE
1123sched_display( CURRENT_THREAD->core->lid );
1124#endif     
1125
1126        // search a runable thread
1127        sched_yield( "IDLE" );
1128    }
1129}  // end thread_idle()
1130
1131
1132/////////////////////////////////////////////////
1133void thread_user_time_update( thread_t * thread )
1134{
1135    // TODO
1136    // printk("\n[WARNING] function %s not implemented\n", __FUNCTION__ );
1137}
1138
1139///////////////////////////////////////////////////
1140void thread_kernel_time_update( thread_t * thread )
1141{
1142    // TODO
1143    // printk("\n[WARNING] function %s not implemented\n", __FUNCTION__ );
1144}
1145
1146/////////////////////////////////////
1147xptr_t thread_get_xptr( pid_t    pid,
1148                        trdid_t  trdid )
1149{
1150    cxy_t         target_cxy;          // target thread cluster identifier
1151    ltid_t        target_thread_ltid;  // target thread local index
1152    thread_t    * target_thread_ptr;   // target thread local pointer
1153    xptr_t        target_process_xp;   // extended pointer on target process descriptor
1154    process_t   * target_process_ptr;  // local pointer on target process descriptor
1155    pid_t         target_process_pid;  // target process identifier
1156    xlist_entry_t root;                // root of list of process in target cluster
1157    xptr_t        lock_xp;             // extended pointer on lock protecting  this list
1158
1159    // get target cluster identifier and local thread identifier
1160    target_cxy         = CXY_FROM_TRDID( trdid );
1161    target_thread_ltid = LTID_FROM_TRDID( trdid );
1162
1163    // check trdid argument
1164        if( (target_thread_ltid >= CONFIG_THREAD_MAX_PER_CLUSTER) || 
1165        cluster_is_undefined( target_cxy ) )         return XPTR_NULL;
1166
1167    // get root of list of process descriptors in target cluster
1168    hal_remote_memcpy( XPTR( local_cxy  , &root ),
1169                       XPTR( target_cxy , &LOCAL_CLUSTER->pmgr.local_root ),
1170                       sizeof(xlist_entry_t) );
1171
1172    // get extended pointer on lock protecting the list of processes
1173    lock_xp = XPTR( target_cxy , &LOCAL_CLUSTER->pmgr.local_lock );
1174
1175    // take the lock protecting the list of processes in target cluster
1176    remote_spinlock_lock( lock_xp );
1177
1178    // loop on list of process in target cluster to find the PID process
1179    xptr_t  iter;
1180    bool_t  found = false;
1181    XLIST_FOREACH( XPTR( target_cxy , &LOCAL_CLUSTER->pmgr.local_root ) , iter )
1182    {
1183        target_process_xp  = XLIST_ELEMENT( iter , process_t , local_list );
1184        target_process_ptr = GET_PTR( target_process_xp );
1185        target_process_pid = hal_remote_lw( XPTR( target_cxy , &target_process_ptr->pid ) );
1186        if( target_process_pid == pid )
1187        {
1188            found = true;
1189            break;
1190        }
1191    }
1192
1193    // release the lock protecting the list of processes in target cluster
1194    remote_spinlock_unlock( lock_xp );
1195
1196    // check PID found
1197    if( found == false ) return XPTR_NULL;
1198
1199    // get target thread local pointer
1200    xptr_t xp = XPTR( target_cxy , &target_process_ptr->th_tbl[target_thread_ltid] );
1201    target_thread_ptr = (thread_t *)hal_remote_lpt( xp );
1202
1203    if( target_thread_ptr == NULL )  return XPTR_NULL;
1204
1205    return XPTR( target_cxy , target_thread_ptr );
1206}
1207
Note: See TracBrowser for help on using the repository browser.