2009-04-23 19:23:13 +04:00
/*
* Unix SMB / CIFS implementation .
* thread pool implementation
* Copyright ( C ) Volker Lendecke 2009
*
* This program is free software ; you can redistribute it and / or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation ; either version 3 of the License , or
* ( at your option ) any later version .
*
* This program is distributed in the hope that it will be useful ,
* but WITHOUT ANY WARRANTY ; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE . See the
* GNU General Public License for more details .
*
* You should have received a copy of the GNU General Public License
* along with this program . If not , see < http : //www.gnu.org/licenses/>.
*/
2016-07-31 08:42:21 +03:00
# include "replace.h"
2011-09-21 05:19:58 +04:00
# include "system/time.h"
2016-08-12 13:15:46 +03:00
# include "system/wait.h"
# include "system/threads.h"
2018-07-25 13:03:52 +03:00
# include "system/filesys.h"
2009-04-23 19:23:13 +04:00
# include "pthreadpool.h"
2011-04-22 13:47:11 +04:00
# include "lib/util/dlinklist.h"
2016-08-29 12:35:20 +03:00
# ifdef NDEBUG
# undef NDEBUG
# endif
2016-07-31 08:42:21 +03:00
# include <assert.h>
2009-04-23 19:23:13 +04:00
struct pthreadpool_job {
int id ;
void ( * fn ) ( void * private_data ) ;
void * private_data ;
} ;
struct pthreadpool {
2011-04-22 13:47:11 +04:00
/*
* List pthreadpools for fork safety
*/
struct pthreadpool * prev , * next ;
2009-04-23 19:23:13 +04:00
/*
* Control access to this struct
*/
pthread_mutex_t mutex ;
/*
* Threads waiting for work do so here
*/
pthread_cond_t condvar ;
/*
2014-03-21 20:53:26 +04:00
* Array of jobs
2009-04-23 19:23:13 +04:00
*/
2014-03-21 20:53:26 +04:00
size_t jobs_array_len ;
struct pthreadpool_job * jobs ;
size_t head ;
size_t num_jobs ;
2009-04-23 19:23:13 +04:00
/*
2016-08-15 14:59:12 +03:00
* Indicate job completion
2009-04-23 19:23:13 +04:00
*/
2016-07-31 09:57:35 +03:00
int ( * signal_fn ) ( int jobid ,
void ( * job_fn ) ( void * private_data ) ,
void * job_fn_private_data ,
void * private_data ) ;
void * signal_fn_private_data ;
2009-04-23 19:23:13 +04:00
/*
2018-04-25 15:03:30 +03:00
* indicator to worker threads to stop processing further jobs
* and exit .
2009-04-23 19:23:13 +04:00
*/
2018-04-25 15:03:30 +03:00
bool stopped ;
/*
* indicator to the last worker thread to free the pool
* resources .
*/
bool destroyed ;
2009-04-23 19:23:13 +04:00
/*
* maximum number of threads
2018-06-22 01:29:53 +03:00
* 0 means no real thread , only strict sync processing .
2009-04-23 19:23:13 +04:00
*/
2018-06-22 01:04:48 +03:00
unsigned max_threads ;
2009-04-23 19:23:13 +04:00
/*
* Number of threads
*/
2018-06-22 01:04:48 +03:00
unsigned num_threads ;
2009-04-23 19:23:13 +04:00
/*
* Number of idle threads
*/
2018-06-22 01:04:48 +03:00
unsigned num_idle ;
2017-08-28 17:38:19 +03:00
/*
pthreadpool: Fix starvation after fork
After the race is before the race:
1) Create an idle thread
2) Add a job: This won't create a thread anymore
3) Immediately fork
The idle thread will be woken twice before it's actually woken up: Both
pthreadpool_add_job and pthreadpool_prepare_pool call cond_signal, for
different reasons. We must look at pool->prefork_cond first because otherwise
we will end up in a blocking job deep within a fork call, the helper thread
must take its fingers off the condvar as quickly as possible. This means that
after the fork there's no idle thread around anymore that would pick up the job
submitted in 2). So we must keep the idle threads around across the fork.
The quick solution to re-create one helper thread in pthreadpool_parent has a
fatal flaw: What do we do if that pthread_create call fails? We're deep in an
application calling fork(), and doing fancy signalling from there is really
something we must avoid.
This has one potential performance issue: If we have hundreds of idle threads
(do we ever have that) during the fork, the call to pthread_mutex_lock on the
fork_mutex from pthreadpool_server (the helper thread) will probably cause a
thundering herd when the _parent call unlocks the fork_mutex. The solution for
this to just keep one idle thread around. But this adds code that is not
strictly required functionally for now.
More detailed explanation from Jeremy:
First, understanding the problem the test reproduces:
add a job (num_jobs = 1) -> creates thread to run it.
job finishes, thread sticks around (num_idle = 1).
num_jobs is now zero (initial job finished).
a) Idle thread is now waiting on pool->condvar inside
pthreadpool_server() in pthread_cond_timedwait().
Now, add another job ->
pthreadpool_add_job()
-> pthreadpool_put_job()
This adds the job to the queue.
Oh, there is an idle thread so don't
create one, do:
pthread_cond_signal(&pool->condvar);
and return.
Now call fork *before* idle thread in (a) wakes from
the signaling of pool->condvar.
In the parent (child is irrelevent):
Go into: pthreadpool_prepare() ->
pthreadpool_prepare_pool()
Set the variable to tell idle threads to exit:
pool->prefork_cond = &prefork_cond;
then wake them up with:
pthread_cond_signal(&pool->condvar);
This does nothing as the idle thread
is already awoken.
b) Idle thread wakes up and does:
Reduce idle thread count (num_idle = 0)
pool->num_idle -= 1;
Check if we're in the middle of a fork.
if (pool->prefork_cond != NULL) {
Yes we are, tell pthreadpool_prepare()
we are exiting.
pthread_cond_signal(pool->prefork_cond);
And exit.
pthreadpool_server_exit(pool);
return NULL;
}
So we come back from the fork in the parent with num_jobs = 1,
a job on the queue but no idle threads - and the code that
creates a new thread on job submission was skipped because
an idle thread existed at point (a).
OK, assuming that the previous explaination is correct, the
fix is to create a new pthreadpool context mutex:
pool->fork_mutex
and in pthreadpool_server(), when an idle thread wakes up and
notices we're in the prepare fork state, it puts itself to
sleep by waiting on the new pool->fork_mutex.
And in pthreadpool_prepare_pool(), instead of waiting for
the idle threads to exit, hold the pool->fork_mutex and
signal each idle thread in turn, and wait for the pool->num_idle
to go to zero - which means they're all blocked waiting on
pool->fork_mutex.
When the parent continues, pthreadpool_parent()
unlocks the pool->fork_mutex and all the previously
'idle' threads wake up (and you mention the thundering
herd problem, which is as you say vanishingly small :-)
and pick up any remaining job.
Bug: https://bugzilla.samba.org/show_bug.cgi?id=13179
Signed-off-by: Volker Lendecke <vl@samba.org>
Reviewed-by: Jeremy Allison <jra@samba.org>
2017-11-29 18:45:40 +03:00
* Condition variable indicating that helper threads should
* quickly go away making way for fork ( ) without anybody
* waiting on pool - > condvar .
2017-08-28 17:38:19 +03:00
*/
pthread_cond_t * prefork_cond ;
pthreadpool: Fix starvation after fork
After the race is before the race:
1) Create an idle thread
2) Add a job: This won't create a thread anymore
3) Immediately fork
The idle thread will be woken twice before it's actually woken up: Both
pthreadpool_add_job and pthreadpool_prepare_pool call cond_signal, for
different reasons. We must look at pool->prefork_cond first because otherwise
we will end up in a blocking job deep within a fork call, the helper thread
must take its fingers off the condvar as quickly as possible. This means that
after the fork there's no idle thread around anymore that would pick up the job
submitted in 2). So we must keep the idle threads around across the fork.
The quick solution to re-create one helper thread in pthreadpool_parent has a
fatal flaw: What do we do if that pthread_create call fails? We're deep in an
application calling fork(), and doing fancy signalling from there is really
something we must avoid.
This has one potential performance issue: If we have hundreds of idle threads
(do we ever have that) during the fork, the call to pthread_mutex_lock on the
fork_mutex from pthreadpool_server (the helper thread) will probably cause a
thundering herd when the _parent call unlocks the fork_mutex. The solution for
this to just keep one idle thread around. But this adds code that is not
strictly required functionally for now.
More detailed explanation from Jeremy:
First, understanding the problem the test reproduces:
add a job (num_jobs = 1) -> creates thread to run it.
job finishes, thread sticks around (num_idle = 1).
num_jobs is now zero (initial job finished).
a) Idle thread is now waiting on pool->condvar inside
pthreadpool_server() in pthread_cond_timedwait().
Now, add another job ->
pthreadpool_add_job()
-> pthreadpool_put_job()
This adds the job to the queue.
Oh, there is an idle thread so don't
create one, do:
pthread_cond_signal(&pool->condvar);
and return.
Now call fork *before* idle thread in (a) wakes from
the signaling of pool->condvar.
In the parent (child is irrelevent):
Go into: pthreadpool_prepare() ->
pthreadpool_prepare_pool()
Set the variable to tell idle threads to exit:
pool->prefork_cond = &prefork_cond;
then wake them up with:
pthread_cond_signal(&pool->condvar);
This does nothing as the idle thread
is already awoken.
b) Idle thread wakes up and does:
Reduce idle thread count (num_idle = 0)
pool->num_idle -= 1;
Check if we're in the middle of a fork.
if (pool->prefork_cond != NULL) {
Yes we are, tell pthreadpool_prepare()
we are exiting.
pthread_cond_signal(pool->prefork_cond);
And exit.
pthreadpool_server_exit(pool);
return NULL;
}
So we come back from the fork in the parent with num_jobs = 1,
a job on the queue but no idle threads - and the code that
creates a new thread on job submission was skipped because
an idle thread existed at point (a).
OK, assuming that the previous explaination is correct, the
fix is to create a new pthreadpool context mutex:
pool->fork_mutex
and in pthreadpool_server(), when an idle thread wakes up and
notices we're in the prepare fork state, it puts itself to
sleep by waiting on the new pool->fork_mutex.
And in pthreadpool_prepare_pool(), instead of waiting for
the idle threads to exit, hold the pool->fork_mutex and
signal each idle thread in turn, and wait for the pool->num_idle
to go to zero - which means they're all blocked waiting on
pool->fork_mutex.
When the parent continues, pthreadpool_parent()
unlocks the pool->fork_mutex and all the previously
'idle' threads wake up (and you mention the thundering
herd problem, which is as you say vanishingly small :-)
and pick up any remaining job.
Bug: https://bugzilla.samba.org/show_bug.cgi?id=13179
Signed-off-by: Volker Lendecke <vl@samba.org>
Reviewed-by: Jeremy Allison <jra@samba.org>
2017-11-29 18:45:40 +03:00
/*
* Waiting position for helper threads while fork is
* running . The forking thread will have locked it , and all
* idle helper threads will sit here until after the fork ,
* where the forking thread will unlock it again .
*/
pthread_mutex_t fork_mutex ;
2009-04-23 19:23:13 +04:00
} ;
2011-04-22 13:47:11 +04:00
static pthread_mutex_t pthreadpools_mutex = PTHREAD_MUTEX_INITIALIZER ;
static struct pthreadpool * pthreadpools = NULL ;
static pthread_once_t pthreadpool_atfork_initialized = PTHREAD_ONCE_INIT ;
static void pthreadpool_prep_atfork ( void ) ;
2009-04-23 19:23:13 +04:00
/*
* Initialize a thread pool
*/
2016-08-15 14:59:12 +03:00
int pthreadpool_init ( unsigned max_threads , struct pthreadpool * * presult ,
2016-07-31 09:57:35 +03:00
int ( * signal_fn ) ( int jobid ,
void ( * job_fn ) ( void * private_data ) ,
void * job_fn_private_data ,
void * private_data ) ,
void * signal_fn_private_data )
2009-04-23 19:23:13 +04:00
{
struct pthreadpool * pool ;
int ret ;
2011-04-25 22:05:31 +04:00
pool = ( struct pthreadpool * ) malloc ( sizeof ( struct pthreadpool ) ) ;
2009-04-23 19:23:13 +04:00
if ( pool = = NULL ) {
return ENOMEM ;
}
2016-08-15 14:59:12 +03:00
pool - > signal_fn = signal_fn ;
2016-07-31 09:57:35 +03:00
pool - > signal_fn_private_data = signal_fn_private_data ;
2009-04-23 19:23:13 +04:00
2014-03-21 20:53:26 +04:00
pool - > jobs_array_len = 4 ;
pool - > jobs = calloc (
pool - > jobs_array_len , sizeof ( struct pthreadpool_job ) ) ;
if ( pool - > jobs = = NULL ) {
free ( pool ) ;
return ENOMEM ;
}
pool - > head = pool - > num_jobs = 0 ;
2009-04-23 19:23:13 +04:00
ret = pthread_mutex_init ( & pool - > mutex , NULL ) ;
if ( ret ! = 0 ) {
2014-03-21 20:53:26 +04:00
free ( pool - > jobs ) ;
2009-04-23 19:23:13 +04:00
free ( pool ) ;
return ret ;
}
ret = pthread_cond_init ( & pool - > condvar , NULL ) ;
if ( ret ! = 0 ) {
pthread_mutex_destroy ( & pool - > mutex ) ;
2014-03-21 20:53:26 +04:00
free ( pool - > jobs ) ;
2009-04-23 19:23:13 +04:00
free ( pool ) ;
return ret ;
}
pthreadpool: Fix starvation after fork
After the race is before the race:
1) Create an idle thread
2) Add a job: This won't create a thread anymore
3) Immediately fork
The idle thread will be woken twice before it's actually woken up: Both
pthreadpool_add_job and pthreadpool_prepare_pool call cond_signal, for
different reasons. We must look at pool->prefork_cond first because otherwise
we will end up in a blocking job deep within a fork call, the helper thread
must take its fingers off the condvar as quickly as possible. This means that
after the fork there's no idle thread around anymore that would pick up the job
submitted in 2). So we must keep the idle threads around across the fork.
The quick solution to re-create one helper thread in pthreadpool_parent has a
fatal flaw: What do we do if that pthread_create call fails? We're deep in an
application calling fork(), and doing fancy signalling from there is really
something we must avoid.
This has one potential performance issue: If we have hundreds of idle threads
(do we ever have that) during the fork, the call to pthread_mutex_lock on the
fork_mutex from pthreadpool_server (the helper thread) will probably cause a
thundering herd when the _parent call unlocks the fork_mutex. The solution for
this to just keep one idle thread around. But this adds code that is not
strictly required functionally for now.
More detailed explanation from Jeremy:
First, understanding the problem the test reproduces:
add a job (num_jobs = 1) -> creates thread to run it.
job finishes, thread sticks around (num_idle = 1).
num_jobs is now zero (initial job finished).
a) Idle thread is now waiting on pool->condvar inside
pthreadpool_server() in pthread_cond_timedwait().
Now, add another job ->
pthreadpool_add_job()
-> pthreadpool_put_job()
This adds the job to the queue.
Oh, there is an idle thread so don't
create one, do:
pthread_cond_signal(&pool->condvar);
and return.
Now call fork *before* idle thread in (a) wakes from
the signaling of pool->condvar.
In the parent (child is irrelevent):
Go into: pthreadpool_prepare() ->
pthreadpool_prepare_pool()
Set the variable to tell idle threads to exit:
pool->prefork_cond = &prefork_cond;
then wake them up with:
pthread_cond_signal(&pool->condvar);
This does nothing as the idle thread
is already awoken.
b) Idle thread wakes up and does:
Reduce idle thread count (num_idle = 0)
pool->num_idle -= 1;
Check if we're in the middle of a fork.
if (pool->prefork_cond != NULL) {
Yes we are, tell pthreadpool_prepare()
we are exiting.
pthread_cond_signal(pool->prefork_cond);
And exit.
pthreadpool_server_exit(pool);
return NULL;
}
So we come back from the fork in the parent with num_jobs = 1,
a job on the queue but no idle threads - and the code that
creates a new thread on job submission was skipped because
an idle thread existed at point (a).
OK, assuming that the previous explaination is correct, the
fix is to create a new pthreadpool context mutex:
pool->fork_mutex
and in pthreadpool_server(), when an idle thread wakes up and
notices we're in the prepare fork state, it puts itself to
sleep by waiting on the new pool->fork_mutex.
And in pthreadpool_prepare_pool(), instead of waiting for
the idle threads to exit, hold the pool->fork_mutex and
signal each idle thread in turn, and wait for the pool->num_idle
to go to zero - which means they're all blocked waiting on
pool->fork_mutex.
When the parent continues, pthreadpool_parent()
unlocks the pool->fork_mutex and all the previously
'idle' threads wake up (and you mention the thundering
herd problem, which is as you say vanishingly small :-)
and pick up any remaining job.
Bug: https://bugzilla.samba.org/show_bug.cgi?id=13179
Signed-off-by: Volker Lendecke <vl@samba.org>
Reviewed-by: Jeremy Allison <jra@samba.org>
2017-11-29 18:45:40 +03:00
ret = pthread_mutex_init ( & pool - > fork_mutex , NULL ) ;
if ( ret ! = 0 ) {
pthread_cond_destroy ( & pool - > condvar ) ;
pthread_mutex_destroy ( & pool - > mutex ) ;
free ( pool - > jobs ) ;
free ( pool ) ;
return ret ;
}
2018-04-25 15:03:30 +03:00
pool - > stopped = false ;
pool - > destroyed = false ;
2009-04-23 19:23:13 +04:00
pool - > num_threads = 0 ;
pool - > max_threads = max_threads ;
pool - > num_idle = 0 ;
2017-08-28 17:38:19 +03:00
pool - > prefork_cond = NULL ;
2011-04-22 13:47:11 +04:00
ret = pthread_mutex_lock ( & pthreadpools_mutex ) ;
if ( ret ! = 0 ) {
pthreadpool: Fix starvation after fork
After the race is before the race:
1) Create an idle thread
2) Add a job: This won't create a thread anymore
3) Immediately fork
The idle thread will be woken twice before it's actually woken up: Both
pthreadpool_add_job and pthreadpool_prepare_pool call cond_signal, for
different reasons. We must look at pool->prefork_cond first because otherwise
we will end up in a blocking job deep within a fork call, the helper thread
must take its fingers off the condvar as quickly as possible. This means that
after the fork there's no idle thread around anymore that would pick up the job
submitted in 2). So we must keep the idle threads around across the fork.
The quick solution to re-create one helper thread in pthreadpool_parent has a
fatal flaw: What do we do if that pthread_create call fails? We're deep in an
application calling fork(), and doing fancy signalling from there is really
something we must avoid.
This has one potential performance issue: If we have hundreds of idle threads
(do we ever have that) during the fork, the call to pthread_mutex_lock on the
fork_mutex from pthreadpool_server (the helper thread) will probably cause a
thundering herd when the _parent call unlocks the fork_mutex. The solution for
this to just keep one idle thread around. But this adds code that is not
strictly required functionally for now.
More detailed explanation from Jeremy:
First, understanding the problem the test reproduces:
add a job (num_jobs = 1) -> creates thread to run it.
job finishes, thread sticks around (num_idle = 1).
num_jobs is now zero (initial job finished).
a) Idle thread is now waiting on pool->condvar inside
pthreadpool_server() in pthread_cond_timedwait().
Now, add another job ->
pthreadpool_add_job()
-> pthreadpool_put_job()
This adds the job to the queue.
Oh, there is an idle thread so don't
create one, do:
pthread_cond_signal(&pool->condvar);
and return.
Now call fork *before* idle thread in (a) wakes from
the signaling of pool->condvar.
In the parent (child is irrelevent):
Go into: pthreadpool_prepare() ->
pthreadpool_prepare_pool()
Set the variable to tell idle threads to exit:
pool->prefork_cond = &prefork_cond;
then wake them up with:
pthread_cond_signal(&pool->condvar);
This does nothing as the idle thread
is already awoken.
b) Idle thread wakes up and does:
Reduce idle thread count (num_idle = 0)
pool->num_idle -= 1;
Check if we're in the middle of a fork.
if (pool->prefork_cond != NULL) {
Yes we are, tell pthreadpool_prepare()
we are exiting.
pthread_cond_signal(pool->prefork_cond);
And exit.
pthreadpool_server_exit(pool);
return NULL;
}
So we come back from the fork in the parent with num_jobs = 1,
a job on the queue but no idle threads - and the code that
creates a new thread on job submission was skipped because
an idle thread existed at point (a).
OK, assuming that the previous explaination is correct, the
fix is to create a new pthreadpool context mutex:
pool->fork_mutex
and in pthreadpool_server(), when an idle thread wakes up and
notices we're in the prepare fork state, it puts itself to
sleep by waiting on the new pool->fork_mutex.
And in pthreadpool_prepare_pool(), instead of waiting for
the idle threads to exit, hold the pool->fork_mutex and
signal each idle thread in turn, and wait for the pool->num_idle
to go to zero - which means they're all blocked waiting on
pool->fork_mutex.
When the parent continues, pthreadpool_parent()
unlocks the pool->fork_mutex and all the previously
'idle' threads wake up (and you mention the thundering
herd problem, which is as you say vanishingly small :-)
and pick up any remaining job.
Bug: https://bugzilla.samba.org/show_bug.cgi?id=13179
Signed-off-by: Volker Lendecke <vl@samba.org>
Reviewed-by: Jeremy Allison <jra@samba.org>
2017-11-29 18:45:40 +03:00
pthread_mutex_destroy ( & pool - > fork_mutex ) ;
2011-04-22 13:47:11 +04:00
pthread_cond_destroy ( & pool - > condvar ) ;
pthread_mutex_destroy ( & pool - > mutex ) ;
2014-03-21 20:53:26 +04:00
free ( pool - > jobs ) ;
2011-04-22 13:47:11 +04:00
free ( pool ) ;
return ret ;
}
DLIST_ADD ( pthreadpools , pool ) ;
ret = pthread_mutex_unlock ( & pthreadpools_mutex ) ;
assert ( ret = = 0 ) ;
pthread_once ( & pthreadpool_atfork_initialized , pthreadpool_prep_atfork ) ;
2009-04-23 19:23:13 +04:00
* presult = pool ;
2011-04-22 13:47:11 +04:00
2009-04-23 19:23:13 +04:00
return 0 ;
}
2018-06-22 01:49:33 +03:00
size_t pthreadpool_max_threads ( struct pthreadpool * pool )
{
2018-04-25 15:03:30 +03:00
if ( pool - > stopped ) {
return 0 ;
}
2018-06-22 01:49:33 +03:00
return pool - > max_threads ;
}
size_t pthreadpool_queued_jobs ( struct pthreadpool * pool )
{
int res ;
int unlock_res ;
size_t ret ;
2018-04-25 15:03:30 +03:00
if ( pool - > stopped ) {
return 0 ;
}
2018-06-22 01:49:33 +03:00
res = pthread_mutex_lock ( & pool - > mutex ) ;
if ( res ! = 0 ) {
2018-04-25 15:03:30 +03:00
return res ;
}
if ( pool - > stopped ) {
unlock_res = pthread_mutex_unlock ( & pool - > mutex ) ;
assert ( unlock_res = = 0 ) ;
2018-06-22 01:49:33 +03:00
return 0 ;
}
ret = pool - > num_jobs ;
unlock_res = pthread_mutex_unlock ( & pool - > mutex ) ;
assert ( unlock_res = = 0 ) ;
return ret ;
}
2017-08-28 17:38:19 +03:00
static void pthreadpool_prepare_pool ( struct pthreadpool * pool )
{
int ret ;
pthreadpool: Fix starvation after fork
After the race is before the race:
1) Create an idle thread
2) Add a job: This won't create a thread anymore
3) Immediately fork
The idle thread will be woken twice before it's actually woken up: Both
pthreadpool_add_job and pthreadpool_prepare_pool call cond_signal, for
different reasons. We must look at pool->prefork_cond first because otherwise
we will end up in a blocking job deep within a fork call, the helper thread
must take its fingers off the condvar as quickly as possible. This means that
after the fork there's no idle thread around anymore that would pick up the job
submitted in 2). So we must keep the idle threads around across the fork.
The quick solution to re-create one helper thread in pthreadpool_parent has a
fatal flaw: What do we do if that pthread_create call fails? We're deep in an
application calling fork(), and doing fancy signalling from there is really
something we must avoid.
This has one potential performance issue: If we have hundreds of idle threads
(do we ever have that) during the fork, the call to pthread_mutex_lock on the
fork_mutex from pthreadpool_server (the helper thread) will probably cause a
thundering herd when the _parent call unlocks the fork_mutex. The solution for
this to just keep one idle thread around. But this adds code that is not
strictly required functionally for now.
More detailed explanation from Jeremy:
First, understanding the problem the test reproduces:
add a job (num_jobs = 1) -> creates thread to run it.
job finishes, thread sticks around (num_idle = 1).
num_jobs is now zero (initial job finished).
a) Idle thread is now waiting on pool->condvar inside
pthreadpool_server() in pthread_cond_timedwait().
Now, add another job ->
pthreadpool_add_job()
-> pthreadpool_put_job()
This adds the job to the queue.
Oh, there is an idle thread so don't
create one, do:
pthread_cond_signal(&pool->condvar);
and return.
Now call fork *before* idle thread in (a) wakes from
the signaling of pool->condvar.
In the parent (child is irrelevent):
Go into: pthreadpool_prepare() ->
pthreadpool_prepare_pool()
Set the variable to tell idle threads to exit:
pool->prefork_cond = &prefork_cond;
then wake them up with:
pthread_cond_signal(&pool->condvar);
This does nothing as the idle thread
is already awoken.
b) Idle thread wakes up and does:
Reduce idle thread count (num_idle = 0)
pool->num_idle -= 1;
Check if we're in the middle of a fork.
if (pool->prefork_cond != NULL) {
Yes we are, tell pthreadpool_prepare()
we are exiting.
pthread_cond_signal(pool->prefork_cond);
And exit.
pthreadpool_server_exit(pool);
return NULL;
}
So we come back from the fork in the parent with num_jobs = 1,
a job on the queue but no idle threads - and the code that
creates a new thread on job submission was skipped because
an idle thread existed at point (a).
OK, assuming that the previous explaination is correct, the
fix is to create a new pthreadpool context mutex:
pool->fork_mutex
and in pthreadpool_server(), when an idle thread wakes up and
notices we're in the prepare fork state, it puts itself to
sleep by waiting on the new pool->fork_mutex.
And in pthreadpool_prepare_pool(), instead of waiting for
the idle threads to exit, hold the pool->fork_mutex and
signal each idle thread in turn, and wait for the pool->num_idle
to go to zero - which means they're all blocked waiting on
pool->fork_mutex.
When the parent continues, pthreadpool_parent()
unlocks the pool->fork_mutex and all the previously
'idle' threads wake up (and you mention the thundering
herd problem, which is as you say vanishingly small :-)
and pick up any remaining job.
Bug: https://bugzilla.samba.org/show_bug.cgi?id=13179
Signed-off-by: Volker Lendecke <vl@samba.org>
Reviewed-by: Jeremy Allison <jra@samba.org>
2017-11-29 18:45:40 +03:00
ret = pthread_mutex_lock ( & pool - > fork_mutex ) ;
assert ( ret = = 0 ) ;
2017-08-28 17:38:19 +03:00
ret = pthread_mutex_lock ( & pool - > mutex ) ;
assert ( ret = = 0 ) ;
while ( pool - > num_idle ! = 0 ) {
2018-06-22 01:04:48 +03:00
unsigned num_idle = pool - > num_idle ;
pthreadpool: Fix starvation after fork
After the race is before the race:
1) Create an idle thread
2) Add a job: This won't create a thread anymore
3) Immediately fork
The idle thread will be woken twice before it's actually woken up: Both
pthreadpool_add_job and pthreadpool_prepare_pool call cond_signal, for
different reasons. We must look at pool->prefork_cond first because otherwise
we will end up in a blocking job deep within a fork call, the helper thread
must take its fingers off the condvar as quickly as possible. This means that
after the fork there's no idle thread around anymore that would pick up the job
submitted in 2). So we must keep the idle threads around across the fork.
The quick solution to re-create one helper thread in pthreadpool_parent has a
fatal flaw: What do we do if that pthread_create call fails? We're deep in an
application calling fork(), and doing fancy signalling from there is really
something we must avoid.
This has one potential performance issue: If we have hundreds of idle threads
(do we ever have that) during the fork, the call to pthread_mutex_lock on the
fork_mutex from pthreadpool_server (the helper thread) will probably cause a
thundering herd when the _parent call unlocks the fork_mutex. The solution for
this to just keep one idle thread around. But this adds code that is not
strictly required functionally for now.
More detailed explanation from Jeremy:
First, understanding the problem the test reproduces:
add a job (num_jobs = 1) -> creates thread to run it.
job finishes, thread sticks around (num_idle = 1).
num_jobs is now zero (initial job finished).
a) Idle thread is now waiting on pool->condvar inside
pthreadpool_server() in pthread_cond_timedwait().
Now, add another job ->
pthreadpool_add_job()
-> pthreadpool_put_job()
This adds the job to the queue.
Oh, there is an idle thread so don't
create one, do:
pthread_cond_signal(&pool->condvar);
and return.
Now call fork *before* idle thread in (a) wakes from
the signaling of pool->condvar.
In the parent (child is irrelevent):
Go into: pthreadpool_prepare() ->
pthreadpool_prepare_pool()
Set the variable to tell idle threads to exit:
pool->prefork_cond = &prefork_cond;
then wake them up with:
pthread_cond_signal(&pool->condvar);
This does nothing as the idle thread
is already awoken.
b) Idle thread wakes up and does:
Reduce idle thread count (num_idle = 0)
pool->num_idle -= 1;
Check if we're in the middle of a fork.
if (pool->prefork_cond != NULL) {
Yes we are, tell pthreadpool_prepare()
we are exiting.
pthread_cond_signal(pool->prefork_cond);
And exit.
pthreadpool_server_exit(pool);
return NULL;
}
So we come back from the fork in the parent with num_jobs = 1,
a job on the queue but no idle threads - and the code that
creates a new thread on job submission was skipped because
an idle thread existed at point (a).
OK, assuming that the previous explaination is correct, the
fix is to create a new pthreadpool context mutex:
pool->fork_mutex
and in pthreadpool_server(), when an idle thread wakes up and
notices we're in the prepare fork state, it puts itself to
sleep by waiting on the new pool->fork_mutex.
And in pthreadpool_prepare_pool(), instead of waiting for
the idle threads to exit, hold the pool->fork_mutex and
signal each idle thread in turn, and wait for the pool->num_idle
to go to zero - which means they're all blocked waiting on
pool->fork_mutex.
When the parent continues, pthreadpool_parent()
unlocks the pool->fork_mutex and all the previously
'idle' threads wake up (and you mention the thundering
herd problem, which is as you say vanishingly small :-)
and pick up any remaining job.
Bug: https://bugzilla.samba.org/show_bug.cgi?id=13179
Signed-off-by: Volker Lendecke <vl@samba.org>
Reviewed-by: Jeremy Allison <jra@samba.org>
2017-11-29 18:45:40 +03:00
pthread_cond_t prefork_cond ;
ret = pthread_cond_init ( & prefork_cond , NULL ) ;
assert ( ret = = 0 ) ;
2017-08-28 17:38:19 +03:00
/*
pthreadpool: Fix starvation after fork
After the race is before the race:
1) Create an idle thread
2) Add a job: This won't create a thread anymore
3) Immediately fork
The idle thread will be woken twice before it's actually woken up: Both
pthreadpool_add_job and pthreadpool_prepare_pool call cond_signal, for
different reasons. We must look at pool->prefork_cond first because otherwise
we will end up in a blocking job deep within a fork call, the helper thread
must take its fingers off the condvar as quickly as possible. This means that
after the fork there's no idle thread around anymore that would pick up the job
submitted in 2). So we must keep the idle threads around across the fork.
The quick solution to re-create one helper thread in pthreadpool_parent has a
fatal flaw: What do we do if that pthread_create call fails? We're deep in an
application calling fork(), and doing fancy signalling from there is really
something we must avoid.
This has one potential performance issue: If we have hundreds of idle threads
(do we ever have that) during the fork, the call to pthread_mutex_lock on the
fork_mutex from pthreadpool_server (the helper thread) will probably cause a
thundering herd when the _parent call unlocks the fork_mutex. The solution for
this to just keep one idle thread around. But this adds code that is not
strictly required functionally for now.
More detailed explanation from Jeremy:
First, understanding the problem the test reproduces:
add a job (num_jobs = 1) -> creates thread to run it.
job finishes, thread sticks around (num_idle = 1).
num_jobs is now zero (initial job finished).
a) Idle thread is now waiting on pool->condvar inside
pthreadpool_server() in pthread_cond_timedwait().
Now, add another job ->
pthreadpool_add_job()
-> pthreadpool_put_job()
This adds the job to the queue.
Oh, there is an idle thread so don't
create one, do:
pthread_cond_signal(&pool->condvar);
and return.
Now call fork *before* idle thread in (a) wakes from
the signaling of pool->condvar.
In the parent (child is irrelevent):
Go into: pthreadpool_prepare() ->
pthreadpool_prepare_pool()
Set the variable to tell idle threads to exit:
pool->prefork_cond = &prefork_cond;
then wake them up with:
pthread_cond_signal(&pool->condvar);
This does nothing as the idle thread
is already awoken.
b) Idle thread wakes up and does:
Reduce idle thread count (num_idle = 0)
pool->num_idle -= 1;
Check if we're in the middle of a fork.
if (pool->prefork_cond != NULL) {
Yes we are, tell pthreadpool_prepare()
we are exiting.
pthread_cond_signal(pool->prefork_cond);
And exit.
pthreadpool_server_exit(pool);
return NULL;
}
So we come back from the fork in the parent with num_jobs = 1,
a job on the queue but no idle threads - and the code that
creates a new thread on job submission was skipped because
an idle thread existed at point (a).
OK, assuming that the previous explaination is correct, the
fix is to create a new pthreadpool context mutex:
pool->fork_mutex
and in pthreadpool_server(), when an idle thread wakes up and
notices we're in the prepare fork state, it puts itself to
sleep by waiting on the new pool->fork_mutex.
And in pthreadpool_prepare_pool(), instead of waiting for
the idle threads to exit, hold the pool->fork_mutex and
signal each idle thread in turn, and wait for the pool->num_idle
to go to zero - which means they're all blocked waiting on
pool->fork_mutex.
When the parent continues, pthreadpool_parent()
unlocks the pool->fork_mutex and all the previously
'idle' threads wake up (and you mention the thundering
herd problem, which is as you say vanishingly small :-)
and pick up any remaining job.
Bug: https://bugzilla.samba.org/show_bug.cgi?id=13179
Signed-off-by: Volker Lendecke <vl@samba.org>
Reviewed-by: Jeremy Allison <jra@samba.org>
2017-11-29 18:45:40 +03:00
* Push all idle threads off pool - > condvar . In the
* child we can destroy the pool , which would result
* in undefined behaviour in the
* pthread_cond_destroy ( pool - > condvar ) . glibc just
2017-08-28 17:38:19 +03:00
* blocks here .
*/
pool - > prefork_cond = & prefork_cond ;
ret = pthread_cond_signal ( & pool - > condvar ) ;
assert ( ret = = 0 ) ;
pthreadpool: Fix starvation after fork
After the race is before the race:
1) Create an idle thread
2) Add a job: This won't create a thread anymore
3) Immediately fork
The idle thread will be woken twice before it's actually woken up: Both
pthreadpool_add_job and pthreadpool_prepare_pool call cond_signal, for
different reasons. We must look at pool->prefork_cond first because otherwise
we will end up in a blocking job deep within a fork call, the helper thread
must take its fingers off the condvar as quickly as possible. This means that
after the fork there's no idle thread around anymore that would pick up the job
submitted in 2). So we must keep the idle threads around across the fork.
The quick solution to re-create one helper thread in pthreadpool_parent has a
fatal flaw: What do we do if that pthread_create call fails? We're deep in an
application calling fork(), and doing fancy signalling from there is really
something we must avoid.
This has one potential performance issue: If we have hundreds of idle threads
(do we ever have that) during the fork, the call to pthread_mutex_lock on the
fork_mutex from pthreadpool_server (the helper thread) will probably cause a
thundering herd when the _parent call unlocks the fork_mutex. The solution for
this to just keep one idle thread around. But this adds code that is not
strictly required functionally for now.
More detailed explanation from Jeremy:
First, understanding the problem the test reproduces:
add a job (num_jobs = 1) -> creates thread to run it.
job finishes, thread sticks around (num_idle = 1).
num_jobs is now zero (initial job finished).
a) Idle thread is now waiting on pool->condvar inside
pthreadpool_server() in pthread_cond_timedwait().
Now, add another job ->
pthreadpool_add_job()
-> pthreadpool_put_job()
This adds the job to the queue.
Oh, there is an idle thread so don't
create one, do:
pthread_cond_signal(&pool->condvar);
and return.
Now call fork *before* idle thread in (a) wakes from
the signaling of pool->condvar.
In the parent (child is irrelevent):
Go into: pthreadpool_prepare() ->
pthreadpool_prepare_pool()
Set the variable to tell idle threads to exit:
pool->prefork_cond = &prefork_cond;
then wake them up with:
pthread_cond_signal(&pool->condvar);
This does nothing as the idle thread
is already awoken.
b) Idle thread wakes up and does:
Reduce idle thread count (num_idle = 0)
pool->num_idle -= 1;
Check if we're in the middle of a fork.
if (pool->prefork_cond != NULL) {
Yes we are, tell pthreadpool_prepare()
we are exiting.
pthread_cond_signal(pool->prefork_cond);
And exit.
pthreadpool_server_exit(pool);
return NULL;
}
So we come back from the fork in the parent with num_jobs = 1,
a job on the queue but no idle threads - and the code that
creates a new thread on job submission was skipped because
an idle thread existed at point (a).
OK, assuming that the previous explaination is correct, the
fix is to create a new pthreadpool context mutex:
pool->fork_mutex
and in pthreadpool_server(), when an idle thread wakes up and
notices we're in the prepare fork state, it puts itself to
sleep by waiting on the new pool->fork_mutex.
And in pthreadpool_prepare_pool(), instead of waiting for
the idle threads to exit, hold the pool->fork_mutex and
signal each idle thread in turn, and wait for the pool->num_idle
to go to zero - which means they're all blocked waiting on
pool->fork_mutex.
When the parent continues, pthreadpool_parent()
unlocks the pool->fork_mutex and all the previously
'idle' threads wake up (and you mention the thundering
herd problem, which is as you say vanishingly small :-)
and pick up any remaining job.
Bug: https://bugzilla.samba.org/show_bug.cgi?id=13179
Signed-off-by: Volker Lendecke <vl@samba.org>
Reviewed-by: Jeremy Allison <jra@samba.org>
2017-11-29 18:45:40 +03:00
while ( pool - > num_idle = = num_idle ) {
ret = pthread_cond_wait ( & prefork_cond , & pool - > mutex ) ;
assert ( ret = = 0 ) ;
}
2017-08-28 17:38:19 +03:00
pool - > prefork_cond = NULL ;
pthreadpool: Fix starvation after fork
After the race is before the race:
1) Create an idle thread
2) Add a job: This won't create a thread anymore
3) Immediately fork
The idle thread will be woken twice before it's actually woken up: Both
pthreadpool_add_job and pthreadpool_prepare_pool call cond_signal, for
different reasons. We must look at pool->prefork_cond first because otherwise
we will end up in a blocking job deep within a fork call, the helper thread
must take its fingers off the condvar as quickly as possible. This means that
after the fork there's no idle thread around anymore that would pick up the job
submitted in 2). So we must keep the idle threads around across the fork.
The quick solution to re-create one helper thread in pthreadpool_parent has a
fatal flaw: What do we do if that pthread_create call fails? We're deep in an
application calling fork(), and doing fancy signalling from there is really
something we must avoid.
This has one potential performance issue: If we have hundreds of idle threads
(do we ever have that) during the fork, the call to pthread_mutex_lock on the
fork_mutex from pthreadpool_server (the helper thread) will probably cause a
thundering herd when the _parent call unlocks the fork_mutex. The solution for
this to just keep one idle thread around. But this adds code that is not
strictly required functionally for now.
More detailed explanation from Jeremy:
First, understanding the problem the test reproduces:
add a job (num_jobs = 1) -> creates thread to run it.
job finishes, thread sticks around (num_idle = 1).
num_jobs is now zero (initial job finished).
a) Idle thread is now waiting on pool->condvar inside
pthreadpool_server() in pthread_cond_timedwait().
Now, add another job ->
pthreadpool_add_job()
-> pthreadpool_put_job()
This adds the job to the queue.
Oh, there is an idle thread so don't
create one, do:
pthread_cond_signal(&pool->condvar);
and return.
Now call fork *before* idle thread in (a) wakes from
the signaling of pool->condvar.
In the parent (child is irrelevent):
Go into: pthreadpool_prepare() ->
pthreadpool_prepare_pool()
Set the variable to tell idle threads to exit:
pool->prefork_cond = &prefork_cond;
then wake them up with:
pthread_cond_signal(&pool->condvar);
This does nothing as the idle thread
is already awoken.
b) Idle thread wakes up and does:
Reduce idle thread count (num_idle = 0)
pool->num_idle -= 1;
Check if we're in the middle of a fork.
if (pool->prefork_cond != NULL) {
Yes we are, tell pthreadpool_prepare()
we are exiting.
pthread_cond_signal(pool->prefork_cond);
And exit.
pthreadpool_server_exit(pool);
return NULL;
}
So we come back from the fork in the parent with num_jobs = 1,
a job on the queue but no idle threads - and the code that
creates a new thread on job submission was skipped because
an idle thread existed at point (a).
OK, assuming that the previous explaination is correct, the
fix is to create a new pthreadpool context mutex:
pool->fork_mutex
and in pthreadpool_server(), when an idle thread wakes up and
notices we're in the prepare fork state, it puts itself to
sleep by waiting on the new pool->fork_mutex.
And in pthreadpool_prepare_pool(), instead of waiting for
the idle threads to exit, hold the pool->fork_mutex and
signal each idle thread in turn, and wait for the pool->num_idle
to go to zero - which means they're all blocked waiting on
pool->fork_mutex.
When the parent continues, pthreadpool_parent()
unlocks the pool->fork_mutex and all the previously
'idle' threads wake up (and you mention the thundering
herd problem, which is as you say vanishingly small :-)
and pick up any remaining job.
Bug: https://bugzilla.samba.org/show_bug.cgi?id=13179
Signed-off-by: Volker Lendecke <vl@samba.org>
Reviewed-by: Jeremy Allison <jra@samba.org>
2017-11-29 18:45:40 +03:00
ret = pthread_cond_destroy ( & prefork_cond ) ;
assert ( ret = = 0 ) ;
}
2017-08-28 17:38:19 +03:00
/*
* Probably it ' s well - defined somewhere : What happens to
* condvars after a fork ? The rationale of pthread_atfork only
* writes about mutexes . So better be safe than sorry and
* destroy / reinit pool - > condvar across a fork .
*/
ret = pthread_cond_destroy ( & pool - > condvar ) ;
assert ( ret = = 0 ) ;
}
2011-04-22 13:47:11 +04:00
static void pthreadpool_prepare ( void )
2009-04-23 19:23:13 +04:00
{
2011-04-22 13:47:11 +04:00
int ret ;
struct pthreadpool * pool ;
2009-04-23 19:23:13 +04:00
2011-04-22 13:47:11 +04:00
ret = pthread_mutex_lock ( & pthreadpools_mutex ) ;
assert ( ret = = 0 ) ;
pool = pthreadpools ;
while ( pool ! = NULL ) {
2017-08-28 17:38:19 +03:00
pthreadpool_prepare_pool ( pool ) ;
2011-04-22 13:47:11 +04:00
pool = pool - > next ;
2009-04-23 19:23:13 +04:00
}
2011-04-22 13:47:11 +04:00
}
static void pthreadpool_parent ( void )
{
int ret ;
struct pthreadpool * pool ;
2014-03-03 15:20:41 +04:00
for ( pool = DLIST_TAIL ( pthreadpools ) ;
pool ! = NULL ;
pool = DLIST_PREV ( pool ) ) {
2017-08-28 17:38:19 +03:00
ret = pthread_cond_init ( & pool - > condvar , NULL ) ;
assert ( ret = = 0 ) ;
2011-04-22 13:47:11 +04:00
ret = pthread_mutex_unlock ( & pool - > mutex ) ;
assert ( ret = = 0 ) ;
pthreadpool: Fix starvation after fork
After the race is before the race:
1) Create an idle thread
2) Add a job: This won't create a thread anymore
3) Immediately fork
The idle thread will be woken twice before it's actually woken up: Both
pthreadpool_add_job and pthreadpool_prepare_pool call cond_signal, for
different reasons. We must look at pool->prefork_cond first because otherwise
we will end up in a blocking job deep within a fork call, the helper thread
must take its fingers off the condvar as quickly as possible. This means that
after the fork there's no idle thread around anymore that would pick up the job
submitted in 2). So we must keep the idle threads around across the fork.
The quick solution to re-create one helper thread in pthreadpool_parent has a
fatal flaw: What do we do if that pthread_create call fails? We're deep in an
application calling fork(), and doing fancy signalling from there is really
something we must avoid.
This has one potential performance issue: If we have hundreds of idle threads
(do we ever have that) during the fork, the call to pthread_mutex_lock on the
fork_mutex from pthreadpool_server (the helper thread) will probably cause a
thundering herd when the _parent call unlocks the fork_mutex. The solution for
this to just keep one idle thread around. But this adds code that is not
strictly required functionally for now.
More detailed explanation from Jeremy:
First, understanding the problem the test reproduces:
add a job (num_jobs = 1) -> creates thread to run it.
job finishes, thread sticks around (num_idle = 1).
num_jobs is now zero (initial job finished).
a) Idle thread is now waiting on pool->condvar inside
pthreadpool_server() in pthread_cond_timedwait().
Now, add another job ->
pthreadpool_add_job()
-> pthreadpool_put_job()
This adds the job to the queue.
Oh, there is an idle thread so don't
create one, do:
pthread_cond_signal(&pool->condvar);
and return.
Now call fork *before* idle thread in (a) wakes from
the signaling of pool->condvar.
In the parent (child is irrelevent):
Go into: pthreadpool_prepare() ->
pthreadpool_prepare_pool()
Set the variable to tell idle threads to exit:
pool->prefork_cond = &prefork_cond;
then wake them up with:
pthread_cond_signal(&pool->condvar);
This does nothing as the idle thread
is already awoken.
b) Idle thread wakes up and does:
Reduce idle thread count (num_idle = 0)
pool->num_idle -= 1;
Check if we're in the middle of a fork.
if (pool->prefork_cond != NULL) {
Yes we are, tell pthreadpool_prepare()
we are exiting.
pthread_cond_signal(pool->prefork_cond);
And exit.
pthreadpool_server_exit(pool);
return NULL;
}
So we come back from the fork in the parent with num_jobs = 1,
a job on the queue but no idle threads - and the code that
creates a new thread on job submission was skipped because
an idle thread existed at point (a).
OK, assuming that the previous explaination is correct, the
fix is to create a new pthreadpool context mutex:
pool->fork_mutex
and in pthreadpool_server(), when an idle thread wakes up and
notices we're in the prepare fork state, it puts itself to
sleep by waiting on the new pool->fork_mutex.
And in pthreadpool_prepare_pool(), instead of waiting for
the idle threads to exit, hold the pool->fork_mutex and
signal each idle thread in turn, and wait for the pool->num_idle
to go to zero - which means they're all blocked waiting on
pool->fork_mutex.
When the parent continues, pthreadpool_parent()
unlocks the pool->fork_mutex and all the previously
'idle' threads wake up (and you mention the thundering
herd problem, which is as you say vanishingly small :-)
and pick up any remaining job.
Bug: https://bugzilla.samba.org/show_bug.cgi?id=13179
Signed-off-by: Volker Lendecke <vl@samba.org>
Reviewed-by: Jeremy Allison <jra@samba.org>
2017-11-29 18:45:40 +03:00
ret = pthread_mutex_unlock ( & pool - > fork_mutex ) ;
assert ( ret = = 0 ) ;
2009-04-23 19:23:13 +04:00
}
2011-04-22 13:47:11 +04:00
ret = pthread_mutex_unlock ( & pthreadpools_mutex ) ;
assert ( ret = = 0 ) ;
}
static void pthreadpool_child ( void )
{
int ret ;
struct pthreadpool * pool ;
2014-03-03 15:20:41 +04:00
for ( pool = DLIST_TAIL ( pthreadpools ) ;
pool ! = NULL ;
pool = DLIST_PREV ( pool ) ) {
2011-04-22 13:47:11 +04:00
pool - > num_threads = 0 ;
pool - > num_idle = 0 ;
2014-03-21 20:53:26 +04:00
pool - > head = 0 ;
pool - > num_jobs = 0 ;
2018-07-16 18:17:59 +03:00
pool - > stopped = true ;
2011-04-22 13:47:11 +04:00
2017-08-28 17:38:19 +03:00
ret = pthread_cond_init ( & pool - > condvar , NULL ) ;
assert ( ret = = 0 ) ;
pthreadpool: Fix starvation after fork
After the race is before the race:
1) Create an idle thread
2) Add a job: This won't create a thread anymore
3) Immediately fork
The idle thread will be woken twice before it's actually woken up: Both
pthreadpool_add_job and pthreadpool_prepare_pool call cond_signal, for
different reasons. We must look at pool->prefork_cond first because otherwise
we will end up in a blocking job deep within a fork call, the helper thread
must take its fingers off the condvar as quickly as possible. This means that
after the fork there's no idle thread around anymore that would pick up the job
submitted in 2). So we must keep the idle threads around across the fork.
The quick solution to re-create one helper thread in pthreadpool_parent has a
fatal flaw: What do we do if that pthread_create call fails? We're deep in an
application calling fork(), and doing fancy signalling from there is really
something we must avoid.
This has one potential performance issue: If we have hundreds of idle threads
(do we ever have that) during the fork, the call to pthread_mutex_lock on the
fork_mutex from pthreadpool_server (the helper thread) will probably cause a
thundering herd when the _parent call unlocks the fork_mutex. The solution for
this to just keep one idle thread around. But this adds code that is not
strictly required functionally for now.
More detailed explanation from Jeremy:
First, understanding the problem the test reproduces:
add a job (num_jobs = 1) -> creates thread to run it.
job finishes, thread sticks around (num_idle = 1).
num_jobs is now zero (initial job finished).
a) Idle thread is now waiting on pool->condvar inside
pthreadpool_server() in pthread_cond_timedwait().
Now, add another job ->
pthreadpool_add_job()
-> pthreadpool_put_job()
This adds the job to the queue.
Oh, there is an idle thread so don't
create one, do:
pthread_cond_signal(&pool->condvar);
and return.
Now call fork *before* idle thread in (a) wakes from
the signaling of pool->condvar.
In the parent (child is irrelevent):
Go into: pthreadpool_prepare() ->
pthreadpool_prepare_pool()
Set the variable to tell idle threads to exit:
pool->prefork_cond = &prefork_cond;
then wake them up with:
pthread_cond_signal(&pool->condvar);
This does nothing as the idle thread
is already awoken.
b) Idle thread wakes up and does:
Reduce idle thread count (num_idle = 0)
pool->num_idle -= 1;
Check if we're in the middle of a fork.
if (pool->prefork_cond != NULL) {
Yes we are, tell pthreadpool_prepare()
we are exiting.
pthread_cond_signal(pool->prefork_cond);
And exit.
pthreadpool_server_exit(pool);
return NULL;
}
So we come back from the fork in the parent with num_jobs = 1,
a job on the queue but no idle threads - and the code that
creates a new thread on job submission was skipped because
an idle thread existed at point (a).
OK, assuming that the previous explaination is correct, the
fix is to create a new pthreadpool context mutex:
pool->fork_mutex
and in pthreadpool_server(), when an idle thread wakes up and
notices we're in the prepare fork state, it puts itself to
sleep by waiting on the new pool->fork_mutex.
And in pthreadpool_prepare_pool(), instead of waiting for
the idle threads to exit, hold the pool->fork_mutex and
signal each idle thread in turn, and wait for the pool->num_idle
to go to zero - which means they're all blocked waiting on
pool->fork_mutex.
When the parent continues, pthreadpool_parent()
unlocks the pool->fork_mutex and all the previously
'idle' threads wake up (and you mention the thundering
herd problem, which is as you say vanishingly small :-)
and pick up any remaining job.
Bug: https://bugzilla.samba.org/show_bug.cgi?id=13179
Signed-off-by: Volker Lendecke <vl@samba.org>
Reviewed-by: Jeremy Allison <jra@samba.org>
2017-11-29 18:45:40 +03:00
2011-04-22 13:47:11 +04:00
ret = pthread_mutex_unlock ( & pool - > mutex ) ;
assert ( ret = = 0 ) ;
pthreadpool: Fix starvation after fork
After the race is before the race:
1) Create an idle thread
2) Add a job: This won't create a thread anymore
3) Immediately fork
The idle thread will be woken twice before it's actually woken up: Both
pthreadpool_add_job and pthreadpool_prepare_pool call cond_signal, for
different reasons. We must look at pool->prefork_cond first because otherwise
we will end up in a blocking job deep within a fork call, the helper thread
must take its fingers off the condvar as quickly as possible. This means that
after the fork there's no idle thread around anymore that would pick up the job
submitted in 2). So we must keep the idle threads around across the fork.
The quick solution to re-create one helper thread in pthreadpool_parent has a
fatal flaw: What do we do if that pthread_create call fails? We're deep in an
application calling fork(), and doing fancy signalling from there is really
something we must avoid.
This has one potential performance issue: If we have hundreds of idle threads
(do we ever have that) during the fork, the call to pthread_mutex_lock on the
fork_mutex from pthreadpool_server (the helper thread) will probably cause a
thundering herd when the _parent call unlocks the fork_mutex. The solution for
this to just keep one idle thread around. But this adds code that is not
strictly required functionally for now.
More detailed explanation from Jeremy:
First, understanding the problem the test reproduces:
add a job (num_jobs = 1) -> creates thread to run it.
job finishes, thread sticks around (num_idle = 1).
num_jobs is now zero (initial job finished).
a) Idle thread is now waiting on pool->condvar inside
pthreadpool_server() in pthread_cond_timedwait().
Now, add another job ->
pthreadpool_add_job()
-> pthreadpool_put_job()
This adds the job to the queue.
Oh, there is an idle thread so don't
create one, do:
pthread_cond_signal(&pool->condvar);
and return.
Now call fork *before* idle thread in (a) wakes from
the signaling of pool->condvar.
In the parent (child is irrelevent):
Go into: pthreadpool_prepare() ->
pthreadpool_prepare_pool()
Set the variable to tell idle threads to exit:
pool->prefork_cond = &prefork_cond;
then wake them up with:
pthread_cond_signal(&pool->condvar);
This does nothing as the idle thread
is already awoken.
b) Idle thread wakes up and does:
Reduce idle thread count (num_idle = 0)
pool->num_idle -= 1;
Check if we're in the middle of a fork.
if (pool->prefork_cond != NULL) {
Yes we are, tell pthreadpool_prepare()
we are exiting.
pthread_cond_signal(pool->prefork_cond);
And exit.
pthreadpool_server_exit(pool);
return NULL;
}
So we come back from the fork in the parent with num_jobs = 1,
a job on the queue but no idle threads - and the code that
creates a new thread on job submission was skipped because
an idle thread existed at point (a).
OK, assuming that the previous explaination is correct, the
fix is to create a new pthreadpool context mutex:
pool->fork_mutex
and in pthreadpool_server(), when an idle thread wakes up and
notices we're in the prepare fork state, it puts itself to
sleep by waiting on the new pool->fork_mutex.
And in pthreadpool_prepare_pool(), instead of waiting for
the idle threads to exit, hold the pool->fork_mutex and
signal each idle thread in turn, and wait for the pool->num_idle
to go to zero - which means they're all blocked waiting on
pool->fork_mutex.
When the parent continues, pthreadpool_parent()
unlocks the pool->fork_mutex and all the previously
'idle' threads wake up (and you mention the thundering
herd problem, which is as you say vanishingly small :-)
and pick up any remaining job.
Bug: https://bugzilla.samba.org/show_bug.cgi?id=13179
Signed-off-by: Volker Lendecke <vl@samba.org>
Reviewed-by: Jeremy Allison <jra@samba.org>
2017-11-29 18:45:40 +03:00
ret = pthread_mutex_unlock ( & pool - > fork_mutex ) ;
assert ( ret = = 0 ) ;
2009-04-23 19:23:13 +04:00
}
2011-04-22 13:47:11 +04:00
ret = pthread_mutex_unlock ( & pthreadpools_mutex ) ;
2009-04-23 19:23:13 +04:00
assert ( ret = = 0 ) ;
2011-04-22 13:47:11 +04:00
}
static void pthreadpool_prep_atfork ( void )
{
pthread_atfork ( pthreadpool_prepare , pthreadpool_parent ,
pthreadpool_child ) ;
}
2016-09-09 14:07:57 +03:00
static int pthreadpool_free ( struct pthreadpool * pool )
2009-04-23 19:23:13 +04:00
{
pthreadpool: Fix starvation after fork
After the race is before the race:
1) Create an idle thread
2) Add a job: This won't create a thread anymore
3) Immediately fork
The idle thread will be woken twice before it's actually woken up: Both
pthreadpool_add_job and pthreadpool_prepare_pool call cond_signal, for
different reasons. We must look at pool->prefork_cond first because otherwise
we will end up in a blocking job deep within a fork call, the helper thread
must take its fingers off the condvar as quickly as possible. This means that
after the fork there's no idle thread around anymore that would pick up the job
submitted in 2). So we must keep the idle threads around across the fork.
The quick solution to re-create one helper thread in pthreadpool_parent has a
fatal flaw: What do we do if that pthread_create call fails? We're deep in an
application calling fork(), and doing fancy signalling from there is really
something we must avoid.
This has one potential performance issue: If we have hundreds of idle threads
(do we ever have that) during the fork, the call to pthread_mutex_lock on the
fork_mutex from pthreadpool_server (the helper thread) will probably cause a
thundering herd when the _parent call unlocks the fork_mutex. The solution for
this to just keep one idle thread around. But this adds code that is not
strictly required functionally for now.
More detailed explanation from Jeremy:
First, understanding the problem the test reproduces:
add a job (num_jobs = 1) -> creates thread to run it.
job finishes, thread sticks around (num_idle = 1).
num_jobs is now zero (initial job finished).
a) Idle thread is now waiting on pool->condvar inside
pthreadpool_server() in pthread_cond_timedwait().
Now, add another job ->
pthreadpool_add_job()
-> pthreadpool_put_job()
This adds the job to the queue.
Oh, there is an idle thread so don't
create one, do:
pthread_cond_signal(&pool->condvar);
and return.
Now call fork *before* idle thread in (a) wakes from
the signaling of pool->condvar.
In the parent (child is irrelevent):
Go into: pthreadpool_prepare() ->
pthreadpool_prepare_pool()
Set the variable to tell idle threads to exit:
pool->prefork_cond = &prefork_cond;
then wake them up with:
pthread_cond_signal(&pool->condvar);
This does nothing as the idle thread
is already awoken.
b) Idle thread wakes up and does:
Reduce idle thread count (num_idle = 0)
pool->num_idle -= 1;
Check if we're in the middle of a fork.
if (pool->prefork_cond != NULL) {
Yes we are, tell pthreadpool_prepare()
we are exiting.
pthread_cond_signal(pool->prefork_cond);
And exit.
pthreadpool_server_exit(pool);
return NULL;
}
So we come back from the fork in the parent with num_jobs = 1,
a job on the queue but no idle threads - and the code that
creates a new thread on job submission was skipped because
an idle thread existed at point (a).
OK, assuming that the previous explaination is correct, the
fix is to create a new pthreadpool context mutex:
pool->fork_mutex
and in pthreadpool_server(), when an idle thread wakes up and
notices we're in the prepare fork state, it puts itself to
sleep by waiting on the new pool->fork_mutex.
And in pthreadpool_prepare_pool(), instead of waiting for
the idle threads to exit, hold the pool->fork_mutex and
signal each idle thread in turn, and wait for the pool->num_idle
to go to zero - which means they're all blocked waiting on
pool->fork_mutex.
When the parent continues, pthreadpool_parent()
unlocks the pool->fork_mutex and all the previously
'idle' threads wake up (and you mention the thundering
herd problem, which is as you say vanishingly small :-)
and pick up any remaining job.
Bug: https://bugzilla.samba.org/show_bug.cgi?id=13179
Signed-off-by: Volker Lendecke <vl@samba.org>
Reviewed-by: Jeremy Allison <jra@samba.org>
2017-11-29 18:45:40 +03:00
int ret , ret1 , ret2 ;
2009-04-23 19:23:13 +04:00
2016-10-17 18:09:01 +03:00
ret = pthread_mutex_lock ( & pthreadpools_mutex ) ;
if ( ret ! = 0 ) {
return ret ;
}
DLIST_REMOVE ( pthreadpools , pool ) ;
ret = pthread_mutex_unlock ( & pthreadpools_mutex ) ;
assert ( ret = = 0 ) ;
2018-06-21 13:40:30 +03:00
ret = pthread_mutex_lock ( & pool - > mutex ) ;
assert ( ret = = 0 ) ;
ret = pthread_mutex_unlock ( & pool - > mutex ) ;
assert ( ret = = 0 ) ;
2016-09-09 14:07:57 +03:00
ret = pthread_mutex_destroy ( & pool - > mutex ) ;
ret1 = pthread_cond_destroy ( & pool - > condvar ) ;
pthreadpool: Fix starvation after fork
After the race is before the race:
1) Create an idle thread
2) Add a job: This won't create a thread anymore
3) Immediately fork
The idle thread will be woken twice before it's actually woken up: Both
pthreadpool_add_job and pthreadpool_prepare_pool call cond_signal, for
different reasons. We must look at pool->prefork_cond first because otherwise
we will end up in a blocking job deep within a fork call, the helper thread
must take its fingers off the condvar as quickly as possible. This means that
after the fork there's no idle thread around anymore that would pick up the job
submitted in 2). So we must keep the idle threads around across the fork.
The quick solution to re-create one helper thread in pthreadpool_parent has a
fatal flaw: What do we do if that pthread_create call fails? We're deep in an
application calling fork(), and doing fancy signalling from there is really
something we must avoid.
This has one potential performance issue: If we have hundreds of idle threads
(do we ever have that) during the fork, the call to pthread_mutex_lock on the
fork_mutex from pthreadpool_server (the helper thread) will probably cause a
thundering herd when the _parent call unlocks the fork_mutex. The solution for
this to just keep one idle thread around. But this adds code that is not
strictly required functionally for now.
More detailed explanation from Jeremy:
First, understanding the problem the test reproduces:
add a job (num_jobs = 1) -> creates thread to run it.
job finishes, thread sticks around (num_idle = 1).
num_jobs is now zero (initial job finished).
a) Idle thread is now waiting on pool->condvar inside
pthreadpool_server() in pthread_cond_timedwait().
Now, add another job ->
pthreadpool_add_job()
-> pthreadpool_put_job()
This adds the job to the queue.
Oh, there is an idle thread so don't
create one, do:
pthread_cond_signal(&pool->condvar);
and return.
Now call fork *before* idle thread in (a) wakes from
the signaling of pool->condvar.
In the parent (child is irrelevent):
Go into: pthreadpool_prepare() ->
pthreadpool_prepare_pool()
Set the variable to tell idle threads to exit:
pool->prefork_cond = &prefork_cond;
then wake them up with:
pthread_cond_signal(&pool->condvar);
This does nothing as the idle thread
is already awoken.
b) Idle thread wakes up and does:
Reduce idle thread count (num_idle = 0)
pool->num_idle -= 1;
Check if we're in the middle of a fork.
if (pool->prefork_cond != NULL) {
Yes we are, tell pthreadpool_prepare()
we are exiting.
pthread_cond_signal(pool->prefork_cond);
And exit.
pthreadpool_server_exit(pool);
return NULL;
}
So we come back from the fork in the parent with num_jobs = 1,
a job on the queue but no idle threads - and the code that
creates a new thread on job submission was skipped because
an idle thread existed at point (a).
OK, assuming that the previous explaination is correct, the
fix is to create a new pthreadpool context mutex:
pool->fork_mutex
and in pthreadpool_server(), when an idle thread wakes up and
notices we're in the prepare fork state, it puts itself to
sleep by waiting on the new pool->fork_mutex.
And in pthreadpool_prepare_pool(), instead of waiting for
the idle threads to exit, hold the pool->fork_mutex and
signal each idle thread in turn, and wait for the pool->num_idle
to go to zero - which means they're all blocked waiting on
pool->fork_mutex.
When the parent continues, pthreadpool_parent()
unlocks the pool->fork_mutex and all the previously
'idle' threads wake up (and you mention the thundering
herd problem, which is as you say vanishingly small :-)
and pick up any remaining job.
Bug: https://bugzilla.samba.org/show_bug.cgi?id=13179
Signed-off-by: Volker Lendecke <vl@samba.org>
Reviewed-by: Jeremy Allison <jra@samba.org>
2017-11-29 18:45:40 +03:00
ret2 = pthread_mutex_destroy ( & pool - > fork_mutex ) ;
2016-09-09 14:07:57 +03:00
if ( ret ! = 0 ) {
return ret ;
}
if ( ret1 ! = 0 ) {
return ret1 ;
2009-04-23 19:23:13 +04:00
}
pthreadpool: Fix starvation after fork
After the race is before the race:
1) Create an idle thread
2) Add a job: This won't create a thread anymore
3) Immediately fork
The idle thread will be woken twice before it's actually woken up: Both
pthreadpool_add_job and pthreadpool_prepare_pool call cond_signal, for
different reasons. We must look at pool->prefork_cond first because otherwise
we will end up in a blocking job deep within a fork call, the helper thread
must take its fingers off the condvar as quickly as possible. This means that
after the fork there's no idle thread around anymore that would pick up the job
submitted in 2). So we must keep the idle threads around across the fork.
The quick solution to re-create one helper thread in pthreadpool_parent has a
fatal flaw: What do we do if that pthread_create call fails? We're deep in an
application calling fork(), and doing fancy signalling from there is really
something we must avoid.
This has one potential performance issue: If we have hundreds of idle threads
(do we ever have that) during the fork, the call to pthread_mutex_lock on the
fork_mutex from pthreadpool_server (the helper thread) will probably cause a
thundering herd when the _parent call unlocks the fork_mutex. The solution for
this to just keep one idle thread around. But this adds code that is not
strictly required functionally for now.
More detailed explanation from Jeremy:
First, understanding the problem the test reproduces:
add a job (num_jobs = 1) -> creates thread to run it.
job finishes, thread sticks around (num_idle = 1).
num_jobs is now zero (initial job finished).
a) Idle thread is now waiting on pool->condvar inside
pthreadpool_server() in pthread_cond_timedwait().
Now, add another job ->
pthreadpool_add_job()
-> pthreadpool_put_job()
This adds the job to the queue.
Oh, there is an idle thread so don't
create one, do:
pthread_cond_signal(&pool->condvar);
and return.
Now call fork *before* idle thread in (a) wakes from
the signaling of pool->condvar.
In the parent (child is irrelevent):
Go into: pthreadpool_prepare() ->
pthreadpool_prepare_pool()
Set the variable to tell idle threads to exit:
pool->prefork_cond = &prefork_cond;
then wake them up with:
pthread_cond_signal(&pool->condvar);
This does nothing as the idle thread
is already awoken.
b) Idle thread wakes up and does:
Reduce idle thread count (num_idle = 0)
pool->num_idle -= 1;
Check if we're in the middle of a fork.
if (pool->prefork_cond != NULL) {
Yes we are, tell pthreadpool_prepare()
we are exiting.
pthread_cond_signal(pool->prefork_cond);
And exit.
pthreadpool_server_exit(pool);
return NULL;
}
So we come back from the fork in the parent with num_jobs = 1,
a job on the queue but no idle threads - and the code that
creates a new thread on job submission was skipped because
an idle thread existed at point (a).
OK, assuming that the previous explaination is correct, the
fix is to create a new pthreadpool context mutex:
pool->fork_mutex
and in pthreadpool_server(), when an idle thread wakes up and
notices we're in the prepare fork state, it puts itself to
sleep by waiting on the new pool->fork_mutex.
And in pthreadpool_prepare_pool(), instead of waiting for
the idle threads to exit, hold the pool->fork_mutex and
signal each idle thread in turn, and wait for the pool->num_idle
to go to zero - which means they're all blocked waiting on
pool->fork_mutex.
When the parent continues, pthreadpool_parent()
unlocks the pool->fork_mutex and all the previously
'idle' threads wake up (and you mention the thundering
herd problem, which is as you say vanishingly small :-)
and pick up any remaining job.
Bug: https://bugzilla.samba.org/show_bug.cgi?id=13179
Signed-off-by: Volker Lendecke <vl@samba.org>
Reviewed-by: Jeremy Allison <jra@samba.org>
2017-11-29 18:45:40 +03:00
if ( ret2 ! = 0 ) {
return ret2 ;
}
2011-04-25 22:05:31 +04:00
2016-09-09 14:07:57 +03:00
free ( pool - > jobs ) ;
free ( pool ) ;
return 0 ;
2009-04-23 19:23:13 +04:00
}
/*
2018-04-25 15:03:30 +03:00
* Stop a thread pool . Wake up all idle threads for exit .
2009-04-23 19:23:13 +04:00
*/
2018-04-25 15:03:30 +03:00
static int pthreadpool_stop_locked ( struct pthreadpool * pool )
{
int ret ;
pool - > stopped = true ;
if ( pool - > num_threads = = 0 ) {
return 0 ;
}
/*
* We have active threads , tell them to finish .
*/
ret = pthread_cond_broadcast ( & pool - > condvar ) ;
return ret ;
}
/*
* Stop a thread pool . Wake up all idle threads for exit .
*/
int pthreadpool_stop ( struct pthreadpool * pool )
2009-04-23 19:23:13 +04:00
{
int ret , ret1 ;
ret = pthread_mutex_lock ( & pool - > mutex ) ;
if ( ret ! = 0 ) {
return ret ;
}
2018-04-25 15:03:30 +03:00
if ( ! pool - > stopped ) {
ret = pthreadpool_stop_locked ( pool ) ;
2011-04-22 13:47:11 +04:00
}
2018-04-25 15:03:30 +03:00
ret1 = pthread_mutex_unlock ( & pool - > mutex ) ;
assert ( ret1 = = 0 ) ;
2016-10-12 13:12:28 +03:00
2018-04-25 15:03:30 +03:00
return ret ;
}
/*
* Destroy a thread pool . Wake up all idle threads for exit . The last
* one will free the pool .
*/
int pthreadpool_destroy ( struct pthreadpool * pool )
{
int ret , ret1 ;
bool free_it ;
assert ( ! pool - > destroyed ) ;
2016-10-12 13:12:28 +03:00
2018-04-25 15:03:30 +03:00
ret = pthread_mutex_lock ( & pool - > mutex ) ;
if ( ret ! = 0 ) {
2016-10-12 13:12:28 +03:00
return ret ;
}
2018-04-25 15:03:30 +03:00
pool - > destroyed = true ;
2009-04-23 19:23:13 +04:00
2018-04-25 15:03:30 +03:00
if ( ! pool - > stopped ) {
ret = pthreadpool_stop_locked ( pool ) ;
}
free_it = ( pool - > num_threads = = 0 ) ;
2009-04-23 19:23:13 +04:00
2016-09-09 14:07:57 +03:00
ret1 = pthread_mutex_unlock ( & pool - > mutex ) ;
assert ( ret1 = = 0 ) ;
2011-04-22 13:47:11 +04:00
2018-04-25 15:03:30 +03:00
if ( free_it ) {
pthreadpool_free ( pool ) ;
}
2016-09-09 14:07:57 +03:00
return ret ;
2009-04-23 19:23:13 +04:00
}
/*
2016-09-09 14:07:57 +03:00
* Prepare for pthread_exit ( ) , pool - > mutex must be locked and will be
* unlocked here . This is a bit of a layering violation , but here we
* also take care of removing the pool if we ' re the last thread .
2009-04-23 19:23:13 +04:00
*/
static void pthreadpool_server_exit ( struct pthreadpool * pool )
{
2016-09-09 14:07:57 +03:00
int ret ;
2016-10-12 13:12:28 +03:00
bool free_it ;
2011-04-25 22:05:31 +04:00
2009-04-23 19:23:13 +04:00
pool - > num_threads - = 1 ;
2011-04-25 22:05:31 +04:00
2018-04-25 15:03:30 +03:00
free_it = ( pool - > destroyed & & ( pool - > num_threads = = 0 ) ) ;
2011-04-25 22:05:31 +04:00
2016-09-09 14:07:57 +03:00
ret = pthread_mutex_unlock ( & pool - > mutex ) ;
assert ( ret = = 0 ) ;
2016-10-12 13:12:28 +03:00
if ( free_it ) {
pthreadpool_free ( pool ) ;
}
2009-04-23 19:23:13 +04:00
}
2014-03-21 20:53:26 +04:00
static bool pthreadpool_get_job ( struct pthreadpool * p ,
struct pthreadpool_job * job )
{
2018-04-25 15:03:30 +03:00
if ( p - > stopped ) {
2018-04-20 18:12:07 +03:00
return false ;
}
2014-03-21 20:53:26 +04:00
if ( p - > num_jobs = = 0 ) {
return false ;
}
* job = p - > jobs [ p - > head ] ;
p - > head = ( p - > head + 1 ) % p - > jobs_array_len ;
p - > num_jobs - = 1 ;
return true ;
}
static bool pthreadpool_put_job ( struct pthreadpool * p ,
int id ,
void ( * fn ) ( void * private_data ) ,
void * private_data )
{
struct pthreadpool_job * job ;
if ( p - > num_jobs = = p - > jobs_array_len ) {
struct pthreadpool_job * tmp ;
size_t new_len = p - > jobs_array_len * 2 ;
tmp = realloc (
p - > jobs , sizeof ( struct pthreadpool_job ) * new_len ) ;
if ( tmp = = NULL ) {
return false ;
}
p - > jobs = tmp ;
/*
* We just doubled the jobs array . The array implements a FIFO
* queue with a modulo - based wraparound , so we have to memcpy
* the jobs that are logically at the queue end but physically
* before the queue head into the reallocated area . The new
* space starts at the current jobs_array_len , and we have to
* copy everything before the current head job into the new
* area .
*/
memcpy ( & p - > jobs [ p - > jobs_array_len ] , p - > jobs ,
sizeof ( struct pthreadpool_job ) * p - > head ) ;
p - > jobs_array_len = new_len ;
}
job = & p - > jobs [ ( p - > head + p - > num_jobs ) % p - > jobs_array_len ] ;
job - > id = id ;
job - > fn = fn ;
job - > private_data = private_data ;
p - > num_jobs + = 1 ;
return true ;
}
2017-11-28 20:59:06 +03:00
static void pthreadpool_undo_put_job ( struct pthreadpool * p )
{
p - > num_jobs - = 1 ;
}
2009-04-23 19:23:13 +04:00
static void * pthreadpool_server ( void * arg )
{
struct pthreadpool * pool = ( struct pthreadpool * ) arg ;
int res ;
res = pthread_mutex_lock ( & pool - > mutex ) ;
if ( res ! = 0 ) {
return NULL ;
}
while ( 1 ) {
2011-04-22 13:47:11 +04:00
struct timespec ts ;
2014-03-21 20:53:26 +04:00
struct pthreadpool_job job ;
2009-04-23 19:23:13 +04:00
/*
* idle - wait at most 1 second . If nothing happens in that
* time , exit this thread .
*/
2011-06-05 23:30:16 +04:00
clock_gettime ( CLOCK_REALTIME , & ts ) ;
ts . tv_sec + = 1 ;
2009-04-23 19:23:13 +04:00
2018-04-25 15:03:30 +03:00
while ( ( pool - > num_jobs = = 0 ) & & ! pool - > stopped ) {
2009-04-23 19:23:13 +04:00
pool - > num_idle + = 1 ;
res = pthread_cond_timedwait (
2011-04-22 13:47:11 +04:00
& pool - > condvar , & pool - > mutex , & ts ) ;
2009-04-23 19:23:13 +04:00
pool - > num_idle - = 1 ;
2017-08-28 17:38:19 +03:00
if ( pool - > prefork_cond ! = NULL ) {
/*
* Me must allow fork ( ) to continue
* without anybody waiting on
pthreadpool: Fix starvation after fork
After the race is before the race:
1) Create an idle thread
2) Add a job: This won't create a thread anymore
3) Immediately fork
The idle thread will be woken twice before it's actually woken up: Both
pthreadpool_add_job and pthreadpool_prepare_pool call cond_signal, for
different reasons. We must look at pool->prefork_cond first because otherwise
we will end up in a blocking job deep within a fork call, the helper thread
must take its fingers off the condvar as quickly as possible. This means that
after the fork there's no idle thread around anymore that would pick up the job
submitted in 2). So we must keep the idle threads around across the fork.
The quick solution to re-create one helper thread in pthreadpool_parent has a
fatal flaw: What do we do if that pthread_create call fails? We're deep in an
application calling fork(), and doing fancy signalling from there is really
something we must avoid.
This has one potential performance issue: If we have hundreds of idle threads
(do we ever have that) during the fork, the call to pthread_mutex_lock on the
fork_mutex from pthreadpool_server (the helper thread) will probably cause a
thundering herd when the _parent call unlocks the fork_mutex. The solution for
this to just keep one idle thread around. But this adds code that is not
strictly required functionally for now.
More detailed explanation from Jeremy:
First, understanding the problem the test reproduces:
add a job (num_jobs = 1) -> creates thread to run it.
job finishes, thread sticks around (num_idle = 1).
num_jobs is now zero (initial job finished).
a) Idle thread is now waiting on pool->condvar inside
pthreadpool_server() in pthread_cond_timedwait().
Now, add another job ->
pthreadpool_add_job()
-> pthreadpool_put_job()
This adds the job to the queue.
Oh, there is an idle thread so don't
create one, do:
pthread_cond_signal(&pool->condvar);
and return.
Now call fork *before* idle thread in (a) wakes from
the signaling of pool->condvar.
In the parent (child is irrelevent):
Go into: pthreadpool_prepare() ->
pthreadpool_prepare_pool()
Set the variable to tell idle threads to exit:
pool->prefork_cond = &prefork_cond;
then wake them up with:
pthread_cond_signal(&pool->condvar);
This does nothing as the idle thread
is already awoken.
b) Idle thread wakes up and does:
Reduce idle thread count (num_idle = 0)
pool->num_idle -= 1;
Check if we're in the middle of a fork.
if (pool->prefork_cond != NULL) {
Yes we are, tell pthreadpool_prepare()
we are exiting.
pthread_cond_signal(pool->prefork_cond);
And exit.
pthreadpool_server_exit(pool);
return NULL;
}
So we come back from the fork in the parent with num_jobs = 1,
a job on the queue but no idle threads - and the code that
creates a new thread on job submission was skipped because
an idle thread existed at point (a).
OK, assuming that the previous explaination is correct, the
fix is to create a new pthreadpool context mutex:
pool->fork_mutex
and in pthreadpool_server(), when an idle thread wakes up and
notices we're in the prepare fork state, it puts itself to
sleep by waiting on the new pool->fork_mutex.
And in pthreadpool_prepare_pool(), instead of waiting for
the idle threads to exit, hold the pool->fork_mutex and
signal each idle thread in turn, and wait for the pool->num_idle
to go to zero - which means they're all blocked waiting on
pool->fork_mutex.
When the parent continues, pthreadpool_parent()
unlocks the pool->fork_mutex and all the previously
'idle' threads wake up (and you mention the thundering
herd problem, which is as you say vanishingly small :-)
and pick up any remaining job.
Bug: https://bugzilla.samba.org/show_bug.cgi?id=13179
Signed-off-by: Volker Lendecke <vl@samba.org>
Reviewed-by: Jeremy Allison <jra@samba.org>
2017-11-29 18:45:40 +03:00
* & pool - > condvar . Tell
* pthreadpool_prepare_pool that we
* got that message .
*/
res = pthread_cond_signal ( pool - > prefork_cond ) ;
assert ( res = = 0 ) ;
res = pthread_mutex_unlock ( & pool - > mutex ) ;
assert ( res = = 0 ) ;
/*
* pthreadpool_prepare_pool has
* already locked this mutex across
* the fork . This makes us wait
* without sitting in a condvar .
2017-08-28 17:38:19 +03:00
*/
pthreadpool: Fix starvation after fork
After the race is before the race:
1) Create an idle thread
2) Add a job: This won't create a thread anymore
3) Immediately fork
The idle thread will be woken twice before it's actually woken up: Both
pthreadpool_add_job and pthreadpool_prepare_pool call cond_signal, for
different reasons. We must look at pool->prefork_cond first because otherwise
we will end up in a blocking job deep within a fork call, the helper thread
must take its fingers off the condvar as quickly as possible. This means that
after the fork there's no idle thread around anymore that would pick up the job
submitted in 2). So we must keep the idle threads around across the fork.
The quick solution to re-create one helper thread in pthreadpool_parent has a
fatal flaw: What do we do if that pthread_create call fails? We're deep in an
application calling fork(), and doing fancy signalling from there is really
something we must avoid.
This has one potential performance issue: If we have hundreds of idle threads
(do we ever have that) during the fork, the call to pthread_mutex_lock on the
fork_mutex from pthreadpool_server (the helper thread) will probably cause a
thundering herd when the _parent call unlocks the fork_mutex. The solution for
this to just keep one idle thread around. But this adds code that is not
strictly required functionally for now.
More detailed explanation from Jeremy:
First, understanding the problem the test reproduces:
add a job (num_jobs = 1) -> creates thread to run it.
job finishes, thread sticks around (num_idle = 1).
num_jobs is now zero (initial job finished).
a) Idle thread is now waiting on pool->condvar inside
pthreadpool_server() in pthread_cond_timedwait().
Now, add another job ->
pthreadpool_add_job()
-> pthreadpool_put_job()
This adds the job to the queue.
Oh, there is an idle thread so don't
create one, do:
pthread_cond_signal(&pool->condvar);
and return.
Now call fork *before* idle thread in (a) wakes from
the signaling of pool->condvar.
In the parent (child is irrelevent):
Go into: pthreadpool_prepare() ->
pthreadpool_prepare_pool()
Set the variable to tell idle threads to exit:
pool->prefork_cond = &prefork_cond;
then wake them up with:
pthread_cond_signal(&pool->condvar);
This does nothing as the idle thread
is already awoken.
b) Idle thread wakes up and does:
Reduce idle thread count (num_idle = 0)
pool->num_idle -= 1;
Check if we're in the middle of a fork.
if (pool->prefork_cond != NULL) {
Yes we are, tell pthreadpool_prepare()
we are exiting.
pthread_cond_signal(pool->prefork_cond);
And exit.
pthreadpool_server_exit(pool);
return NULL;
}
So we come back from the fork in the parent with num_jobs = 1,
a job on the queue but no idle threads - and the code that
creates a new thread on job submission was skipped because
an idle thread existed at point (a).
OK, assuming that the previous explaination is correct, the
fix is to create a new pthreadpool context mutex:
pool->fork_mutex
and in pthreadpool_server(), when an idle thread wakes up and
notices we're in the prepare fork state, it puts itself to
sleep by waiting on the new pool->fork_mutex.
And in pthreadpool_prepare_pool(), instead of waiting for
the idle threads to exit, hold the pool->fork_mutex and
signal each idle thread in turn, and wait for the pool->num_idle
to go to zero - which means they're all blocked waiting on
pool->fork_mutex.
When the parent continues, pthreadpool_parent()
unlocks the pool->fork_mutex and all the previously
'idle' threads wake up (and you mention the thundering
herd problem, which is as you say vanishingly small :-)
and pick up any remaining job.
Bug: https://bugzilla.samba.org/show_bug.cgi?id=13179
Signed-off-by: Volker Lendecke <vl@samba.org>
Reviewed-by: Jeremy Allison <jra@samba.org>
2017-11-29 18:45:40 +03:00
res = pthread_mutex_lock ( & pool - > fork_mutex ) ;
assert ( res = = 0 ) ;
res = pthread_mutex_unlock ( & pool - > fork_mutex ) ;
assert ( res = = 0 ) ;
res = pthread_mutex_lock ( & pool - > mutex ) ;
assert ( res = = 0 ) ;
2017-08-28 17:38:19 +03:00
}
2009-04-23 19:23:13 +04:00
if ( res = = ETIMEDOUT ) {
2014-03-21 20:53:26 +04:00
if ( pool - > num_jobs = = 0 ) {
2009-04-23 19:23:13 +04:00
/*
* we timed out and still no work for
* us . Exit .
*/
pthreadpool_server_exit ( pool ) ;
return NULL ;
}
break ;
}
assert ( res = = 0 ) ;
}
2014-03-21 20:53:26 +04:00
if ( pthreadpool_get_job ( pool , & job ) ) {
2016-08-15 14:59:12 +03:00
int ret ;
2009-04-23 19:23:13 +04:00
/*
2011-04-22 13:47:11 +04:00
* Do the work with the mutex unlocked
2009-04-23 19:23:13 +04:00
*/
res = pthread_mutex_unlock ( & pool - > mutex ) ;
assert ( res = = 0 ) ;
2014-03-21 20:53:26 +04:00
job . fn ( job . private_data ) ;
2009-04-23 19:23:13 +04:00
2016-08-15 14:59:12 +03:00
ret = pool - > signal_fn ( job . id ,
2016-07-31 09:57:35 +03:00
job . fn , job . private_data ,
pool - > signal_fn_private_data ) ;
2016-08-29 12:35:39 +03:00
res = pthread_mutex_lock ( & pool - > mutex ) ;
assert ( res = = 0 ) ;
2016-08-15 14:59:12 +03:00
if ( ret ! = 0 ) {
2009-04-23 19:23:13 +04:00
pthreadpool_server_exit ( pool ) ;
return NULL ;
}
}
2018-04-25 15:03:30 +03:00
if ( pool - > stopped ) {
2009-04-23 19:23:13 +04:00
/*
2018-04-25 15:03:30 +03:00
* we ' re asked to stop processing jobs , so exit
2009-04-23 19:23:13 +04:00
*/
pthreadpool_server_exit ( pool ) ;
return NULL ;
}
}
}
2017-11-28 20:49:36 +03:00
static int pthreadpool_create_thread ( struct pthreadpool * pool )
2009-04-23 19:23:13 +04:00
{
2016-09-09 14:07:57 +03:00
pthread_attr_t thread_attr ;
2009-04-23 19:23:13 +04:00
pthread_t thread_id ;
int res ;
sigset_t mask , omask ;
2017-11-28 20:49:36 +03:00
/*
* Create a new worker thread . It should not receive any signals .
*/
sigfillset ( & mask ) ;
res = pthread_attr_init ( & thread_attr ) ;
if ( res ! = 0 ) {
return res ;
}
res = pthread_attr_setdetachstate (
& thread_attr , PTHREAD_CREATE_DETACHED ) ;
if ( res ! = 0 ) {
pthread_attr_destroy ( & thread_attr ) ;
return res ;
}
res = pthread_sigmask ( SIG_BLOCK , & mask , & omask ) ;
if ( res ! = 0 ) {
pthread_attr_destroy ( & thread_attr ) ;
return res ;
}
res = pthread_create ( & thread_id , & thread_attr , pthreadpool_server ,
( void * ) pool ) ;
assert ( pthread_sigmask ( SIG_SETMASK , & omask , NULL ) = = 0 ) ;
pthread_attr_destroy ( & thread_attr ) ;
if ( res = = 0 ) {
pool - > num_threads + = 1 ;
}
return res ;
}
int pthreadpool_add_job ( struct pthreadpool * pool , int job_id ,
void ( * fn ) ( void * private_data ) , void * private_data )
{
int res ;
2018-06-22 01:27:39 +03:00
int unlock_res ;
2017-11-28 20:49:36 +03:00
2018-04-25 15:03:30 +03:00
assert ( ! pool - > destroyed ) ;
2009-04-23 19:23:13 +04:00
res = pthread_mutex_lock ( & pool - > mutex ) ;
if ( res ! = 0 ) {
return res ;
}
2018-04-25 15:03:30 +03:00
if ( pool - > stopped ) {
2011-04-22 13:47:11 +04:00
/*
* Protect against the pool being shut down while
* trying to add a job
*/
2018-06-22 01:27:39 +03:00
unlock_res = pthread_mutex_unlock ( & pool - > mutex ) ;
assert ( unlock_res = = 0 ) ;
2011-04-22 13:47:11 +04:00
return EINVAL ;
}
2018-06-22 01:29:53 +03:00
if ( pool - > max_threads = = 0 ) {
unlock_res = pthread_mutex_unlock ( & pool - > mutex ) ;
assert ( unlock_res = = 0 ) ;
/*
* If no thread are allowed we do strict sync processing .
*/
fn ( private_data ) ;
res = pool - > signal_fn ( job_id , fn , private_data ,
pool - > signal_fn_private_data ) ;
return res ;
}
2009-04-23 19:23:13 +04:00
/*
* Add job to the end of the queue
*/
2014-03-21 20:53:26 +04:00
if ( ! pthreadpool_put_job ( pool , job_id , fn , private_data ) ) {
2018-06-22 01:27:39 +03:00
unlock_res = pthread_mutex_unlock ( & pool - > mutex ) ;
assert ( unlock_res = = 0 ) ;
2014-03-21 20:53:26 +04:00
return ENOMEM ;
2009-04-23 19:23:13 +04:00
}
if ( pool - > num_idle > 0 ) {
/*
* We have idle threads , wake one .
*/
res = pthread_cond_signal ( & pool - > condvar ) ;
2017-11-28 20:59:06 +03:00
if ( res ! = 0 ) {
pthreadpool_undo_put_job ( pool ) ;
}
2017-12-12 15:58:48 +03:00
unlock_res = pthread_mutex_unlock ( & pool - > mutex ) ;
assert ( unlock_res = = 0 ) ;
2009-04-23 19:23:13 +04:00
return res ;
}
2018-06-22 01:29:53 +03:00
if ( pool - > num_threads > = pool - > max_threads ) {
2009-04-23 19:23:13 +04:00
/*
* No more new threads , we just queue the request
*/
2018-06-22 01:27:39 +03:00
unlock_res = pthread_mutex_unlock ( & pool - > mutex ) ;
assert ( unlock_res = = 0 ) ;
2009-04-23 19:23:13 +04:00
return 0 ;
}
2017-11-28 20:49:36 +03:00
res = pthreadpool_create_thread ( pool ) ;
2017-12-12 15:52:56 +03:00
if ( res = = 0 ) {
2018-06-22 01:27:39 +03:00
unlock_res = pthread_mutex_unlock ( & pool - > mutex ) ;
assert ( unlock_res = = 0 ) ;
2017-12-12 15:52:56 +03:00
return 0 ;
}
2017-11-28 20:59:06 +03:00
2017-12-12 15:52:56 +03:00
if ( pool - > num_threads ! = 0 ) {
2017-11-28 20:59:06 +03:00
/*
* At least one thread is still available , let
* that one run the queued job .
*/
2018-06-22 01:27:39 +03:00
unlock_res = pthread_mutex_unlock ( & pool - > mutex ) ;
assert ( unlock_res = = 0 ) ;
2017-12-12 15:52:56 +03:00
return 0 ;
2009-04-23 19:23:13 +04:00
}
2017-12-12 15:52:56 +03:00
pthreadpool_undo_put_job ( pool ) ;
2018-06-22 01:27:39 +03:00
unlock_res = pthread_mutex_unlock ( & pool - > mutex ) ;
assert ( unlock_res = = 0 ) ;
2017-12-12 15:52:56 +03:00
2009-04-23 19:23:13 +04:00
return res ;
}
2018-04-20 16:00:31 +03:00
size_t pthreadpool_cancel_job ( struct pthreadpool * pool , int job_id ,
void ( * fn ) ( void * private_data ) , void * private_data )
{
int res ;
size_t i , j ;
size_t num = 0 ;
2018-04-25 15:03:30 +03:00
assert ( ! pool - > destroyed ) ;
2018-04-20 16:00:31 +03:00
res = pthread_mutex_lock ( & pool - > mutex ) ;
if ( res ! = 0 ) {
return res ;
}
for ( i = 0 , j = 0 ; i < pool - > num_jobs ; i + + ) {
size_t idx = ( pool - > head + i ) % pool - > jobs_array_len ;
size_t new_idx = ( pool - > head + j ) % pool - > jobs_array_len ;
struct pthreadpool_job * job = & pool - > jobs [ idx ] ;
if ( ( job - > private_data = = private_data ) & &
( job - > id = = job_id ) & &
( job - > fn = = fn ) )
{
/*
* Just skip the entry .
*/
num + + ;
continue ;
}
/*
* If we already removed one or more jobs ( so j will be smaller
* then i ) , we need to fill possible gaps in the logical list .
*/
if ( j < i ) {
pool - > jobs [ new_idx ] = * job ;
}
j + + ;
}
pool - > num_jobs - = num ;
res = pthread_mutex_unlock ( & pool - > mutex ) ;
assert ( res = = 0 ) ;
return num ;
}