From: Juergen Gross <juergen.gross@ts.fujitsu.com>
To: Andre Przywara <andre.przywara@amd.com>
Cc: George Dunlap <George.Dunlap@eu.citrix.com>,
"xen-devel@lists.xensource.com" <xen-devel@lists.xensource.com>,
"Diestelhorst, Stephan" <Stephan.Diestelhorst@amd.com>
Subject: Re: Hypervisor crash(!) on xl cpupool-numa-split
Date: Thu, 10 Feb 2011 07:42:39 +0100 [thread overview]
Message-ID: <4D5388DF.8040900@ts.fujitsu.com> (raw)
In-Reply-To: <4D52A2CD.9090507@ts.fujitsu.com>
[-- Attachment #1: Type: text/plain, Size: 1428 bytes --]
On 02/09/11 15:21, Juergen Gross wrote:
> Andre, George,
>
>
> What seems to be interesting: I think the problem did always occur when
> a new cpupool was created and the first cpu was moved to it.
>
> I think my previous assumption regarding the master_ticker was not too bad.
> I think somehow the master_ticker of the new cpupool is becoming active
> before the scheduler is really initialized properly. This could happen, if
> enough time is spent between alloc_pdata for the cpu to be moved and the
> critical section in schedule_cpu_switch().
>
> The solution should be to activate the timers only if the scheduler is
> ready for them.
>
> George, do you think the master_ticker should be stopped in suspend_ticker
> as well? I still see potential problems for entering deep C-States. I think
> I'll prepare a patch which will keep the master_ticker active for the
> C-State case and migrate it for the schedule_cpu_switch() case.
Okay, here is a patch for this. It ran on my 4-core machine without any
problems.
Andre, could you give it a try?
Juergen
--
Juergen Gross Principal Developer Operating Systems
TSP ES&S SWE OS6 Telephone: +49 (0) 89 3222 2967
Fujitsu Technology Solutions e-mail: juergen.gross@ts.fujitsu.com
Domagkstr. 28 Internet: ts.fujitsu.com
D-80807 Muenchen Company details: ts.fujitsu.com/imprint.html
[-- Attachment #2: ticker.patch --]
[-- Type: text/x-patch, Size: 5447 bytes --]
diff -r 1967c7c290eb xen/common/sched_credit.c
--- a/xen/common/sched_credit.c Wed Feb 09 12:03:09 2011 +0000
+++ b/xen/common/sched_credit.c Thu Feb 10 07:39:27 2011 +0100
@@ -50,6 +50,8 @@
(CSCHED_CREDITS_PER_MSEC * CSCHED_MSECS_PER_TSLICE)
#define CSCHED_CREDITS_PER_ACCT \
(CSCHED_CREDITS_PER_MSEC * CSCHED_MSECS_PER_TICK * CSCHED_TICKS_PER_ACCT)
+#define CSCHED_ACCT_TSLICE \
+ (MILLISECS(CSCHED_MSECS_PER_TICK) * CSCHED_TICKS_PER_ACCT)
/*
@@ -170,6 +172,7 @@ struct csched_private {
uint32_t ncpus;
struct timer master_ticker;
unsigned int master;
+ int master_active;
cpumask_t idlers;
cpumask_t cpus;
uint32_t weight;
@@ -320,6 +323,7 @@ csched_free_pdata(const struct scheduler
struct csched_private *prv = CSCHED_PRIV(ops);
struct csched_pcpu *spc = pcpu;
unsigned long flags;
+ uint64_t now = NOW();
if ( spc == NULL )
return;
@@ -334,10 +338,16 @@ csched_free_pdata(const struct scheduler
{
prv->master = first_cpu(prv->cpus);
migrate_timer(&prv->master_ticker, prv->master);
+ if ( prv->master_active )
+ set_timer(&prv->master_ticker, now + CSCHED_ACCT_TSLICE
+ - now % CSCHED_ACCT_TSLICE);
}
kill_timer(&spc->ticker);
if ( prv->ncpus == 0 )
+ {
kill_timer(&prv->master_ticker);
+ prv->master_active = 0;
+ }
spin_unlock_irqrestore(&prv->lock, flags);
@@ -367,12 +377,10 @@ csched_alloc_pdata(const struct schedule
{
prv->master = cpu;
init_timer(&prv->master_ticker, csched_acct, prv, cpu);
- set_timer(&prv->master_ticker, NOW() +
- MILLISECS(CSCHED_MSECS_PER_TICK) * CSCHED_TICKS_PER_ACCT);
+ prv->master_active = 0;
}
init_timer(&spc->ticker, csched_tick, (void *)(unsigned long)cpu, cpu);
- set_timer(&spc->ticker, NOW() + MILLISECS(CSCHED_MSECS_PER_TICK));
INIT_LIST_HEAD(&spc->runq);
spc->runq_sort_last = prv->runq_sort;
@@ -1138,8 +1146,7 @@ csched_acct(void* dummy)
prv->runq_sort++;
out:
- set_timer( &prv->master_ticker, NOW() +
- MILLISECS(CSCHED_MSECS_PER_TICK) * CSCHED_TICKS_PER_ACCT );
+ set_timer( &prv->master_ticker, NOW() + CSCHED_ACCT_TSLICE );
}
static void
@@ -1529,24 +1536,39 @@ csched_deinit(const struct scheduler *op
xfree(prv);
}
-static void csched_tick_suspend(const struct scheduler *ops, unsigned int cpu)
+static void csched_tick_suspend(const struct scheduler *ops, unsigned int cpu, int temp)
{
+ struct csched_private *prv;
struct csched_pcpu *spc;
+ prv = CSCHED_PRIV(ops);
spc = CSCHED_PCPU(cpu);
stop_timer(&spc->ticker);
+ if ( (prv->master == cpu) && !temp )
+ {
+ prv->master = cycle_cpu(prv->master, prv->cpus);
+ migrate_timer(&prv->master_ticker, prv->master);
+ }
}
static void csched_tick_resume(const struct scheduler *ops, unsigned int cpu)
{
+ struct csched_private *prv;
struct csched_pcpu *spc;
uint64_t now = NOW();
+ prv = CSCHED_PRIV(ops);
spc = CSCHED_PCPU(cpu);
set_timer(&spc->ticker, now + MILLISECS(CSCHED_MSECS_PER_TICK)
- now % MILLISECS(CSCHED_MSECS_PER_TICK) );
+ if ( (prv->master == cpu) && !prv->master_active )
+ {
+ set_timer(&prv->master_ticker, now + CSCHED_ACCT_TSLICE
+ - now % CSCHED_ACCT_TSLICE);
+ prv->master_active = 1;
+ }
}
static struct csched_private _csched_priv;
diff -r 1967c7c290eb xen/common/schedule.c
--- a/xen/common/schedule.c Wed Feb 09 12:03:09 2011 +0000
+++ b/xen/common/schedule.c Thu Feb 10 07:39:27 2011 +0100
@@ -1208,6 +1208,8 @@ static int cpu_schedule_up(unsigned int
if ( (ops.alloc_pdata != NULL) &&
((sd->sched_priv = ops.alloc_pdata(&ops, cpu)) == NULL) )
return -ENOMEM;
+ if ( ops.tick_resume != NULL )
+ ops.tick_resume(&ops, cpu);
return 0;
}
@@ -1286,6 +1288,8 @@ void __init scheduler_init(void)
if ( ops.alloc_pdata &&
!(this_cpu(schedule_data).sched_priv = ops.alloc_pdata(&ops, 0)) )
BUG();
+ if ( ops.tick_resume != NULL )
+ ops.tick_resume(&ops, 0);
}
int schedule_cpu_switch(unsigned int cpu, struct cpupool *c)
@@ -1312,7 +1316,7 @@ int schedule_cpu_switch(unsigned int cpu
pcpu_schedule_lock_irqsave(cpu, flags);
- SCHED_OP(old_ops, tick_suspend, cpu);
+ SCHED_OP(old_ops, tick_suspend, cpu, 0);
vpriv_old = idle->sched_priv;
idle->sched_priv = vpriv;
per_cpu(scheduler, cpu) = new_ops;
@@ -1392,7 +1396,7 @@ void sched_tick_suspend(void)
unsigned int cpu = smp_processor_id();
sched = per_cpu(scheduler, cpu);
- SCHED_OP(sched, tick_suspend, cpu);
+ SCHED_OP(sched, tick_suspend, cpu, 1);
}
void sched_tick_resume(void)
diff -r 1967c7c290eb xen/include/xen/sched-if.h
--- a/xen/include/xen/sched-if.h Wed Feb 09 12:03:09 2011 +0000
+++ b/xen/include/xen/sched-if.h Thu Feb 10 07:39:27 2011 +0100
@@ -175,7 +175,7 @@ struct scheduler {
void (*dump_settings) (const struct scheduler *);
void (*dump_cpu_state) (const struct scheduler *, int);
- void (*tick_suspend) (const struct scheduler *, unsigned int);
+ void (*tick_suspend) (const struct scheduler *, unsigned int, int);
void (*tick_resume) (const struct scheduler *, unsigned int);
};
[-- Attachment #3: Type: text/plain, Size: 138 bytes --]
_______________________________________________
Xen-devel mailing list
Xen-devel@lists.xensource.com
http://lists.xensource.com/xen-devel
next prev parent reply other threads:[~2011-02-10 6:42 UTC|newest]
Thread overview: 53+ messages / expand[flat|nested] mbox.gz Atom feed top
2011-01-27 23:18 Hypervisor crash(!) on xl cpupool-numa-split Andre Przywara
2011-01-28 6:47 ` Juergen Gross
2011-01-28 11:07 ` Andre Przywara
2011-01-28 11:44 ` Juergen Gross
2011-01-28 13:14 ` Andre Przywara
2011-01-31 7:04 ` Juergen Gross
2011-01-31 14:59 ` Andre Przywara
2011-01-31 15:28 ` George Dunlap
2011-02-01 16:32 ` Andre Przywara
2011-02-02 6:27 ` Juergen Gross
2011-02-02 8:49 ` Juergen Gross
2011-02-02 10:05 ` Juergen Gross
2011-02-02 10:59 ` Andre Przywara
2011-02-02 14:39 ` Stephan Diestelhorst
2011-02-02 15:14 ` Juergen Gross
2011-02-02 16:01 ` Stephan Diestelhorst
2011-02-03 5:57 ` Juergen Gross
2011-02-03 9:18 ` Juergen Gross
2011-02-04 14:09 ` Andre Przywara
2011-02-07 12:38 ` Andre Przywara
2011-02-07 13:32 ` Juergen Gross
2011-02-07 15:55 ` George Dunlap
2011-02-08 5:43 ` Juergen Gross
2011-02-08 12:08 ` George Dunlap
2011-02-08 12:14 ` George Dunlap
2011-02-08 16:33 ` Andre Przywara
2011-02-09 12:27 ` George Dunlap
2011-02-09 12:27 ` George Dunlap
2011-02-09 13:04 ` Juergen Gross
2011-02-09 13:39 ` Andre Przywara
2011-02-09 13:51 ` Andre Przywara
2011-02-09 14:21 ` Juergen Gross
2011-02-10 6:42 ` Juergen Gross [this message]
2011-02-10 9:25 ` Andre Przywara
2011-02-10 14:18 ` Andre Przywara
2011-02-11 6:17 ` Juergen Gross
2011-02-11 7:39 ` Andre Przywara
2011-02-14 17:57 ` George Dunlap
2011-02-15 7:22 ` Juergen Gross
2011-02-16 9:47 ` Juergen Gross
2011-02-16 13:54 ` George Dunlap
[not found] ` <4D6237C6.1050206@amd.c om>
2011-02-16 14:11 ` Juergen Gross
2011-02-16 14:28 ` Juergen Gross
2011-02-17 0:05 ` André Przywara
2011-02-17 7:05 ` Juergen Gross
2011-02-17 9:11 ` Juergen Gross
2011-02-21 10:00 ` Andre Przywara
2011-02-21 13:19 ` Juergen Gross
2011-02-21 14:45 ` Andre Przywara
2011-02-21 14:50 ` Juergen Gross
2011-02-08 12:23 ` Juergen Gross
2011-01-28 11:13 ` George Dunlap
2011-01-28 13:05 ` Andre Przywara
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=4D5388DF.8040900@ts.fujitsu.com \
--to=juergen.gross@ts.fujitsu.com \
--cc=George.Dunlap@eu.citrix.com \
--cc=Stephan.Diestelhorst@amd.com \
--cc=andre.przywara@amd.com \
--cc=xen-devel@lists.xensource.com \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line
before the message body.
This is an external index of several public inboxes,
see mirroring instructions on how to clone and mirror
all data and code used by this external index.