[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index] [Xen-changelog] [xen staging] x86: optimize loading of GDT at context switch
commit 1464c4cdd719fa5ab08b710218a866780a694dca Author: Juergen Gross <jgross@xxxxxxxx> AuthorDate: Fri Jul 26 10:43:42 2019 +0200 Commit: Jan Beulich <jbeulich@xxxxxxxx> CommitDate: Fri Jul 26 10:43:42 2019 +0200 x86: optimize loading of GDT at context switch Instead of dynamically decide whether the previous vcpu was using full or default GDT just add a percpu variable for that purpose. This at once removes the need for testing vcpu_ids to differ twice. This change improves performance by 0.5% - 1% on my test machine when doing parallel compilation. Signed-off-by: Juergen Gross <jgross@xxxxxxxx> Reviewed-by: Jan Beulich <jbeulich@xxxxxxxx> --- xen/arch/x86/cpu/common.c | 3 +++ xen/arch/x86/domain.c | 13 ++++++++----- xen/include/asm-x86/desc.h | 1 + 3 files changed, 12 insertions(+), 5 deletions(-) diff --git a/xen/arch/x86/cpu/common.c b/xen/arch/x86/cpu/common.c index 1db96d959c..7478e21177 100644 --- a/xen/arch/x86/cpu/common.c +++ b/xen/arch/x86/cpu/common.c @@ -49,6 +49,8 @@ unsigned int vaddr_bits __read_mostly = VADDR_BITS; static unsigned int cleared_caps[NCAPINTS]; static unsigned int forced_caps[NCAPINTS]; +DEFINE_PER_CPU(bool, full_gdt_loaded); + void __init setup_clear_cpu_cap(unsigned int cap) { const uint32_t *dfs; @@ -756,6 +758,7 @@ void load_system_tables(void) offsetof(struct tss_struct, __cacheline_filler) - 1, SYS_DESC_tss_busy); + per_cpu(full_gdt_loaded, cpu) = false; lgdt(&gdtr); lidt(&idtr); ltr(TSS_ENTRY << 3); diff --git a/xen/arch/x86/domain.c b/xen/arch/x86/domain.c index ea55160887..5933b3f51b 100644 --- a/xen/arch/x86/domain.c +++ b/xen/arch/x86/domain.c @@ -1670,7 +1670,7 @@ static void update_xen_slot_in_full_gdt(const struct vcpu *v, unsigned int cpu) : per_cpu(compat_gdt_table_l1e, cpu)); } -static void load_full_gdt(const struct vcpu *v) +static void load_full_gdt(const struct vcpu *v, unsigned int cpu) { struct desc_ptr gdt_desc = { .limit = LAST_RESERVED_GDT_BYTE, @@ -1678,6 +1678,8 @@ static void load_full_gdt(const struct vcpu *v) }; lgdt(&gdt_desc); + + per_cpu(full_gdt_loaded, cpu) = true; } static void load_default_gdt(unsigned int cpu) @@ -1689,6 +1691,8 @@ static void load_default_gdt(unsigned int cpu) }; lgdt(&gdt_desc); + + per_cpu(full_gdt_loaded, cpu) = false; } static void __context_switch(void) @@ -1740,7 +1744,7 @@ static void __context_switch(void) if ( need_full_gdt(nd) ) update_xen_slot_in_full_gdt(n, cpu); - if ( need_full_gdt(pd) && + if ( per_cpu(full_gdt_loaded, cpu) && ((p->vcpu_id != n->vcpu_id) || !need_full_gdt(nd)) ) load_default_gdt(cpu); @@ -1753,9 +1757,8 @@ static void __context_switch(void) svm_load_segs(0, 0, 0, 0, 0, 0, 0); #endif - if ( need_full_gdt(nd) && - ((p->vcpu_id != n->vcpu_id) || !need_full_gdt(pd)) ) - load_full_gdt(n); + if ( need_full_gdt(nd) && !per_cpu(full_gdt_loaded, cpu) ) + load_full_gdt(n, cpu); if ( pd != nd ) cpumask_clear_cpu(cpu, pd->dirty_cpumask); diff --git a/xen/include/asm-x86/desc.h b/xen/include/asm-x86/desc.h index e565727dc0..c011c03ae2 100644 --- a/xen/include/asm-x86/desc.h +++ b/xen/include/asm-x86/desc.h @@ -210,6 +210,7 @@ DECLARE_PER_CPU(l1_pgentry_t, gdt_table_l1e); extern seg_desc_t boot_cpu_compat_gdt_table[]; DECLARE_PER_CPU(seg_desc_t *, compat_gdt_table); DECLARE_PER_CPU(l1_pgentry_t, compat_gdt_table_l1e); +DECLARE_PER_CPU(bool, full_gdt_loaded); extern void load_TR(void); -- generated by git-patchbot for /home/xen/git/xen.git#staging _______________________________________________ Xen-changelog mailing list Xen-changelog@xxxxxxxxxxxxxxxxxxxx https://lists.xenproject.org/xen-changelog
|
Lists.xenproject.org is hosted with RackSpace, monitoring our |