|
[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index] [Xen-devel] [RFC PATCH] xen: comment opaque expression in __page_to_virt
mm.h's __page_to_virt has a rather opaque expression. Comment it.
The diff below shows the effect that the extra division and
multiplication has on gcc's output; the "-" lines are the result of
compiling
return (void *)(DIRECTMAP_VIRT_START +
((unsigned long)pg - FRAMETABLE_VIRT_START) /
(sizeof(*pg) ) *
(PAGE_SIZE )
);
instead.
NB that this patch is an RFC because I don't actually know whether
what I wrote in the comment about x86 performance, and the purpose, of
the code, is correct. Jan, please confirm/deny/correct as
appropriate.
Reported-By: Ian Campbell <ian.campbell@xxxxxxxxxx>
Cc: Jan Beulich <jbeulich@xxxxxxxxxx>
Signed-off-by: Ian Jackson <ian.jackson@xxxxxxxxxxxxx>
--- page_alloc.tmp.mariner.31972.s 2012-08-29 16:32:44.000000000 +0100
+++ page_alloc.tmp.mariner.31960.s 2012-08-29 16:32:09.000000000 +0100
@@ -5338,15 +5338,15 @@
# 325 "/u/iwj/work/xen-unstable-tools.hg/xen/include/asm/mm.h" 1
ud2 ; ret $1303; movl $.LC31, %esp; movl $.LC41, %esp
# 0 "" 2
- .loc 10 327 0
+ .loc 10 333 0
#NO_APP
- movl $3, %ebx
+ movl $24, %ebx
.LVL543:
movl $0, %edx
divl %ebx
- addl $8355840, %eax
+ addl $1044480, %eax
movl %eax, %ebx
- sall $9, %ebx
+ sall $12, %ebx
.LBE737:
.LBE736:
.loc 1 1179 0
@@ -5368,13 +5368,13 @@
.LBE739:
.LBB741:
.LBB738:
- .loc 10 327 0
+ .loc 10 333 0
movl $-1431655765, %edx
mull %edx
- shrl %edx
- leal 8355840(%edx), %ebx
+ shrl $4, %edx
+ leal 1044480(%edx), %ebx
.LVL545:
- sall $9, %ebx
+ sall $12, %ebx
.LBE738:
.LBE741:
.loc 1 1179 0
diff -r a0b5f8102a00 xen/include/asm-x86/mm.h
--- a/xen/include/asm-x86/mm.h Tue Aug 28 22:40:45 2012 +0100
+++ b/xen/include/asm-x86/mm.h Wed Aug 29 16:44:58 2012 +0100
@@ -323,6 +323,13 @@ static inline struct page_info *__virt_t
static inline void *__page_to_virt(const struct page_info *pg)
{
ASSERT((unsigned long)pg - FRAMETABLE_VIRT_START < FRAMETABLE_VIRT_END);
+ /* (sizeof(*pg) & -sizeof(*pg)) selects the LS bit of sizeof(*pg).
+ * The division and re-multiplication arranges to do the easy part
+ * of the division with a shift, and then puts the shifted-out
+ * power of 2 back again in the multiplication. This is
+ * beneficial because with gcc (at least with 4.4.5) it generates
+ * a division by 3 instead of a division by 8 which is faster.
+ */
return (void *)(DIRECTMAP_VIRT_START +
((unsigned long)pg - FRAMETABLE_VIRT_START) /
(sizeof(*pg) / (sizeof(*pg) & -sizeof(*pg))) *
_______________________________________________
Xen-devel mailing list
Xen-devel@xxxxxxxxxxxxx
http://lists.xen.org/xen-devel
|
![]() |
Lists.xenproject.org is hosted with RackSpace, monitoring our |