Re: [PATCH v8 11/28] x86/asm/head: annotate data appropriatelly

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]

 



> Subject: Re: [PATCH v8 11/28] x86/asm/head: annotate data appropriatelly

appropriately

On Thu, Aug 08, 2019 at 12:38:37PM +0200, Jiri Slaby wrote:
> Use the new SYM_DATA, SYM_DATA_START, and SYM_DATA_END in both 32 and 64
> bit heads.  In the 64-bit version, define also
> SYM_DATA_START_PAGE_ALIGNED locally using the new SYM_START. It is used
> in the code instead of NEXT_PAGE() which was defined in this file and
> has been using the obsolete macro GLOBAL().
> 
> Now, the data in the 64-bit object file look sane:
> Value   Size Type    Bind   Vis      Ndx Name
>   0000  4096 OBJECT  GLOBAL DEFAULT   15 init_level4_pgt
>   1000  4096 OBJECT  GLOBAL DEFAULT   15 level3_kernel_pgt
>   2000  2048 OBJECT  GLOBAL DEFAULT   15 level2_kernel_pgt
>   3000  4096 OBJECT  GLOBAL DEFAULT   15 level2_fixmap_pgt
>   4000  4096 OBJECT  GLOBAL DEFAULT   15 level1_fixmap_pgt
>   5000     2 OBJECT  GLOBAL DEFAULT   15 early_gdt_descr
>   5002     8 OBJECT  LOCAL  DEFAULT   15 early_gdt_descr_base
>   500a     8 OBJECT  GLOBAL DEFAULT   15 phys_base
>   0000     8 OBJECT  GLOBAL DEFAULT   17 initial_code
>   0008     8 OBJECT  GLOBAL DEFAULT   17 initial_gs
>   0010     8 OBJECT  GLOBAL DEFAULT   17 initial_stack
>   0000     4 OBJECT  GLOBAL DEFAULT   19 early_recursion_flag
>   1000  4096 OBJECT  GLOBAL DEFAULT   19 early_level4_pgt
>   2000 0x40000 OBJECT  GLOBAL DEFAULT   19 early_dynamic_pgts
>   0000  4096 OBJECT  GLOBAL DEFAULT   22 empty_zero_page
> 
> All have correct size and type.

Nice.

> 
> Note, that we can now see that it might be worth pushing
> early_recursion_flag after early_dynamic_pgts -- we are wasting almost
> 4K of .init.data.

Yes, please do in a separate patch which can even go separately. I get
here:

---
Disassembly of section .init.data:

ffffffff82684000 <early_recursion_flag>:
        ...

ffffffff82685000 <early_top_pgt>:
        ...

ffffffff82686000 <early_dynamic_pgts>:
        ...

ffffffff826c6000 <next_early_pgt>:
        ...

ffffffff826c6020 <initcall_level_names>:
---


vs


---
Disassembly of section .init.data:

ffffffff82684000 <early_top_pgt>:
        ...

ffffffff82685000 <early_dynamic_pgts>:
        ...

ffffffff826c5000 <early_recursion_flag>:
ffffffff826c5000:       00 00                   add    %al,(%rax)
        ...

ffffffff826c5004 <next_early_pgt>:
        ...

ffffffff826c5020 <initcall_level_names>:
---

That's exactly 4K saved.


> Signed-off-by: Jiri Slaby <jslaby@xxxxxxx>
> Cc: Thomas Gleixner <tglx@xxxxxxxxxxxxx>
> Cc: Ingo Molnar <mingo@xxxxxxxxxx>
> Cc: "H. Peter Anvin" <hpa@xxxxxxxxx>
> Cc: x86@xxxxxxxxxx
> ---
>  arch/x86/kernel/head_32.S | 29 ++++++++-------
>  arch/x86/kernel/head_64.S | 78 +++++++++++++++++++++------------------
>  2 files changed, 58 insertions(+), 49 deletions(-)
> 
> diff --git a/arch/x86/kernel/head_32.S b/arch/x86/kernel/head_32.S
> index 0bae769b7b59..2d5390d84467 100644
> --- a/arch/x86/kernel/head_32.S
> +++ b/arch/x86/kernel/head_32.S
> @@ -502,8 +502,7 @@ ENDPROC(early_ignore_irq)
>  
>  __INITDATA
>  	.align 4
> -GLOBAL(early_recursion_flag)
> -	.long 0
> +SYM_DATA(early_recursion_flag, .long 0)
>  
>  __REFDATA
>  	.align 4
> @@ -551,7 +550,7 @@ EXPORT_SYMBOL(empty_zero_page)
>  __PAGE_ALIGNED_DATA
>  	/* Page-aligned for the benefit of paravirt? */
>  	.align PGD_ALIGN
> -ENTRY(initial_page_table)
> +SYM_DATA_START(initial_page_table)
>  	.long	pa(initial_pg_pmd+PGD_IDENT_ATTR),0	/* low identity map */
>  # if KPMDS == 3
>  	.long	pa(initial_pg_pmd+PGD_IDENT_ATTR),0
> @@ -569,17 +568,18 @@ ENTRY(initial_page_table)
>  #  error "Kernel PMDs should be 1, 2 or 3"
>  # endif
>  	.align PAGE_SIZE		/* needs to be page-sized too */
> +SYM_DATA_END(initial_page_table)
>  #endif
>  
>  .data
>  .balign 4
> -ENTRY(initial_stack)
> -	/*
> -	 * The SIZEOF_PTREGS gap is a convention which helps the in-kernel
> -	 * unwinder reliably detect the end of the stack.
> -	 */
> -	.long init_thread_union + THREAD_SIZE - SIZEOF_PTREGS - \
> -	      TOP_OF_KERNEL_STACK_PADDING;
> +/*
> + * The SIZEOF_PTREGS gap is a convention which helps the in-kernel unwinder
> + * reliably detect the end of the stack.
> + */
> +SYM_DATA(initial_stack,
> +		.long init_thread_union + THREAD_SIZE -
> +		SIZEOF_PTREGS - TOP_OF_KERNEL_STACK_PADDING)
>  
>  __INITRODATA
>  int_msg:
> @@ -600,22 +600,25 @@ int_msg:
>  	ALIGN
>  # early boot GDT descriptor (must use 1:1 address mapping)
>  	.word 0				# 32 bit align gdt_desc.address
> -boot_gdt_descr:
> +SYM_DATA_START(boot_gdt_descr)
>  	.word __BOOT_DS+7
>  	.long boot_gdt - __PAGE_OFFSET
> +SYM_DATA_END(boot_gdt_descr)

So there's one "globl boot_gdt_descr" above already and this turns into:

 .data
.globl boot_gdt_descr
^^^^^^^^^^^^^^^^^^^^^

 .align 4,0x90
 # early boot GDT descriptor (must use 1:1 address mapping)
 .word 0 # 32 bit align gdt_desc.address
.globl boot_gdt_descr ; ; boot_gdt_descr:
^^^^^^^^^^^^^^^^^^^^^

I guess you can remove the above one.

Also, this can be made a local symbol too.

>  # boot GDT descriptor (later on used by CPU#0):
>  	.word 0				# 32 bit align gdt_desc.address
> -ENTRY(early_gdt_descr)
> +SYM_DATA_START(early_gdt_descr)
>  	.word GDT_ENTRIES*8-1
>  	.long gdt_page			/* Overwritten for secondary CPUs */
> +SYM_DATA_END(early_gdt_descr)
>  
>  /*
>   * The boot_gdt must mirror the equivalent in setup.S and is
>   * used only for booting.
>   */
>  	.align L1_CACHE_BYTES
> -ENTRY(boot_gdt)
> +SYM_DATA_START(boot_gdt)
>  	.fill GDT_ENTRY_BOOT_CS,8,0
>  	.quad 0x00cf9a000000ffff	/* kernel 4GB code at 0x00000000 */
>  	.quad 0x00cf92000000ffff	/* kernel 4GB data at 0x00000000 */
> +SYM_DATA_END(boot_gdt)
> diff --git a/arch/x86/kernel/head_64.S b/arch/x86/kernel/head_64.S
> index 6fedcda37634..6661c76a2049 100644
> --- a/arch/x86/kernel/head_64.S
> +++ b/arch/x86/kernel/head_64.S
> @@ -260,16 +260,14 @@ END(start_cpu0)
>  	/* Both SMP bootup and ACPI suspend change these variables */
>  	__REFDATA
>  	.balign	8
> -	GLOBAL(initial_code)
> -	.quad	x86_64_start_kernel
> -	GLOBAL(initial_gs)
> -	.quad	INIT_PER_CPU_VAR(fixed_percpu_data)
> -	GLOBAL(initial_stack)
> -	/*
> -	 * The SIZEOF_PTREGS gap is a convention which helps the in-kernel
> -	 * unwinder reliably detect the end of the stack.
> -	 */
> -	.quad  init_thread_union + THREAD_SIZE - SIZEOF_PTREGS
> +SYM_DATA(initial_code,	.quad x86_64_start_kernel)
> +SYM_DATA(initial_gs,	.quad INIT_PER_CPU_VAR(fixed_percpu_data))

<---- newline here.

> +/*
> + * The SIZEOF_PTREGS gap is a convention which helps the in-kernel unwinder
> + * reliably detect the end of the stack.
> + */
> +SYM_DATA(initial_stack,
> +		.quad init_thread_union + THREAD_SIZE - SIZEOF_PTREGS)

No need to break that line.

...

-- 
Regards/Gruss,
    Boris.

Good mailing practices for 400: avoid top-posting and trim the reply.



[Index of Archives]     [Linux Kernel]     [Kernel Newbies]     [x86 Platform Driver]     [Netdev]     [Linux Wireless]     [Netfilter]     [Bugtraq]     [Linux Filesystems]     [Yosemite Discussion]     [MIPS Linux]     [ARM Linux]     [Linux Security]     [Linux RAID]     [Samba]     [Device Mapper]

  Powered by Linux