RE: [PATCH V2] Implement the -a option to pad dtb aligned

Wang Tim（王艇艇） <timwang@xxxxxxxxxxxx> · Fri, 1 Jul 2016 02:26:20 +0000

Hi David,
Thanks again for your carefully review!
-------------------------------------------------------------------------------------------------

Your example is quite better than my current resolution!
I've used a similar method in my current resolution:
Here is my code in makefile：

diff --git a/AndroidKernel.mk b/AndroidKernel.mk
index 3390949..c5d616b 100644
--- a/AndroidKernel.mk
+++ b/AndroidKernel.mk
@@ -3,6 +3,7 @@ KERNEL_OUT := $(TARGET_OUT_INTERMEDIATES)/KERNEL
 KERNEL_IMG_BUILT := $(KERNEL_OUT)/arch/$(KERNEL_ARCH)/boot/Image
 KERNEL_IMG_DTBS := $(KERNEL_OUT)/arch/$(KERNEL_ARCH)/boot/dts/asr
 KERNEL_MODULES_OUT := $(TARGET_ROOT_OUT)/lib/modules
+KERNEL_DTB_ALIGN_SIZE := 64
 
 JOBS := $(shell echo `cat /proc/cpuinfo | grep processor | wc -l` / 2 + 1 | bc)
 
@@ -15,4 +16,10 @@ linuxkernel:
        @-mkdir -p $(KERNEL_MODULES_OUT)
        @-find $(TARGET_OUT_INTERMEDIATES) -name *.ko | xargs -I{} cp {} $(KERNEL_MODULES_OUT)
 
-       cat $(KERNEL_IMG_DTBS)/* $(KERNEL_IMG_BUILT) > $(KERNEL_IMG)
+       # align dtb files based on 64 bytes for uboot load and parse
+       for orig_dtb_file in $(KERNEL_IMG_DTBS)/*.dtb; \
+       do \
+               cat $${orig_dtb_file} /dev/zero | head -c `expr \`ls -l $${orig_dtb_file} | awk -F' ' '{print $$5}'\` + $(KE
+       done
+
+       cat $(KERNEL_IMG_DTBS)/*.padded $(KERNEL_IMG_BUILT) > $(KERNEL_IMG)

But I still think the operation in Makefile is not good enough and simple enough in this case than "DTC -a align_base" way.
If we using -a operation, we only need one line code in Makefile:
DTC_FLAGS ?= -a 64
Quite simple , how do you think? :)
----------------------------------------------------------------------------------------------------

I'm so sorry to confused you again.
Actually , I've done lots of tests after received your 1st mail.
And according your kindly suggestion, I found not only the -a + -p combination.
The -a + -s combination totally wrong as well, pervious patch will get a padlen < 0 if -S with a small size than orig_size.

My current patch use a new method to calculator the padlen after -p operation which not add padsize twice.
I calculator the padlen_APPEND data buy	expression: 
padlen += ALIGN(tsize, align_size) - tsize;
/* padlen is padsize from -p , padlen_APPEND means (padlen_from -a) */

------------------------
| orig_size     |
-----------------------
|padlen from -p |  /* at the end of ths line, the offset is the tsize after -p operation, which means padlen = padsize, tsize = orig_size + padlen */
-----------------------
|padlen_APPEND|  /* this line according to the ALIGN(tsize, align_size), so it's only the -a option added size */
-------------------------
So we can get the final padlen += ALIGN(tsize, align_size) - tsize;

ALIGN(tsize, align_size) is the final size of dtb file include the -p and -a parameters since tsize have included -p parameter
And I use the finial size - tsize, that means the -a option added size, that's padlen_APPEND size.
Not sure whether my express is clear enough.
Sorry for my ugly English grammar.

Let's check the patch with debug log:
diff --git a/scripts/dtc/flattree.c b/scripts/dtc/flattree.c
index bd99fa2..52bce0c 100644
--- a/scripts/dtc/flattree.c
+++ b/scripts/dtc/flattree.c
@@ -396,22 +396,39 @@ void dt_to_blob(FILE *f, struct boot_info *bi, int version)
        /*
         * If the user asked for more space than is used, adjust the totalsize.
         */
+       fprintf(stderr, "orig_size: %d \n", fdt32_to_cpu(fdt.totalsize));
+
+       fprintf(stderr, "S: %d, p: %d, a: %d, padlen: %d \n", minsize, padsize, align_size, padlen);
        if (minsize > 0) {
                padlen = minsize - fdt32_to_cpu(fdt.totalsize);
-               if ((padlen < 0) && (quiet < 1))
+               if ((padlen < 0) && (quiet < 1)) {
                        fprintf(stderr,
                                "Warning: blob size %d >= minimum size %d\n",
                                fdt32_to_cpu(fdt.totalsize), minsize);
+                       padlen = 0;
+               }
        }
+       fprintf(stderr, "S: %d, p: %d, a: %d, padlen: %d \n", minsize, padsize, align_size, padlen);
 
        if (padsize > 0)
                padlen = padsize;
+       fprintf(stderr, "S: %d, p: %d, a: %d, padlen: %d \n", minsize, padsize, align_size, padlen);
 
        if (padlen > 0) {
                int tsize = fdt32_to_cpu(fdt.totalsize);
                tsize += padlen;
                fdt.totalsize = cpu_to_fdt32(tsize);
        }
+       fprintf(stderr, "S: %d, p: %d, a: %d, padlen: %d \n", minsize, padsize, align_size, padlen);
+
+       if (align_size > 0) {
+               int tsize = fdt32_to_cpu(fdt.totalsize);
+               padlen += ALIGN(tsize, align_size) - tsize;
+               tsize = ALIGN(tsize, align_size);
+               fdt.totalsize = cpu_to_fdt32(tsize);
+       }
+       fprintf(stderr, "S: %d, p: %d, a: %d, padlen: %d \n", minsize, padsize, align_size, padlen);
+       fprintf(stderr, "final_size: %d \n", fdt32_to_cpu(fdt.totalsize));
 
        /*
         * Assemble the blob: start with the header, add with alignment
And then, please check whether these test log are right:
1. -p 1 -a 4
orig_size: 10171 
S: 0, p: 1, a: 4, padlen: 0 
S: 0, p: 1, a: 4, padlen: 0 
S: 0, p: 1, a: 4, padlen: 1 
S: 0, p: 1, a: 4, padlen: 1 
S: 0, p: 1, a: 4, padlen: 1 
final_size: 10172

2. -p 102 -a 4
orig_size: 10171 
S: 0, p: 102, a: 4, padlen: 0 
S: 0, p: 102, a: 4, padlen: 0 
S: 0, p: 102, a: 4, padlen: 102 
S: 0, p: 102, a: 4, padlen: 102 
S: 0, p: 102, a: 4, padlen: 105 
final_size: 10276

3. -S 10000 -a 4
orig_size: 10171 
S: 10000, p: 0, a: 4, padlen: 0 
Warning: blob size 10171 >= minimum size 10000
S: 10000, p: 0, a: 4, padlen: 0 
S: 10000, p: 0, a: 4, padlen: 0 
S: 10000, p: 0, a: 4, padlen: 0 
S: 10000, p: 0, a: 4, padlen: 1 
final_size: 10172

4. -S 99999 -a 4
orig_size: 10171 
S: 99999, p: 0, a: 4, padlen: 0 
S: 99999, p: 0, a: 4, padlen: 89828 
S: 99999, p: 0, a: 4, padlen: 89828 
S: 99999, p: 0, a: 4, padlen: 89828 
S: 99999, p: 0, a: 4, padlen: 89829 
final_size: 100000

5. -a 4
orig_size: 10171 
S: 0, p: 0, a: 4, padlen: 0 
S: 0, p: 0, a: 4, padlen: 0 
S: 0, p: 0, a: 4, padlen: 0 
S: 0, p: 0, a: 4, padlen: 0 
S: 0, p: 0, a: 4, padlen: 1 
final_size: 10172

-------------------------------------------------------------
About the blob_to_asm change,
The power of 2 means if the align_size is 64, the patch should like this:
asm_emit_align(f, 6);

-------------------------------------------------------------------
Please check my latest patch v3 for -a option, and please help to review again.
Thanks in advance!

Best Regards
Tim Wang(王艇艇)


-----Original Message-----
From: David Gibson [mailto:david@xxxxxxxxxxxxxxxxxxxxx] 
Sent: Tuesday, June 28, 2016 1:29 PM
To: Wang Tim（王艇艇）
Cc: devicetree-compiler@xxxxxxxxxxxxxxx; wtt_usst@xxxxxxx
Subject: Re: [PATCH] Implement the -a option to pad dtb aligned

On Mon, Jun 27, 2016 at 08:49:37AM +0000, Wang Tim（王艇艇） wrote:
> Hi David,
> (Seems my pervious mail rejected by vger.kernel.org).
> 
> Thanks for your kindly review!
> About the usage of this patch, as I know, some android phone and 
> google TV soc vendors or production vendors need such option to cat 
> all dtb files to support several products.
> Such as one soc vendor support two customers products. And each of 
> them use different screen panel and camera sensor. But most other 
> peripherals are same as the common board.
> We can use one kernel Image and several dtb files to support both of them.

Right, I see why you need the alignment in the output.  But it's pretty easy to introduce this as you produce the archive, without folding it into dtc.

For example:
	$ dd if=1.dtb bs=8 conv=sync of=dtbset
	$ dd if=2.dtb bs=8 conv=sync,notrunc oflag=append of=dtbset
	$ dd if=3.dtb bs=8 conv=sync,notrunc oflag=append of=dtbset
		.
		.
		.

Will create dtbset with all the dtbs aligned to 8 byte boundaries.

> The calculate method of -a option after -p/-S is totally wrong.
> I've fix it in attached patch file, please help to review again.
> 
> But I'm not sure whether my dt_to_asm part change is right.
> Please show me more details if my patch is wrong again.
> 
> Here is the updated patch：
> [PATCH] Implement the -a option to pad dtb aligned
> 
> There is one condition that need cat the dtb files into one dtb.img 
> which can support several boards use same SoC platform.
> 
> And the original dtb file size is not aligned to any base.
> This may cause "Synchronous Abort" when load from a unligned address 
> on some SoC machine, such as ARM.
> 
> So this patch implement the -a <aligned number> option to pad zero at 
> the end of dtb files and make the dtb size aligned to <aligned 
> number>.
> 
> Then, the aligned dtbs can cat together and load without "Synchronous 
> Abort".
> 
> Signed-off-by: Tim Wang <timwang@xxxxxxxxxxxx>
> ---
>  dtc.c      |  9 ++++++++-
>  dtc.h      |  1 +
>  flattree.c | 13 ++++++++++++-
>  3 files changed, 21 insertions(+), 2 deletions(-)
> 
> diff --git a/dtc.c b/dtc.c
> index 5fa23c4..1749d26 100644
> --- a/dtc.c
> +++ b/dtc.c
> @@ -30,6 +30,7 @@ int quiet;		/* Level of quietness */
>  int reservenum;		/* Number of memory reservation slots */
>  int minsize;		/* Minimum blob size */
>  int padsize;		/* Additional padding to blob */
> +int align_size;		/* Additional padding to blob accroding to the align size */
>  int phandle_format = PHANDLE_BOTH;	/* Use linux,phandle or phandle properties */
>  
>  static void fill_fullpaths(struct node *tree, const char *prefix) @@ 
> -53,7 +54,7 @@ static void fill_fullpaths(struct node *tree, const char *prefix)
>  #define FDT_VERSION(version)	_FDT_VERSION(version)
>  #define _FDT_VERSION(version)	#version
>  static const char usage_synopsis[] = "dtc [options] <input file>"; 
> -static const char usage_short_opts[] = 
> "qI:O:o:V:d:R:S:p:fb:i:H:sW:E:hv";
> +static const char usage_short_opts[] = 
> +"qI:O:o:V:d:R:S:p:a:fb:i:H:sW:E:hv";
>  static struct option const usage_long_opts[] = {
>  	{"quiet",            no_argument, NULL, 'q'},
>  	{"in-format",         a_argument, NULL, 'I'},
> @@ -64,6 +65,7 @@ static struct option const usage_long_opts[] = {
>  	{"reserve",           a_argument, NULL, 'R'},
>  	{"space",             a_argument, NULL, 'S'},
>  	{"pad",               a_argument, NULL, 'p'},
> +	{"align",             a_argument, NULL, 'a'},
>  	{"boot-cpu",          a_argument, NULL, 'b'},
>  	{"force",            no_argument, NULL, 'f'},
>  	{"include",           a_argument, NULL, 'i'},
> @@ -91,6 +93,7 @@ static const char * const usage_opts_help[] = {
>  	"\n\tMake space for <number> reserve map entries (for dtb and asm output)",
>  	"\n\tMake the blob at least <bytes> long (extra space)",
>  	"\n\tAdd padding to the blob of <bytes> long (extra space)",
> +	"\n\tMake the blob align to the <bytes> (extra space)",
>  	"\n\tSet the physical boot cpu",
>  	"\n\tTry to produce output even if the input tree has errors",
>  	"\n\tAdd a path to search for include files", @@ -169,6 +172,7 @@ 
> int main(int argc, char *argv[])
>  	reservenum = 0;
>  	minsize    = 0;
>  	padsize    = 0;
> +	align_size = 0;
>  
>  	while ((opt = util_getopt_long()) != EOF) {
>  		switch (opt) {
> @@ -196,6 +200,9 @@ int main(int argc, char *argv[])
>  		case 'p':
>  			padsize = strtol(optarg, NULL, 0);
>  			break;
> +		case 'a':
> +			align_size = strtol(optarg, NULL, 0);
> +			break;
>  		case 'f':
>  			force = true;
>  			break;
> diff --git a/dtc.h b/dtc.h
> index 56212c8..b406d21 100644
> --- a/dtc.h
> +++ b/dtc.h
> @@ -53,6 +53,7 @@ extern int quiet;		/* Level of quietness */
>  extern int reservenum;		/* Number of memory reservation slots */
>  extern int minsize;		/* Minimum blob size */
>  extern int padsize;		/* Additional padding to blob */
> +extern int align_size;		/* Additional padding to blob accroding to the align size */
>  extern int phandle_format;	/* Use linux,phandle or phandle properties */
>  
>  #define PHANDLE_LEGACY	0x1
> diff --git a/flattree.c b/flattree.c
> index ec14954..29f0a54 100644
> --- a/flattree.c
> +++ b/flattree.c
> @@ -398,10 +398,12 @@ void dt_to_blob(FILE *f, struct boot_info *bi, int version)
>  	 */
>  	if (minsize > 0) {
>  		padlen = minsize - fdt32_to_cpu(fdt.totalsize);
> -		if ((padlen < 0) && (quiet < 1))
> +		if ((padlen < 0) && (quiet < 1)) {
>  			fprintf(stderr,
>  				"Warning: blob size %d >= minimum size %d\n",
>  				fdt32_to_cpu(fdt.totalsize), minsize);
> +			padlen = 0;
> +		}
>  	}
>  
>  	if (padsize > 0)
> @@ -413,6 +415,13 @@ void dt_to_blob(FILE *f, struct boot_info *bi, int version)
>  		fdt.totalsize = cpu_to_fdt32(tsize);
>  	}
>  
> +	if (align_size > 0) {
> +		int tsize = fdt32_to_cpu(fdt.totalsize);
> +		padlen += ALIGN(tsize, align_size) - tsize;
> +		tsize = ALIGN(tsize, align_size);
> +		fdt.totalsize = cpu_to_fdt32(tsize);
> +	}
> +

This is still wrong.  The previous if already increased totalsize by padlen.  Now you've adjusted padlen and added it to totalsize again.

Please, actually test this with both -p and -a options.

>  	/*
>  	 * Assemble the blob: start with the header, add with alignment
>  	 * the reserve buffer, add the reserve map terminating zeroes, @@ 
> -478,6 +487,8 @@ void dt_to_asm(FILE *f, struct boot_info *bi, int version)
>  	fprintf(f, "/* autogenerated by dtc, do not edit */\n\n");
>  
>  	emit_label(f, symprefix, "blob_start");
> +	if (align_size > 0)
> +		asm_emit_align(f, align_size);

This is correct, as long as align_size is a power of two - otherwise it will probably cause an assembler error.

>  	emit_label(f, symprefix, "header");
>  	fprintf(f, "\t/* magic */\n");
>  	asm_emit_cell(f, FDT_MAGIC);

-- 
David Gibson			| I'll have my music baroque, and my code
david AT gibson.dropbear.id.au	| minimalist, thank you.  NOT _the_ _other_
				| _way_ _around_!
http://www.ozlabs.org/~dgibson
��.n��������+%������w��{.n����z�{��z��^n�r������&��z�ޗ�zf���h���~����������_��+v���)ߣ�