get_native_u2 & friends

Edward Nevill ed at camswl.com
Thu Feb 26 07:45:24 PST 2009


Hi all,

I think the best thing to do with get_native_u2 and friends is to let the compiler decide
how to access unaligned data. Most modern compilers have some facility for doing this.
In gcc you can use __attribute__((packed)) as follows.

typedef union unaligned {
	unsigned	u;
	unsigned short	us;
	unsigned long long ul;
} __attribute__((packed)) unaligned;

unsigned short get_native_u2(unaligned *p)
{
	return p->us;
}

unsigned get_native_u4(unaligned *p)
{
	return p->u;
}

unsigned long long get_native_u8(unaligned *p)
{
	return p->ul;
}

Below is the code generated for ARM and X86. Note that in the X86 case it just does the access
since X86 allows unaligned accesses whereas for ARM it goes ahead and doesbyte loads.

If on some architechture it is better to test the alignment and then do word/halfword loads if
the pointer is aligned and byte loads otherwise then hopefully the compiler will know the
best code to generate rarther than us trying to second guess what is best on individual
architectures.

Also, in many case these functions are called when it is known that the data is aligned as in
this example from _tableswitch...

      CASE(_tableswitch): {
          jint* lpc  = (jint*)VMalignWordUp(pc+1);
          int32_t  key  = STACK_INT(-1);
          int32_t  low  = Bytes::get_Java_u4((address)&lpc[1]);
          int32_t  high = Bytes::get_Java_u4((address)&lpc[2]);

Maybe it is worth having get_Java_u4() and get_Java_u4_unaligned()?

Regards,
Ed.


--- x86.s --------------------------------------------------------
	.file	"test.c"
	.text
	.p2align 4,,15
.globl get_native_u2
	.type	get_native_u2, @function
get_native_u2:
	pushl	%ebp
	movl	%esp, %ebp
	movl	8(%ebp), %eax
	popl	%ebp
	movzwl	(%eax), %eax
	ret
	.size	get_native_u2, .-get_native_u2
	.p2align 4,,15
.globl get_native_u4
	.type	get_native_u4, @function
get_native_u4:
	pushl	%ebp
	movl	%esp, %ebp
	movl	8(%ebp), %eax
	popl	%ebp
	movl	(%eax), %eax
	ret
	.size	get_native_u4, .-get_native_u4
	.p2align 4,,15
.globl get_native_u8
	.type	get_native_u8, @function
get_native_u8:
	pushl	%ebp
	movl	%esp, %ebp
	movl	8(%ebp), %eax
	popl	%ebp
	movl	4(%eax), %edx
	movl	(%eax), %eax
	ret
	.size	get_native_u8, .-get_native_u8
	.ident	"GCC: (GNU) 4.2.4 (Ubuntu 4.2.4-1ubuntu3)"
	.section	.note.GNU-stack,"", at progbits
--- arm.s -------------------------------------------------------------
	.arch armv5t
	.fpu softvfp
	.eabi_attribute 20, 1
	.eabi_attribute 21, 1
	.eabi_attribute 23, 3
	.eabi_attribute 24, 1
	.eabi_attribute 25, 1
	.eabi_attribute 26, 2
	.eabi_attribute 30, 2
	.eabi_attribute 18, 4
	.file	"test.c"
	.text
	.align	2
	.global	get_native_u2
	.type	get_native_u2, %function
get_native_u2:
	@ args = 0, pretend = 0, frame = 0
	@ frame_needed = 0, uses_anonymous_args = 0
	@ link register save eliminated.
	ldrb	r3, [r0, #1]	@ zero_extendqisi2
	ldrb	r0, [r0, #0]	@ zero_extendqisi2
	orr	r0, r0, r3, asl #8
	bx	lr
	.size	get_native_u2, .-get_native_u2
	.align	2
	.global	get_native_u4
	.type	get_native_u4, %function
get_native_u4:
	@ args = 0, pretend = 0, frame = 0
	@ frame_needed = 0, uses_anonymous_args = 0
	@ link register save eliminated.
	ldrb	r1, [r0, #1]	@ zero_extendqisi2
	ldrb	r3, [r0, #0]	@ zero_extendqisi2
	ldrb	r2, [r0, #2]	@ zero_extendqisi2
	ldrb	r0, [r0, #3]	@ zero_extendqisi2
	orr	r3, r3, r1, asl #8
	orr	r3, r3, r2, asl #16
	orr	r0, r3, r0, asl #24
	bx	lr
	.size	get_native_u4, .-get_native_u4
	.align	2
	.global	get_native_u8
	.type	get_native_u8, %function
get_native_u8:
	@ args = 0, pretend = 0, frame = 0
	@ frame_needed = 0, uses_anonymous_args = 0
	@ link register save eliminated.
	stmfd	sp!, {r4, r5, r6}
	ldrb	r5, [r0, #1]	@ zero_extendqisi2
	ldrb	r6, [r0, #5]	@ zero_extendqisi2
	ldrb	r3, [r0, #0]	@ zero_extendqisi2
	ldrb	ip, [r0, #2]	@ zero_extendqisi2
	ldrb	r1, [r0, #4]	@ zero_extendqisi2
	ldrb	r2, [r0, #6]	@ zero_extendqisi2
	ldrb	r4, [r0, #7]	@ zero_extendqisi2
	ldrb	r0, [r0, #3]	@ zero_extendqisi2
	orr	r3, r3, r5, asl #8
	orr	r1, r1, r6, asl #8
	orr	r3, r3, ip, asl #16
	orr	r1, r1, r2, asl #16
	orr	r0, r3, r0, asl #24
	orr	r1, r1, r4, asl #24
	ldmfd	sp!, {r4, r5, r6}
	bx	lr
	.size	get_native_u8, .-get_native_u8
	.ident	"GCC: (Ubuntu 4.3.3-1ubuntu1) 4.3.3"
	.section	.note.GNU-stack,"",%progbits



More information about the zero-dev mailing list