Index: dyncall/dyncall_call_arm32_arm_armhf.S
--- dyncall/dyncall_call_arm32_arm_armhf.S.orig
+++ dyncall/dyncall_call_arm32_arm_armhf.S
@@ -59,7 +59,7 @@ ENTRY_C(dcCall_arm32_armhf)
 	add r5,  r1, #16 /* r5 = stack args (after intreg ones) */
 
 	/* Load 16 single-precision registers (= 8 double-precision registers). */
-	fldmiad r3, {d0-d7}
+	vldmia r3, {d0-d7}
 
 	/* prep stack parameter area (includes room for spill area, callee spills if needed) */
 	sub r13, r13, r2
@@ -77,7 +77,7 @@ armhf_pushArgs:
 
 armhf_call:
 	ldmia r1, {r0-r3}  /* Load first 4 arguments for new call into r0-r3. */
-	                   /* 'blx %r4' workaround for ARMv4t: */
+	                   /* 'blx r4' workaround for ARMv4t: */
 	mov r14, r15       /* Branch return address(r15) -> link register (r14) -- r15 always points to address of current + 2 instructions (= Epilog code). */ 
 	bx  r4             /* Call (ARM/THUMB), available for ARMv4t. */
 
