| /*************************************************************************** |
| * __________ __ ___. |
| * Open \______ \ ____ ____ | | _\_ |__ _______ ___ |
| * Source | _// _ \_/ ___\| |/ /| __ \ / _ \ \/ / |
| * Jukebox | | ( <_> ) \___| < | \_\ ( <_> > < < |
| * Firmware |____|_ /\____/ \___ >__|_ \|___ /\____/__/\_ \ |
| * \/ \/ \/ \/ \/ |
| * $Id$ |
| * |
| * Copyright (C) 2004 by Jens Arnold |
| * |
| * This program is free software; you can redistribute it and/or |
| * modify it under the terms of the GNU General Public License |
| * as published by the Free Software Foundation; either version 2 |
| * of the License, or (at your option) any later version. |
| * |
| * This software is distributed on an "AS IS" basis, WITHOUT WARRANTY OF ANY |
| * KIND, either express or implied. |
| * |
| ****************************************************************************/ |
| |
| .section .icode,"ax",@progbits |
| |
| .align 2 /* this aligns to 2^2=4 byte bounday */ |
| .global _descramble |
| .type _descramble,@function |
| |
| /* Descramble a block of byte data, from source to dest, processing len |
| * bytes. Size only limited by the len argument. Note that len must |
| * be an even multiple of 4 (something rolo_load() already assumes. |
| * (Does the Archos firmware loader also require that?). |
| * |
| * Returns the 16-bit "sum" checksum of the descrambled data. |
| * |
| * Arguments: |
| * r4 - source (unsigned char*) |
| * r5 - dest (unsigned char*) |
| * r6 - len (unsigned int) |
| * |
| * Register usage: |
| * r0 - data |
| * r1 - temp |
| * r2 - checksum |
| * r3 - current src address |
| * r4 - source |
| * r5 - dest |
| * r6 - len -> source_end |
| * r7 - dest_end |
| * r8 - len / 4 |
| */ |
| |
| _descramble: |
| mov.l r8,@-r15 |
| mov r6,r8 |
| shlr2 r8 /* r8 = len / 4 */ |
| mov r5,r7 |
| add r6,r7 /* dest_end = dest + len */ |
| add r4,r6 /* source_end = source + len */ |
| mov r4,r3 /* addr = source */ |
| mov #0,r2 /* checksum = 0 */ |
| |
| .loop: |
| mov.b @r3,r0 /* data = *addr */ |
| add r8,r3 /* addr += len / 4 */ |
| extu.b r0,r0 /* zero extend data byte */ |
| swap.b r0,r1 /* byte swap low word to temp */ |
| or r1,r0 /* r0's two lower bytes now identical */ |
| shlr r0 /* -> this equals "rotr.b r0" now */ |
| not r0,r0 /* negate */ |
| extu.b r0,r0 /* zero extend low byte (only needed for sum) */ |
| mov.b r0,@r5 /* *dest = data */ |
| add r0,r2 /* checksum += data */ |
| add #1,r5 /* dest++ */ |
| cmp/hi r3,r6 /* addr < source_end ? */ |
| bt .loop |
| |
| add #1,r4 /* source++ */ |
| mov r4,r3 /* addr = source */ |
| cmp/hi r5,r7 /* dest < dest_end */ |
| bt .loop |
| |
| /* 15 clock cycles if no reset of source address, 19 if reset, |
| * avg. 16 cycles per byte. Magnus' Version needed 17-22 cycles per byte |
| */ |
| |
| mov.l @r15+,r8 |
| rts |
| extu.w r2,r0 |
| |
| |
| /* Move len bytes from source to dest (which must be suitably aligned for |
| * long moves) and jump to dest + 0x200. |
| * |
| * Arguments: |
| * r4 - source |
| * r5 - dest |
| * r6 - len |
| */ |
| |
| .align 2 |
| .global _rolo_restart |
| .type _rolo_restart,@function |
| |
| _rolo_restart: |
| mov r5,r0 |
| sub r4,r0 /* r0 = dest - source */ |
| add #-4,r0 /* adjust for early increment */ |
| add r4,r6 /* r6 = source + len */ |
| |
| .copy: /* loop takes 6 cycles per longword */ |
| mov.l @r4+,r1 |
| cmp/hi r4,r6 |
| mov.l r1,@(r0,r4) |
| bt .copy |
| |
| mov.l @r5+,r0 /* start address from image */ |
| jmp @r0 |
| mov.l @r5+,r15 /* stack pointer from image */ |
| |
| .end: |
| .size _descramble,.end-_descramble |