New atari/tos version. Requires UCL 0.92.

committer: mfx <mfx> 973825927 +0000
This commit is contained in:
Markus F.X.J. Oberhumer 2000-11-10 03:12:07 +00:00
parent 6a4d9475f2
commit 30cd0816fd
3 changed files with 137 additions and 72 deletions

View File

@ -153,11 +153,6 @@ bool PackTos::checkFileHeader()
throwCantPack("I won't pack F_OS_SPECIAL programs"); throwCantPack("I won't pack F_OS_SPECIAL programs");
if ((f & F_PROTMODE) > F_PROT_I) if ((f & F_PROTMODE) > F_PROT_I)
throwCantPack("invalid protection mode"); throwCantPack("invalid protection mode");
if (f & F_MEMFLAGS)
{
if (opt->force < 1)
throwCantPack("invalid memory flags; use option `-f' to force packing");
}
if ((f & F_PROTMODE) != F_PROT_P) if ((f & F_PROTMODE) != F_PROT_P)
{ {
if (opt->force < 1) if (opt->force < 1)
@ -180,20 +175,62 @@ bool PackTos::checkFileHeader()
} }
void PackTos::patch_d0_subq(void *l, int llen, /*************************************************************************
const char *d0_old, const char *subq_old, //
unsigned d0_new) **************************************************************************/
unsigned PackTos::patch_d0_subq(void *l, int llen, unsigned d0,
const char *subq_marker)
{ {
void *p; // patch a "subq.l #1,d0" or "subq.w #1,d0".
// patch "subq.l #1,d0" or "subq.w #1,d0" // also convert into "dbra" if possible
p = find_be16(l, llen, get_be16(subq_old)); upx_byte *p;
checkPatch(l, p, 2);
set_be16(p, d0_new > 65535 ? 0x5380 : 0x5340); assert((int)d0 > 0);
// p = find_be16(l, llen, get_be16(subq_marker));
p = find_be32(l, llen, get_be32(d0_old));
if (p[2] == 0x66) // bne.b XXX
checkPatch(l, p, 4);
else
checkPatch(l, p, 2);
if (d0 > 65536)
{
set_be16(p, 0x5380); // subq.l #1,d0
}
else
{
if (p[2] == 0x66) // bne.b XXX
{
set_be16(p, 0x51c8); // dbra d0,XXX
// adjust and extend branch from 8 to 16 bits
int branch = (signed char) p[3];
set_be16(p+2, branch+2);
// adjust d0
d0 -= 1;
}
else
{
set_be16(p, 0x5340); // subq.w #1,d0
}
d0 &= 0xffff;
}
return d0;
}
unsigned PackTos::patch_d0_loop(void *l, int llen, unsigned d0,
const char *d0_marker, const char *subq_marker)
{
upx_byte *p;
d0 = patch_d0_subq(l, llen, d0, subq_marker);
p = find_be32(l, llen, get_be32(d0_marker));
assert(get_be16(p - 2) == 0x203c); // move.l #XXXXXXXX,d0
checkPatch(l, p, 4); checkPatch(l, p, 4);
set_be32(p, d0_new); set_be32(p, d0);
assert(get_be16(p, -2) == 0x203c); // move.l #XXXXXXXX,d0 return d0;
} }
@ -289,9 +326,10 @@ void PackTos::pack(OutputFile *fo)
unsigned overlay = 0; unsigned overlay = 0;
const unsigned lsize = getLoaderSize(); const unsigned lsize = getLoaderSize();
const unsigned e_len = get_be16(getLoader()+lsize-4); const unsigned e_len = get_be16(getLoader()+lsize-6);
const unsigned d_len = get_be16(getLoader()+lsize-2); const unsigned d_len = get_be16(getLoader()+lsize-4);
assert(e_len + d_len == lsize - 4); const unsigned decomp_offset = get_be16(getLoader()+lsize-2);
assert(e_len + d_len == lsize - 6);
assert((e_len & 3) == 0 && (d_len & 1) == 0); assert((e_len & 3) == 0 && (d_len & 1) == 0);
const unsigned i_text = ih.fh_text; const unsigned i_text = ih.fh_text;
@ -429,11 +467,11 @@ void PackTos::pack(OutputFile *fo)
if (!opt->small) if (!opt->small)
patchVersion(loader,o_text); patchVersion(loader,o_text);
// patch "subq.l #1,d0" or "subq.w #1,d0" - see "up41" below // patch "subq.l #1,d0" or "subq.w #1,d0" - see "up41" below
patch_be16(loader,o_text,"u4", const unsigned dirty_bss_d0 =
dirty_bss / dirty_bss_align > 65535 ? 0x5380 : 0x5340); patch_d0_subq(loader, o_text, dirty_bss / dirty_bss_align, "u4");
patch_be32(loader,o_text,"up31",d_off + offset); patch_be32(loader,o_text,"up31",d_off + offset + decomp_offset);
if (opt->small) if (opt->small)
patch_d0_subq(loader,o_text,"up22","u1", o_data/4); patch_d0_loop(loader,o_text,o_data/4,"up22","u1");
else else
{ {
if (o_data <= 160) if (o_data <= 160)
@ -446,7 +484,7 @@ void PackTos::pack(OutputFile *fo)
loop2 = 160; loop2 = 160;
} }
patch_be16(loader,o_text,"u2", 0x7000 + loop2/4-1); // moveq.l #X,d0 patch_be16(loader,o_text,"u2", 0x7000 + loop2/4-1); // moveq.l #X,d0
patch_d0_subq(loader,o_text,"up22","u1", loop1); patch_d0_loop(loader,o_text,loop1,"up22","u1");
} }
patch_be32(loader,o_text,"up21",o_data + offset); patch_be32(loader,o_text,"up21",o_data + offset);
patch_be32(loader,o_text,"up13",i_bss); // p_blen patch_be32(loader,o_text,"up13",i_bss); // p_blen
@ -459,7 +497,7 @@ void PackTos::pack(OutputFile *fo)
upx_byte *p = obuf + d_off; upx_byte *p = obuf + d_off;
// patch "moveq.l #1,d3" or "jmp (a5)" // patch "moveq.l #1,d3" or "jmp (a5)"
patch_be16(p,d_len,"u3", (relocsize > 4) ? 0x7601 : 0x4ed5); patch_be16(p,d_len,"u3", (relocsize > 4) ? 0x7601 : 0x4ed5);
patch_be32(p,d_len,"up41", dirty_bss / dirty_bss_align); patch_be32(p,d_len,"up41", dirty_bss_d0);
// set new file_hdr // set new file_hdr
memcpy(&oh, &ih, FH_SIZE); memcpy(&oh, &ih, FH_SIZE);
@ -474,8 +512,8 @@ void PackTos::pack(OutputFile *fo)
oh.fh_text = o_text + o_data; oh.fh_text = o_text + o_data;
oh.fh_data = 0; oh.fh_data = 0;
} }
oh.fh_bss = o_bss; oh.fh_bss = o_bss;
oh.fh_sym = 0; oh.fh_sym = 0;
oh.fh_reserved = 0; oh.fh_reserved = 0;
// only keep the following flags: // only keep the following flags:
oh.fh_flag = ih.fh_flag & (F_FASTLOAD | F_ALTALLOC | F_SMALLTPA | F_ALLOCZERO | F_KEEP); oh.fh_flag = ih.fh_flag & (F_FASTLOAD | F_ALTALLOC | F_SMALLTPA | F_ALLOCZERO | F_KEEP);

View File

@ -72,7 +72,8 @@ protected:
} ih, oh; } ih, oh;
protected: protected:
void patch_d0_subq(void *l, int llen, const char*, const char*, unsigned); unsigned patch_d0_subq(void *l, int llen, unsigned, const char*);
unsigned patch_d0_loop(void *l, int llen, unsigned, const char*, const char*);
}; };

View File

@ -43,11 +43,16 @@
; ;
#ifdef __A68K__ #if defined(__A68K__)
# define align4 align 0,4 # define align4 align 0,4
# define L(label) \/**/label # define L(label) \/**/label
# define macro(name) name macro # define macro(name) name macro
# define text section code # define text section code
#elif defined(__ASL__)
# define align4 align 4
# define L(label) $$/**/label
# define macro(name) name macro
# define text section code
#else #else
# define align4 align 4 # define align4 align 4
# define L(label) ./**/label # define L(label) ./**/label
@ -61,18 +66,22 @@
; basepage offsets ; basepage offsets
p_lowtpa equ $0 ; .l p_lowtpa equ $0 ; .l pointer to self (bottom of TPA)
p_hitpa equ $4 ; .l p_hitpa equ $4 ; .l pointer to top of TPA + 1
p_tbase equ $8 ; .l p_tbase equ $8 ; .l base of text segment
p_tlen equ $c ; .l p_tlen equ $c ; .l length of text segment
p_dbase equ $10 ; .l p_dbase equ $10 ; .l base of data segment
p_dlen equ $14 ; .l p_dlen equ $14 ; .l length of data segment
p_bbase equ $18 ; .l p_bbase equ $18 ; .l base of BSS segment
p_blen equ $1c ; .l p_blen equ $1c ; .l length of BSS segment
p_dta equ $20 ; .l pointer to current DTA
p_parent equ $24 ; .l pointer to parent's basepage
p_flags equ $28 ; .l memory usage flags
p_env equ $2c ; .l pointer to environment string
#if 0 #if 0
; file header offsets (NOT USED) ; file header offsets (NOT USED)
fh_magic equ $0 ; .w $601a fh_magic equ $0 ; .w $601a
fh_text equ $2 ; .l fh_text equ $2 ; .l
fh_data equ $6 ; .l fh_data equ $6 ; .l
fh_bss equ $a ; .l fh_bss equ $a ; .l
@ -80,7 +89,7 @@ fh_sym equ $e ; .l
fh_reserved equ $12 ; .l fh_reserved equ $12 ; .l
fh_flag equ $16 ; .l fh_flag equ $16 ; .l
fh_reloc equ $1a ; .w fh_reloc equ $1a ; .w
FH_SIZE equ $1c ; 28 bytes FH_SIZE equ $1c ; 28 bytes
#endif #endif
; ;
@ -88,8 +97,8 @@ FH_SIZE equ $1c ; 28 bytes
; d4 p_tbase - start of text segment ; d4 p_tbase - start of text segment
; a6 p_bbase - start of decompressed bss segment, this also is the ; a6 p_bbase - start of decompressed bss segment, this also is the
; - end of decompressed text+data ; - end of decompressed text+data
; - beginning of decompressed relocations ; - start of decompressed relocations
; - beginning of dirty bss ; - start of dirty bss
; a5 final startup code copied below stack ; a5 final startup code copied below stack
; ;
@ -102,13 +111,18 @@ FH_SIZE equ $1c ; 28 bytes
; // are contiguous in memory ; // are contiguous in memory
; **************************************************************************/ ; **************************************************************************/
#if defined(__ASL__)
padding off
#endif
text text
dc.b 'UPX1' ; marker for o2bin.pl dc.b 'UPX1' ; marker for o2bin.pl
start: start:
move.l a0,d0 ; a0 is basepage if accessory move.l a0,d0 ; a0 is basepage if accessory
beq L(l_app) beq L(l_app)
move.l 4(a0),sp ; accessory - get stack move.l 4(a0),sp ; accessory - get stack
bra L(start) bra L(start)
L(l_app): move.l 4(sp),d0 ; application - get basepage L(l_app): move.l 4(sp),d0 ; application - get basepage
L(start): movem.l d1-d7/a0-a6,-(sp) L(start): movem.l d1-d7/a0-a6,-(sp)
@ -187,54 +201,63 @@ L(loop2): move.l -(a1),-(a0)
copy_to_stack: copy_to_stack:
lea.l clear_bss_end(pc),a2 lea.l clear_bss_end(pc),a2
move.l sp,a5 move.l sp,a5
moveq.l #((clear_bss_end-clear_bss)/2),d0 moveq.l #((clear_bss_end-clear_bss)/2-1),d5
move.l d4,-(a5) ; entry point for final jmp move.l d4,-(a5) ; entry point for final jmp
L(loop): move.w -(a2),-(a5) L(loop): move.w -(a2),-(a5)
subq.w #1,d0 subq.l #1,d5
bne L(loop) bcc L(loop)
; note: now d0 is 0 ; note: d5.l is now -1 (needed for decompressor)
; ------------- prepare decompressor ; ------------- prepare decompressor
; a0 still points to the start of the compressed block ; a0 still points to the start of the compressed block
; note: the next statement can be moved below cutpoint
; if it helps for the align4
;;move.l d4,a1 ; dest. for decompressing
move.l d4,a1 ; dest. for decompressing move.l d4,a1 ; dest. for decompressing
#define NRV_NO_INIT
;;moveq.l #-1,d5 ; last_off = -1
moveq.l #-1,d7
moveq.l #-128,d0 ; d0.b = $80
#if defined(NRV2B)
moveq.l #-$68,d6 ; 0xffffff98
lsl.w #5,d6 ; 0xfffff300 == -0xd00
#elif defined(NRV2D)
moveq.l #-$50,d6 ; 0xffffffb0
lsl.w #4,d6 ; 0xfffffb00 == -0x500
#endif
; ------------- jump to copied decompressor ; ------------- jump to copied decompressor
move.l d4,a2 move.l d4,a2
add.l #'up31',a2 add.l #'up31',a2
jmp (a2) ; jmp cutpoint jmp (a2) ; jmp decompr_start
; /************************************************************************* ; /*************************************************************************
; // this is the final part of the startup code which runs in the stack ; // this is the final part of the startup code which runs in the stack
; **************************************************************************/ ; **************************************************************************/
; on entry d1 and d2 are 0
; ------------- clear dirty bss ; ------------- clear dirty bss
clear_bss: clear_bss:
; on entry d2 is 0
#if defined(SMALL) #if defined(SMALL)
L(loop): move.l d1,(a6)+ L(loop): move.l d2,(a6)+
;;subq.l #1,d0 ;;subq.l #1,d0
dc.b 'u4' ; subq.l #1,d0 / subq.w #1,d0 dc.b 'u4' ; subq.l #1,d0 / subq.w #1,d0
bne L(loop) bne L(loop)
#else #else
; the dirty bss is usually not too large, so we don't ; the dirty bss is usually not too large, so we don't
; bother making movem optimizations here ; bother making movem optimizations here
L(loop): move.l d1,(a6)+ L(loop): move.l d2,(a6)+
move.l d1,(a6)+ move.l d2,(a6)+
move.l d1,(a6)+ move.l d2,(a6)+
move.l d1,(a6)+ move.l d2,(a6)+
;;subq.l #1,d0 ;;subq.l #1,d0
dc.b 'u4' ; subq.l #1,d0 / subq.w #1,d0 dc.b 'u4' ; subq.l #1,d0 / subq.w #1,d0
bne L(loop) bne L(loop)
@ -243,13 +266,10 @@ L(loop): move.l d1,(a6)+
; ------------- start program ; ------------- start program
; note: d0.l is now 0
movem.l (sp)+,d1-d7/a0-a6 movem.l (sp)+,d1-d7/a0-a6
cmp.l d0,a0 move.l a0,d0
beq L(l_app) beq L(l_app)
;;suba.l sp,sp ; accessory: no stack sub.l sp,sp ; accessory: no stack
move.l d0,sp ; accessory: no stack
L(l_app): dc.w $4ef9 ; jmp $xxxxxxxx - jmp to text segment L(l_app): dc.w $4ef9 ; jmp $xxxxxxxx - jmp to text segment
clear_bss_end: clear_bss_end:
@ -264,12 +284,11 @@ clear_bss_end:
#else #else
# include "ident_n.ash" # include "ident_n.ash"
#endif #endif
even
align4 align4
dc.b 'UPX!' ; magic dc.b 'UPX!' ; magic
ds.b 28 ; #include "header.ash" dc.l 0,0,0,0,0,0,0 ; 28 bytes - #include "header.ash"
; end of text segment - size is a multiple of 4 ; end of text segment - size is a multiple of 4
@ -277,7 +296,8 @@ clear_bss_end:
; /************************************************************************* ; /*************************************************************************
; // This part is appended after the compressed data. ; // This part is appended after the compressed data.
; // It runs in the last part of the dirty bss (after the relocations). ; // It runs in the last part of the dirty bss (after the
; // relocations and the original fileheader).
; **************************************************************************/ ; **************************************************************************/
cutpoint: cutpoint:
@ -292,7 +312,7 @@ cutpoint:
# error # error
#endif #endif
; note: d1 and d2 are 0 from decompressor above ; note: d2 is 0 from decompressor above
; ------------- prepare d0 for clearing the dirty bss ; ------------- prepare d0 for clearing the dirty bss
@ -311,23 +331,25 @@ cutpoint:
; ------------- reloc ; ------------- reloc
reloc:
; The decompressed relocations now are just after the decompressed ; The decompressed relocations now are just after the decompressed
; data segment, i.e. at the beginning of the (dirty) bss. ; data segment, i.e. at the beginning of the (dirty) bss.
; note: d1 and d2 are still 0 ; note: d2 is still 0
move.l a6,a0 ; a0 = start of relocations move.l a6,a0 ; a0 = start of relocations
move.l d4,a1 move.l d4,a1
add.l (a0)+,a1 ; get initial fixup add.l (a0)+,a1 ; get initial fixup
L(loop1): add.l d1,a1 ; increase fixup L(loop1): add.l d2,a1 ; increase fixup
add.l d4,(a1) ; reloc one address add.l d4,(a1) ; reloc one address
L(loop2): move.b (a0)+,d1 L(loop2): move.b (a0)+,d2
beq reloc_end beq reloc_end
cmp.b d3,d1 ; note: d3.b is #1 cmp.b d3,d2 ; note: d3.b is #1
bne L(loop1) bne L(loop1)
lea 254(a1),a1 ; d1 == 1 -> add 254, don't reloc lea 254(a1),a1 ; d2 == 1 -> add 254, don't reloc
bra L(loop2) bra L(loop2)
reloc_end: reloc_end:
@ -338,7 +360,7 @@ reloc_end:
; We are currently running in the dirty bss. ; We are currently running in the dirty bss.
; Jump to the code we copied below the stack. ; Jump to the code we copied below the stack.
; note: d1 and d2 are still 0 ; note: d2 is still 0
jmp (a5) ; jmp clear_bss (on stack) jmp (a5) ; jmp clear_bss (on stack)
@ -347,8 +369,12 @@ reloc_end:
eof: eof:
dc.w cutpoint-start ; size of entry dc.w cutpoint-start ; size of entry
dc.w eof-cutpoint ; size of decompressor dc.w eof-cutpoint ; size of decompressor
dc.w decompr_start-cutpoint ; offset of decompressor start
dc.b 'UPX9' ; marker for o2bin.pl dc.b 'UPX9' ; marker for o2bin.pl
#if defined(__ASL__)
endsection code
#endif
end end