Fixed a crash when reading the DWARF information.
[clinton/Virtual-Jaguar-Rx.git] / src / blitter.cpp
CommitLineData
cf76e892
JPM
1//
2// Blitter core
3//
4// by James Hammons
5// (C) 2010 Underground Software
6//
7// JLH = James Hammons <jlhamm@acm.org>
8// JPM = Jean-Paul Mari <djipi.mari@gmail.com>
9//
10// Who When What
11// --- ---------- -----------------------------------------------------------
12// JLH 01/16/2010 Created this log ;-)
13// JPM 06/06/2016 Visual Studio support
14//
15
16//
17// I owe a debt of gratitude to Curt Vendel and to John Mathieson--to Curt
18// for supplying the Oberon ASIC nets and to John for making them available
19// to Curt. ;-) Without that excellent documentation which shows *exactly*
20// what's going on inside the TOM chip, we'd all still be guessing as to how
21// the wily blitter and other pieces of the Jaguar puzzle actually work.
22// Now how about those JERRY ASIC nets gentlemen...? [We have those now!] ;-)
23//
24
25#include "blitter.h"
26
27#include <stdlib.h>
28#include <stdio.h>
29#include <string.h>
30#include "jaguar.h"
31#include "log.h"
32//#include "memory.h"
33#include "settings.h"
34
35// Various conditional compilation goodies...
36
37//#define LOG_BLITS
38
39#define USE_ORIGINAL_BLITTER
40//#define USE_MIDSUMMER_BLITTER
41#define USE_MIDSUMMER_BLITTER_MKII
42
43#ifdef USE_ORIGINAL_BLITTER
44#ifdef USE_MIDSUMMER_BLITTER_MKII
45#define USE_BOTH_BLITTERS
46#endif
47#endif
48
49
50// External global variables
51
52extern int jaguar_active_memory_dumps;
53
54// Local global variables
55
56int start_logging = 0;
57uint8_t blitter_working = 0;
58bool startConciseBlitLogging = false;
59bool logBlit = false;
60
61// Blitter register RAM (most of it is hidden from the user)
62
63static uint8_t blitter_ram[0x100];
64
65// Other crapola
66
67bool specialLog = false;
68extern int effect_start;
69extern int blit_start_log;
70void BlitterMidsummer(uint32_t cmd);
71void BlitterMidsummer2(void);
72
73#define REG(A) (((uint32_t)blitter_ram[(A)] << 24) | ((uint32_t)blitter_ram[(A)+1] << 16) \
74 | ((uint32_t)blitter_ram[(A)+2] << 8) | (uint32_t)blitter_ram[(A)+3])
75#define WREG(A,D) (blitter_ram[(A)] = ((D)>>24)&0xFF, blitter_ram[(A)+1] = ((D)>>16)&0xFF, \
76 blitter_ram[(A)+2] = ((D)>>8)&0xFF, blitter_ram[(A)+3] = (D)&0xFF)
77
78// Blitter registers (offsets from F02200)
79
80#define A1_BASE ((uint32_t)0x00)
81#define A1_FLAGS ((uint32_t)0x04)
82#define A1_CLIP ((uint32_t)0x08) // Height and width values for clipping
83#define A1_PIXEL ((uint32_t)0x0C) // Integer part of the pixel (Y.i and X.i)
84#define A1_STEP ((uint32_t)0x10) // Integer part of the step
85#define A1_FSTEP ((uint32_t)0x14) // Fractional part of the step
86#define A1_FPIXEL ((uint32_t)0x18) // Fractional part of the pixel (Y.f and X.f)
87#define A1_INC ((uint32_t)0x1C) // Integer part of the increment
88#define A1_FINC ((uint32_t)0x20) // Fractional part of the increment
89#define A2_BASE ((uint32_t)0x24)
90#define A2_FLAGS ((uint32_t)0x28)
91#define A2_MASK ((uint32_t)0x2C) // Modulo values for x and y (M.y and M.x)
92#define A2_PIXEL ((uint32_t)0x30) // Integer part of the pixel (no fractional part for A2)
93#define A2_STEP ((uint32_t)0x34) // Integer part of the step (no fractional part for A2)
94#define COMMAND ((uint32_t)0x38)
95#define PIXLINECOUNTER ((uint32_t)0x3C) // Inner & outer loop values
96#define SRCDATA ((uint32_t)0x40)
97#define DSTDATA ((uint32_t)0x48)
98#define DSTZ ((uint32_t)0x50)
99#define SRCZINT ((uint32_t)0x58)
100#define SRCZFRAC ((uint32_t)0x60)
101#define PATTERNDATA ((uint32_t)0x68)
102#define INTENSITYINC ((uint32_t)0x70)
103#define ZINC ((uint32_t)0x74)
104#define COLLISIONCTRL ((uint32_t)0x78)
105#define PHRASEINT0 ((uint32_t)0x7C)
106#define PHRASEINT1 ((uint32_t)0x80)
107#define PHRASEINT2 ((uint32_t)0x84)
108#define PHRASEINT3 ((uint32_t)0x88)
109#define PHRASEZ0 ((uint32_t)0x8C)
110#define PHRASEZ1 ((uint32_t)0x90)
111#define PHRASEZ2 ((uint32_t)0x94)
112#define PHRASEZ3 ((uint32_t)0x98)
113
114// Blitter command bits
115
116#define SRCEN (cmd & 0x00000001)
117#define SRCENZ (cmd & 0x00000002)
118#define SRCENX (cmd & 0x00000004)
119#define DSTEN (cmd & 0x00000008)
120#define DSTENZ (cmd & 0x00000010)
121#define DSTWRZ (cmd & 0x00000020)
122#define CLIPA1 (cmd & 0x00000040)
123
124#define UPDA1F (cmd & 0x00000100)
125#define UPDA1 (cmd & 0x00000200)
126#define UPDA2 (cmd & 0x00000400)
127
128#define DSTA2 (cmd & 0x00000800)
129
130#define Z_OP_INF (cmd & 0x00040000)
131#define Z_OP_EQU (cmd & 0x00080000)
132#define Z_OP_SUP (cmd & 0x00100000)
133
134#define LFU_NAN (cmd & 0x00200000)
135#define LFU_NA (cmd & 0x00400000)
136#define LFU_AN (cmd & 0x00800000)
137#define LFU_A (cmd & 0x01000000)
138
139#define CMPDST (cmd & 0x02000000)
140#define BCOMPEN (cmd & 0x04000000)
141#define DCOMPEN (cmd & 0x08000000)
142
143#define PATDSEL (cmd & 0x00010000)
144#define ADDDSEL (cmd & 0x00020000)
145#define TOPBEN (cmd & 0x00004000)
146#define TOPNEN (cmd & 0x00008000)
147#define BKGWREN (cmd & 0x10000000)
148#define GOURD (cmd & 0x00001000)
149#define GOURZ (cmd & 0x00002000)
150#define SRCSHADE (cmd & 0x40000000)
151
152
153#define XADDPHR 0
154#define XADDPIX 1
155#define XADD0 2
156#define XADDINC 3
157
158#define XSIGNSUB_A1 (REG(A1_FLAGS)&0x080000)
159#define XSIGNSUB_A2 (REG(A2_FLAGS)&0x080000)
160
161#define YSIGNSUB_A1 (REG(A1_FLAGS)&0x100000)
162#define YSIGNSUB_A2 (REG(A2_FLAGS)&0x100000)
163
164#define YADD1_A1 (REG(A1_FLAGS)&0x040000)
165#define YADD1_A2 (REG(A2_FLAGS)&0x040000)
166
167/*******************************************************************************
168********************** STUFF CUT BELOW THIS LINE! ******************************
169*******************************************************************************/
170#ifdef USE_ORIGINAL_BLITTER // We're ditching this crap for now...
171
172//Put 'em back, once we fix the problem!!! [KO]
173// 1 bpp pixel read
174#define PIXEL_SHIFT_1(a) (((~a##_x) >> 16) & 7)
175#define PIXEL_OFFSET_1(a) (((((uint32_t)a##_y >> 16) * a##_width / 8) + (((uint32_t)a##_x >> 19) & ~7)) * (1 + a##_pitch) + (((uint32_t)a##_x >> 19) & 7))
176#define READ_PIXEL_1(a) ((JaguarReadByte(a##_addr+PIXEL_OFFSET_1(a), BLITTER) >> PIXEL_SHIFT_1(a)) & 0x01)
177//#define READ_PIXEL_1(a) ((JaguarReadByte(a##_addr+PIXEL_OFFSET_1(a)) >> PIXEL_SHIFT_1(a)) & 0x01)
178
179// 2 bpp pixel read
180#define PIXEL_SHIFT_2(a) (((~a##_x) >> 15) & 6)
181#define PIXEL_OFFSET_2(a) (((((uint32_t)a##_y >> 16) * a##_width / 4) + (((uint32_t)a##_x >> 18) & ~7)) * (1 + a##_pitch) + (((uint32_t)a##_x >> 18) & 7))
182#define READ_PIXEL_2(a) ((JaguarReadByte(a##_addr+PIXEL_OFFSET_2(a), BLITTER) >> PIXEL_SHIFT_2(a)) & 0x03)
183//#define READ_PIXEL_2(a) ((JaguarReadByte(a##_addr+PIXEL_OFFSET_2(a)) >> PIXEL_SHIFT_2(a)) & 0x03)
184
185// 4 bpp pixel read
186#define PIXEL_SHIFT_4(a) (((~a##_x) >> 14) & 4)
187#define PIXEL_OFFSET_4(a) (((((uint32_t)a##_y >> 16) * (a##_width/2)) + (((uint32_t)a##_x >> 17) & ~7)) * (1 + a##_pitch) + (((uint32_t)a##_x >> 17) & 7))
188#define READ_PIXEL_4(a) ((JaguarReadByte(a##_addr+PIXEL_OFFSET_4(a), BLITTER) >> PIXEL_SHIFT_4(a)) & 0x0f)
189//#define READ_PIXEL_4(a) ((JaguarReadByte(a##_addr+PIXEL_OFFSET_4(a)) >> PIXEL_SHIFT_4(a)) & 0x0f)
190
191// 8 bpp pixel read
192#define PIXEL_OFFSET_8(a) (((((uint32_t)a##_y >> 16) * a##_width) + (((uint32_t)a##_x >> 16) & ~7)) * (1 + a##_pitch) + (((uint32_t)a##_x >> 16) & 7))
193#define READ_PIXEL_8(a) (JaguarReadByte(a##_addr+PIXEL_OFFSET_8(a), BLITTER))
194//#define READ_PIXEL_8(a) (JaguarReadByte(a##_addr+PIXEL_OFFSET_8(a)))
195
196// 16 bpp pixel read
197#define PIXEL_OFFSET_16(a) (((((uint32_t)a##_y >> 16) * a##_width) + (((uint32_t)a##_x >> 16) & ~3)) * (1 + a##_pitch) + (((uint32_t)a##_x >> 16) & 3))
198#define READ_PIXEL_16(a) (JaguarReadWord(a##_addr+(PIXEL_OFFSET_16(a)<<1), BLITTER))
199//#define READ_PIXEL_16(a) (JaguarReadWord(a##_addr+(PIXEL_OFFSET_16(a)<<1)))
200
201// 32 bpp pixel read
202#define PIXEL_OFFSET_32(a) (((((uint32_t)a##_y >> 16) * a##_width) + (((uint32_t)a##_x >> 16) & ~1)) * (1 + a##_pitch) + (((uint32_t)a##_x >> 16) & 1))
203#define READ_PIXEL_32(a) (JaguarReadLong(a##_addr+(PIXEL_OFFSET_32(a)<<2), BLITTER))
204//#define READ_PIXEL_32(a) (JaguarReadLong(a##_addr+(PIXEL_OFFSET_32(a)<<2)))
205
206// pixel read
207#define READ_PIXEL(a,f) (\
208 (((f>>3)&0x07) == 0) ? (READ_PIXEL_1(a)) : \
209 (((f>>3)&0x07) == 1) ? (READ_PIXEL_2(a)) : \
210 (((f>>3)&0x07) == 2) ? (READ_PIXEL_4(a)) : \
211 (((f>>3)&0x07) == 3) ? (READ_PIXEL_8(a)) : \
212 (((f>>3)&0x07) == 4) ? (READ_PIXEL_16(a)) : \
213 (((f>>3)&0x07) == 5) ? (READ_PIXEL_32(a)) : 0)
214
215// 16 bpp z data read
216#define ZDATA_OFFSET_16(a) (PIXEL_OFFSET_16(a) + a##_zoffs * 4)
217#define READ_ZDATA_16(a) (JaguarReadWord(a##_addr+(ZDATA_OFFSET_16(a)<<1), BLITTER))
218//#define READ_ZDATA_16(a) (JaguarReadWord(a##_addr+(ZDATA_OFFSET_16(a)<<1)))
219
220// z data read
221#define READ_ZDATA(a,f) (READ_ZDATA_16(a))
222
223// 16 bpp z data write
224#define WRITE_ZDATA_16(a,d) { JaguarWriteWord(a##_addr+(ZDATA_OFFSET_16(a)<<1), d, BLITTER); }
225//#define WRITE_ZDATA_16(a,d) { JaguarWriteWord(a##_addr+(ZDATA_OFFSET_16(a)<<1), d); }
226
227// z data write
228#define WRITE_ZDATA(a,f,d) WRITE_ZDATA_16(a,d);
229
230// 1 bpp r data read
231#define READ_RDATA_1(r,a,p) ((p) ? ((REG(r+(((uint32_t)a##_x >> 19) & 0x04))) >> (((uint32_t)a##_x >> 16) & 0x1F)) & 0x0001 : (REG(r) & 0x0001))
232
233// 2 bpp r data read
234#define READ_RDATA_2(r,a,p) ((p) ? ((REG(r+(((uint32_t)a##_x >> 18) & 0x04))) >> (((uint32_t)a##_x >> 15) & 0x3E)) & 0x0003 : (REG(r) & 0x0003))
235
236// 4 bpp r data read
237#define READ_RDATA_4(r,a,p) ((p) ? ((REG(r+(((uint32_t)a##_x >> 17) & 0x04))) >> (((uint32_t)a##_x >> 14) & 0x28)) & 0x000F : (REG(r) & 0x000F))
238
239// 8 bpp r data read
240#define READ_RDATA_8(r,a,p) ((p) ? ((REG(r+(((uint32_t)a##_x >> 16) & 0x04))) >> (((uint32_t)a##_x >> 13) & 0x18)) & 0x00FF : (REG(r) & 0x00FF))
241
242// 16 bpp r data read
243#define READ_RDATA_16(r,a,p) ((p) ? ((REG(r+(((uint32_t)a##_x >> 15) & 0x04))) >> (((uint32_t)a##_x >> 12) & 0x10)) & 0xFFFF : (REG(r) & 0xFFFF))
244
245// 32 bpp r data read
246#define READ_RDATA_32(r,a,p) ((p) ? REG(r+(((uint32_t)a##_x >> 14) & 0x04)) : REG(r))
247
248// register data read
249#define READ_RDATA(r,a,f,p) (\
250 (((f>>3)&0x07) == 0) ? (READ_RDATA_1(r,a,p)) : \
251 (((f>>3)&0x07) == 1) ? (READ_RDATA_2(r,a,p)) : \
252 (((f>>3)&0x07) == 2) ? (READ_RDATA_4(r,a,p)) : \
253 (((f>>3)&0x07) == 3) ? (READ_RDATA_8(r,a,p)) : \
254 (((f>>3)&0x07) == 4) ? (READ_RDATA_16(r,a,p)) : \
255 (((f>>3)&0x07) == 5) ? (READ_RDATA_32(r,a,p)) : 0)
256
257// 1 bpp pixel write
258#define WRITE_PIXEL_1(a,d) { JaguarWriteByte(a##_addr+PIXEL_OFFSET_1(a), (JaguarReadByte(a##_addr+PIXEL_OFFSET_1(a), BLITTER)&(~(0x01 << PIXEL_SHIFT_1(a))))|(d<<PIXEL_SHIFT_1(a)), BLITTER); }
259//#define WRITE_PIXEL_1(a,d) { JaguarWriteByte(a##_addr+PIXEL_OFFSET_1(a), (JaguarReadByte(a##_addr+PIXEL_OFFSET_1(a))&(~(0x01 << PIXEL_SHIFT_1(a))))|(d<<PIXEL_SHIFT_1(a))); }
260
261// 2 bpp pixel write
262#define WRITE_PIXEL_2(a,d) { JaguarWriteByte(a##_addr+PIXEL_OFFSET_2(a), (JaguarReadByte(a##_addr+PIXEL_OFFSET_2(a), BLITTER)&(~(0x03 << PIXEL_SHIFT_2(a))))|(d<<PIXEL_SHIFT_2(a)), BLITTER); }
263//#define WRITE_PIXEL_2(a,d) { JaguarWriteByte(a##_addr+PIXEL_OFFSET_2(a), (JaguarReadByte(a##_addr+PIXEL_OFFSET_2(a))&(~(0x03 << PIXEL_SHIFT_2(a))))|(d<<PIXEL_SHIFT_2(a))); }
264
265// 4 bpp pixel write
266#define WRITE_PIXEL_4(a,d) { JaguarWriteByte(a##_addr+PIXEL_OFFSET_4(a), (JaguarReadByte(a##_addr+PIXEL_OFFSET_4(a), BLITTER)&(~(0x0f << PIXEL_SHIFT_4(a))))|(d<<PIXEL_SHIFT_4(a)), BLITTER); }
267//#define WRITE_PIXEL_4(a,d) { JaguarWriteByte(a##_addr+PIXEL_OFFSET_4(a), (JaguarReadByte(a##_addr+PIXEL_OFFSET_4(a))&(~(0x0f << PIXEL_SHIFT_4(a))))|(d<<PIXEL_SHIFT_4(a))); }
268
269// 8 bpp pixel write
270#define WRITE_PIXEL_8(a,d) { JaguarWriteByte(a##_addr+PIXEL_OFFSET_8(a), d, BLITTER); }
271//#define WRITE_PIXEL_8(a,d) { JaguarWriteByte(a##_addr+PIXEL_OFFSET_8(a), d); }
272
273// 16 bpp pixel write
274//#define WRITE_PIXEL_16(a,d) { JaguarWriteWord(a##_addr+(PIXEL_OFFSET_16(a)<<1),d); }
275#define WRITE_PIXEL_16(a,d) { JaguarWriteWord(a##_addr+(PIXEL_OFFSET_16(a)<<1), d, BLITTER); if (specialLog) WriteLog("Pixel write address: %08X\n", a##_addr+(PIXEL_OFFSET_16(a)<<1)); }
276//#define WRITE_PIXEL_16(a,d) { JaguarWriteWord(a##_addr+(PIXEL_OFFSET_16(a)<<1), d); if (specialLog) WriteLog("Pixel write address: %08X\n", a##_addr+(PIXEL_OFFSET_16(a)<<1)); }
277
278// 32 bpp pixel write
279#define WRITE_PIXEL_32(a,d) { JaguarWriteLong(a##_addr+(PIXEL_OFFSET_32(a)<<2), d, BLITTER); }
280//#define WRITE_PIXEL_32(a,d) { JaguarWriteLong(a##_addr+(PIXEL_OFFSET_32(a)<<2), d); }
281
282// pixel write
283#define WRITE_PIXEL(a,f,d) {\
284 switch ((f>>3)&0x07) { \
285 case 0: WRITE_PIXEL_1(a,d); break; \
286 case 1: WRITE_PIXEL_2(a,d); break; \
287 case 2: WRITE_PIXEL_4(a,d); break; \
288 case 3: WRITE_PIXEL_8(a,d); break; \
289 case 4: WRITE_PIXEL_16(a,d); break; \
290 case 5: WRITE_PIXEL_32(a,d); break; \
291 }}
292
293// Width in Pixels of a Scanline
294// This is a pretranslation of the value found in the A1 & A2 flags: It's really a floating point value
295// of the form EEEEMM where MM is the mantissa with an implied "1." in front of it and the EEEE value is
296// the exponent. Valid values for the exponent range from 0 to 11 (decimal). It's easiest to think of it
297// as a floating point bit pattern being followed by a number of zeroes. So, e.g., 001101 translates to
298// 1.01 (the "1." being implied) x (2 ^ 3) or 1010 -> 10 in base 10 (i.e., 1.01 with the decimal place
299// being shifted to the right 3 places).
300/*static uint32_t blitter_scanline_width[48] =
301{
302 0, 0, 0, 0, // Note: This would really translate to 1, 1, 1, 1
303 2, 0, 0, 0,
304 4, 0, 6, 0,
305 8, 10, 12, 14,
306 16, 20, 24, 28,
307 32, 40, 48, 56,
308 64, 80, 96, 112,
309 128, 160, 192, 224,
310 256, 320, 384, 448,
311 512, 640, 768, 896,
312 1024, 1280, 1536, 1792,
313 2048, 2560, 3072, 3584
314};//*/
315
316//static uint8_t * tom_ram_8;
317//static uint8_t * paletteRam;
318static uint8_t src;
319static uint8_t dst;
320static uint8_t misc;
321static uint8_t a1ctl;
322static uint8_t mode;
323static uint8_t ity;
324static uint8_t zop;
325static uint8_t op;
326static uint8_t ctrl;
327static uint32_t a1_addr;
328static uint32_t a2_addr;
329static int32_t a1_zoffs;
330static int32_t a2_zoffs;
331static uint32_t xadd_a1_control;
332static uint32_t xadd_a2_control;
333static int32_t a1_pitch;
334static int32_t a2_pitch;
335static uint32_t n_pixels;
336static uint32_t n_lines;
337static int32_t a1_x;
338static int32_t a1_y;
339static int32_t a1_width;
340static int32_t a2_x;
341static int32_t a2_y;
342static int32_t a2_width;
343static int32_t a2_mask_x;
344static int32_t a2_mask_y;
345static int32_t a1_xadd;
346static int32_t a1_yadd;
347static int32_t a2_xadd;
348static int32_t a2_yadd;
349static uint8_t a1_phrase_mode;
350static uint8_t a2_phrase_mode;
351static int32_t a1_step_x = 0;
352static int32_t a1_step_y = 0;
353static int32_t a2_step_x = 0;
354static int32_t a2_step_y = 0;
355static uint32_t outer_loop;
356static uint32_t inner_loop;
357static uint32_t a2_psize;
358static uint32_t a1_psize;
359static uint32_t gouraud_add;
360//static uint32_t gouraud_data;
361//static uint16_t gint[4];
362//static uint16_t gfrac[4];
363//static uint8_t gcolour[4];
364static int gd_i[4];
365static int gd_c[4];
366static int gd_ia, gd_ca;
367static int colour_index = 0;
368static int32_t zadd;
369static uint32_t z_i[4];
370
371static int32_t a1_clip_x, a1_clip_y;
372
373// In the spirit of "get it right first, *then* optimize" I've taken the liberty
374// of removing all the unnecessary code caching. If it turns out to be a good way
375// to optimize the blitter, then we may revisit it in the future...
376
377//
378// Generic blit handler
379//
380void blitter_generic(uint32_t cmd)
381{
382/*
383Blit! (0018FA70 <- 008DDC40) count: 2 x 13, A1/2_FLAGS: 00014218/00013C18 [cmd: 1401060C]
384 CMD -> src: SRCENX dst: DSTEN misc: a1ctl: UPDA1 UPDA2 mode: ity: PATDSEL z-op: op: LFU_CLEAR ctrl: BCOMPEN BKGWREN
385 A1 step values: -2 (X), 1 (Y)
386 A2 step values: -1 (X), 1 (Y) [mask (unused): 00000000 - FFFFFFFF/FFFFFFFF]
387 A1 -> pitch: 1 phrases, depth: 8bpp, z-off: 0, width: 320 (21), addctl: XADDPIX YADD0 XSIGNADD YSIGNADD
388 A2 -> pitch: 1 phrases, depth: 8bpp, z-off: 0, width: 192 (1E), addctl: XADDPIX YADD0 XSIGNADD YSIGNADD
389 A1 x/y: 100/12, A2 x/y: 106/0 Pattern: 000000F300000000
390*/
391//if (effect_start)
392// specialLog = true;
393/*if (cmd == 0x1401060C && blit_start_log)
394 specialLog = true;//*/
395//Testing only!
396//uint32_t logGo = ((cmd == 0x01800E01 && REG(A1_BASE) == 0x898000) ? 1 : 0);
397 uint32_t srcdata, srczdata, dstdata, dstzdata, writedata, inhibit;
398 uint32_t bppSrc = (DSTA2 ? 1 << ((REG(A1_FLAGS) >> 3) & 0x07) : 1 << ((REG(A2_FLAGS) >> 3) & 0x07));
399
400if (specialLog)
401{
402 WriteLog("About to do n x m blit (BM width is ? pixels)...\n");
403 WriteLog("A1_STEP_X/Y = %08X/%08X, A2_STEP_X/Y = %08X/%08X\n", a1_step_x, a1_step_y, a2_step_x, a2_step_y);
404}
405/* if (BCOMPEN)
406 {
407 if (DSTA2)
408 a1_xadd = 0;
409 else
410 a2_xadd = 0;
411 }//*/
412
413 while (outer_loop--)
414 {
415if (specialLog)
416{
417 WriteLog(" A1_X/Y = %08X/%08X, A2_X/Y = %08X/%08X\n", a1_x, a1_y, a2_x, a2_y);
418}
419 uint32_t a1_start = a1_x, a2_start = a2_x, bitPos = 0;
420
421 //Kludge for Hover Strike...
422 //I wonder if this kludge is in conjunction with the SRCENX down below...
423 // This isn't so much a kludge but the way things work in BCOMPEN mode...!
424 if (BCOMPEN && SRCENX)
425 {
426 if (n_pixels < bppSrc)
427 bitPos = bppSrc - n_pixels;
428 }
429
430 inner_loop = n_pixels;
431 while (inner_loop--)
432 {
433if (specialLog)
434{
435 WriteLog(" A1_X/Y = %08X/%08X, A2_X/Y = %08X/%08X\n", a1_x, a1_y, a2_x, a2_y);
436}
437 srcdata = srczdata = dstdata = dstzdata = writedata = inhibit = 0;
438
439 if (!DSTA2) // Data movement: A1 <- A2
440 {
441 // load src data and Z
442// if (SRCEN)
443 if (SRCEN || SRCENX) // Not sure if this is correct... (seems to be...!)
444 {
445 srcdata = READ_PIXEL(a2, REG(A2_FLAGS));
446
447 if (SRCENZ)
448 srczdata = READ_ZDATA(a2, REG(A2_FLAGS));
449 else if (cmd & 0x0001C020) // PATDSEL | TOPBEN | TOPNEN | DSTWRZ
450 srczdata = READ_RDATA(SRCZINT, a2, REG(A2_FLAGS), a2_phrase_mode);
451 }
452 else // Use SRCDATA register...
453 {
454 srcdata = READ_RDATA(SRCDATA, a2, REG(A2_FLAGS), a2_phrase_mode);
455
456 if (cmd & 0x0001C020) // PATDSEL | TOPBEN | TOPNEN | DSTWRZ
457 srczdata = READ_RDATA(SRCZINT, a2, REG(A2_FLAGS), a2_phrase_mode);
458 }
459
460 // load dst data and Z
461 if (DSTEN)
462 {
463 dstdata = READ_PIXEL(a1, REG(A1_FLAGS));
464
465 if (DSTENZ)
466 dstzdata = READ_ZDATA(a1, REG(A1_FLAGS));
467 else
468 dstzdata = READ_RDATA(DSTZ, a1, REG(A1_FLAGS), a1_phrase_mode);
469 }
470 else
471 {
472 dstdata = READ_RDATA(DSTDATA, a1, REG(A1_FLAGS), a1_phrase_mode);
473
474 if (DSTENZ)
475 dstzdata = READ_RDATA(DSTZ, a1, REG(A1_FLAGS), a1_phrase_mode);
476 }
477
478/*This wasn't working... // a1 clipping
479 if (cmd & 0x00000040)
480 {
481 if (a1_x < 0 || a1_y < 0 || (a1_x >> 16) >= (REG(A1_CLIP) & 0x7FFF)
482 || (a1_y >> 16) >= ((REG(A1_CLIP) >> 16) & 0x7FFF))
483 inhibit = 1;
484 }//*/
485
486 if (GOURZ)
487 srczdata = z_i[colour_index] >> 16;
488
489 // apply z comparator
490 if (Z_OP_INF && srczdata < dstzdata) inhibit = 1;
491 if (Z_OP_EQU && srczdata == dstzdata) inhibit = 1;
492 if (Z_OP_SUP && srczdata > dstzdata) inhibit = 1;
493
494 // apply data comparator
495// Note: DCOMPEN only works in 8/16 bpp modes! !!! FIX !!!
496// Does BCOMPEN only work in 1 bpp mode???
497// No, but it always does a 1 bit expansion no matter what the BPP of the channel is set to. !!! FIX !!!
498// This is bit tricky... We need to fix the XADD value so that it acts like a 1BPP value while inside
499// an 8BPP space.
500 if (DCOMPEN | BCOMPEN)
501 {
502//Temp, for testing Hover Strike
503//Doesn't seem to do it... Why?
504//What needs to happen here is twofold. First, the address generator in the outer loop has
505//to honor the BPP when calculating the start address (which it kinda does already). Second,
506//it has to step bit by bit when using BCOMPEN. How to do this???
507 if (BCOMPEN)
508//small problem with this approach: it's not accurate... We need a proper address to begin with
509//and *then* we can do the bit stepping from there the way it's *supposed* to be done... !!! FIX !!!
510//[DONE]
511 {
512 uint32_t pixShift = (~bitPos) & (bppSrc - 1);
513 srcdata = (srcdata >> pixShift) & 0x01;
514
515 bitPos++;
516// if (bitPos % bppSrc == 0)
517// a2_x += 0x00010000;
518 }
519/*
520Interesting (Hover Strike--large letter):
521
522Blit! (0018FA70 <- 008DDC40) count: 2 x 13, A1/2_FLAGS: 00014218/00013C18 [cmd: 1401060C]
523 CMD -> src: SRCENX dst: DSTEN misc: a1ctl: UPDA1 UPDA2 mode: ity: PATDSEL z-op: op: LFU_CLEAR ctrl: BCOMPEN BKGWREN
524 A1 step values: -2 (X), 1 (Y)
525 A2 step values: -1 (X), 1 (Y) [mask (unused): 00000000 - FFFFFFFF/FFFFFFFF]
526 A1 -> pitch: 1 phrases, depth: 8bpp, z-off: 0, width: 320 (21), addctl: XADDPIX YADD0 XSIGNADD YSIGNADD
527 A2 -> pitch: 1 phrases, depth: 8bpp, z-off: 0, width: 192 (1E), addctl: XADDPIX YADD0 XSIGNADD YSIGNADD
528 A1 x/y: 100/12, A2 x/y: 106/0 Pattern: 000000F300000000
529
530Blit! (0018FA70 <- 008DDC40) count: 8 x 13, A1/2_FLAGS: 00014218/00013C18 [cmd: 1401060C]
531 CMD -> src: SRCENX dst: DSTEN misc: a1ctl: UPDA1 UPDA2 mode: ity: PATDSEL z-op: op: LFU_CLEAR ctrl: BCOMPEN BKGWREN
532 A1 step values: -8 (X), 1 (Y)
533 A2 step values: -1 (X), 1 (Y) [mask (unused): 00000000 - FFFFFFFF/FFFFFFFF]
534 A1 -> pitch: 1 phrases, depth: 8bpp, z-off: 0, width: 320 (21), addctl: XADDPIX YADD0 XSIGNADD YSIGNADD
535 A2 -> pitch: 1 phrases, depth: 8bpp, z-off: 0, width: 192 (1E), addctl: XADDPIX YADD0 XSIGNADD YSIGNADD
536 A1 x/y: 102/12, A2 x/y: 107/0 Pattern: 000000F300000000
537
538Blit! (0018FA70 <- 008DDC40) count: 1 x 13, A1/2_FLAGS: 00014218/00013C18 [cmd: 1401060C]
539 CMD -> src: SRCENX dst: DSTEN misc: a1ctl: UPDA1 UPDA2 mode: ity: PATDSEL z-op: op: LFU_CLEAR ctrl: BCOMPEN BKGWREN
540 A1 step values: -1 (X), 1 (Y)
541 A2 step values: -1 (X), 1 (Y) [mask (unused): 00000000 - FFFFFFFF/FFFFFFFF]
542 A1 -> pitch: 1 phrases, depth: 8bpp, z-off: 0, width: 320 (21), addctl: XADDPIX YADD0 XSIGNADD YSIGNADD
543 A2 -> pitch: 1 phrases, depth: 8bpp, z-off: 0, width: 192 (1E), addctl: XADDPIX YADD0 XSIGNADD YSIGNADD
544 A1 x/y: 118/12, A2 x/y: 70/0 Pattern: 000000F300000000
545
546Blit! (0018FA70 <- 008DDC40) count: 8 x 13, A1/2_FLAGS: 00014218/00013C18 [cmd: 1401060C]
547 CMD -> src: SRCENX dst: DSTEN misc: a1ctl: UPDA1 UPDA2 mode: ity: PATDSEL z-op: op: LFU_CLEAR ctrl: BCOMPEN BKGWREN
548 A1 step values: -8 (X), 1 (Y)
549 A2 step values: -1 (X), 1 (Y) [mask (unused): 00000000 - FFFFFFFF/FFFFFFFF]
550 A1 -> pitch: 1 phrases, depth: 8bpp, z-off: 0, width: 320 (21), addctl: XADDPIX YADD0 XSIGNADD YSIGNADD
551 A2 -> pitch: 1 phrases, depth: 8bpp, z-off: 0, width: 192 (1E), addctl: XADDPIX YADD0 XSIGNADD YSIGNADD
552 A1 x/y: 119/12, A2 x/y: 71/0 Pattern: 000000F300000000
553
554Blit! (0018FA70 <- 008DDC40) count: 1 x 13, A1/2_FLAGS: 00014218/00013C18 [cmd: 1401060C]
555 CMD -> src: SRCENX dst: DSTEN misc: a1ctl: UPDA1 UPDA2 mode: ity: PATDSEL z-op: op: LFU_CLEAR ctrl: BCOMPEN BKGWREN
556 A1 step values: -1 (X), 1 (Y)
557 A2 step values: -1 (X), 1 (Y) [mask (unused): 00000000 - FFFFFFFF/FFFFFFFF]
558 A1 -> pitch: 1 phrases, depth: 8bpp, z-off: 0, width: 320 (21), addctl: XADDPIX YADD0 XSIGNADD YSIGNADD
559 A2 -> pitch: 1 phrases, depth: 8bpp, z-off: 0, width: 192 (1E), addctl: XADDPIX YADD0 XSIGNADD YSIGNADD
560 A1 x/y: 127/12, A2 x/y: 66/0 Pattern: 000000F300000000
561
562Blit! (0018FA70 <- 008DDC40) count: 8 x 13, A1/2_FLAGS: 00014218/00013C18 [cmd: 1401060C]
563 CMD -> src: SRCENX dst: DSTEN misc: a1ctl: UPDA1 UPDA2 mode: ity: PATDSEL z-op: op: LFU_CLEAR ctrl: BCOMPEN BKGWREN
564 A1 step values: -8 (X), 1 (Y)
565 A2 step values: -1 (X), 1 (Y) [mask (unused): 00000000 - FFFFFFFF/FFFFFFFF]
566 A1 -> pitch: 1 phrases, depth: 8bpp, z-off: 0, width: 320 (21), addctl: XADDPIX YADD0 XSIGNADD YSIGNADD
567 A2 -> pitch: 1 phrases, depth: 8bpp, z-off: 0, width: 192 (1E), addctl: XADDPIX YADD0 XSIGNADD YSIGNADD
568 A1 x/y: 128/12, A2 x/y: 67/0 Pattern: 000000F300000000
569*/
570
571
572 if (!CMPDST)
573 {
574//WriteLog("Blitter: BCOMPEN set on command %08X inhibit prev:%u, now:", cmd, inhibit);
575 // compare source pixel with pattern pixel
576/*
577Blit! (000B8250 <- 0012C3A0) count: 16 x 1, A1/2_FLAGS: 00014420/00012000 [cmd: 05810001]
578 CMD -> src: SRCEN dst: misc: a1ctl: mode: ity: PATDSEL z-op: op: LFU_REPLACE ctrl: BCOMPEN
579 A1 -> pitch: 1 phrases, depth: 16bpp, z-off: 0, width: 384 (22), addctl: XADDPIX YADD0 XSIGNADD YSIGNADD
580 A2 -> pitch: 1 phrases, depth: 1bpp, z-off: 0, width: 16 (10), addctl: XADDPIX YADD0 XSIGNADD YSIGNADD
581 x/y: 0/20
582...
583*/
584// AvP is still wrong, could be cuz it's doing A1 -> A2...
585
586// Src is the 1bpp bitmap... DST is the PATTERN!!!
587// This seems to solve at least ONE of the problems with MC3D...
588// Why should this be inverted???
589// Bcuz it is. This is supposed to be used only for a bit -> pixel expansion...
590/* if (srcdata == READ_RDATA(PATTERNDATA, a2, REG(A2_FLAGS), a2_phrase_mode))
591// if (srcdata != READ_RDATA(PATTERNDATA, a2, REG(A2_FLAGS), a2_phrase_mode))
592 inhibit = 1;//*/
593/* uint32_t A2bpp = 1 << ((REG(A2_FLAGS) >> 3) & 0x07);
594 if (A2bpp == 1 || A2bpp == 16 || A2bpp == 8)
595 inhibit = (srcdata == 0 ? 1: 0);
596// inhibit = !srcdata;
597 else
598 WriteLog("Blitter: Bad BPP (%u) selected for BCOMPEN mode!\n", A2bpp);//*/
599// What it boils down to is this:
600
601 if (srcdata == 0)
602 inhibit = 1;//*/
603 }
604 else
605 {
606 // compare destination pixel with pattern pixel
607 if (dstdata == READ_RDATA(PATTERNDATA, a1, REG(A1_FLAGS), a1_phrase_mode))
608// if (dstdata != READ_RDATA(PATTERNDATA, a1, REG(A1_FLAGS), a1_phrase_mode))
609 inhibit = 1;
610 }
611
612// This is DEFINITELY WRONG
613// if (a1_phrase_mode || a2_phrase_mode)
614// inhibit = !inhibit;
615 }
616
617 if (CLIPA1)
618 {
619 inhibit |= (((a1_x >> 16) < a1_clip_x && (a1_x >> 16) >= 0
620 && (a1_y >> 16) < a1_clip_y && (a1_y >> 16) >= 0) ? 0 : 1);
621 }
622
623 // compute the write data and store
624 if (!inhibit)
625 {
626// Houston, we have a problem...
627// Look here, at PATDSEL and GOURD. If both are active (as they are on the BIOS intro), then there's
628// a conflict! E.g.:
629//Blit! (00100000 <- 000095D0) count: 3 x 1, A1/2_FLAGS: 00014220/00004020 [cmd: 00011008]
630// CMD -> src: dst: DSTEN misc: a1ctl: mode: GOURD ity: PATDSEL z-op: op: LFU_CLEAR ctrl:
631// A1 -> pitch: 1 phrases, depth: 16bpp, z-off: 0, width: 320 (21), addctl: XADDPIX YADD0 XSIGNADD YSIGNADD
632// A2 -> pitch: 1 phrases, depth: 16bpp, z-off: 0, width: 256 (20), addctl: XADDPHR YADD0 XSIGNADD YSIGNADD
633// A1 x/y: 90/171, A2 x/y: 808/0 Pattern: 776D770077007700
634
635 if (PATDSEL)
636 {
637 // use pattern data for write data
638 writedata = READ_RDATA(PATTERNDATA, a1, REG(A1_FLAGS), a1_phrase_mode);
639 }
640 else if (ADDDSEL)
641 {
642/*if (blit_start_log)
643 WriteLog("BLIT: ADDDSEL srcdata: %08X\, dstdata: %08X, ", srcdata, dstdata);//*/
644
645 // intensity addition
646//Ok, this is wrong... Or is it? Yes, it's wrong! !!! FIX !!!
647/* writedata = (srcdata & 0xFF) + (dstdata & 0xFF);
648 if (!(TOPBEN) && writedata > 0xFF)
649// writedata = 0xFF;
650 writedata &= 0xFF;
651 writedata |= (srcdata & 0xF00) + (dstdata & 0xF00);
652 if (!(TOPNEN) && writedata > 0xFFF)
653// writedata = 0xFFF;
654 writedata &= 0xFFF;
655 writedata |= (srcdata & 0xF000) + (dstdata & 0xF000);//*/
656//notneeded--writedata &= 0xFFFF;
657/*if (blit_start_log)
658 WriteLog("writedata: %08X\n", writedata);//*/
659/*
660Hover Strike ADDDSEL blit:
661
662Blit! (00098D90 <- 0081DDC0) count: 320 x 287, A1/2_FLAGS: 00004220/00004020 [cmd: 00020208]
663 CMD -> src: dst: DSTEN misc: a1ctl: UPDA1 mode: ity: ADDDSEL z-op: op: LFU_CLEAR ctrl:
664 A1 step values: -320 (X), 1 (Y)
665 A1 -> pitch: 1 phrases, depth: 16bpp, z-off: 0, width: 320 (21), addctl: XADDPHR YADD0 XSIGNADD YSIGNADD
666 A2 -> pitch: 1 phrases, depth: 16bpp, z-off: 0, width: 256 (20), addctl: XADDPHR YADD0 XSIGNADD YSIGNADD
667 A1 x/y: 0/0, A2 x/y: 3288/0 Pattern: 0000000000000000 SRCDATA: 00FD00FD00FD00FD
668*/
669 writedata = (srcdata & 0xFF) + (dstdata & 0xFF);
670
671 if (!TOPBEN)
672 {
673//This is correct now, but slow...
674 int16_t s = (srcdata & 0xFF) | (srcdata & 0x80 ? 0xFF00 : 0x0000),
675 d = dstdata & 0xFF;
676 int16_t sum = s + d;
677
678 if (sum < 0)
679 writedata = 0x00;
680 else if (sum > 0xFF)
681 writedata = 0xFF;
682 else
683 writedata = (uint32_t)sum;
684 }
685
686//This doesn't seem right... Looks like it would muck up the low byte... !!! FIX !!!
687 writedata |= (srcdata & 0xF00) + (dstdata & 0xF00);
688
689 if (!TOPNEN && writedata > 0xFFF)
690 {
691 writedata &= 0xFFF;
692 }
693
694 writedata |= (srcdata & 0xF000) + (dstdata & 0xF000);
695 }
696 else
697 {
698 if (LFU_NAN) writedata |= ~srcdata & ~dstdata;
699 if (LFU_NA) writedata |= ~srcdata & dstdata;
700 if (LFU_AN) writedata |= srcdata & ~dstdata;
701 if (LFU_A) writedata |= srcdata & dstdata;
702 }
703
704//Although, this looks like it's OK... (even if it is shitty!)
705//According to JTRM, this is part of the four things the blitter does with the write data (the other
706//three being PATDSEL, ADDDSEL, and LFU (default). I'm not sure which gets precedence, this or PATDSEL
707//(see above blit example)...
708 if (GOURD)
709 writedata = ((gd_c[colour_index]) << 8) | (gd_i[colour_index] >> 16);
710
711 if (SRCSHADE)
712 {
713 int intensity = srcdata & 0xFF;
714 int ia = gd_ia >> 16;
715 if (ia & 0x80)
716 ia = 0xFFFFFF00 | ia;
717 intensity += ia;
718 if (intensity < 0)
719 intensity = 0;
720 if (intensity > 0xFF)
721 intensity = 0xFF;
722 writedata = (srcdata & 0xFF00) | intensity;
723 }
724 }
725 else
726 {
727 writedata = dstdata;
728 srczdata = dstzdata;
729 }
730
731//Tried 2nd below for Hover Strike: No dice.
732 if (/*a1_phrase_mode || */BKGWREN || !inhibit)
733// if (/*a1_phrase_mode || BKGWREN ||*/ !inhibit)
734 {
735/*if (((REG(A1_FLAGS) >> 3) & 0x07) == 5)
736{
737 uint32_t offset = a1_addr+(PIXEL_OFFSET_32(a1)<<2);
738// (((((uint32_t)a##_y >> 16) * a##_width) + (((uint32_t)a##_x >> 16) & ~1)) * (1 + a##_pitch) + (((uint32_t)a##_x >> 16) & 1))
739 if ((offset >= 0x1FF020 && offset <= 0x1FF03F) || (offset >= 0x1FF820 && offset <= 0x1FF83F))
740 WriteLog("32bpp pixel write: A1 Phrase mode --> ");
741}//*/
742 // write to the destination
743 WRITE_PIXEL(a1, REG(A1_FLAGS), writedata);
744 if (DSTWRZ)
745 WRITE_ZDATA(a1, REG(A1_FLAGS), srczdata);
746 }
747 }
748 else // if (DSTA2) // Data movement: A1 -> A2
749 {
750 // load src data and Z
751 if (SRCEN)
752 {
753 srcdata = READ_PIXEL(a1, REG(A1_FLAGS));
754 if (SRCENZ)
755 srczdata = READ_ZDATA(a1, REG(A1_FLAGS));
756 else if (cmd & 0x0001C020) // PATDSEL | TOPBEN | TOPNEN | DSTWRZ
757 srczdata = READ_RDATA(SRCZINT, a1, REG(A1_FLAGS), a1_phrase_mode);
758 }
759 else
760 {
761 srcdata = READ_RDATA(SRCDATA, a1, REG(A1_FLAGS), a1_phrase_mode);
762 if (cmd & 0x001C020) // PATDSEL | TOPBEN | TOPNEN | DSTWRZ
763 srczdata = READ_RDATA(SRCZINT, a1, REG(A1_FLAGS), a1_phrase_mode);
764 }
765
766 // load dst data and Z
767 if (DSTEN)
768 {
769 dstdata = READ_PIXEL(a2, REG(A2_FLAGS));
770 if (DSTENZ)
771 dstzdata = READ_ZDATA(a2, REG(A2_FLAGS));
772 else
773 dstzdata = READ_RDATA(DSTZ, a2, REG(A2_FLAGS), a2_phrase_mode);
774 }
775 else
776 {
777 dstdata = READ_RDATA(DSTDATA, a2, REG(A2_FLAGS), a2_phrase_mode);
778 if (DSTENZ)
779 dstzdata = READ_RDATA(DSTZ, a2, REG(A2_FLAGS), a2_phrase_mode);
780 }
781
782 if (GOURZ)
783 srczdata = z_i[colour_index] >> 16;
784
785 // apply z comparator
786 if (Z_OP_INF && srczdata < dstzdata) inhibit = 1;
787 if (Z_OP_EQU && srczdata == dstzdata) inhibit = 1;
788 if (Z_OP_SUP && srczdata > dstzdata) inhibit = 1;
789
790 // apply data comparator
791//NOTE: The bit comparator (BCOMPEN) is NOT the same at the data comparator!
792 if (DCOMPEN | BCOMPEN)
793 {
794 if (!CMPDST)
795 {
796 // compare source pixel with pattern pixel
797// AvP: Numbers are correct, but sprites are not!
798//This doesn't seem to be a problem... But could still be wrong...
799/* if (srcdata == READ_RDATA(PATTERNDATA, a1, REG(A1_FLAGS), a1_phrase_mode))
800// if (srcdata != READ_RDATA(PATTERNDATA, a1, REG(A1_FLAGS), a1_phrase_mode))
801 inhibit = 1;//*/
802// This is probably not 100% correct... It works in the 1bpp case
803// (in A1 <- A2 mode, that is...)
804// AvP: This is causing blocks to be written instead of bit patterns...
805// Works now...
806// NOTE: We really should separate out the BCOMPEN & DCOMPEN stuff!
807/* uint32_t A1bpp = 1 << ((REG(A1_FLAGS) >> 3) & 0x07);
808 if (A1bpp == 1 || A1bpp == 16 || A1bpp == 8)
809 inhibit = (srcdata == 0 ? 1: 0);
810 else
811 WriteLog("Blitter: Bad BPP (%u) selected for BCOMPEN mode!\n", A1bpp);//*/
812// What it boils down to is this:
813 if (srcdata == 0)
814 inhibit = 1;//*/
815 }
816 else
817 {
818 // compare destination pixel with pattern pixel
819 if (dstdata == READ_RDATA(PATTERNDATA, a2, REG(A2_FLAGS), a2_phrase_mode))
820// if (dstdata != READ_RDATA(PATTERNDATA, a2, REG(A2_FLAGS), a2_phrase_mode))
821 inhibit = 1;
822 }
823
824// This is DEFINITELY WRONG
825// if (a1_phrase_mode || a2_phrase_mode)
826// inhibit = !inhibit;
827 }
828
829 if (CLIPA1)
830 {
831 inhibit |= (((a1_x >> 16) < a1_clip_x && (a1_x >> 16) >= 0
832 && (a1_y >> 16) < a1_clip_y && (a1_y >> 16) >= 0) ? 0 : 1);
833 }
834
835 // compute the write data and store
836 if (!inhibit)
837 {
838 if (PATDSEL)
839 {
840 // use pattern data for write data
841 writedata = READ_RDATA(PATTERNDATA, a2, REG(A2_FLAGS), a2_phrase_mode);
842 }
843 else if (ADDDSEL)
844 {
845 // intensity addition
846 writedata = (srcdata & 0xFF) + (dstdata & 0xFF);
847 if (!(TOPBEN) && writedata > 0xFF)
848 writedata = 0xFF;
849 writedata |= (srcdata & 0xF00) + (dstdata & 0xF00);
850 if (!(TOPNEN) && writedata > 0xFFF)
851 writedata = 0xFFF;
852 writedata |= (srcdata & 0xF000) + (dstdata & 0xF000);
853 }
854 else
855 {
856 if (LFU_NAN)
857 writedata |= ~srcdata & ~dstdata;
858 if (LFU_NA)
859 writedata |= ~srcdata & dstdata;
860 if (LFU_AN)
861 writedata |= srcdata & ~dstdata;
862 if (LFU_A)
863 writedata |= srcdata & dstdata;
864 }
865
866 if (GOURD)
867 writedata = ((gd_c[colour_index]) << 8) | (gd_i[colour_index] >> 16);
868
869 if (SRCSHADE)
870 {
871 int intensity = srcdata & 0xFF;
872 int ia = gd_ia >> 16;
873 if (ia & 0x80)
874 ia = 0xFFFFFF00 | ia;
875 intensity += ia;
876 if (intensity < 0)
877 intensity = 0;
878 if (intensity > 0xFF)
879 intensity = 0xFF;
880 writedata = (srcdata & 0xFF00) | intensity;
881 }
882 }
883 else
884 {
885 writedata = dstdata;
886 srczdata = dstzdata;
887 }
888
889 if (/*a2_phrase_mode || */BKGWREN || !inhibit)
890 {
891/*if (logGo)
892{
893 uint32_t offset = a2_addr+(PIXEL_OFFSET_16(a2)<<1);
894// (((((uint32_t)a##_y >> 16) * a##_width) + (((uint32_t)a##_x >> 16) & ~1)) * (1 + a##_pitch) + (((uint32_t)a##_x >> 16) & 1))
895 WriteLog("[%08X:%04X] ", offset, writedata);
896}//*/
897 // write to the destination
898 WRITE_PIXEL(a2, REG(A2_FLAGS), writedata);
899
900 if (DSTWRZ)
901 WRITE_ZDATA(a2, REG(A2_FLAGS), srczdata);
902 }
903 }
904
905 // Update x and y (inner loop)
906//Now it does! But crappy, crappy, crappy! !!! FIX !!! [DONE]
907//This is less than ideal, but it works...
908 if (!BCOMPEN)
909 {//*/
910 a1_x += a1_xadd, a1_y += a1_yadd;
911 a2_x = (a2_x + a2_xadd) & a2_mask_x, a2_y = (a2_y + a2_yadd) & a2_mask_y;
912 }
913 else
914 {
915 a1_y += a1_yadd, a2_y = (a2_y + a2_yadd) & a2_mask_y;
916 if (!DSTA2)
917 {
918 a1_x += a1_xadd;
919 if (bitPos % bppSrc == 0)
920 a2_x = (a2_x + a2_xadd) & a2_mask_x;
921 }
922 else
923 {
924 a2_x = (a2_x + a2_xadd) & a2_mask_x;
925 if (bitPos % bppSrc == 0)
926 a1_x += a1_xadd;
927 }
928 }//*/
929
930 if (GOURZ)
931 z_i[colour_index] += zadd;
932
933 if (GOURD || SRCSHADE)
934 {
935 gd_i[colour_index] += gd_ia;
936//Hmm, this doesn't seem to do anything...
937//But it is correct according to the JTRM...!
938if ((int32_t)gd_i[colour_index] < 0)
939 gd_i[colour_index] = 0;
940if (gd_i[colour_index] > 0x00FFFFFF)
941 gd_i[colour_index] = 0x00FFFFFF;//*/
942
943 gd_c[colour_index] += gd_ca;
944if ((int32_t)gd_c[colour_index] < 0)
945 gd_c[colour_index] = 0;
946if (gd_c[colour_index] > 0x000000FF)
947 gd_c[colour_index] = 0x000000FF;//*/
948 }
949
950 if (GOURD || SRCSHADE || GOURZ)
951 {
952 if (a1_phrase_mode)
953//This screws things up WORSE (for the BIOS opening screen)
954// if (a1_phrase_mode || a2_phrase_mode)
955 colour_index = (colour_index + 1) & 0x03;
956 }
957 }
958
959/*
960Here's the problem... The phrase mode code!
961Blit! (00100000 -> 00148000) count: 327 x 267, A1/2_FLAGS: 00004420/00004420 [cmd: 41802E01]
962 CMD -> src: SRCEN dst: misc: a1ctl: UPDA1 UPDA2 mode: DSTA2 GOURZ ity: z-op: op: LFU_REPLACE ctrl: SRCSHADE
963 A1 step values: -327 (X), 1 (Y)
964 A2 step values: -327 (X), 1 (Y) [mask (unused): 00000000 - FFFFFFFF/FFFFFFFF]
965 A1 -> pitch: 1 phrases, depth: 16bpp, z-off: 0, width: 384 (22), addctl: XADDPHR YADD0 XSIGNADD YSIGNADD
966 A2 -> pitch: 1 phrases, depth: 16bpp, z-off: 0, width: 384 (22), addctl: XADDPHR YADD0 XSIGNADD YSIGNADD
967 A1 x/y: 28/58, A2 x/y: 28/58 Pattern: 00EA7BEA77EA77EA SRCDATA: 7BFF7BFF7BFF7BFF
968
969Below fixes it, but then borks:
970; O
971
972Blit! (00110000 <- 0010B2A8) count: 12 x 12, A1/2_FLAGS: 000042E2/00000020 [cmd: 09800609]
973 CMD -> src: SRCEN dst: DSTEN misc: a1ctl: UPDA1 UPDA2 mode: ity: z-op: op: LFU_REPLACE ctrl: DCOMPEN
974 A1 step values: -15 (X), 1 (Y)
975 A2 step values: -4 (X), 0 (Y) [mask (unused): 00000000 - FFFFFFFF/FFFFFFFF]
976 A1 -> pitch: 4 phrases, depth: 16bpp, z-off: 3, width: 320 (21), addctl: XADDPHR YADD0 XSIGNADD YSIGNADD
977 A2 -> pitch: 1 phrases, depth: 16bpp, z-off: 0, width: 1 (00), addctl: XADDPHR YADD0 XSIGNADD YSIGNADD
978 A1 x/y: 173/144, A2 x/y: 4052/0
979
980Lesse, with pre-add we'd have:
981
982 oooooooooooo
98300001111222233334444555566667777
984 ^ ^starts here...
985 | ^ends here.
986 |rolls back to here. Hmm.
987
988*/
989//NOTE: The way to fix the CD BIOS is to uncomment below and comment the stuff after
990// the phrase mode mucking around. But it fucks up everything else...
991//#define SCREWY_CD_DEPENDENT
992#ifdef SCREWY_CD_DEPENDENT
993 a1_x += a1_step_x;
994 a1_y += a1_step_y;
995 a2_x += a2_step_x;
996 a2_y += a2_step_y;//*/
997#endif
998
999 //New: Phrase mode taken into account! :-p
1000/* if (a1_phrase_mode) // v1
1001 {
1002 // Bump the pointer to the next phrase boundary
1003 // Even though it works, this is crappy... Clean it up!
1004 uint32_t size = 64 / a1_psize;
1005
1006 // Crappy kludge... ('aligning' source to destination)
1007 if (a2_phrase_mode && DSTA2)
1008 {
1009 uint32_t extra = (a2_start >> 16) % size;
1010 a1_x += extra << 16;
1011 }
1012
1013 uint32_t newx = (a1_x >> 16) / size;
1014 uint32_t newxrem = (a1_x >> 16) % size;
1015 a1_x &= 0x0000FFFF;
1016 a1_x |= (((newx + (newxrem == 0 ? 0 : 1)) * size) & 0xFFFF) << 16;
1017 }//*/
1018 if (a1_phrase_mode) // v2
1019 {
1020 // Bump the pointer to the next phrase boundary
1021 // Even though it works, this is crappy... Clean it up!
1022 uint32_t size = 64 / a1_psize;
1023
1024 // Crappy kludge... ('aligning' source to destination)
1025 if (a2_phrase_mode && DSTA2)
1026 {
1027 uint32_t extra = (a2_start >> 16) % size;
1028 a1_x += extra << 16;
1029 }
1030
1031 uint32_t pixelSize = (size - 1) << 16;
1032 a1_x = (a1_x + pixelSize) & ~pixelSize;
1033 }
1034
1035/* if (a2_phrase_mode) // v1
1036 {
1037 // Bump the pointer to the next phrase boundary
1038 // Even though it works, this is crappy... Clean it up!
1039 uint32_t size = 64 / a2_psize;
1040
1041 // Crappy kludge... ('aligning' source to destination)
1042 // Prolly should do this for A1 channel as well... [DONE]
1043 if (a1_phrase_mode && !DSTA2)
1044 {
1045 uint32_t extra = (a1_start >> 16) % size;
1046 a2_x += extra << 16;
1047 }
1048
1049 uint32_t newx = (a2_x >> 16) / size;
1050 uint32_t newxrem = (a2_x >> 16) % size;
1051 a2_x &= 0x0000FFFF;
1052 a2_x |= (((newx + (newxrem == 0 ? 0 : 1)) * size) & 0xFFFF) << 16;
1053 }//*/
1054 if (a2_phrase_mode) // v1
1055 {
1056 // Bump the pointer to the next phrase boundary
1057 // Even though it works, this is crappy... Clean it up!
1058 uint32_t size = 64 / a2_psize;
1059
1060 // Crappy kludge... ('aligning' source to destination)
1061 // Prolly should do this for A1 channel as well... [DONE]
1062 if (a1_phrase_mode && !DSTA2)
1063 {
1064 uint32_t extra = (a1_start >> 16) % size;
1065 a2_x += extra << 16;
1066 }
1067
1068 uint32_t pixelSize = (size - 1) << 16;
1069 a2_x = (a2_x + pixelSize) & ~pixelSize;
1070 }
1071
1072 //Not entirely: This still mucks things up... !!! FIX !!!
1073 //Should this go before or after the phrase mode mucking around?
1074#ifndef SCREWY_CD_DEPENDENT
1075 a1_x += a1_step_x;
1076 a1_y += a1_step_y;
1077 a2_x += a2_step_x;
1078 a2_y += a2_step_y;//*/
1079#endif
1080 }
1081
1082 // write values back to registers
1083 WREG(A1_PIXEL, (a1_y & 0xFFFF0000) | ((a1_x >> 16) & 0xFFFF));
1084 WREG(A1_FPIXEL, (a1_y << 16) | (a1_x & 0xFFFF));
1085 WREG(A2_PIXEL, (a2_y & 0xFFFF0000) | ((a2_x >> 16) & 0xFFFF));
1086specialLog = false;
1087}
1088
1089void blitter_blit(uint32_t cmd)
1090{
1091//Apparently this is doing *something*, just not sure exactly what...
1092/*if (cmd == 0x41802E01)
1093{
1094 WriteLog("BLIT: Found our blit. Was: %08X ", cmd);
1095 cmd = 0x01800E01;
1096 WriteLog("Is: %08X\n", cmd);
1097}//*/
1098
1099 uint32_t pitchValue[4] = { 0, 1, 3, 2 };
1100 colour_index = 0;
1101 src = cmd & 0x07;
1102 dst = (cmd >> 3) & 0x07;
1103 misc = (cmd >> 6) & 0x03;
1104 a1ctl = (cmd >> 8) & 0x7;
1105 mode = (cmd >> 11) & 0x07;
1106 ity = (cmd >> 14) & 0x0F;
1107 zop = (cmd >> 18) & 0x07;
1108 op = (cmd >> 21) & 0x0F;
1109 ctrl = (cmd >> 25) & 0x3F;
1110
1111 // Addresses in A1/2_BASE are *phrase* aligned, i.e., bottom three bits are ignored!
1112 // NOTE: This fixes Rayman's bad collision detection AND keeps T2K working!
1113 a1_addr = REG(A1_BASE) & 0xFFFFFFF8;
1114 a2_addr = REG(A2_BASE) & 0xFFFFFFF8;
1115
1116 a1_zoffs = (REG(A1_FLAGS) >> 6) & 7;
1117 a2_zoffs = (REG(A2_FLAGS) >> 6) & 7;
1118
1119 xadd_a1_control = (REG(A1_FLAGS) >> 16) & 0x03;
1120 xadd_a2_control = (REG(A2_FLAGS) >> 16) & 0x03;
1121
1122 a1_pitch = pitchValue[(REG(A1_FLAGS) & 0x03)];
1123 a2_pitch = pitchValue[(REG(A2_FLAGS) & 0x03)];
1124
1125 n_pixels = REG(PIXLINECOUNTER) & 0xFFFF;
1126 n_lines = (REG(PIXLINECOUNTER) >> 16) & 0xFFFF;
1127
1128 a1_x = (REG(A1_PIXEL) << 16) | (REG(A1_FPIXEL) & 0xFFFF);
1129 a1_y = (REG(A1_PIXEL) & 0xFFFF0000) | (REG(A1_FPIXEL) >> 16);
1130//According to the JTRM, X is restricted to 15 bits and Y is restricted to 12.
1131//But it seems to fuck up T2K! !!! FIX !!!
1132//Could it be sign extended??? Doesn't seem to be so according to JTRM
1133// a1_x &= 0x7FFFFFFF, a1_y &= 0x0FFFFFFF;
1134//Actually, it says that the X is 16 bits. But it still seems to mess with the Y when restricted to 12...
1135// a1_y &= 0x0FFFFFFF;
1136
1137// a1_width = blitter_scanline_width[((REG(A1_FLAGS) & 0x00007E00) >> 9)];
1138// According to JTRM, this must give a *whole number* of phrases in the current
1139// pixel size (this means the lookup above is WRONG)... !!! FIX !!!
1140 uint32_t m = (REG(A1_FLAGS) >> 9) & 0x03, e = (REG(A1_FLAGS) >> 11) & 0x0F;
1141 a1_width = ((0x04 | m) << e) >> 2;//*/
1142
1143 a2_x = (REG(A2_PIXEL) & 0x0000FFFF) << 16;
1144 a2_y = (REG(A2_PIXEL) & 0xFFFF0000);
1145//According to the JTRM, X is restricted to 15 bits and Y is restricted to 12.
1146//But it seems to fuck up T2K! !!! FIX !!!
1147// a2_x &= 0x7FFFFFFF, a2_y &= 0x0FFFFFFF;
1148//Actually, it says that the X is 16 bits. But it still seems to mess with the Y when restricted to 12...
1149// a2_y &= 0x0FFFFFFF;
1150
1151// a2_width = blitter_scanline_width[((REG(A2_FLAGS) & 0x00007E00) >> 9)];
1152// According to JTRM, this must give a *whole number* of phrases in the current
1153// pixel size (this means the lookup above is WRONG)... !!! FIX !!!
1154 m = (REG(A2_FLAGS) >> 9) & 0x03, e = (REG(A2_FLAGS) >> 11) & 0x0F;
1155 a2_width = ((0x04 | m) << e) >> 2;//*/
1156 a2_mask_x = ((REG(A2_MASK) & 0x0000FFFF) << 16) | 0xFFFF;
1157 a2_mask_y = (REG(A2_MASK) & 0xFFFF0000) | 0xFFFF;
1158
1159 // Check for "use mask" flag
1160 if (!(REG(A2_FLAGS) & 0x8000))
1161 {
1162 a2_mask_x = 0xFFFFFFFF; // must be 16.16
1163 a2_mask_y = 0xFFFFFFFF; // must be 16.16
1164 }
1165
1166 a1_phrase_mode = 0;
1167
1168 // According to the official documentation, a hardware bug ties A2's yadd bit to A1's...
1169 a2_yadd = a1_yadd = (YADD1_A1 ? 1 << 16 : 0);
1170
1171 if (YSIGNSUB_A1)
1172 a1_yadd = -a1_yadd;
1173
1174 // determine a1_xadd
1175 switch (xadd_a1_control)
1176 {
1177 case XADDPHR:
1178// This is a documented Jaguar bug relating to phrase mode and truncation... Look into it!
1179 // add phrase offset to X and truncate
1180 a1_xadd = 1 << 16;
1181 a1_phrase_mode = 1;
1182 break;
1183 case XADDPIX:
1184 // add pixelsize (1) to X
1185 a1_xadd = 1 << 16;
1186 break;
1187 case XADD0:
1188 // add zero (for those nice vertical lines)
1189 a1_xadd = 0;
1190 break;
1191 case XADDINC:
1192 // add the contents of the increment register
1193 a1_xadd = (REG(A1_INC) << 16) | (REG(A1_FINC) & 0x0000FFFF);
1194 a1_yadd = (REG(A1_INC) & 0xFFFF0000) | (REG(A1_FINC) >> 16);
1195 break;
1196 }
1197
1198
1199//Blit! (0011D000 -> 000B9600) count: 228 x 1, A1/2_FLAGS: 00073820/00064220 [cmd: 41802801]
1200// A1 -> pitch: 1 phrases, depth: 16bpp, z-off: 0, width: 128 (1C), addctl: XADDINC YADD1 XSIGNADD YSIGNADD
1201// A2 -> pitch: 1 phrases, depth: 16bpp, z-off: 0, width: 320 (21), addctl: XADD0 YADD1 XSIGNADD YSIGNADD
1202//if (YADD1_A1 && YADD1_A2 && xadd_a2_control == XADD0 && xadd_a1_control == XADDINC)// &&
1203// uint32_t a1f = REG(A1_FLAGS), a2f = REG(A2_FLAGS);
1204//Ok, so this ISN'T it... Prolly the XADDPHR code above that's doing it...
1205//if (REG(A1_FLAGS) == 0x00073820 && REG(A2_FLAGS) == 0x00064220 && cmd == 0x41802801)
1206// A1 x/y: 14368/7, A2 x/y: 150/36
1207//This is it... The problem...
1208//if ((a1_x >> 16) == 14368) // 14368 = $3820
1209// return; //Lesse what we got...
1210
1211 if (XSIGNSUB_A1)
1212 a1_xadd = -a1_xadd;
1213
1214 if (YSIGNSUB_A2)
1215 a2_yadd = -a2_yadd;
1216
1217 a2_phrase_mode = 0;
1218
1219 // determine a2_xadd
1220 switch (xadd_a2_control)
1221 {
1222 case XADDPHR:
1223 // add phrase offset to X and truncate
1224 a2_xadd = 1 << 16;
1225 a2_phrase_mode = 1;
1226 break;
1227 case XADDPIX:
1228 // add pixelsize (1) to X
1229 a2_xadd = 1 << 16;
1230 break;
1231 case XADD0:
1232 // add zero (for those nice vertical lines)
1233 a2_xadd = 0;
1234 break;
1235//This really isn't a valid bit combo for A2... Shouldn't this cause the blitter to just say no?
1236 case XADDINC:
1237WriteLog("BLIT: Asked to use invalid bit combo (XADDINC) for A2...\n");
1238 // add the contents of the increment register
1239 // since there is no register for a2 we just add 1
1240//Let's do nothing, since it's not listed as a valid bit combo...
1241// a2_xadd = 1 << 16;
1242 break;
1243 }
1244
1245 if (XSIGNSUB_A2)
1246 a2_xadd = -a2_xadd;
1247
1248 // Modify outer loop steps based on blitter command
1249
1250 a1_step_x = 0;
1251 a1_step_y = 0;
1252 a2_step_x = 0;
1253 a2_step_y = 0;
1254
1255 if (UPDA1F)
1256 a1_step_x = (REG(A1_FSTEP) & 0xFFFF),
1257 a1_step_y = (REG(A1_FSTEP) >> 16);
1258
1259 if (UPDA1)
1260 a1_step_x |= ((REG(A1_STEP) & 0x0000FFFF) << 16),
1261 a1_step_y |= ((REG(A1_STEP) & 0xFFFF0000));
1262
1263 if (UPDA2)
1264 a2_step_x = (REG(A2_STEP) & 0x0000FFFF) << 16,
1265 a2_step_y = (REG(A2_STEP) & 0xFFFF0000);
1266
1267 outer_loop = n_lines;
1268
1269 // Clipping...
1270
1271 if (CLIPA1)
1272 a1_clip_x = REG(A1_CLIP) & 0x7FFF,
1273 a1_clip_y = (REG(A1_CLIP) >> 16) & 0x7FFF;
1274
1275// This phrase sizing is incorrect as well... !!! FIX !!! [NOTHING TO FIX]
1276// Err, this is pixel size... (and it's OK)
1277 a2_psize = 1 << ((REG(A2_FLAGS) >> 3) & 0x07);
1278 a1_psize = 1 << ((REG(A1_FLAGS) >> 3) & 0x07);
1279
1280 // Z-buffering
1281 if (GOURZ)
1282 {
1283 zadd = REG(ZINC);
1284
1285 for(int v=0; v<4; v++)
1286 z_i[v] = REG(PHRASEZ0 + v*4);
1287 }
1288
1289 // Gouraud shading
1290 if (GOURD || GOURZ || SRCSHADE)
1291 {
1292 gd_c[0] = blitter_ram[PATTERNDATA + 6];
1293 gd_i[0] = ((uint32_t)blitter_ram[PATTERNDATA + 7] << 16)
1294 | ((uint32_t)blitter_ram[SRCDATA + 6] << 8) | blitter_ram[SRCDATA + 7];
1295
1296 gd_c[1] = blitter_ram[PATTERNDATA + 4];
1297 gd_i[1] = ((uint32_t)blitter_ram[PATTERNDATA + 5] << 16)
1298 | ((uint32_t)blitter_ram[SRCDATA + 4] << 8) | blitter_ram[SRCDATA + 5];
1299
1300 gd_c[2] = blitter_ram[PATTERNDATA + 2];
1301 gd_i[2] = ((uint32_t)blitter_ram[PATTERNDATA + 3] << 16)
1302 | ((uint32_t)blitter_ram[SRCDATA + 2] << 8) | blitter_ram[SRCDATA + 3];
1303
1304 gd_c[3] = blitter_ram[PATTERNDATA + 0];
1305 gd_i[3] = ((uint32_t)blitter_ram[PATTERNDATA + 1] << 16)
1306 | ((uint32_t)blitter_ram[SRCDATA + 0] << 8) | blitter_ram[SRCDATA + 1];
1307
1308 gouraud_add = REG(INTENSITYINC);
1309
1310 gd_ia = gouraud_add & 0x00FFFFFF;
1311 if (gd_ia & 0x00800000)
1312 gd_ia = 0xFF000000 | gd_ia;
1313
1314 gd_ca = (gouraud_add >> 24) & 0xFF;
1315 if (gd_ca & 0x00000080)
1316 gd_ca = 0xFFFFFF00 | gd_ca;
1317 }
1318
1319 // Bit comparitor fixing...
1320/* if (BCOMPEN)
1321 {
1322 // Determine the data flow direction...
1323 if (!DSTA2)
1324 a2_step_x /= (1 << ((REG(A2_FLAGS) >> 3) & 0x07));
1325 else
1326 ;//add this later
1327 }//*/
1328/* if (BCOMPEN)//Kludge for Hover Strike... !!! FIX !!!
1329 {
1330 // Determine the data flow direction...
1331 if (!DSTA2)
1332 a2_x <<= 3;
1333 }//*/
1334
1335#ifdef LOG_BLITS
1336 if (start_logging)
1337 {
1338 WriteLog("Blit!\n");
1339 WriteLog(" cmd = 0x%.8x\n",cmd);
1340 WriteLog(" a1_base = %08X\n", a1_addr);
1341 WriteLog(" a1_pitch = %d\n", a1_pitch);
1342 WriteLog(" a1_psize = %d\n", a1_psize);
1343 WriteLog(" a1_width = %d\n", a1_width);
1344 WriteLog(" a1_xadd = %f (phrase=%d)\n", (float)a1_xadd / 65536.0, a1_phrase_mode);
1345 WriteLog(" a1_yadd = %f\n", (float)a1_yadd / 65536.0);
1346 WriteLog(" a1_xstep = %f\n", (float)a1_step_x / 65536.0);
1347 WriteLog(" a1_ystep = %f\n", (float)a1_step_y / 65536.0);
1348 WriteLog(" a1_x = %f\n", (float)a1_x / 65536.0);
1349 WriteLog(" a1_y = %f\n", (float)a1_y / 65536.0);
1350 WriteLog(" a1_zoffs = %i\n",a1_zoffs);
1351
1352 WriteLog(" a2_base = %08X\n", a2_addr);
1353 WriteLog(" a2_pitch = %d\n", a2_pitch);
1354 WriteLog(" a2_psize = %d\n", a2_psize);
1355 WriteLog(" a2_width = %d\n", a2_width);
1356 WriteLog(" a2_xadd = %f (phrase=%d)\n", (float)a2_xadd / 65536.0, a2_phrase_mode);
1357 WriteLog(" a2_yadd = %f\n", (float)a2_yadd / 65536.0);
1358 WriteLog(" a2_xstep = %f\n", (float)a2_step_x / 65536.0);
1359 WriteLog(" a2_ystep = %f\n", (float)a2_step_y / 65536.0);
1360 WriteLog(" a2_x = %f\n", (float)a2_x / 65536.0);
1361 WriteLog(" a2_y = %f\n", (float)a2_y / 65536.0);
1362 WriteLog(" a2_mask_x= 0x%.4x\n",a2_mask_x);
1363 WriteLog(" a2_mask_y= 0x%.4x\n",a2_mask_y);
1364 WriteLog(" a2_zoffs = %i\n",a2_zoffs);
1365
1366 WriteLog(" count = %d x %d\n", n_pixels, n_lines);
1367
1368 WriteLog(" command = %08X\n", cmd);
1369 WriteLog(" dsten = %i\n",DSTEN);
1370 WriteLog(" srcen = %i\n",SRCEN);
1371 WriteLog(" patdsel = %i\n",PATDSEL);
1372 WriteLog(" color = 0x%.8x\n",REG(PATTERNDATA));
1373 WriteLog(" dcompen = %i\n",DCOMPEN);
1374 WriteLog(" bcompen = %i\n",BCOMPEN);
1375 WriteLog(" cmpdst = %i\n",CMPDST);
1376 WriteLog(" GOURZ = %i\n",GOURZ);
1377 WriteLog(" GOURD = %i\n",GOURD);
1378 WriteLog(" SRCSHADE= %i\n",SRCSHADE);
1379 }
1380#endif
1381
1382//NOTE: Pitch is ignored!
1383
1384//This *might* be the altimeter blits (they are)...
1385//On captured screen, x-pos for black (inner) is 259, for pink is 257
1386//Black is short by 3, pink is short by 1...
1387/*
1388Blit! (00110000 <- 000BF010) count: 9 x 31, A1/2_FLAGS: 000042E2/00010020 [cmd: 00010200]
1389 CMD -> src: dst: misc: a1ctl: UPDA1 mode: ity: PATDSEL z-op: op: LFU_CLEAR ctrl:
1390 A1 -> pitch: 4 phrases, depth: 16bpp, z-off: 3, width: 320 (21), addctl: XADDPHR YADD0 XSIGNADD YSIGNADD
1391 A2 -> pitch: 1 phrases, depth: 16bpp, z-off: 0, width: 1 (00), addctl: XADDPIX YADD0 XSIGNADD YSIGNADD
1392 A1 x/y: 262/124, A2 x/y: 128/0
1393Blit! (00110000 <- 000BF010) count: 5 x 38, A1/2_FLAGS: 000042E2/00010020 [cmd: 00010200]
1394 CMD -> src: dst: misc: a1ctl: UPDA1 mode: ity: PATDSEL z-op: op: LFU_CLEAR ctrl:
1395 A1 -> pitch: 4 phrases, depth: 16bpp, z-off: 3, width: 320 (21), addctl: XADDPHR YADD0 XSIGNADD YSIGNADD
1396 A2 -> pitch: 1 phrases, depth: 16bpp, z-off: 0, width: 1 (00), addctl: XADDPIX YADD0 XSIGNADD YSIGNADD
1397 A1 x/y: 264/117, A2 x/y: 407/0
1398
1399Blit! (00110000 <- 000BF010) count: 9 x 23, A1/2_FLAGS: 000042E2/00010020 [cmd: 00010200]
1400 CMD -> src: dst: misc: a1ctl: UPDA1 mode: ity: PATDSEL z-op: op: LFU_CLEAR ctrl:
1401 A1 step values: -10 (X), 1 (Y)
1402 A1 -> pitch: 4(2) phrases, depth: 16bpp, z-off: 3, width: 320 (21), addctl: XADDPHR YADD0 XSIGNADD YSIGNADD
1403 A2 -> pitch: 1(0) phrases, depth: 16bpp, z-off: 0, width: 1 (00), addctl: XADDPIX YADD0 XSIGNADD YSIGNADD
1404 A1 x/y: 262/132, A2 x/y: 129/0
1405Blit! (00110000 <- 000BF010) count: 5 x 27, A1/2_FLAGS: 000042E2/00010020 [cmd: 00010200]
1406 CMD -> src: dst: misc: a1ctl: UPDA1 mode: ity: PATDSEL z-op: op: LFU_CLEAR ctrl:
1407 A1 step values: -8 (X), 1 (Y)
1408 A1 -> pitch: 4(2) phrases, depth: 16bpp, z-off: 3, width: 320 (21), addctl: XADDPHR YADD0 XSIGNADD YSIGNADD
1409 A2 -> pitch: 1(0) phrases, depth: 16bpp, z-off: 0, width: 1 (00), addctl: XADDPIX YADD0 XSIGNADD YSIGNADD
1410 A1 x/y: 264/128, A2 x/y: 336/0
1411
1412 264v vCursor ends up here...
1413 xxxxx...`
1414 111122223333
1415
1416262v vCursor ends up here...
1417 xxxxxxxxx.'
1418 1111222233334444
1419
1420Fixed! Now for more:
1421
1422; This looks like the ship icon in the upper left corner...
1423
1424Blit! (00110000 <- 0010B2A8) count: 11 x 12, A1/2_FLAGS: 000042E2/00000020 [cmd: 09800609]
1425 CMD -> src: SRCEN dst: DSTEN misc: a1ctl: UPDA1 UPDA2 mode: ity: z-op: op: LFU_REPLACE ctrl: DCOMPEN
1426 A1 step values: -12 (X), 1 (Y)
1427 A2 step values: 0 (X), 0 (Y) [mask (unused): 00000000 - FFFFFFFF/FFFFFFFF]
1428 A1 -> pitch: 4 phrases, depth: 16bpp, z-off: 3, width: 320 (21), addctl: XADDPHR YADD0 XSIGNADD YSIGNADD
1429 A2 -> pitch: 1 phrases, depth: 16bpp, z-off: 0, width: 1 (00), addctl: XADDPHR YADD0 XSIGNADD YSIGNADD
1430 A1 x/y: 20/24, A2 x/y: 5780/0
1431
1432Also fixed!
1433
1434More (not sure this is a blitter problem as much as it's a GPU problem):
1435All but the "M" are trashed...
1436This does *NOT* look like a blitter problem, as it's rendering properly...
1437Actually, if you look at the A1 step values, there IS a discrepancy!
1438
1439; D
1440
1441Blit! (00110000 <- 0010B2A8) count: 12 x 12, A1/2_FLAGS: 000042E2/00000020 [cmd: 09800609]
1442 CMD -> src: SRCEN dst: DSTEN misc: a1ctl: UPDA1 UPDA2 mode: ity: z-op: op: LFU_REPLACE ctrl: DCOMPEN
1443 A1 step values: -14 (X), 1 (Y)
1444 A2 step values: -4 (X), 0 (Y) [mask (unused): 00000000 - FFFFFFFF/FFFFFFFF]
1445 A1 -> pitch: 4 phrases, depth: 16bpp, z-off: 3, width: 320 (21), addctl: XADDPHR YADD0 XSIGNADD YSIGNADD
1446 A2 -> pitch: 1 phrases, depth: 16bpp, z-off: 0, width: 1 (00), addctl: XADDPHR YADD0 XSIGNADD YSIGNADD
1447 A1 x/y: 134/144, A2 x/y: 2516/0
1448;129,146: +5,-2
1449
1450; E
1451
1452Blit! (00110000 <- 0010B2A8) count: 12 x 12, A1/2_FLAGS: 000042E2/00000020 [cmd: 09800609]
1453 CMD -> src: SRCEN dst: DSTEN misc: a1ctl: UPDA1 UPDA2 mode: ity: z-op: op: LFU_REPLACE ctrl: DCOMPEN
1454 A1 step values: -13 (X), 1 (Y)
1455 A2 step values: -4 (X), 0 (Y) [mask (unused): 00000000 - FFFFFFFF/FFFFFFFF]
1456 A1 -> pitch: 4 phrases, depth: 16bpp, z-off: 3, width: 320 (21), addctl: XADDPHR YADD0 XSIGNADD YSIGNADD
1457 A2 -> pitch: 1 phrases, depth: 16bpp, z-off: 0, width: 1 (00), addctl: XADDPHR YADD0 XSIGNADD YSIGNADD
1458 A1 x/y: 147/144, A2 x/y: 2660/0
1459
1460; M
1461
1462Blit! (00110000 <- 0010B2A8) count: 12 x 12, A1/2_FLAGS: 000042E2/00000020 [cmd: 09800609]
1463 CMD -> src: SRCEN dst: DSTEN misc: a1ctl: UPDA1 UPDA2 mode: ity: z-op: op: LFU_REPLACE ctrl: DCOMPEN
1464 A1 step values: -12 (X), 1 (Y)
1465 A2 step values: 0 (X), 0 (Y) [mask (unused): 00000000 - FFFFFFFF/FFFFFFFF]
1466 A1 -> pitch: 4 phrases, depth: 16bpp, z-off: 3, width: 320 (21), addctl: XADDPHR YADD0 XSIGNADD YSIGNADD
1467 A2 -> pitch: 1 phrases, depth: 16bpp, z-off: 0, width: 1 (00), addctl: XADDPHR YADD0 XSIGNADD YSIGNADD
1468 A1 x/y: 160/144, A2 x/y: 3764/0
1469
1470; O
1471
1472Blit! (00110000 <- 0010B2A8) count: 12 x 12, A1/2_FLAGS: 000042E2/00000020 [cmd: 09800609]
1473 CMD -> src: SRCEN dst: DSTEN misc: a1ctl: UPDA1 UPDA2 mode: ity: z-op: op: LFU_REPLACE ctrl: DCOMPEN
1474 A1 step values: -15 (X), 1 (Y)
1475 A2 step values: -4 (X), 0 (Y) [mask (unused): 00000000 - FFFFFFFF/FFFFFFFF]
1476 A1 -> pitch: 4 phrases, depth: 16bpp, z-off: 3, width: 320 (21), addctl: XADDPHR YADD0 XSIGNADD YSIGNADD
1477 A2 -> pitch: 1 phrases, depth: 16bpp, z-off: 0, width: 1 (00), addctl: XADDPHR YADD0 XSIGNADD YSIGNADD
1478 A1 x/y: 173/144, A2 x/y: 4052/0
1479
1480*/
1481//extern int op_start_log;
1482if (blit_start_log)
1483{
1484 const char * ctrlStr[4] = { "XADDPHR\0", "XADDPIX\0", "XADD0\0", "XADDINC\0" };
1485 const char * bppStr[8] = { "1bpp\0", "2bpp\0", "4bpp\0", "8bpp\0", "16bpp\0", "32bpp\0", "???\0", "!!!\0" };
1486 const char * opStr[16] = { "LFU_CLEAR", "LFU_NSAND", "LFU_NSAD", "LFU_NOTS", "LFU_SAND", "LFU_NOTD", "LFU_N_SXORD", "LFU_NSORND",
1487 "LFU_SAD", "LFU_XOR", "LFU_D", "LFU_NSORD", "LFU_REPLACE", "LFU_SORND", "LFU_SORD", "LFU_ONE" };
1488 uint32_t /*src = cmd & 0x07, dst = (cmd >> 3) & 0x07, misc = (cmd >> 6) & 0x03,
1489 a1ctl = (cmd >> 8) & 0x07,*/ mode = (cmd >> 11) & 0x07/*, ity = (cmd >> 14) & 0x0F,
1490 zop = (cmd >> 18) & 0x07, op = (cmd >> 21) & 0x0F, ctrl = (cmd >> 25) & 0x3F*/;
1491 uint32_t a1f = REG(A1_FLAGS), a2f = REG(A2_FLAGS);
1492 uint32_t p1 = a1f & 0x07, p2 = a2f & 0x07,
1493 d1 = (a1f >> 3) & 0x07, d2 = (a2f >> 3) & 0x07,
1494 zo1 = (a1f >> 6) & 0x07, zo2 = (a2f >> 6) & 0x07,
1495 w1 = (a1f >> 9) & 0x3F, w2 = (a2f >> 9) & 0x3F,
1496 ac1 = (a1f >> 16) & 0x1F, ac2 = (a2f >> 16) & 0x1F;
1497 uint32_t iw1 = ((0x04 | (w1 & 0x03)) << ((w1 & 0x3C) >> 2)) >> 2;
1498 uint32_t iw2 = ((0x04 | (w2 & 0x03)) << ((w2 & 0x3C) >> 2)) >> 2;
1499 WriteLog("Blit! (%08X %s %08X) count: %d x %d, A1/2_FLAGS: %08X/%08X [cmd: %08X]\n", a1_addr, (mode&0x01 ? "->" : "<-"), a2_addr, n_pixels, n_lines, a1f, a2f, cmd);
1500// WriteLog(" CMD -> src: %d, dst: %d, misc: %d, a1ctl: %d, mode: %d, ity: %1X, z-op: %d, op: %1X, ctrl: %02X\n", src, dst, misc, a1ctl, mode, ity, zop, op, ctrl);
1501
1502 WriteLog(" CMD -> src: %s%s%s ", (cmd & 0x0001 ? "SRCEN " : ""), (cmd & 0x0002 ? "SRCENZ " : ""), (cmd & 0x0004 ? "SRCENX" : ""));
1503 WriteLog("dst: %s%s%s ", (cmd & 0x0008 ? "DSTEN " : ""), (cmd & 0x0010 ? "DSTENZ " : ""), (cmd & 0x0020 ? "DSTWRZ" : ""));
1504 WriteLog("misc: %s%s ", (cmd & 0x0040 ? "CLIP_A1 " : ""), (cmd & 0x0080 ? "???" : ""));
1505 WriteLog("a1ctl: %s%s%s ", (cmd & 0x0100 ? "UPDA1F " : ""), (cmd & 0x0200 ? "UPDA1 " : ""), (cmd & 0x0400 ? "UPDA2" : ""));
1506 WriteLog("mode: %s%s%s ", (cmd & 0x0800 ? "DSTA2 " : ""), (cmd & 0x1000 ? "GOURD " : ""), (cmd & 0x2000 ? "GOURZ" : ""));
1507 WriteLog("ity: %s%s%s%s ", (cmd & 0x4000 ? "TOPBEN " : ""), (cmd & 0x8000 ? "TOPNEN " : ""), (cmd & 0x00010000 ? "PATDSEL" : ""), (cmd & 0x00020000 ? "ADDDSEL" : ""));
1508 WriteLog("z-op: %s%s%s ", (cmd & 0x00040000 ? "ZMODELT " : ""), (cmd & 0x00080000 ? "ZMODEEQ " : ""), (cmd & 0x00100000 ? "ZMODEGT" : ""));
1509 WriteLog("op: %s ", opStr[(cmd >> 21) & 0x0F]);
1510 WriteLog("ctrl: %s%s%s%s%s%s\n", (cmd & 0x02000000 ? "CMPDST " : ""), (cmd & 0x04000000 ? "BCOMPEN " : ""), (cmd & 0x08000000 ? "DCOMPEN " : ""), (cmd & 0x10000000 ? "BKGWREN " : ""), (cmd & 0x20000000 ? "BUSHI " : ""), (cmd & 0x40000000 ? "SRCSHADE" : ""));
1511
1512 if (UPDA1)
1513 WriteLog(" A1 step values: %d (X), %d (Y)\n", a1_step_x >> 16, a1_step_y >> 16);
1514
1515 if (UPDA2)
1516 WriteLog(" A2 step values: %d (X), %d (Y) [mask (%sused): %08X - %08X/%08X]\n", a2_step_x >> 16, a2_step_y >> 16, (a2f & 0x8000 ? "" : "un"), REG(A2_MASK), a2_mask_x, a2_mask_y);
1517
1518 WriteLog(" A1 -> pitch: %d phrases, depth: %s, z-off: %d, width: %d (%02X), addctl: %s %s %s %s\n", 1 << p1, bppStr[d1], zo1, iw1, w1, ctrlStr[ac1&0x03], (ac1&0x04 ? "YADD1" : "YADD0"), (ac1&0x08 ? "XSIGNSUB" : "XSIGNADD"), (ac1&0x10 ? "YSIGNSUB" : "YSIGNADD"));
1519 WriteLog(" A2 -> pitch: %d phrases, depth: %s, z-off: %d, width: %d (%02X), addctl: %s %s %s %s\n", 1 << p2, bppStr[d2], zo2, iw2, w2, ctrlStr[ac2&0x03], (ac2&0x04 ? "YADD1" : "YADD0"), (ac2&0x08 ? "XSIGNSUB" : "XSIGNADD"), (ac2&0x10 ? "YSIGNSUB" : "YSIGNADD"));
1520 WriteLog(" A1 x/y: %d/%d, A2 x/y: %d/%d Pattern: %08X%08X SRCDATA: %08X%08X\n", a1_x >> 16, a1_y >> 16, a2_x >> 16, a2_y >> 16, REG(PATTERNDATA), REG(PATTERNDATA + 4), REG(SRCDATA), REG(SRCDATA + 4));
1521// blit_start_log = 0;
1522// op_start_log = 1;
1523}
1524
1525 blitter_working = 1;
1526//#ifndef USE_GENERIC_BLITTER
1527// if (!blitter_execute_cached_code(blitter_in_cache(cmd)))
1528//#endif
1529 blitter_generic(cmd);
1530
1531/*if (blit_start_log)
1532{
1533 if (a1_addr == 0xF03000 && a2_addr == 0x004D58)
1534 {
1535 WriteLog("\nBytes at 004D58:\n");
1536 for(int i=0x004D58; i<0x004D58+(10*127*4); i++)
1537 WriteLog("%02X ", JaguarReadByte(i));
1538 WriteLog("\nBytes at F03000:\n");
1539 for(int i=0xF03000; i<0xF03000+(6*127*4); i++)
1540 WriteLog("%02X ", JaguarReadByte(i));
1541 WriteLog("\n\n");
1542 }
1543}//*/
1544
1545 blitter_working = 0;
1546}
1547#endif // of the #if 0 near the top...
1548/*******************************************************************************
1549********************** STUFF CUT ABOVE THIS LINE! ******************************
1550*******************************************************************************/
1551
1552
1553void BlitterInit(void)
1554{
1555 BlitterReset();
1556}
1557
1558
1559void BlitterReset(void)
1560{
1561 memset(blitter_ram, 0x00, 0xA0);
1562}
1563
1564
1565void BlitterDone(void)
1566{
1567 WriteLog("BLIT: Done.\n");
1568}
1569
1570
1571uint8_t BlitterReadByte(uint32_t offset, uint32_t who/*=UNKNOWN*/)
1572{
1573 offset &= 0xFF;
1574
1575 // status register
1576//This isn't cycle accurate--how to fix? !!! FIX !!!
1577//Probably have to do some multi-threaded implementation or at least a reentrant safe implementation...
1578//Real hardware returns $00000805, just like the JTRM says.
1579 if (offset == (0x38 + 0))
1580 return 0x00;
1581 if (offset == (0x38 + 1))
1582 return 0x00;
1583 if (offset == (0x38 + 2))
1584 return 0x08;
1585 if (offset == (0x38 + 3))
1586 return 0x05; // always idle/never stopped (collision detection ignored!)
1587
1588// CHECK HERE ONCE THIS FIX HAS BEEN TESTED: [X]
1589//Fix for AvP:
1590 if (offset >= 0x04 && offset <= 0x07)
1591//This is it. I wonder if it just ignores the lower three bits?
1592//No, this is a documented Jaguar I bug. It also bites the read at $F02230 as well...
1593 return blitter_ram[offset + 0x08]; // A1_PIXEL ($F0220C) read at $F02204
1594
1595 if (offset >= 0x2C && offset <= 0x2F)
1596 return blitter_ram[offset + 0x04]; // A2_PIXEL ($F02230) read at $F0222C
1597
1598 return blitter_ram[offset];
1599}
1600
1601
1602//Crappy!
1603uint16_t BlitterReadWord(uint32_t offset, uint32_t who/*=UNKNOWN*/)
1604{
1605 return ((uint16_t)BlitterReadByte(offset, who) << 8) | (uint16_t)BlitterReadByte(offset+1, who);
1606}
1607
1608
1609//Crappy!
1610uint32_t BlitterReadLong(uint32_t offset, uint32_t who/*=UNKNOWN*/)
1611{
1612 return (BlitterReadWord(offset, who) << 16) | BlitterReadWord(offset+2, who);
1613}
1614
1615
1616void BlitterWriteByte(uint32_t offset, uint8_t data, uint32_t who/*=UNKNOWN*/)
1617{
1618/*if (offset & 0xFF == 0x7B)
1619 WriteLog("--> Wrote to B_STOP: value -> %02X\n", data);*/
1620 offset &= 0xFF;
1621/*if ((offset >= PATTERNDATA) && (offset < PATTERNDATA + 8))
1622{
1623 printf("--> %s wrote %02X to byte %u of PATTERNDATA...\n", whoName[who], data, offset - PATTERNDATA);
1624 fflush(stdout);
1625}//*/
1626
1627 // This handles writes to INTENSITY0-3 by also writing them to their proper places in
1628 // PATTERNDATA & SOURCEDATA (should do the same for the Z registers! !!! FIX !!! [DONE])
1629 if ((offset >= 0x7C) && (offset <= 0x9B))
1630 {
1631 switch (offset)
1632 {
1633 // INTENSITY registers 0-3
1634 case 0x7C: break;
1635 case 0x7D: blitter_ram[PATTERNDATA + 7] = data; break;
1636 case 0x7E: blitter_ram[SRCDATA + 6] = data; break;
1637 case 0x7F: blitter_ram[SRCDATA + 7] = data; break;
1638
1639 case 0x80: break;
1640 case 0x81: blitter_ram[PATTERNDATA + 5] = data; break;
1641 case 0x82: blitter_ram[SRCDATA + 4] = data; break;
1642 case 0x83: blitter_ram[SRCDATA + 5] = data; break;
1643
1644 case 0x84: break;
1645 case 0x85: blitter_ram[PATTERNDATA + 3] = data; break;
1646 case 0x86: blitter_ram[SRCDATA + 2] = data; break;
1647 case 0x87: blitter_ram[SRCDATA + 3] = data; break;
1648
1649 case 0x88: break;
1650 case 0x89: blitter_ram[PATTERNDATA + 1] = data; break;
1651 case 0x8A: blitter_ram[SRCDATA + 0] = data; break;
1652 case 0x8B: blitter_ram[SRCDATA + 1] = data; break;
1653
1654
1655 // Z registers 0-3
1656 case 0x8C: blitter_ram[SRCZINT + 6] = data; break;
1657 case 0x8D: blitter_ram[SRCZINT + 7] = data; break;
1658 case 0x8E: blitter_ram[SRCZFRAC + 6] = data; break;
1659 case 0x8F: blitter_ram[SRCZFRAC + 7] = data; break;
1660
1661 case 0x90: blitter_ram[SRCZINT + 4] = data; break;
1662 case 0x91: blitter_ram[SRCZINT + 5] = data; break;
1663 case 0x92: blitter_ram[SRCZFRAC + 4] = data; break;
1664 case 0x93: blitter_ram[SRCZFRAC + 5] = data; break;
1665
1666 case 0x94: blitter_ram[SRCZINT + 2] = data; break;
1667 case 0x95: blitter_ram[SRCZINT + 3] = data; break;
1668 case 0x96: blitter_ram[SRCZFRAC + 2] = data; break;
1669 case 0x97: blitter_ram[SRCZFRAC + 3] = data; break;
1670
1671 case 0x98: blitter_ram[SRCZINT + 0] = data; break;
1672 case 0x99: blitter_ram[SRCZINT + 1] = data; break;
1673 case 0x9A: blitter_ram[SRCZFRAC + 0] = data; break;
1674 case 0x9B: blitter_ram[SRCZFRAC + 1] = data; break;
1675 }
1676 }
1677
1678 // It looks weird, but this is how the 64 bit registers are actually handled...!
1679
1680 else if ((offset >= SRCDATA + 0) && (offset <= SRCDATA + 3)
1681 || (offset >= DSTDATA + 0) && (offset <= DSTDATA + 3)
1682 || (offset >= DSTZ + 0) && (offset <= DSTZ + 3)
1683 || (offset >= SRCZINT + 0) && (offset <= SRCZINT + 3)
1684 || (offset >= SRCZFRAC + 0) && (offset <= SRCZFRAC + 3)
1685 || (offset >= PATTERNDATA + 0) && (offset <= PATTERNDATA + 3))
1686 {
1687 blitter_ram[offset + 4] = data;
1688 }
1689 else if ((offset >= SRCDATA + 4) && (offset <= SRCDATA + 7)
1690 || (offset >= DSTDATA + 4) && (offset <= DSTDATA + 7)
1691 || (offset >= DSTZ + 4) && (offset <= DSTZ + 7)
1692 || (offset >= SRCZINT + 4) && (offset <= SRCZINT + 7)
1693 || (offset >= SRCZFRAC + 4) && (offset <= SRCZFRAC + 7)
1694 || (offset >= PATTERNDATA + 4) && (offset <= PATTERNDATA + 7))
1695 {
1696 blitter_ram[offset - 4] = data;
1697 }
1698 else
1699 blitter_ram[offset] = data;
1700}
1701
1702
1703void BlitterWriteWord(uint32_t offset, uint16_t data, uint32_t who/*=UNKNOWN*/)
1704{
1705/*if (((offset & 0xFF) >= PATTERNDATA) && ((offset & 0xFF) < PATTERNDATA + 8))
1706{
1707 printf("----> %s wrote %04X to byte %u of PATTERNDATA...\n", whoName[who], data, offset - (0xF02200 + PATTERNDATA));
1708 fflush(stdout);
1709}*/
1710//#if 1
1711/* if (offset & 0xFF == A1_PIXEL && data == 14368)
1712 {
1713 WriteLog("\n1\nA1_PIXEL written by %s (%u)...\n\n\n", whoName[who], data);
1714extern bool doGPUDis;
1715doGPUDis = true;
1716 }
1717 if ((offset & 0xFF) == (A1_PIXEL + 2) && data == 14368)
1718 {
1719 WriteLog("\n2\nA1_PIXEL written by %s (%u)...\n\n\n", whoName[who], data);
1720extern bool doGPUDis;
1721doGPUDis = true;
1722 }//*/
1723//#endif
1724
1725 BlitterWriteByte(offset + 0, data >> 8, who);
1726 BlitterWriteByte(offset + 1, data & 0xFF, who);
1727
1728 if ((offset & 0xFF) == 0x3A)
1729 // I.e., the second write of 32-bit value--not convinced this is the best way to do this!
1730 // But then again, according to the Jaguar docs, this is correct...!
1731/*extern int blit_start_log;
1732extern bool doGPUDis;
1733if (blit_start_log)
1734{
1735 WriteLog("BLIT: Blitter started by %s...\n", whoName[who]);
1736 doGPUDis = true;
1737}//*/
1738#ifndef USE_BOTH_BLITTERS
1739#ifdef USE_ORIGINAL_BLITTER
1740 blitter_blit(GET32(blitter_ram, 0x38));
1741#endif
1742#ifdef USE_MIDSUMMER_BLITTER
1743 BlitterMidsummer(GET32(blitter_ram, 0x38));
1744#endif
1745#ifdef USE_MIDSUMMER_BLITTER_MKII
1746 BlitterMidsummer2();
1747#endif
1748#else
1749 {
1750 if (vjs.useFastBlitter)
1751 blitter_blit(GET32(blitter_ram, 0x38));
1752 else
1753 BlitterMidsummer2();
1754 }
1755#endif
1756}
1757//F02278,9,A,B
1758
1759
1760void BlitterWriteLong(uint32_t offset, uint32_t data, uint32_t who/*=UNKNOWN*/)
1761{
1762/*if (((offset & 0xFF) >= PATTERNDATA) && ((offset & 0xFF) < PATTERNDATA + 8))
1763{
1764 printf("------> %s wrote %08X to byte %u of PATTERNDATA...\n", whoName[who], data, offset - (0xF02200 + PATTERNDATA));
1765 fflush(stdout);
1766}//*/
1767//#if 1
1768/* if ((offset & 0xFF) == A1_PIXEL && (data & 0xFFFF) == 14368)
1769 {
1770 WriteLog("\n3\nA1_PIXEL written by %s (%u)...\n\n\n", whoName[who], data);
1771extern bool doGPUDis;
1772doGPUDis = true;
1773 }//*/
1774//#endif
1775
1776 BlitterWriteWord(offset + 0, data >> 16, who);
1777 BlitterWriteWord(offset + 2, data & 0xFFFF, who);
1778}
1779
1780
1781void LogBlit(void)
1782{
1783 const char * opStr[16] = { "LFU_CLEAR", "LFU_NSAND", "LFU_NSAD", "LFU_NOTS", "LFU_SAND", "LFU_NOTD", "LFU_N_SXORD", "LFU_NSORND",
1784 "LFU_SAD", "LFU_XOR", "LFU_D", "LFU_NSORD", "LFU_REPLACE", "LFU_SORND", "LFU_SORD", "LFU_ONE" };
1785 uint32_t cmd = GET32(blitter_ram, 0x38);
1786 uint32_t m = (REG(A1_FLAGS) >> 9) & 0x03, e = (REG(A1_FLAGS) >> 11) & 0x0F;
1787 uint32_t a1_width = ((0x04 | m) << e) >> 2;
1788 m = (REG(A2_FLAGS) >> 9) & 0x03, e = (REG(A2_FLAGS) >> 11) & 0x0F;
1789 uint32_t a2_width = ((0x04 | m) << e) >> 2;
1790
1791 WriteLog("Blit!\n");
1792 WriteLog(" COMMAND = %08X\n", cmd);
1793 WriteLog(" a1_base = %08X\n", REG(A1_BASE));
1794 WriteLog(" a1_flags = %08X (%c %c %c %c%c . %c%c%c%c%c%c %c%c%c %c%c%c . %c%c)\n", REG(A1_FLAGS),
1795 (REG(A1_FLAGS) & 0x100000 ? '1' : '0'),
1796 (REG(A1_FLAGS) & 0x080000 ? '1' : '0'),
1797 (REG(A1_FLAGS) & 0x040000 ? '1' : '0'),
1798 (REG(A1_FLAGS) & 0x020000 ? '1' : '0'),
1799 (REG(A1_FLAGS) & 0x010000 ? '1' : '0'),
1800 (REG(A1_FLAGS) & 0x004000 ? '1' : '0'),
1801 (REG(A1_FLAGS) & 0x002000 ? '1' : '0'),
1802 (REG(A1_FLAGS) & 0x001000 ? '1' : '0'),
1803 (REG(A1_FLAGS) & 0x000800 ? '1' : '0'),
1804 (REG(A1_FLAGS) & 0x000400 ? '1' : '0'),
1805 (REG(A1_FLAGS) & 0x000200 ? '1' : '0'),
1806 (REG(A1_FLAGS) & 0x000100 ? '1' : '0'),
1807 (REG(A1_FLAGS) & 0x000080 ? '1' : '0'),
1808 (REG(A1_FLAGS) & 0x000040 ? '1' : '0'),
1809 (REG(A1_FLAGS) & 0x000020 ? '1' : '0'),
1810 (REG(A1_FLAGS) & 0x000010 ? '1' : '0'),
1811 (REG(A1_FLAGS) & 0x000008 ? '1' : '0'),
1812 (REG(A1_FLAGS) & 0x000002 ? '1' : '0'),
1813 (REG(A1_FLAGS) & 0x000001 ? '1' : '0'));
1814 WriteLog(" pitch=%u, pixSz=%u, zOff=%u, width=%u, xCtrl=%u\n",
1815 REG(A1_FLAGS) & 0x00003, (REG(A1_FLAGS) & 0x00038) >> 3,
1816 (REG(A1_FLAGS) & 0x001C0) >> 6, a1_width, (REG(A1_FLAGS) & 0x30000) >> 16);
1817 WriteLog(" a1_clip = %u, %u (%08X)\n", GET16(blitter_ram, A1_CLIP + 2), GET16(blitter_ram, A1_CLIP + 0), GET32(blitter_ram, A1_CLIP));
1818 WriteLog(" a1_pixel = %d, %d (%08X)\n", (int16_t)GET16(blitter_ram, A1_PIXEL + 2), (int16_t)GET16(blitter_ram, A1_PIXEL + 0), GET32(blitter_ram, A1_PIXEL));
1819 WriteLog(" a1_step = %d, %d (%08X)\n", (int16_t)GET16(blitter_ram, A1_STEP + 2), (int16_t)GET16(blitter_ram, A1_STEP + 0), GET32(blitter_ram, A1_STEP));
1820 WriteLog(" a1_fstep = %u, %u (%08X)\n", GET16(blitter_ram, A1_FSTEP + 2), GET16(blitter_ram, A1_FSTEP + 0), GET32(blitter_ram, A1_FSTEP));
1821 WriteLog(" a1_fpixel= %u, %u (%08X)\n", GET16(blitter_ram, A1_FPIXEL + 2), GET16(blitter_ram, A1_FPIXEL + 0), GET32(blitter_ram, A1_FPIXEL));
1822 WriteLog(" a1_inc = %d, %d (%08X)\n", (int16_t)GET16(blitter_ram, A1_INC + 2), (int16_t)GET16(blitter_ram, A1_INC + 0), GET32(blitter_ram, A1_INC));
1823 WriteLog(" a1_finc = %u, %u (%08X)\n", GET16(blitter_ram, A1_FINC + 2), GET16(blitter_ram, A1_FINC + 0), GET32(blitter_ram, A1_FINC));
1824
1825 WriteLog(" a2_base = %08X\n", REG(A2_BASE));
1826 WriteLog(" a2_flags = %08X (%c %c %c %c%c %c %c%c%c%c%c%c %c%c%c %c%c%c . %c%c)\n", REG(A2_FLAGS),
1827 (REG(A2_FLAGS) & 0x100000 ? '1' : '0'),
1828 (REG(A2_FLAGS) & 0x080000 ? '1' : '0'),
1829 (REG(A2_FLAGS) & 0x040000 ? '1' : '0'),
1830 (REG(A2_FLAGS) & 0x020000 ? '1' : '0'),
1831 (REG(A2_FLAGS) & 0x010000 ? '1' : '0'),
1832 (REG(A2_FLAGS) & 0x008000 ? '1' : '0'),
1833 (REG(A2_FLAGS) & 0x004000 ? '1' : '0'),
1834 (REG(A2_FLAGS) & 0x002000 ? '1' : '0'),
1835 (REG(A2_FLAGS) & 0x001000 ? '1' : '0'),
1836 (REG(A2_FLAGS) & 0x000800 ? '1' : '0'),
1837 (REG(A2_FLAGS) & 0x000400 ? '1' : '0'),
1838 (REG(A2_FLAGS) & 0x000200 ? '1' : '0'),
1839 (REG(A2_FLAGS) & 0x000100 ? '1' : '0'),
1840 (REG(A2_FLAGS) & 0x000080 ? '1' : '0'),
1841 (REG(A2_FLAGS) & 0x000040 ? '1' : '0'),
1842 (REG(A2_FLAGS) & 0x000020 ? '1' : '0'),
1843 (REG(A2_FLAGS) & 0x000010 ? '1' : '0'),
1844 (REG(A2_FLAGS) & 0x000008 ? '1' : '0'),
1845 (REG(A2_FLAGS) & 0x000002 ? '1' : '0'),
1846 (REG(A2_FLAGS) & 0x000001 ? '1' : '0'));
1847 WriteLog(" pitch=%u, pixSz=%u, zOff=%u, width=%u, xCtrl=%u\n",
1848 REG(A2_FLAGS) & 0x00003, (REG(A2_FLAGS) & 0x00038) >> 3,
1849 (REG(A2_FLAGS) & 0x001C0) >> 6, a2_width, (REG(A2_FLAGS) & 0x30000) >> 16);
1850 WriteLog(" a2_mask = %u, %u (%08X)\n", GET16(blitter_ram, A2_MASK + 2), GET16(blitter_ram, A2_MASK + 0), GET32(blitter_ram, A2_MASK));
1851 WriteLog(" a2_pixel = %d, %d (%08X)\n", (int16_t)GET16(blitter_ram, A2_PIXEL + 2), (int16_t)GET16(blitter_ram, A2_PIXEL + 0), GET32(blitter_ram, A2_PIXEL));
1852 WriteLog(" a2_step = %d, %d (%08X)\n", (int16_t)GET16(blitter_ram, A2_STEP + 2), (int16_t)GET16(blitter_ram, A2_STEP + 0), GET32(blitter_ram, A2_STEP));
1853
1854 WriteLog(" count = %d x %d\n", GET16(blitter_ram, PIXLINECOUNTER + 2), GET16(blitter_ram, PIXLINECOUNTER));
1855
1856 WriteLog(" SRCEN = %s\n", (SRCEN ? "1" : "0"));
1857 WriteLog(" SRCENZ = %s\n", (SRCENZ ? "1" : "0"));
1858 WriteLog(" SRCENX = %s\n", (SRCENX ? "1" : "0"));
1859 WriteLog(" DSTEN = %s\n", (DSTEN ? "1" : "0"));
1860 WriteLog(" DSTENZ = %s\n", (DSTENZ ? "1" : "0"));
1861 WriteLog(" DSTWRZ = %s\n", (DSTWRZ ? "1" : "0"));
1862 WriteLog(" CLIPA1 = %s\n", (CLIPA1 ? "1" : "0"));
1863 WriteLog(" UPDA1F = %s\n", (UPDA1F ? "1" : "0"));
1864 WriteLog(" UPDA1 = %s\n", (UPDA1 ? "1" : "0"));
1865 WriteLog(" UPDA2 = %s\n", (UPDA2 ? "1" : "0"));
1866 WriteLog(" DSTA2 = %s\n", (DSTA2 ? "1" : "0"));
1867 WriteLog(" ZOP = %s %s %s\n", (Z_OP_INF ? "<" : ""), (Z_OP_EQU ? "=" : ""), (Z_OP_SUP ? ">" : ""));
1868 WriteLog("+-LFUFUNC = %s\n", opStr[(cmd >> 21) & 0x0F]);
1869 WriteLog("| PATDSEL = %s (PD=%08X%08X)\n", (PATDSEL ? "1" : "0"), REG(PATTERNDATA), REG(PATTERNDATA + 4));
1870 WriteLog("+-ADDDSEL = %s\n", (ADDDSEL ? "1" : "0"));
1871 WriteLog(" CMPDST = %s\n", (CMPDST ? "1" : "0"));
1872 WriteLog(" BCOMPEN = %s\n", (BCOMPEN ? "1" : "0"));
1873 WriteLog(" DCOMPEN = %s\n", (DCOMPEN ? "1" : "0"));
1874 WriteLog(" TOPBEN = %s\n", (TOPBEN ? "1" : "0"));
1875 WriteLog(" TOPNEN = %s\n", (TOPNEN ? "1" : "0"));
1876 WriteLog(" BKGWREN = %s\n", (BKGWREN ? "1" : "0"));
1877 WriteLog(" GOURD = %s (II=%08X, SD=%08X%08X)\n", (GOURD ? "1" : "0"), REG(INTENSITYINC), REG(SRCDATA), REG(SRCDATA + 4));
1878 WriteLog(" GOURZ = %s (ZI=%08X, ZD=%08X%08X, SZ1=%08X%08X, SZ2=%08X%08X)\n", (GOURZ ? "1" : "0"), REG(ZINC), REG(DSTZ), REG(DSTZ + 4),
1879 REG(SRCZINT), REG(SRCZINT + 4), REG(SRCZFRAC), REG(SRCZFRAC + 4));
1880 WriteLog(" SRCSHADE = %s\n", (SRCSHADE ? "1" : "0"));
1881}
1882
1883
1884#ifdef USE_MIDSUMMER_BLITTER
1885//
1886// Here's an attempt to write a blitter that conforms to the Midsummer specs--since
1887// it's supposedly backwards compatible, it should work well...
1888//
1889//#define LOG_BLITTER_MEMORY_ACCESSES
1890
1891#define DATINIT (false)
1892#define TXTEXT (false)
1893#define POLYGON (false)
1894
1895void BlitterMidsummer(uint32_t cmd)
1896{
1897#ifdef LOG_BLITS
1898 LogBlit();
1899#endif
1900uint32_t outer_loop, inner_loop, a1_addr, a2_addr;
1901int32_t a1_x, a1_y, a2_x, a2_y, a1_width, a2_width;
1902uint8_t a1_phrase_mode, a2_phrase_mode;
1903
1904 a1_addr = REG(A1_BASE) & 0xFFFFFFF8;
1905 a2_addr = REG(A2_BASE) & 0xFFFFFFF8;
1906 a1_x = (REG(A1_PIXEL) << 16) | (REG(A1_FPIXEL) & 0xFFFF);
1907 a1_y = (REG(A1_PIXEL) & 0xFFFF0000) | (REG(A1_FPIXEL) >> 16);
1908 uint32_t m = (REG(A1_FLAGS) >> 9) & 0x03, e = (REG(A1_FLAGS) >> 11) & 0x0F;
1909 a1_width = ((0x04 | m) << e) >> 2;//*/
1910 a2_x = (REG(A2_PIXEL) & 0x0000FFFF) << 16;
1911 a2_y = (REG(A2_PIXEL) & 0xFFFF0000);
1912 m = (REG(A2_FLAGS) >> 9) & 0x03, e = (REG(A2_FLAGS) >> 11) & 0x0F;
1913 a2_width = ((0x04 | m) << e) >> 2;//*/
1914
1915 a1_phrase_mode = a2_phrase_mode = 0;
1916
1917 if ((blitter_ram[A1_FLAGS + 1] & 0x03) == 0)
1918 a1_phrase_mode = 1;
1919
1920 if ((blitter_ram[A2_FLAGS + 1] & 0x03) == 0)
1921 a2_phrase_mode = 1;
1922
1923#define INNER0 (inner_loop == 0)
1924#define OUTER0 (outer_loop == 0)
1925
1926// $01800005 has SRCENX, may have to investigate further...
1927// $00011008 has GOURD & DSTEN.
1928// $41802F41 has SRCSHADE, CLIPA1
1929/*bool logBlit = false;
1930if (cmd != 0x00010200 && cmd != 0x01800001 && cmd != 0x01800005
1931 && cmd != 0x00011008 && cmd !=0x41802F41)
1932{
1933 logBlit = true;
1934 LogBlit();
1935}//*/
1936
1937 uint64_t srcData = GET64(blitter_ram, SRCDATA), srcXtraData,
1938 dstData = GET64(blitter_ram, DSTDATA), writeData;
1939 uint32_t srcAddr, dstAddr;
1940 uint8_t bitCount, a1PixelSize, a2PixelSize;
1941
1942 // JTRM says phrase mode only works for 8BPP or higher, so let's try this...
1943 uint32_t phraseOffset[8] = { 8, 8, 8, 8, 4, 2, 0, 0 };
1944 uint8_t pixelShift[8] = { 3, 2, 1, 0, 1, 2, 0, 0 };
1945
1946 a1PixelSize = (blitter_ram[A1_FLAGS + 3] >> 3) & 0x07;
1947 a2PixelSize = (blitter_ram[A2_FLAGS + 3] >> 3) & 0x07;
1948
1949 outer_loop = GET16(blitter_ram, PIXLINECOUNTER + 0);
1950
1951 if (outer_loop == 0)
1952 outer_loop = 0x10000;
1953
1954 // We just list the states here and jump from state to state in order to
1955 // keep things somewhat clear. Optimization/cleanups later.
1956
1957//idle: // Blitter is idle, and will not perform any bus activity
1958/*
1959idle Blitter is off the bus, and no activity takes place.
1960if GO if DATINIT goto init_if
1961 else goto inner
1962*/
1963 if (DATINIT)
1964 goto init_if;
1965 else
1966 goto inner;
1967
1968/*
1969inner Inner loop is active, read and write cycles are performed
1970*/
1971inner: // Run inner loop state machine (asserts step from its idle state)
1972 inner_loop = GET16(blitter_ram, PIXLINECOUNTER + 2);
1973
1974 if (inner_loop == 0)
1975 inner_loop = 0x10000;
1976
1977/*
1978------------------------------
1979idle: Inactive, blitter is idle or passing round outer loop
1980idle Another state in the outer loop is active. No bus transfers are performed.
1981if STEP
1982 if SRCENX goto sreadx
1983 else if TXTEXT goto txtread
1984 else if SRCEN goto sread
1985 else if DSTEN goto dread
1986 else if DSTENZ goto dzread
1987 else goto dwrite
1988*/
1989 if (SRCENX)
1990 goto sreadx;
1991 else if (TXTEXT)
1992 goto txtread;
1993 else if (SRCEN)
1994 goto sread;
1995 else if (DSTEN)
1996 goto dread;
1997 else if (DSTENZ)
1998 goto dzread;
1999 else
2000 goto dwrite;
2001
2002/*
2003sreadx Extra source data read at the start of an inner loop pass.
2004if STEP
2005 if SRCENZ goto szreadx
2006 else if TXTEXT goto txtread
2007 else if SRCEN goto sread
2008 else if DSTEN goto dread
2009 else if DSTENZ goto dzread
2010 else goto dwrite
2011*/
2012sreadx: // Extra source data read
2013 if (SRCENZ)
2014 goto szreadx;
2015 else if (TXTEXT)
2016 goto txtread;
2017 else if (SRCEN)
2018 goto sread;
2019 else if (DSTEN)
2020 goto dread;
2021 else if (DSTENZ)
2022 goto dzread;
2023 else
2024 goto dwrite;
2025
2026/*
2027szreadx Extra source Z read as the start of an inner loop pass.
2028if STEP
2029 if TXTEXT goto txtread
2030 else goto sread
2031*/
2032szreadx: // Extra source Z read
2033 if (TXTEXT)
2034 goto txtread;
2035 else
2036 goto sread;
2037
2038/*
2039txtread Read texture data from external memory. This state is only used for external texture.
2040 TEXTEXT is the condition TEXTMODE=1.
2041if STEP
2042 if SRCEN goto sread
2043 else if DSTEN goto dread
2044 else if DSTENZ goto dzread
2045 else goto dwrite
2046*/
2047txtread: // Read external texture data
2048 if (SRCEN)
2049 goto sread;
2050 else if (DSTEN)
2051 goto dread;
2052 else if (DSTENZ)
2053 goto dzread;
2054 else
2055 goto dwrite;
2056
2057/*
2058sread Source data read.
2059if STEP
2060 if SRCENZ goto szread
2061 else if DSTEN goto dread
2062 else if DSTENZ goto dzread
2063 else goto dwrite
2064*/
2065sread: // Source data read
2066//The JTRM doesn't really specify the internal structure of the source data read, but I would
2067//imagine that if it's in phrase mode that it starts by reading the phrase that the window is
2068//pointing at. Likewise, the pixel (if in BPP 1, 2 & 4, chopped) otherwise. It probably still
2069//transfers an entire phrase even in pixel mode.
2070//Odd thought: Does it expand, e.g., 1 BPP pixels into 32 BPP internally? Hmm...
2071//No.
2072/*
2073 a1_addr = REG(A1_BASE) & 0xFFFFFFF8;
2074 a2_addr = REG(A2_BASE) & 0xFFFFFFF8;
2075 a1_zoffs = (REG(A1_FLAGS) >> 6) & 7;
2076 a2_zoffs = (REG(A2_FLAGS) >> 6) & 7;
2077 xadd_a1_control = (REG(A1_FLAGS) >> 16) & 0x03;
2078 xadd_a2_control = (REG(A2_FLAGS) >> 16) & 0x03;
2079 a1_pitch = pitchValue[(REG(A1_FLAGS) & 0x03)];
2080 a2_pitch = pitchValue[(REG(A2_FLAGS) & 0x03)];
2081 n_pixels = REG(PIXLINECOUNTER) & 0xFFFF;
2082 n_lines = (REG(PIXLINECOUNTER) >> 16) & 0xFFFF;
2083 a1_x = (REG(A1_PIXEL) << 16) | (REG(A1_FPIXEL) & 0xFFFF);
2084 a1_y = (REG(A1_PIXEL) & 0xFFFF0000) | (REG(A1_FPIXEL) >> 16);
2085 a2_psize = 1 << ((REG(A2_FLAGS) >> 3) & 0x07);
2086 a1_psize = 1 << ((REG(A1_FLAGS) >> 3) & 0x07);
2087 a1_phrase_mode = 0;
2088 a2_phrase_mode = 0;
2089 a1_width = ((0x04 | m) << e) >> 2;
2090 a2_width = ((0x04 | m) << e) >> 2;
2091
2092 // write values back to registers
2093 WREG(A1_PIXEL, (a1_y & 0xFFFF0000) | ((a1_x >> 16) & 0xFFFF));
2094 WREG(A1_FPIXEL, (a1_y << 16) | (a1_x & 0xFFFF));
2095 WREG(A2_PIXEL, (a2_y & 0xFFFF0000) | ((a2_x >> 16) & 0xFFFF));
2096*/
2097 // Calculate the address to be read...
2098
2099//Need to fix phrase mode calcs here, since they should *step* by eight, not mulitply.
2100//Also, need to fix various differing BPP modes here, since offset won't be correct except
2101//for 8BPP. !!! FIX !!!
2102 srcAddr = (DSTA2 ? a1_addr : a2_addr);
2103
2104/* if ((DSTA2 ? a1_phrase_mode : a2_phrase_mode) == 1)
2105 {
2106 srcAddr += (((DSTA2 ? a1_x : a2_x) >> 16)
2107 + (((DSTA2 ? a1_y : a2_y) >> 16) * (DSTA2 ? a1_width : a2_width)));
2108 }
2109 else*/
2110 {
2111// uint32_t pixAddr = ((DSTA2 ? a1_x : a2_x) >> 16)
2112// + (((DSTA2 ? a1_y : a2_y) >> 16) * (DSTA2 ? a1_width : a2_width));
2113 int32_t pixAddr = (int16_t)((DSTA2 ? a1_x : a2_x) >> 16)
2114 + ((int16_t)((DSTA2 ? a1_y : a2_y) >> 16) * (DSTA2 ? a1_width : a2_width));
2115
2116 if ((DSTA2 ? a1PixelSize : a2PixelSize) < 3)
2117 pixAddr >>= pixelShift[(DSTA2 ? a1PixelSize : a2PixelSize)];
2118 else if ((DSTA2 ? a1PixelSize : a2PixelSize) > 3)
2119 pixAddr <<= pixelShift[(DSTA2 ? a1PixelSize : a2PixelSize)];
2120
2121 srcAddr += pixAddr;
2122 }
2123
2124 // And read it!
2125
2126 if ((DSTA2 ? a1_phrase_mode : a2_phrase_mode) == 1)
2127 {
2128 srcData = ((uint64_t)JaguarReadLong(srcAddr, BLITTER) << 32)
2129 | (uint64_t)JaguarReadLong(srcAddr + 4, BLITTER);
2130 }
2131 else
2132 {
2133//1,2,&4BPP are wrong here... !!! FIX !!!
2134 if ((DSTA2 ? a1PixelSize : a2PixelSize) == 0) // 1 BPP
2135 srcData = JaguarReadByte(srcAddr, BLITTER);
2136 if ((DSTA2 ? a1PixelSize : a2PixelSize) == 1) // 2 BPP
2137 srcData = JaguarReadByte(srcAddr, BLITTER);
2138 if ((DSTA2 ? a1PixelSize : a2PixelSize) == 2) // 4 BPP
2139 srcData = JaguarReadByte(srcAddr, BLITTER);
2140 if ((DSTA2 ? a1PixelSize : a2PixelSize) == 3) // 8 BPP
2141 srcData = JaguarReadByte(srcAddr, BLITTER);
2142 if ((DSTA2 ? a1PixelSize : a2PixelSize) == 4) // 16 BPP
2143 srcData = JaguarReadWord(srcAddr, BLITTER);
2144 if ((DSTA2 ? a1PixelSize : a2PixelSize) == 5) // 32 BPP
2145 srcData = JaguarReadLong(srcAddr, BLITTER);
2146 }
2147
2148#ifdef LOG_BLITTER_MEMORY_ACCESSES
2149if (logBlit)
2150 WriteLog("BLITTER: srcAddr=%08X, srcData=%08X %08X\n", srcAddr, (uint32_t)(srcData >> 32), (uint32_t)(srcData & 0xFFFFFFFF));
2151#endif
2152
2153 if (SRCENZ)
2154 goto szread;
2155 else if (DSTEN)
2156 goto dread;
2157 else if (DSTENZ)
2158 goto dzread;
2159 else
2160 goto dwrite;
2161
2162szread: // Source Z read
2163/*
2164szread Source Z read.
2165if STEP
2166 if DSTEN goto dread
2167 else if DSTENZ goto dzread
2168 else goto dwrite
2169*/
2170 if (DSTEN)
2171 goto dread;
2172 else if (DSTENZ)
2173 goto dzread;
2174 else
2175 goto dwrite;
2176
2177dread: // Destination data read
2178/*
2179dread Destination data read.
2180if STEP
2181 if DSTENZ goto dzread
2182 else goto dwrite
2183*/
2184 // Calculate the destination address to be read...
2185
2186//Need to fix phrase mode calcs here, since they should *step* by eight, not mulitply.
2187//Also, need to fix various differing BPP modes here, since offset won't be correct except
2188//for 8BPP. !!! FIX !!!
2189 dstAddr = (DSTA2 ? a2_addr : a1_addr);
2190
2191 {
2192// uint32_t pixAddr = ((DSTA2 ? a2_x : a1_x) >> 16)
2193// + (((DSTA2 ? a2_y : a1_y) >> 16) * (DSTA2 ? a2_width : a1_width));
2194 int32_t pixAddr = (int16_t)((DSTA2 ? a2_x : a1_x) >> 16)
2195 + ((int16_t)((DSTA2 ? a2_y : a1_y) >> 16) * (DSTA2 ? a2_width : a1_width));
2196
2197 if ((DSTA2 ? a2PixelSize : a1PixelSize) < 3)
2198 pixAddr >>= pixelShift[(DSTA2 ? a2PixelSize : a1PixelSize)];
2199 else if ((DSTA2 ? a2PixelSize : a1PixelSize) > 3)
2200 pixAddr <<= pixelShift[(DSTA2 ? a2PixelSize : a1PixelSize)];
2201
2202 dstAddr += pixAddr;
2203 }
2204
2205 // And read it!
2206
2207 if ((DSTA2 ? a2_phrase_mode : a1_phrase_mode) == 1)
2208 {
2209 dstData = ((uint64_t)JaguarReadLong(srcAddr, BLITTER) << 32)
2210 | (uint64_t)JaguarReadLong(srcAddr + 4, BLITTER);
2211 }
2212 else
2213 {
2214//1,2,&4BPP are wrong here... !!! FIX !!!
2215 if ((DSTA2 ? a2PixelSize : a1PixelSize) == 0) // 1 BPP
2216 dstData = JaguarReadByte(dstAddr, BLITTER);
2217 if ((DSTA2 ? a2PixelSize : a1PixelSize) == 1) // 2 BPP
2218 dstData = JaguarReadByte(dstAddr, BLITTER);
2219 if ((DSTA2 ? a2PixelSize : a1PixelSize) == 2) // 4 BPP
2220 dstData = JaguarReadByte(dstAddr, BLITTER);
2221 if ((DSTA2 ? a2PixelSize : a1PixelSize) == 3) // 8 BPP
2222 dstData = JaguarReadByte(dstAddr, BLITTER);
2223 if ((DSTA2 ? a2PixelSize : a1PixelSize) == 4) // 16 BPP
2224 dstData = JaguarReadWord(dstAddr, BLITTER);
2225 if ((DSTA2 ? a2PixelSize : a1PixelSize) == 5) // 32 BPP
2226 dstData = JaguarReadLong(dstAddr, BLITTER);
2227 }
2228
2229#ifdef LOG_BLITTER_MEMORY_ACCESSES
2230if (logBlit)
2231 WriteLog("BLITTER (dread): dstAddr=%08X, dstData=%08X %08X\n", dstAddr, (uint32_t)(dstData >> 32), (uint32_t)(dstData & 0xFFFFFFFF));
2232#endif
2233
2234 if (DSTENZ)
2235 goto dzread;
2236 else
2237 goto dwrite;
2238
2239dzread: // Destination Z read
2240/*
2241dzread Destination Z read.
2242if STEP goto dwrite
2243*/
2244 goto dwrite;
2245
2246dwrite: // Destination data write
2247/*
2248dwrite Destination write. Every pass round the inner loop must go through this state..
2249if STEP
2250 if DSTWRZ goto dzwrite
2251 else if INNER0 goto idle
2252 else if TXTEXT goto txtread
2253 else if SRCEN goto sread
2254 else if DSTEN goto dread
2255 else if DSTENZ goto dzread
2256 else goto dwrite
2257*/
2258/*
2259Blit!
2260 a1_base = 00100000
2261 a1_pitch = 0
2262 a1_psize = 16
2263 a1_width = 320
2264 a1_xadd = 1.000000 (phrase=0)
2265 a1_yadd = 0.000000
2266 a1_x = 159.000000
2267 a1_y = 1.000000
2268 a1_zoffs = 0
2269 a2_base = 000095D0
2270 a2_pitch = 0
2271 a2_psize = 16
2272 a2_width = 256
2273 a2_xadd = 1.000000 (phrase=1)
2274 a2_yadd = 0.000000
2275 a2_x = 2.000000
2276 a2_y = 0.000000
2277 a2_mask_x= 0xFFFFFFFF
2278 a2_mask_y= 0xFFFFFFFF
2279 a2_zoffs = 0
2280 count = 2 x 1
2281 COMMAND = 00011008
2282 SRCEN = 0
2283 DSTEN = 1
2284 UPDA1F = 0
2285 UPDA1 = 0
2286 UPDA2 = 0
2287 DSTA2 = 0
2288--LFUFUNC = LFU_CLEAR
2289| PATDSEL = 1 (PD=77C7 7700 7700 7700)
2290--ADDDSEL = 0
2291 GOURD = 1 (II=00FC 1A00, SD=FF00 0000 0000 0000)
2292*/
2293
2294//Still need to do CLIPA1 and SRCSHADE and GOURD and GOURZ...
2295
2296 // Check clipping...
2297
2298 if (CLIPA1)
2299 {
2300 uint16_t x = a1_x >> 16, y = a1_y >> 16;
2301
2302 if (x >= GET16(blitter_ram, A1_CLIP + 2) || y >= GET16(blitter_ram, A1_CLIP))
2303 goto inhibitWrite;
2304 }
2305
2306 // Figure out what gets written...
2307
2308 if (PATDSEL)
2309 {
2310 writeData = GET64(blitter_ram, PATTERNDATA);
2311//GOURD works properly only in 16BPP mode...
2312//SRCDATA holds the intensity fractions...
2313//Does GOURD get calc'ed here or somewhere else???
2314//Temporary testing kludge...
2315//if (GOURD)
2316// writeData >>= 48;
2317// writeData = 0xFF88;
2318//OK, it's not writing an entire strip of pixels... Why?
2319//bad incrementing, that's why!
2320 }
2321 else if (ADDDSEL)
2322 {
2323 // Apparently this only works with 16-bit pixels. Not sure if it works in phrase mode either.
2324//Also, take TOPBEN & TOPNEN into account here as well...
2325 writeData = srcData + dstData;
2326 }
2327 else // LFUFUNC is the default...
2328 {
2329 writeData = 0;
2330
2331 if (LFU_NAN)
2332 writeData |= ~srcData & ~dstData;
2333 if (LFU_NA)
2334 writeData |= ~srcData & dstData;
2335 if (LFU_AN)
2336 writeData |= srcData & ~dstData;
2337 if (LFU_A)
2338 writeData |= srcData & dstData;
2339 }
2340
2341 // Calculate the address to be written...
2342
2343 dstAddr = (DSTA2 ? a2_addr : a1_addr);
2344
2345/* if ((DSTA2 ? a2_phrase_mode : a1_phrase_mode) == 1)
2346 {
2347//both of these calculate the wrong address because they don't take into account
2348//pixel sizes...
2349 dstAddr += ((DSTA2 ? a2_x : a1_x) >> 16)
2350 + (((DSTA2 ? a2_y : a1_y) >> 16) * (DSTA2 ? a2_width : a1_width));
2351 }
2352 else*/
2353 {
2354/* dstAddr += ((DSTA2 ? a2_x : a1_x) >> 16)
2355 + (((DSTA2 ? a2_y : a1_y) >> 16) * (DSTA2 ? a2_width : a1_width));*/
2356// uint32_t pixAddr = ((DSTA2 ? a2_x : a1_x) >> 16)
2357// + (((DSTA2 ? a2_y : a1_y) >> 16) * (DSTA2 ? a2_width : a1_width));
2358 int32_t pixAddr = (int16_t)((DSTA2 ? a2_x : a1_x) >> 16)
2359 + ((int16_t)((DSTA2 ? a2_y : a1_y) >> 16) * (DSTA2 ? a2_width : a1_width));
2360
2361 if ((DSTA2 ? a2PixelSize : a1PixelSize) < 3)
2362 pixAddr >>= pixelShift[(DSTA2 ? a2PixelSize : a1PixelSize)];
2363 else if ((DSTA2 ? a2PixelSize : a1PixelSize) > 3)
2364 pixAddr <<= pixelShift[(DSTA2 ? a2PixelSize : a1PixelSize)];
2365
2366 dstAddr += pixAddr;
2367 }
2368
2369 // And write it!
2370
2371 if ((DSTA2 ? a2_phrase_mode : a1_phrase_mode) == 1)
2372 {
2373 JaguarWriteLong(dstAddr, writeData >> 32, BLITTER);
2374 JaguarWriteLong(dstAddr + 4, writeData & 0xFFFFFFFF, BLITTER);
2375 }
2376 else
2377 {
2378//1,2,&4BPP are wrong here... !!! FIX !!!
2379 if ((DSTA2 ? a2PixelSize : a1PixelSize) == 0) // 1 BPP
2380 JaguarWriteByte(dstAddr, writeData, BLITTER);
2381 if ((DSTA2 ? a2PixelSize : a1PixelSize) == 1) // 2 BPP
2382 JaguarWriteByte(dstAddr, writeData, BLITTER);
2383 if ((DSTA2 ? a2PixelSize : a1PixelSize) == 2) // 4 BPP
2384 JaguarWriteByte(dstAddr, writeData, BLITTER);
2385 if ((DSTA2 ? a2PixelSize : a1PixelSize) == 3) // 8 BPP
2386 JaguarWriteByte(dstAddr, writeData, BLITTER);
2387 if ((DSTA2 ? a2PixelSize : a1PixelSize) == 4) // 16 BPP
2388 JaguarWriteWord(dstAddr, writeData, BLITTER);
2389 if ((DSTA2 ? a2PixelSize : a1PixelSize) == 5) // 32 BPP
2390 JaguarWriteLong(dstAddr, writeData, BLITTER);
2391 }
2392
2393#ifdef LOG_BLITTER_MEMORY_ACCESSES
2394if (logBlit)
2395 WriteLog("BLITTER: dstAddr=%08X, writeData=%08X %08X\n", dstAddr, (uint32_t)(writeData >> 32), (uint32_t)(writeData & 0xFFFFFFFF));
2396#endif
2397
2398inhibitWrite://Should this go here? or on the other side of the X/Y incrementing?
2399//Seems OK here... for now.
2400
2401// Do funky X/Y incrementation here as well... !!! FIX !!!
2402
2403 // Handle A1 channel stepping
2404
2405 if ((blitter_ram[A1_FLAGS + 1] & 0x03) == 0)
2406 a1_x += phraseOffset[a1PixelSize] << 16;
2407 else if ((blitter_ram[A1_FLAGS + 1] & 0x03) == 1)
2408 a1_x += (blitter_ram[A1_FLAGS + 1] & 0x08 ? -1 << 16 : 1 << 16);
2409/* else if ((blitter_ram[A1_FLAGS + 1] & 0x03) == 2)
2410 a1_x += 0 << 16; */
2411 else if ((blitter_ram[A1_FLAGS + 1] & 0x03) == 3)
2412 {
2413//Always add the FINC here??? That was the problem with the BIOS screen... So perhaps.
2414 a1_x += GET16(blitter_ram, A1_FINC + 2);
2415 a1_y += GET16(blitter_ram, A1_FINC + 0);
2416
2417 a1_x += GET16(blitter_ram, A1_INC + 2) << 16;
2418 a1_y += GET16(blitter_ram, A1_INC + 0) << 16;
2419 }
2420
2421 if ((blitter_ram[A1_FLAGS + 1] & 0x04) && (blitter_ram[A1_FLAGS + 1] & 0x03 != 3))
2422 a1_y += (blitter_ram[A1_FLAGS + 1] & 0x10 ? -1 << 16 : 1 << 16);
2423
2424 // Handle A2 channel stepping
2425
2426 if ((blitter_ram[A2_FLAGS + 1] & 0x03) == 0)
2427 a2_x += phraseOffset[a2PixelSize] << 16;
2428 else if ((blitter_ram[A2_FLAGS + 1] & 0x03) == 1)
2429 a2_x += (blitter_ram[A2_FLAGS + 1] & 0x08 ? -1 << 16 : 1 << 16);
2430/* else if ((blitter_ram[A2_FLAGS + 1] & 0x03) == 2)
2431 a2_x += 0 << 16; */
2432
2433 if (blitter_ram[A2_FLAGS + 1] & 0x04)
2434 a2_y += (blitter_ram[A2_FLAGS + 1] & 0x10 ? -1 << 16 : 1 << 16);
2435
2436//Need to fix this so that it subtracts (saturating, of course) the correct number of pixels
2437//in phrase mode... !!! FIX !!! [DONE]
2438//Need to fix this so that it counts down the correct item. Does it count the
2439//source or the destination phrase mode???
2440//It shouldn't matter, because we *should* end up processing the same amount
2441//the same number of pixels... Not sure though.
2442 if ((DSTA2 ? a2_phrase_mode : a1_phrase_mode) == 1)
2443 {
2444 if (inner_loop < phraseOffset[DSTA2 ? a2PixelSize : a1PixelSize])
2445 inner_loop = 0;
2446 else
2447 inner_loop -= phraseOffset[DSTA2 ? a2PixelSize : a1PixelSize];
2448 }
2449 else
2450 inner_loop--;
2451
2452
2453 if (DSTWRZ)
2454 goto dzwrite;
2455 else if (INNER0)
2456 goto indone;
2457 else if (TXTEXT)
2458 goto txtread;
2459 else if (SRCEN)
2460 goto sread;
2461 else if (DSTEN)
2462 goto dread;
2463 else if (DSTENZ)
2464 goto dzread;
2465 else
2466 goto dwrite;
2467
2468dzwrite: // Destination Z write
2469/*
2470dzwrite Destination Z write.
2471if STEP
2472 if INNER0 goto idle
2473 else if TXTEXT goto txtread
2474 else if SRCEN goto sread
2475 else if DSTEN goto dread
2476 else if DSTENZ goto dzread
2477 else goto dwrite
2478*/
2479 if (INNER0)
2480 goto indone;
2481 else if (TXTEXT)
2482 goto txtread;
2483 else if (SRCEN)
2484 goto sread;
2485 else if (DSTEN)
2486 goto dread;
2487 else if (DSTENZ)
2488 goto dzread;
2489 else
2490 goto dwrite;
2491
2492/*
2493------------------------------
2494if INDONE if OUTER0 goto idle
2495else if UPDA1F goto a1fupdate
2496else if UPDA1 goto a1update
2497else if GOURZ.POLYGON goto zfupdate
2498else if UPDA2 goto a2update
2499else if DATINIT goto init_if
2500else restart inner
2501*/
2502indone:
2503 outer_loop--;
2504
2505
2506 if (OUTER0)
2507 goto blitter_done;
2508 else if (UPDA1F)
2509 goto a1fupdate;
2510 else if (UPDA1)
2511 goto a1update;
2512//kill this, for now...
2513// else if (GOURZ.POLYGON)
2514// goto zfupdate;
2515 else if (UPDA2)
2516 goto a2update;
2517 else if (DATINIT)
2518 goto init_if;
2519 else
2520 goto inner;
2521
2522a1fupdate: // Update A1 pointer fractions and more (see below)
2523/*
2524a1fupdate A1 step fraction is added to A1 pointer fraction
2525 POLYGON true: A1 step delta X and Y fraction parts are added to the A1
2526 step X and Y fraction parts (the value prior to this add is used for
2527 the step to pointer add).
2528 POLYGON true: inner count step fraction is added to the inner count
2529 fraction part
2530 POLYGON.GOURD true: the I fraction step is added to the computed
2531 intensity fraction parts +
2532 POLYGON.GOURD true: the I fraction step delta is added to the I
2533 fraction step
2534goto a1update
2535*/
2536/*
2537#define A1_PIXEL ((uint32_t)0x0C) // Integer part of the pixel (Y.i and X.i)
2538#define A1_STEP ((uint32_t)0x10) // Integer part of the step
2539#define A1_FSTEP ((uint32_t)0x14) // Fractional part of the step
2540#define A1_FPIXEL ((uint32_t)0x18) // Fractional part of the pixel (Y.f and X.f)
2541*/
2542
2543// This is all kinda murky. All we have are the Midsummer docs to give us any guidance,
2544// and it's incomplete or filled with errors (like above). Aarrrgggghhhhh!
2545
2546//This isn't right. Is it? I don't think the fractional parts are signed...
2547// a1_x += (int32_t)((int16_t)GET16(blitter_ram, A1_FSTEP + 2));
2548// a1_y += (int32_t)((int16_t)GET16(blitter_ram, A1_FSTEP + 0));
2549 a1_x += GET16(blitter_ram, A1_FSTEP + 2);
2550 a1_y += GET16(blitter_ram, A1_FSTEP + 0);
2551
2552 goto a1update;
2553
2554a1update: // Update A1 pointer integers
2555/*
2556a1update A1 step is added to A1 pointer, with carry from the fractional add
2557 POLYGON true: A1 step delta X and Y integer parts are added to the A1
2558 step X and Y integer parts, with carry from the corresponding
2559 fractional part add (again, the value prior to this add is used for
2560 the step to pointer add).
2561 POLYGON true: inner count step is added to the inner count, with carry
2562 POLYGON.GOURD true: the I step is added to the computed intensities,
2563 with carry +
2564 POLYGON.GOURD true: the I step delta is added to the I step, with
2565 carry the texture X and Y step delta values are added to the X and Y
2566 step values.
2567if GOURZ.POLYGON goto zfupdate
2568else if UPDA2 goto a2update
2569else if DATINIT goto init_if
2570else restart inner
2571*/
2572 a1_x += (int32_t)(GET16(blitter_ram, A1_STEP + 2) << 16);
2573 a1_y += (int32_t)(GET16(blitter_ram, A1_STEP + 0) << 16);
2574
2575
2576//kill this, for now...
2577// if (GOURZ.POLYGON)
2578 if (false)
2579 goto zfupdate;
2580 else if (UPDA2)
2581 goto a2update;
2582 else if (DATINIT)
2583 goto init_if;
2584 else
2585 goto inner;
2586
2587zfupdate: // Update computed Z step fractions
2588/*
2589zfupdate the Z fraction step is added to the computed Z fraction parts +
2590 the Z fraction step delta is added to the Z fraction step
2591goto zupdate
2592*/
2593 goto zupdate;
2594
2595zupdate: // Update computed Z step integers
2596/*
2597zupdate the Z step is added to the computed Zs, with carry +
2598 the Z step delta is added to the Z step, with carry
2599if UPDA2 goto a2update
2600else if DATINIT goto init_if
2601else restart inner
2602*/
2603 if (UPDA2)
2604 goto a2update;
2605 else if (DATINIT)
2606 goto init_if;
2607 else
2608 goto inner;
2609
2610a2update: // Update A2 pointer
2611/*
2612a2update A2 step is added to the A2 pointer
2613if DATINIT goto init_if
2614else restart inner
2615*/
2616 a2_x += (int32_t)(GET16(blitter_ram, A2_STEP + 2) << 16);
2617 a2_y += (int32_t)(GET16(blitter_ram, A2_STEP + 0) << 16);
2618
2619
2620 if (DATINIT)
2621 goto init_if;
2622 else
2623 goto inner;
2624
2625init_if: // Initialise intensity fractions and texture X
2626/*
2627init_if Initialise the fractional part of the computed intensity fields, from
2628 the increment and step registers. The texture X integer and fractional
2629 parts can also be initialised.
2630goto init_ii
2631*/
2632 goto init_ii;
2633
2634init_ii: // Initialise intensity integers and texture Y
2635/*
2636init_ii Initialise the integer part of the computed intensity, and texture Y
2637 integer and fractional parts
2638if GOURZ goto init_zf
2639else goto inner
2640*/
2641 if (GOURZ)
2642 goto init_zf;
2643 else
2644 goto inner;
2645
2646init_zf: // Initialise Z fractions
2647/*
2648init_zf Initialise the fractional part of the computed Z fields.
2649goto init_zi
2650*/
2651 goto init_zi;
2652
2653init_zi: // Initialise Z integers
2654/*
2655init_zi Initialise the integer part of the computed Z fields.
2656goto inner
2657*/
2658 goto inner;
2659
2660
2661/*
2662The outer loop state machine fires off the inner loop, and controls the updating
2663process between passes through the inner loop.
2664
2665+ -- these functions are irrelevant if the DATINIT function is enabled, which it
2666 will normally be.
2667
2668All these states will complete in one clock cycle, with the exception of the idle
2669state, which means the blitter is quiescent; and the inner state, which takes as
2670long as is required to complete one strip of pixels. It is therefore possible for
2671the blitter to spend a maximum of nine clock cycles of inactivity between passes
2672through the inner loop.
2673*/
2674
2675blitter_done:
2676 {}
2677}
2678#endif
2679
2680
2681//
2682// Here's attempt #2--taken from the Oberon chip specs!
2683//
2684
2685#ifdef USE_MIDSUMMER_BLITTER_MKII
2686
2687void ADDRGEN(uint32_t &, uint32_t &, bool, bool,
2688 uint16_t, uint16_t, uint32_t, uint8_t, uint8_t, uint8_t, uint8_t,
2689 uint16_t, uint16_t, uint32_t, uint8_t, uint8_t, uint8_t, uint8_t);
2690void ADDARRAY(uint16_t * addq, uint8_t daddasel, uint8_t daddbsel, uint8_t daddmode,
2691 uint64_t dstd, uint32_t iinc, uint8_t initcin[], uint64_t initinc, uint16_t initpix,
2692 uint32_t istep, uint64_t patd, uint64_t srcd, uint64_t srcz1, uint64_t srcz2,
2693 uint32_t zinc, uint32_t zstep);
2694void ADD16SAT(uint16_t &r, uint8_t &co, uint16_t a, uint16_t b, uint8_t cin, bool sat, bool eightbit, bool hicinh);
2695void ADDAMUX(int16_t &adda_x, int16_t &adda_y, uint8_t addasel, int16_t a1_step_x, int16_t a1_step_y,
2696 int16_t a1_stepf_x, int16_t a1_stepf_y, int16_t a2_step_x, int16_t a2_step_y,
2697 int16_t a1_inc_x, int16_t a1_inc_y, int16_t a1_incf_x, int16_t a1_incf_y, uint8_t adda_xconst,
2698 bool adda_yconst, bool addareg, bool suba_x, bool suba_y);
2699void ADDBMUX(int16_t &addb_x, int16_t &addb_y, uint8_t addbsel, int16_t a1_x, int16_t a1_y,
2700 int16_t a2_x, int16_t a2_y, int16_t a1_frac_x, int16_t a1_frac_y);
2701void DATAMUX(int16_t &data_x, int16_t &data_y, uint32_t gpu_din, int16_t addq_x, int16_t addq_y, bool addqsel);
2702void ADDRADD(int16_t &addq_x, int16_t &addq_y, bool a1fracldi,
2703 uint16_t adda_x, uint16_t adda_y, uint16_t addb_x, uint16_t addb_y, uint8_t modx, bool suba_x, bool suba_y);
2704void DATA(uint64_t &wdata, uint8_t &dcomp, uint8_t &zcomp, bool &nowrite,
2705 bool big_pix, bool cmpdst, uint8_t daddasel, uint8_t daddbsel, uint8_t daddmode, bool daddq_sel, uint8_t data_sel,
2706 uint8_t dbinh, uint8_t dend, uint8_t dstart, uint64_t dstd, uint32_t iinc, uint8_t lfu_func, uint64_t &patd, bool patdadd,
2707 bool phrase_mode, uint64_t srcd, bool srcdread, bool srczread, bool srcz2add, uint8_t zmode,
2708 bool bcompen, bool bkgwren, bool dcompen, uint8_t icount, uint8_t pixsize,
2709 uint64_t &srcz, uint64_t dstz, uint32_t zinc);
2710void COMP_CTRL(uint8_t &dbinh, bool &nowrite,
2711 bool bcompen, bool big_pix, bool bkgwren, uint8_t dcomp, bool dcompen, uint8_t icount,
2712 uint8_t pixsize, bool phrase_mode, uint8_t srcd, uint8_t zcomp);
2713#define VERBOSE_BLITTER_LOGGING
2714
2715void BlitterMidsummer2(void)
2716{
2717#ifdef LOG_BLITS
2718 LogBlit();
2719#endif
2720 if (startConciseBlitLogging)
2721 LogBlit();
2722
2723 // Here's what the specs say the state machine does. Note that this can probably be
2724 // greatly simplified (also, it's different from what John has in his Oberon docs):
2725//Will remove stuff that isn't in Jaguar I once fully described (stuff like texture won't
2726//be described here at all)...
2727
2728 uint32_t cmd = GET32(blitter_ram, COMMAND);
2729
2730#if 0
2731logBlit = false;
2732if (
2733 cmd != 0x00010200 && // PATDSEL
2734 cmd != 0x01800001 // SRCEN LFUFUNC=C
2735 && cmd != 0x01800005
2736//Boot ROM ATARI letters:
2737 && cmd != 0x00011008 // DSTEN GOURD PATDSEL
2738//Boot ROM spinning cube:
2739 && cmd != 0x41802F41 // SRCEN CLIP_A1 UPDA1 UPDA1F UPDA2 DSTA2 GOURZ ZMODE=0 LFUFUNC=C SRCSHADE
2740//T2K intro screen:
2741 && cmd != 0x01800E01 // SRCEN UPDA1 UPDA2 DSTA2 LFUFUNC=C
2742//T2K TEMPEST letters:
2743 && cmd != 0x09800741 // SRCEN CLIP_A1 UPDA1 UPDA1F UPDA2 LFUFUNC=C DCOMPEN
2744//Static letters on Cybermorph intro screen:
2745 && cmd != 0x09800609 // SRCEN DSTEN UPDA1 UPDA2 LFUFUNC=C DCOMPEN
2746//Static pic on title screen:
2747 && cmd != 0x01800601 // SRCEN UPDA1 UPDA2 LFUFUNC=C
2748//Turning letters on Cybermorph intro screen:
2749// && cmd != 0x09800F41 // SRCEN CLIP_A1 UPDA1 UPDA1F UPDA2 DSTA2 LFUFUNC=C DCOMPEN
2750 && cmd != 0x00113078 // DSTEN DSTENZ DSTWRZ CLIP_A1 GOURD GOURZ PATDSEL ZMODE=4
2751 && cmd != 0x09900F39 // SRCEN DSTEN DSTENZ DSTWRZ UPDA1 UPDA1F UPDA2 DSTA2 ZMODE=4 LFUFUNC=C DCOMPEN
2752 && cmd != 0x09800209 // SRCEN DSTEN UPDA1 LFUFUNC=C DCOMPEN
2753 && cmd != 0x00011200 // UPDA1 GOURD PATDSEL
2754//Start of Hover Strike (clearing screen):
2755 && cmd != 0x00010000 // PATDSEL
2756//Hover Strike text:
2757 && cmd != 0x1401060C // SRCENX DSTEN UPDA1 UPDA2 PATDSEL BCOMPEN BKGWREN
2758//Hover Strike 3D stuff
2759 && cmd != 0x01902839 // SRCEN DSTEN DSTENZ DSTWRZ DSTA2 GOURZ ZMODE=4 LFUFUNC=C
2760//Hover Strike darkening on intro to play (briefing) screen
2761 && cmd != 0x00020208 // DSTEN UPDA1 ADDDSEL
2762//Trevor McFur stuff:
2763 && cmd != 0x05810601 // SRCEN UPDA1 UPDA2 PATDSEL BCOMPEN
2764 && cmd != 0x01800201 // SRCEN UPDA1 LFUFUNC=C
2765//T2K:
2766 && cmd != 0x00011000 // GOURD PATDSEL
2767 && cmd != 0x00011040 // CLIP_A1 GOURD PATDSEL
2768//Checkered flag:
2769 && cmd != 0x01800000 // LFUFUNC=C
2770 && cmd != 0x01800401 //
2771 && cmd != 0x01800040 //
2772 && cmd != 0x00020008 //
2773// && cmd != 0x09800F41 // SRCEN CLIP_A1 UPDA1 UPDA1F UPDA2 DSTA2 LFUFUNC=C DCOMPEN
2774 )
2775 logBlit = true;//*/
2776#else
2777logBlit = true;
2778#endif
2779if (blit_start_log == 0) // Wait for the signal...
2780 logBlit = false;//*/
2781//temp, for testing...
2782/*if (cmd != 0x49820609)
2783 logBlit = false;//*/
2784
2785/*
2786Some T2K unique blits:
2787logBlit = F, cmd = 00010200 *
2788logBlit = F, cmd = 00011000
2789logBlit = F, cmd = 00011040
2790logBlit = F, cmd = 01800005 *
2791logBlit = F, cmd = 09800741 *
2792
2793Hover Strike mission selection screen:
2794Blit! (CMD = 01902839) // SRCEN DSTEN DSTENZ DSTWRZ DSTA2 GOURZ ZMODE=4 LFUFUNC=C
2795
2796Checkered Flag blits in the screw up zone:
2797Blit! (CMD = 01800001) // SRCEN LFUFUNC=C
2798Blit! (CMD = 01800000) // LFUFUNC=C
2799Blit! (CMD = 00010000) // PATDSEL
2800
2801Wolfenstein 3D in the fuckup zone:
2802Blit! (CMD = 01800000) // LFUFUNC=C
2803*/
2804
2805//printf("logBlit = %s, cmd = %08X\n", (logBlit ? "T" : "F"), cmd);
2806//fflush(stdout);
2807//logBlit = true;
2808
2809/*
2810Blit! (CMD = 00011040)
2811Flags: CLIP_A1 GOURD PATDSEL
2812 count = 18 x 1
2813 a1_base = 00100000, a2_base = 0081F6A8
2814 a1_x = 00A7, a1_y = 0014, a1_frac_x = 0000, a1_frac_y = 0000, a2_x = 0001, a2_y = 0000
2815 a1_step_x = FE80, a1_step_y = 0001, a1_stepf_x = 0000, a1_stepf_y = 0000, a2_step_x = FFF8, a2_step_y = 0001
2816 a1_inc_x = 0001, a1_inc_y = 0000, a1_incf_x = 0000, a1_incf_y = 0000
2817 a1_win_x = 0180, a1_win_y = 0118, a2_mask_x = 0000, a2_mask_y = 0000
2818 a2_mask=F a1add=+phr/+0 a2add=+phr/+0
2819 a1_pixsize = 4, a2_pixsize = 4
2820*/
2821//Testing T2K...
2822/*logBlit = false;
2823if (cmd == 0x00011040
2824 && (GET16(blitter_ram, A1_PIXEL + 2) == 0x00A7) && (GET16(blitter_ram, A1_PIXEL + 0) == 0x0014)
2825 && (GET16(blitter_ram, A2_PIXEL + 2) == 0x0001) && (GET16(blitter_ram, A2_PIXEL + 0) == 0x0000)
2826 && (GET16(blitter_ram, PIXLINECOUNTER + 2) == 18))
2827 logBlit = true;*/
2828
2829 // Line states passed in via the command register
2830
2831 bool srcen = (SRCEN), srcenx = (SRCENX), srcenz = (SRCENZ),
2832 dsten = (DSTEN), dstenz = (DSTENZ), dstwrz = (DSTWRZ), clip_a1 = (CLIPA1),
2833 upda1 = (UPDA1), upda1f = (UPDA1F), upda2 = (UPDA2), dsta2 = (DSTA2),
2834 gourd = (GOURD), gourz = (GOURZ), topben = (TOPBEN), topnen = (TOPNEN),
2835 patdsel = (PATDSEL), adddsel = (ADDDSEL), cmpdst = (CMPDST), bcompen = (BCOMPEN),
2836 dcompen = (DCOMPEN), bkgwren = (BKGWREN), srcshade = (SRCSHADE);
2837
2838 uint8_t zmode = (cmd & 0x01C0000) >> 18, lfufunc = (cmd & 0x1E00000) >> 21;
2839//Missing: BUSHI
2840//Where to find various lines:
2841// clip_a1 -> inner
2842// gourd -> dcontrol, inner, outer, state
2843// gourz -> dcontrol, inner, outer, state
2844// cmpdst -> blit, data, datacomp, state
2845// bcompen -> acontrol, inner, mcontrol, state
2846// dcompen -> inner, state
2847// bkgwren -> inner, state
2848// srcshade -> dcontrol, inner, state
2849// adddsel -> dcontrol
2850//NOTE: ADDDSEL takes precedence over PATDSEL, PATDSEL over LFU_FUNC
2851#ifdef VERBOSE_BLITTER_LOGGING
2852if (logBlit)
2853{
2854 char zfs[512], lfus[512];
2855 zfs[0] = lfus[0] = 0;
2856 if (dstwrz || dstenz || gourz)
2857 sprintf(zfs, " ZMODE=%X", zmode);
2858 if (!(patdsel || adddsel))
2859 sprintf(lfus, " LFUFUNC=%X", lfufunc);
2860 WriteLog("\nBlit! (CMD = %08X)\nFlags:%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s\n", cmd,
2861 (srcen ? " SRCEN" : ""), (srcenx ? " SRCENX" : ""), (srcenz ? " SRCENZ" : ""),
2862 (dsten ? " DSTEN" : ""), (dstenz ? " DSTENZ" : ""), (dstwrz ? " DSTWRZ" : ""),
2863 (clip_a1 ? " CLIP_A1" : ""), (upda1 ? " UPDA1" : ""), (upda1f ? " UPDA1F" : ""),
2864 (upda2 ? " UPDA2" : ""), (dsta2 ? " DSTA2" : ""), (gourd ? " GOURD" : ""),
2865 (gourz ? " GOURZ" : ""), (topben ? " TOPBEN" : ""), (topnen ? " TOPNEN" : ""),
2866 (patdsel ? " PATDSEL" : ""), (adddsel ? " ADDDSEL" : ""), zfs, lfus, (cmpdst ? " CMPDST" : ""),
2867 (bcompen ? " BCOMPEN" : ""), (dcompen ? " DCOMPEN" : ""), (bkgwren ? " BKGWREN" : ""),
2868 (srcshade ? " SRCSHADE" : ""));
2869 WriteLog(" count = %d x %d\n", GET16(blitter_ram, PIXLINECOUNTER + 2), GET16(blitter_ram, PIXLINECOUNTER));
2870}
2871#endif
2872
2873 // Lines that don't exist in Jaguar I (and will never be asserted)
2874
2875 bool polygon = false, datinit = false, a1_stepld = false, a2_stepld = false, ext_int = false;
2876 bool istepadd = false, istepfadd = false, finneradd = false, inneradd = false;
2877 bool zstepfadd = false, zstepadd = false;
2878
2879 // Various state lines (initial state--basically the reset state of the FDSYNCs)
2880
2881 bool go = true, idle = true, inner = false, a1fupdate = false, a1update = false,
2882 zfupdate = false, zupdate = false, a2update = false, init_if = false, init_ii = false,
2883 init_zf = false, init_zi = false;
2884
2885 bool outer0 = false, indone = false;
2886
2887 bool idlei, inneri, a1fupdatei, a1updatei, zfupdatei, zupdatei, a2updatei, init_ifi, init_iii,
2888 init_zfi, init_zii;
2889
2890 bool notgzandp = !(gourz && polygon);
2891
2892 // Various registers set up by user
2893
2894 uint16_t ocount = GET16(blitter_ram, PIXLINECOUNTER);
2895 uint8_t a1_pitch = blitter_ram[A1_FLAGS + 3] & 0x03;
2896 uint8_t a2_pitch = blitter_ram[A2_FLAGS + 3] & 0x03;
2897 uint8_t a1_pixsize = (blitter_ram[A1_FLAGS + 3] & 0x38) >> 3;
2898 uint8_t a2_pixsize = (blitter_ram[A2_FLAGS + 3] & 0x38) >> 3;
2899 uint8_t a1_zoffset = (GET16(blitter_ram, A1_FLAGS + 2) >> 6) & 0x07;
2900 uint8_t a2_zoffset = (GET16(blitter_ram, A2_FLAGS + 2) >> 6) & 0x07;
2901 uint8_t a1_width = (blitter_ram[A1_FLAGS + 2] >> 1) & 0x3F;
2902 uint8_t a2_width = (blitter_ram[A2_FLAGS + 2] >> 1) & 0x3F;
2903 bool a2_mask = blitter_ram[A2_FLAGS + 2] & 0x80;
2904 uint8_t a1addx = blitter_ram[A1_FLAGS + 1] & 0x03, a2addx = blitter_ram[A2_FLAGS + 1] & 0x03;
2905 bool a1addy = blitter_ram[A1_FLAGS + 1] & 0x04, a2addy = blitter_ram[A2_FLAGS + 1] & 0x04;
2906 bool a1xsign = blitter_ram[A1_FLAGS + 1] & 0x08, a2xsign = blitter_ram[A2_FLAGS + 1] & 0x08;
2907 bool a1ysign = blitter_ram[A1_FLAGS + 1] & 0x10, a2ysign = blitter_ram[A2_FLAGS + 1] & 0x10;
2908 uint32_t a1_base = GET32(blitter_ram, A1_BASE) & 0xFFFFFFF8; // Phrase aligned by ignoring bottom 3 bits
2909 uint32_t a2_base = GET32(blitter_ram, A2_BASE) & 0xFFFFFFF8;
2910
2911 uint16_t a1_win_x = GET16(blitter_ram, A1_CLIP + 2) & 0x7FFF;
2912 uint16_t a1_win_y = GET16(blitter_ram, A1_CLIP + 0) & 0x7FFF;
2913 int16_t a1_x = (int16_t)GET16(blitter_ram, A1_PIXEL + 2);
2914 int16_t a1_y = (int16_t)GET16(blitter_ram, A1_PIXEL + 0);
2915 int16_t a1_step_x = (int16_t)GET16(blitter_ram, A1_STEP + 2);
2916 int16_t a1_step_y = (int16_t)GET16(blitter_ram, A1_STEP + 0);
2917 uint16_t a1_stepf_x = GET16(blitter_ram, A1_FSTEP + 2);
2918 uint16_t a1_stepf_y = GET16(blitter_ram, A1_FSTEP + 0);
2919 uint16_t a1_frac_x = GET16(blitter_ram, A1_FPIXEL + 2);
2920 uint16_t a1_frac_y = GET16(blitter_ram, A1_FPIXEL + 0);
2921 int16_t a1_inc_x = (int16_t)GET16(blitter_ram, A1_INC + 2);
2922 int16_t a1_inc_y = (int16_t)GET16(blitter_ram, A1_INC + 0);
2923 uint16_t a1_incf_x = GET16(blitter_ram, A1_FINC + 2);
2924 uint16_t a1_incf_y = GET16(blitter_ram, A1_FINC + 0);
2925
2926 int16_t a2_x = (int16_t)GET16(blitter_ram, A2_PIXEL + 2);
2927 int16_t a2_y = (int16_t)GET16(blitter_ram, A2_PIXEL + 0);
2928 uint16_t a2_mask_x = GET16(blitter_ram, A2_MASK + 2);
2929 uint16_t a2_mask_y = GET16(blitter_ram, A2_MASK + 0);
2930 int16_t a2_step_x = (int16_t)GET16(blitter_ram, A2_STEP + 2);
2931 int16_t a2_step_y = (int16_t)GET16(blitter_ram, A2_STEP + 0);
2932
2933 uint64_t srcd1 = GET64(blitter_ram, SRCDATA);
2934 uint64_t srcd2 = 0;
2935 uint64_t dstd = GET64(blitter_ram, DSTDATA);
2936 uint64_t patd = GET64(blitter_ram, PATTERNDATA);
2937 uint32_t iinc = GET32(blitter_ram, INTENSITYINC);
2938 uint64_t srcz1 = GET64(blitter_ram, SRCZINT);
2939 uint64_t srcz2 = GET64(blitter_ram, SRCZFRAC);
2940 uint64_t dstz = GET64(blitter_ram, DSTZ);
2941 uint32_t zinc = GET32(blitter_ram, ZINC);
2942 uint32_t collision = GET32(blitter_ram, COLLISIONCTRL);// 0=RESUME, 1=ABORT, 2=STOPEN
2943
2944 uint8_t pixsize = (dsta2 ? a2_pixsize : a1_pixsize); // From ACONTROL
2945
2946//Testing Trevor McFur--I *think* it's the circle on the lower RHS of the screen...
2947/*logBlit = false;
2948if (cmd == 0x05810601 && (GET16(blitter_ram, PIXLINECOUNTER + 2) == 96)
2949 && (GET16(blitter_ram, PIXLINECOUNTER + 0) == 72))
2950 logBlit = true;//*/
2951//Testing...
2952//if (cmd == 0x1401060C) patd = 0xFFFFFFFFFFFFFFFFLL;
2953//if (cmd == 0x1401060C) patd = 0x00000000000000FFLL;
2954//If it's still not working (bcompen-patd) then see who's writing what to patd and where...
2955//Still not OK. Check to see who's writing what to where in patd!
2956//It looks like M68K is writing to the top half of patd... Hmm...
2957/*
2958----> M68K wrote 0000 to byte 15737344 of PATTERNDATA...
2959--> M68K wrote 00 to byte 0 of PATTERNDATA...
2960--> M68K wrote 00 to byte 1 of PATTERNDATA...
2961----> M68K wrote 00FF to byte 15737346 of PATTERNDATA...
2962--> M68K wrote 00 to byte 2 of PATTERNDATA...
2963--> M68K wrote FF to byte 3 of PATTERNDATA...
2964logBlit = F, cmd = 1401060C
2965
2966Wren0 := ND6 (wren\[0], gpua\[5], gpua\[6..8], bliten, gpu_memw);
2967Wren1 := ND6 (wren\[1], gpua[5], gpua\[6..8], bliten, gpu_memw);
2968Wren2 := ND6 (wren\[2], gpua\[5], gpua[6], gpua\[7..8], bliten, gpu_memw);
2969Wren3 := ND6 (wren\[3], gpua[5], gpua[6], gpua\[7..8], bliten, gpu_memw);
2970
2971--> 0 000x xx00
2972Dec0 := D38GH (a1baseld, a1flagld, a1winld, a1ptrld, a1stepld, a1stepfld, a1fracld, a1incld, gpua[2..4], wren\[0]);
2973--> 0 001x xx00
2974Dec1 := D38GH (a1incfld, a2baseld, a2flagld, a2maskld, a2ptrldg, a2stepld, cmdldt, countldt, gpua[2..4], wren\[1]);
2975--> 0 010x xx00
2976Dec2 := D38GH (srcd1ldg[0..1], dstdldg[0..1], dstzldg[0..1], srcz1ldg[0..1], gpua[2..4], wren\[2]);
2977--> 0 011x xx00
2978Dec3 := D38GH (srcz2ld[0..1], patdld[0..1], iincld, zincld, stopld, intld[0], gpua[2..4], wren\[3]);
2979
2980wren[3] is asserted when gpu address bus = 0 011x xx00
2981patdld[0] -> 0 0110 1000 -> $F02268 (lo 32 bits)
2982patdld[1] -> 0 0110 1100 -> $F0226C (hi 32 bits)
2983
2984So... It's reversed! The data organization of the patd register is [low 32][high 32]! !!! FIX !!! [DONE]
2985And fix all the other 64 bit registers [DONE]
2986*/
2987/*if (cmd == 0x1401060C)
2988{
2989 printf("logBlit = %s, cmd = %08X\n", (logBlit ? "T" : "F"), cmd);
2990 fflush(stdout);
2991}*/
2992/*logBlit = false;
2993if ((cmd == 0x00010200) && (GET16(blitter_ram, PIXLINECOUNTER + 2) == 9))
2994 logBlit = true;
2995
2996; Pink altimeter bar
2997
2998Blit! (00110000 <- 000BF010) count: 9 x 23, A1/2_FLAGS: 000042E2/00010020 [cmd: 00010200]
2999 CMD -> src: dst: misc: a1ctl: UPDA1 mode: ity: PATDSEL z-op: op: LFU_CLEAR ctrl:
3000 A1 step values: -10 (X), 1 (Y)
3001 A1 -> pitch: 4 phrases, depth: 16bpp, z-off: 3, width: 320 (21), addctl: XADDPHR YADD0 XSIGNADD YSIGNADD
3002 A2 -> pitch: 1 phrases, depth: 16bpp, z-off: 0, width: 1 (00), addctl: XADDPIX YADD0 XSIGNADD YSIGNADD
3003 A1 x/y: 262/132, A2 x/y: 129/0
3004;x-coord is 257 in pic, so add 5
3005;20 for ship, 33 for #... Let's see if we can find 'em!
3006
3007; Black altimeter bar
3008
3009Blit! (00110000 <- 000BF010) count: 5 x 29, A1/2_FLAGS: 000042E2/00010020 [cmd: 00010200]
3010 CMD -> src: dst: misc: a1ctl: UPDA1 mode: ity: PATDSEL z-op: op: LFU_CLEAR ctrl:
3011 A1 step values: -8 (X), 1 (Y)
3012 A1 -> pitch: 4 phrases, depth: 16bpp, z-off: 3, width: 320 (21), addctl: XADDPHR YADD0 XSIGNADD YSIGNADD
3013 A2 -> pitch: 1 phrases, depth: 16bpp, z-off: 0, width: 1 (00), addctl: XADDPIX YADD0 XSIGNADD YSIGNADD
3014 A1 x/y: 264/126, A2 x/y: 336/0
3015
3016Here's the pink bar--note that it's phrase mode without dread, so how does this work???
3017Not sure, but I *think* that somehow it MUXes the data at the write site in on the left or right side
3018of the write data when masked in phrase mode. I'll have to do some tracing to see if this is the mechanism
3019it uses or not...
3020
3021Blit! (CMD = 00010200)
3022Flags: UPDA1 PATDSEL
3023 count = 9 x 11
3024 a1_base = 00110010, a2_base = 000BD7E0
3025 a1_x = 0106, a1_y = 0090, a1_frac_x = 0000, a1_frac_y = 8000, a2_x = 025A, a2_y = 0000
3026 a1_step_x = FFF6, a1_step_y = 0001, a1_stepf_x = 5E00, a1_stepf_y = D100, a2_step_x = FFF7, a2_step_y = 0001
3027 a1_inc_x = 0001, a1_inc_y = FFFF, a1_incf_x = 0000, a1_incf_y = E000
3028 a1_win_x = 0000, a1_win_y = 0000, a2_mask_x = 0000, a2_mask_y = 0000
3029 a2_mask=F a1add=+phr/+0 a2add=+1/+0
3030 a1_pixsize = 4, a2_pixsize = 4
3031 srcd=BAC673AC2C92E578 dstd=0000000000000000 patd=74C074C074C074C0 iinc=0002E398
3032 srcz1=7E127E12000088DA srcz2=DBE06DF000000000 dstz=0000000000000000 zinc=FFFE4840, coll=0
3033 Phrase mode is ON
3034 [in=T a1f=F a1=F zf=F z=F a2=F iif=F iii=F izf=F izi=F]
3035 Entering INNER state...
3036 Entering DWRITE state...
3037 Dest write address/pix address: 0016A830/0 [dstart=20 dend=40 pwidth=8 srcshift=0][daas=0 dabs=0 dam=7 ds=0 daq=F] [7400000074C074C0] (icount=0007, inc=2)
3038 Entering A1_ADD state [a1_x=0106, a1_y=0090, addasel=0, addbsel=0, modx=2, addareg=F, adda_xconst=2, adda_yconst=0]...
3039 Entering DWRITE state...
3040 Dest write address/pix address: 0016A850/0 [dstart=0 dend=40 pwidth=8 srcshift=0][daas=0 dabs=0 dam=7 ds=0 daq=F] [74C074C074C074C0] (icount=0003, inc=4)
3041 Entering A1_ADD state [a1_x=0108, a1_y=0090, addasel=0, addbsel=0, modx=2, addareg=F, adda_xconst=2, adda_yconst=0]...
3042 Entering DWRITE state...
3043 Dest write address/pix address: 0016A870/0 [dstart=0 dend=30 pwidth=8 srcshift=0][daas=0 dabs=0 dam=7 ds=0 daq=F] [74C074C074C00000] (icount=FFFF, inc=4)
3044 Entering A1_ADD state [a1_x=010C, a1_y=0090, addasel=0, addbsel=0, modx=2, addareg=F, adda_xconst=2, adda_yconst=0]...
3045 Entering IDLE_INNER state...
3046 Leaving INNER state... (ocount=000A)
3047 [in=F a1f=F a1=T zf=F z=F a2=F iif=F iii=F izf=F izi=F]
3048 Entering A1UPDATE state... (272/144 -> 262/145)
3049 [in=T a1f=F a1=F zf=F z=F a2=F iif=F iii=F izf=F izi=F]
3050 Entering INNER state...
3051*/
3052
3053 // Bugs in Jaguar I
3054
3055 a2addy = a1addy; // A2 channel Y add bit is tied to A1's
3056
3057//if (logBlit && (ocount > 20)) logBlit = false;
3058#ifdef VERBOSE_BLITTER_LOGGING
3059if (logBlit)
3060{
3061 WriteLog(" a1_base = %08X, a2_base = %08X\n", a1_base, a2_base);
3062 WriteLog(" a1_x = %04X, a1_y = %04X, a1_frac_x = %04X, a1_frac_y = %04X, a2_x = %04X, a2_y = %04X\n", (uint16_t)a1_x, (uint16_t)a1_y, a1_frac_x, a1_frac_y, (uint16_t)a2_x, (uint16_t)a2_y);
3063 WriteLog(" a1_step_x = %04X, a1_step_y = %04X, a1_stepf_x = %04X, a1_stepf_y = %04X, a2_step_x = %04X, a2_step_y = %04X\n", (uint16_t)a1_step_x, (uint16_t)a1_step_y, a1_stepf_x, a1_stepf_y, (uint16_t)a2_step_x, (uint16_t)a2_step_y);
3064 WriteLog(" a1_inc_x = %04X, a1_inc_y = %04X, a1_incf_x = %04X, a1_incf_y = %04X\n", (uint16_t)a1_inc_x, (uint16_t)a1_inc_y, a1_incf_x, a1_incf_y);
3065 WriteLog(" a1_win_x = %04X, a1_win_y = %04X, a2_mask_x = %04X, a2_mask_y = %04X\n", a1_win_x, a1_win_y, a2_mask_x, a2_mask_y);
3066 char x_add_str[4][4] = { "phr", "1", "0", "inc" };
3067 WriteLog(" a2_mask=%s a1add=%s%s/%s%s a2add=%s%s/%s%s\n", (a2_mask ? "T" : "F"), (a1xsign ? "-" : "+"), x_add_str[a1addx],
3068 (a1ysign ? "-" : "+"), (a1addy ? "1" : "0"), (a2xsign ? "-" : "+"), x_add_str[a2addx],
3069 (a2ysign ? "-" : "+"), (a2addy ? "1" : "0"));
3070 WriteLog(" a1_pixsize = %u, a2_pixsize = %u\n", a1_pixsize, a2_pixsize);
3071 WriteLog(" srcd=%08X%08X dstd=%08X%08X patd=%08X%08X iinc=%08X\n",
3072 (uint32_t)(srcd1 >> 32), (uint32_t)(srcd1 & 0xFFFFFFFF),
3073 (uint32_t)(dstd >> 32), (uint32_t)(dstd & 0xFFFFFFFF),
3074 (uint32_t)(patd >> 32), (uint32_t)(patd & 0xFFFFFFFF), iinc);
3075 WriteLog(" srcz1=%08X%08X srcz2=%08X%08X dstz=%08X%08X zinc=%08X, coll=%X\n",
3076 (uint32_t)(srcz1 >> 32), (uint32_t)(srcz1 & 0xFFFFFFFF),
3077 (uint32_t)(srcz2 >> 32), (uint32_t)(srcz2 & 0xFFFFFFFF),
3078 (uint32_t)(dstz >> 32), (uint32_t)(dstz & 0xFFFFFFFF), zinc, collision);
3079}
3080#endif
3081
3082 // Various state lines set up by user
3083
3084 bool phrase_mode = ((!dsta2 && a1addx == 0) || (dsta2 && a2addx == 0) ? true : false); // From ACONTROL
3085#ifdef VERBOSE_BLITTER_LOGGING
3086if (logBlit)
3087 WriteLog(" Phrase mode is %s\n", (phrase_mode ? "ON" : "off"));
3088#endif
3089//logBlit = false;
3090
3091 // Stopgap vars to simulate various lines
3092
3093 uint16_t a1FracCInX = 0, a1FracCInY = 0;
3094
3095 while (true)
3096 {
3097 // IDLE
3098
3099 if ((idle && !go) || (inner && outer0 && indone))
3100 {
3101#ifdef VERBOSE_BLITTER_LOGGING
3102if (logBlit)
3103 WriteLog(" Entering IDLE state...\n");
3104#endif
3105 idlei = true;
3106
3107//Instead of a return, let's try breaking out of the loop...
3108break;
3109// return;
3110 }
3111 else
3112 idlei = false;
3113
3114 // INNER LOOP ACTIVE
3115/*
3116 Entering DWRITE state... (icount=0000, inc=4)
3117 Entering IDLE_INNER state...
3118 Leaving INNER state... (ocount=00EF)
3119 [in=T a1f=F a1=T zf=F z=F a2=F iif=F iii=F izf=F izi=F]
3120 Entering INNER state...
3121Now:
3122 [in=F a1f=F a1=F zf=F z=F a2=F iif=F iii=F izf=F izi=F]
3123*/
3124
3125 if ((idle && go && !datinit)
3126 || (inner && !indone)
3127 || (inner && indone && !outer0 && !upda1f && !upda1 && notgzandp && !upda2 && !datinit)
3128 || (a1update && !upda2 && notgzandp && !datinit)
3129 || (zupdate && !upda2 && !datinit)
3130 || (a2update && !datinit)
3131 || (init_ii && !gourz)
3132 || (init_zi))
3133 {
3134 inneri = true;
3135 }
3136 else
3137 inneri = false;
3138
3139 // A1 FRACTION UPDATE
3140
3141 if (inner && indone && !outer0 && upda1f)
3142 {
3143 a1fupdatei = true;
3144 }
3145 else
3146 a1fupdatei = false;
3147
3148 // A1 POINTER UPDATE
3149
3150 if ((a1fupdate)
3151 || (inner && indone && !outer0 && !upda1f && upda1))
3152 {
3153 a1updatei = true;
3154 }
3155 else
3156 a1updatei = false;
3157
3158 // Z FRACTION UPDATE
3159
3160 if ((a1update && gourz && polygon)
3161 || (inner && indone && !outer0 && !upda1f && !upda1 && gourz && polygon))
3162 {
3163 zfupdatei = true;
3164 }
3165 else
3166 zfupdatei = false;
3167
3168 // Z INTEGER UPDATE
3169
3170 if (zfupdate)
3171 {
3172 zupdatei = true;
3173 }
3174 else
3175 zupdatei = false;
3176
3177 // A2 POINTER UPDATE
3178
3179 if ((a1update && upda2 && notgzandp)
3180 || (zupdate && upda2)
3181 || (inner && indone && !outer0 && !upda1f && notgzandp && !upda1 && upda2))
3182 {
3183 a2updatei = true;
3184 }
3185 else
3186 a2updatei = false;
3187
3188 // INITIALIZE INTENSITY FRACTION
3189
3190 if ((zupdate && !upda2 && datinit)
3191 || (a1update && !upda2 && datinit && notgzandp)
3192 || (inner && indone && !outer0 && !upda1f && !upda1 && notgzandp && !upda2 && datinit)
3193 || (a2update && datinit)
3194 || (idle && go && datinit))
3195 {
3196 init_ifi = true;
3197 }
3198 else
3199 init_ifi = false;
3200
3201 // INITIALIZE INTENSITY INTEGER
3202
3203 if (init_if)
3204 {
3205 init_iii = true;
3206 }
3207 else
3208 init_iii = false;
3209
3210 // INITIALIZE Z FRACTION
3211
3212 if (init_ii && gourz)
3213 {
3214 init_zfi = true;
3215 }
3216 else
3217 init_zfi = false;
3218
3219 // INITIALIZE Z INTEGER
3220
3221 if (init_zf)
3222 {
3223 init_zii = true;
3224 }
3225 else
3226 init_zii = false;
3227
3228// Here we move the fooi into their foo counterparts in order to simulate the moving
3229// of data into the various FDSYNCs... Each time we loop we simulate one clock cycle...
3230
3231 idle = idlei;
3232 inner = inneri;
3233 a1fupdate = a1fupdatei;
3234 a1update = a1updatei;
3235 zfupdate = zfupdatei; // *
3236 zupdate = zupdatei; // *
3237 a2update = a2updatei;
3238 init_if = init_ifi; // *
3239 init_ii = init_iii; // *
3240 init_zf = init_zfi; // *
3241 init_zi = init_zii; // *
3242// * denotes states that will never assert for Jaguar I
3243#ifdef VERBOSE_BLITTER_LOGGING
3244if (logBlit)
3245 WriteLog(" [in=%c a1f=%c a1=%c zf=%c z=%c a2=%c iif=%c iii=%c izf=%c izi=%c]\n",
3246 (inner ? 'T' : 'F'), (a1fupdate ? 'T' : 'F'), (a1update ? 'T' : 'F'),
3247 (zfupdate ? 'T' : 'F'), (zupdate ? 'T' : 'F'), (a2update ? 'T' : 'F'),
3248 (init_if ? 'T' : 'F'), (init_ii ? 'T' : 'F'), (init_zf ? 'T' : 'F'),
3249 (init_zi ? 'T' : 'F'));
3250#endif
3251
3252// Now, depending on how we want to handle things, we could either put the implementation
3253// of the various pieces up above, or handle them down below here.
3254
3255// Let's try postprocessing for now...
3256
3257 if (inner)
3258 {
3259 indone = false;
3260#ifdef VERBOSE_BLITTER_LOGGING
3261if (logBlit)
3262 WriteLog(" Entering INNER state...\n");
3263#endif
3264 uint16_t icount = GET16(blitter_ram, PIXLINECOUNTER + 2);
3265 bool idle_inner = true, step = true, sreadx = false, szreadx = false, sread = false,
3266 szread = false, dread = false, dzread = false, dwrite = false, dzwrite = false;
3267 bool inner0 = false;
3268 bool idle_inneri, sreadxi, szreadxi, sreadi, szreadi, dreadi, dzreadi, dwritei, dzwritei;
3269
3270 // State lines that will never assert in Jaguar I
3271
3272 bool textext = false, txtread = false;
3273
3274//other stuff
3275uint8_t srcshift = 0;
3276bool sshftld = true; // D flipflop (D -> Q): instart -> sshftld
3277//NOTE: sshftld probably is only asserted at the beginning of the inner loop. !!! FIX !!!
3278/*
3279Blit! (CMD = 01800005)
3280Flags: SRCEN SRCENX LFUFUNC=C
3281 count = 626 x 1
3282 a1_base = 00037290, a2_base = 000095D0
3283 a1_x = 0000, a1_y = 0000, a2_x = 0002, a2_y = 0000
3284 a1_pixsize = 4, a2_pixsize = 4
3285 srcd=0000000000000000, dstd=0000000000000000, patd=0000000000000000
3286 Phrase mode is ON
3287 [in=T a1f=F a1=F zf=F z=F a2=F iif=F iii=F izf=F izi=F]
3288 Entering INNER state...
3289 Entering SREADX state... [dstart=0 dend=20 pwidth=8 srcshift=20]
3290 Source extra read address/pix address: 000095D4/0 [0000001C00540038]
3291 Entering A2_ADD state [a2_x=0002, a2_y=0000, addasel=0, addbsel=1, modx=2, addareg=F, adda_xconst=2, adda_yconst=0]...
3292 Entering SREAD state... [dstart=0 dend=20 pwidth=8 srcshift=0]
3293 Source read address/pix address: 000095D8/0 [0054003800009814]
3294 Entering A2_ADD state [a2_x=0004, a2_y=0000, addasel=0, addbsel=1, modx=2, addareg=F, adda_xconst=2, adda_yconst=0]...
3295 Entering DWRITE state...
3296 Dest write address/pix address: 00037290/0 [dstart=0 dend=20 pwidth=8 srcshift=0] (icount=026E, inc=4)
3297 Entering A1_ADD state [a1_x=0000, a1_y=0000, addasel=0, addbsel=0, modx=2, addareg=F, adda_xconst=2, adda_yconst=0]...
3298 Entering SREAD state... [dstart=0 dend=20 pwidth=8 srcshift=0]
3299 Source read address/pix address: 000095E0/0 [00009968000377C7]
3300 Entering A2_ADD state [a2_x=0008, a2_y=0000, addasel=0, addbsel=1, modx=2, addareg=F, adda_xconst=2, adda_yconst=0]...
3301 Entering DWRITE state...
3302 Dest write address/pix address: 00037298/0 [dstart=0 dend=20 pwidth=8 srcshift=0] (icount=026A, inc=4)
3303 Entering A1_ADD state [a1_x=0004, a1_y=0000, addasel=0, addbsel=0, modx=2, addareg=F, adda_xconst=2, adda_yconst=0]...
3304*/
3305
3306// while (!idle_inner)
3307 while (true)
3308 {
3309 // IDLE
3310
3311 if ((idle_inner && !step)
3312 || (dzwrite && step && inner0)
3313 || (dwrite && step && !dstwrz && inner0))
3314 {
3315#ifdef VERBOSE_BLITTER_LOGGING
3316if (logBlit)
3317 WriteLog(" Entering IDLE_INNER state...\n");
3318#endif
3319 idle_inneri = true;
3320break;
3321 }
3322 else
3323 idle_inneri = false;
3324
3325 // EXTRA SOURCE DATA READ
3326
3327 if ((idle_inner && step && srcenx)
3328 || (sreadx && !step))
3329 {
3330 sreadxi = true;
3331 }
3332 else
3333 sreadxi = false;
3334
3335 // EXTRA SOURCE ZED READ
3336
3337 if ((sreadx && step && srcenz)
3338 || (szreadx && !step))
3339 {
3340 szreadxi = true;
3341 }
3342 else
3343 szreadxi = false;
3344
3345 // TEXTURE DATA READ (not implemented because not in Jaguar I)
3346
3347 // SOURCE DATA READ
3348
3349 if ((szreadx && step && !textext)
3350 || (sreadx && step && !srcenz && srcen)
3351 || (idle_inner && step && !srcenx && !textext && srcen)
3352 || (dzwrite && step && !inner0 && !textext && srcen)
3353 || (dwrite && step && !dstwrz && !inner0 && !textext && srcen)
3354 || (txtread && step && srcen)
3355 || (sread && !step))
3356 {
3357 sreadi = true;
3358 }
3359 else
3360 sreadi = false;
3361
3362 // SOURCE ZED READ
3363
3364 if ((sread && step && srcenz)
3365 || (szread && !step))
3366 {
3367 szreadi = true;
3368 }
3369 else
3370 szreadi = false;
3371
3372 // DESTINATION DATA READ
3373
3374 if ((szread && step && dsten)
3375 || (sread && step && !srcenz && dsten)
3376 || (sreadx && step && !srcenz && !textext && !srcen && dsten)
3377 || (idle_inner && step && !srcenx && !textext && !srcen && dsten)
3378 || (dzwrite && step && !inner0 && !textext && !srcen && dsten)
3379 || (dwrite && step && !dstwrz && !inner0 && !textext && !srcen && dsten)
3380 || (txtread && step && !srcen && dsten)
3381 || (dread && !step))
3382 {
3383 dreadi = true;
3384 }
3385 else
3386 dreadi = false;
3387
3388 // DESTINATION ZED READ
3389
3390 if ((dread && step && dstenz)
3391 || (szread && step && !dsten && dstenz)
3392 || (sread && step && !srcenz && !dsten && dstenz)
3393 || (sreadx && step && !srcenz && !textext && !srcen && !dsten && dstenz)
3394 || (idle_inner && step && !srcenx && !textext && !srcen && !dsten && dstenz)
3395 || (dzwrite && step && !inner0 && !textext && !srcen && !dsten && dstenz)
3396 || (dwrite && step && !dstwrz && !inner0 && !textext && !srcen && !dsten && dstenz)
3397 || (txtread && step && !srcen && !dsten && dstenz)
3398 || (dzread && !step))
3399 {
3400 dzreadi = true;
3401 }
3402 else
3403 dzreadi = false;
3404
3405 // DESTINATION DATA WRITE
3406
3407 if ((dzread && step)
3408 || (dread && step && !dstenz)
3409 || (szread && step && !dsten && !dstenz)
3410 || (sread && step && !srcenz && !dsten && !dstenz)
3411 || (txtread && step && !srcen && !dsten && !dstenz)
3412 || (sreadx && step && !srcenz && !textext && !srcen && !dsten && !dstenz)
3413 || (idle_inner && step && !srcenx && !textext && !srcen && !dsten && !dstenz)
3414 || (dzwrite && step && !inner0 && !textext && !srcen && !dsten && !dstenz)
3415 || (dwrite && step && !dstwrz && !inner0 && !textext && !srcen && !dsten && !dstenz)
3416 || (dwrite && !step))
3417 {
3418 dwritei = true;
3419 }
3420 else
3421 dwritei = false;
3422
3423 // DESTINATION ZED WRITE
3424
3425 if ((dzwrite && !step)
3426 || (dwrite && step && dstwrz))
3427 {
3428 dzwritei = true;
3429 }
3430 else
3431 dzwritei = false;
3432
3433//Kludge: A QnD way to make sure that sshftld is asserted only for the first
3434// cycle of the inner loop...
3435sshftld = idle_inner;
3436
3437// Here we move the fooi into their foo counterparts in order to simulate the moving
3438// of data into the various FDSYNCs... Each time we loop we simulate one clock cycle...
3439
3440 idle_inner = idle_inneri;
3441 sreadx = sreadxi;
3442 szreadx = szreadxi;
3443 sread = sreadi;
3444 szread = szreadi;
3445 dread = dreadi;
3446 dzread = dzreadi;
3447 dwrite = dwritei;
3448 dzwrite = dzwritei;
3449
3450// Here's a few more decodes--not sure if they're supposed to go here or not...
3451
3452 bool srca_addi = (sreadxi && !srcenz) || (sreadi && !srcenz) || szreadxi || szreadi;
3453
3454 bool dsta_addi = (dwritei && !dstwrz) || dzwritei;
3455
3456 bool gensrc = sreadxi || szreadxi || sreadi || szreadi;
3457 bool gendst = dreadi || dzreadi || dwritei || dzwritei;
3458 bool gena2i = (gensrc && !dsta2) || (gendst && dsta2);
3459
3460 bool zaddr = szreadx || szread || dzread || dzwrite;
3461
3462// Some stuff from MCONTROL.NET--not sure if this is the correct use of this decode or not...
3463/*Fontread\ := OND1 (fontread\, sread[1], sreadx[1], bcompen);
3464Fontread := INV1 (fontread, fontread\);
3465Justt := NAN3 (justt, fontread\, phrase_mode, tactive\);
3466Justify := TS (justify, justt, busen);*/
3467bool fontread = (sread || sreadx) && bcompen;
3468bool justify = !(!fontread && phrase_mode /*&& tactive*/);
3469
3470/* Generate inner loop update enables */
3471/*
3472A1_addi := MX2 (a1_addi, dsta_addi, srca_addi, dsta2);
3473A2_addi := MX2 (a2_addi, srca_addi, dsta_addi, dsta2);
3474A1_add := FD1 (a1_add, a1_add\, a1_addi, clk);
3475A2_add := FD1 (a2_add, a2_add\, a2_addi, clk);
3476A2_addb := BUF1 (a2_addb, a2_add);
3477*/
3478 bool a1_add = (dsta2 ? srca_addi : dsta_addi);
3479 bool a2_add = (dsta2 ? dsta_addi : srca_addi);
3480
3481/* Address adder input A register selection
3482000 A1 step integer part
3483001 A1 step fraction part
3484010 A1 increment integer part
3485011 A1 increment fraction part
3486100 A2 step
3487
3488bit 2 = a2update
3489bit 1 = /a2update . (a1_add . a1addx[0..1])
3490bit 0 = /a2update . ( a1fupdate
3491 + a1_add . atick[0] . a1addx[0..1])
3492The /a2update term on bits 0 and 1 is redundant.
3493Now look-ahead based
3494*/
3495 uint8_t addasel = (a1fupdate || (a1_add && a1addx == 3) ? 0x01 : 0x00);
3496 addasel |= (a1_add && a1addx == 3 ? 0x02 : 0x00);
3497 addasel |= (a2update ? 0x04 : 0x00);
3498/* Address adder input A X constant selection
3499adda_xconst[0..2] generate a power of 2 in the range 1-64 or all
3500zeroes when they are all 1
3501Remember - these are pixels, so to add one phrase the pixel size
3502has to be taken into account to get the appropriate value.
3503for A1
3504 if a1addx[0..1] are 00 set 6 - pixel size
3505 if a1addx[0..1] are 01 set the value 000
3506 if a1addx[0..1] are 10 set the value 111
3507similarly for A2
3508JLH: Also, 11 will likewise set the value to 111
3509*/
3510 uint8_t a1_xconst = 6 - a1_pixsize, a2_xconst = 6 - a2_pixsize;
3511
3512 if (a1addx == 1)
3513 a1_xconst = 0;
3514 else if (a1addx & 0x02)
3515 a1_xconst = 7;
3516
3517 if (a2addx == 1)
3518 a2_xconst = 0;
3519 else if (a2addx & 0x02)
3520 a2_xconst = 7;
3521
3522 uint8_t adda_xconst = (a2_add ? a2_xconst : a1_xconst);
3523/* Address adder input A Y constant selection
352422 June 94 - This was erroneous, because only the a1addy bit was reflected here.
3525Therefore, the selection has to be controlled by a bug fix bit.
3526JLH: Bug fix bit in Jaguar II--not in Jaguar I!
3527*/
3528 bool adda_yconst = a1addy;
3529/* Address adder input A register versus constant selection
3530given by a1_add . a1addx[0..1]
3531 + a1update
3532 + a1fupdate
3533 + a2_add . a2addx[0..1]
3534 + a2update
3535*/
3536 bool addareg = ((a1_add && a1addx == 3) || a1update || a1fupdate
3537 || (a2_add && a2addx == 3) || a2update ? true : false);
3538/* The adders can be put into subtract mode in add pixel size
3539mode when the corresponding flags are set */
3540 bool suba_x = ((a1_add && a1xsign && a1addx == 1) || (a2_add && a2xsign && a2addx == 1) ? true : false);
3541 bool suba_y = ((a1_add && a1addy && a1ysign) || (a2_add && a2addy && a2ysign) ? true : false);
3542/* Address adder input B selection
354300 A1 pointer
354401 A2 pointer
354510 A1 fraction
354611 Zero
3547
3548Bit 1 = a1fupdate
3549 + (a1_add . atick[0] . a1addx[0..1])
3550 + a1fupdate . a1_stepld
3551 + a1update . a1_stepld
3552 + a2update . a2_stepld
3553Bit 0 = a2update + a2_add
3554 + a1fupdate . a1_stepld
3555 + a1update . a1_stepld
3556 + a2update . a2_stepld
3557*/
3558 uint8_t addbsel = (a2update || a2_add || (a1fupdate && a1_stepld)
3559 || (a1update && a1_stepld) || (a2update && a2_stepld) ? 0x01 : 0x00);
3560 addbsel |= (a1fupdate || (a1_add && a1addx == 3) || (a1fupdate && a1_stepld)
3561 || (a1update && a1_stepld) || (a2update && a2_stepld) ? 0x02 : 0x00);
3562
3563/* The modulo bits are used to align X onto a phrase boundary when
3564it is being updated by one phrase
3565000 no mask
3566001 mask bit 0
3567010 mask bits 1-0
3568..
3569110 mask bits 5-0
3570
3571Masking is enabled for a1 when a1addx[0..1] is 00, and the value
3572is 6 - the pixel size (again!)
3573*/
3574 uint8_t maska1 = (a1_add && a1addx == 0 ? 6 - a1_pixsize : 0);
3575 uint8_t maska2 = (a2_add && a2addx == 0 ? 6 - a2_pixsize : 0);
3576 uint8_t modx = (a2_add ? maska2 : maska1);
3577/* Generate load strobes for the increment updates */
3578
3579/*A1pldt := NAN2 (a1pldt, atick[1], a1_add);
3580A1ptrldi := NAN2 (a1ptrldi, a1update\, a1pldt);
3581
3582A1fldt := NAN4 (a1fldt, atick[0], a1_add, a1addx[0..1]);
3583A1fracldi := NAN2 (a1fracldi, a1fupdate\, a1fldt);
3584
3585A2pldt := NAN2 (a2pldt, atick[1], a2_add);
3586A2ptrldi := NAN2 (a2ptrldi, a2update\, a2pldt);*/
3587 bool a1fracldi = a1fupdate || (a1_add && a1addx == 3);
3588
3589// Some more from DCONTROL...
3590// atick[] just MAY be important here! We're assuming it's true and dropping the term...
3591// That will probably screw up some of the lower terms that seem to rely on the timing of it...
3592#ifdef _MSC_VER
3593#pragma message("Warning: srcdreadd is not properly initialized!")
3594#else
3595#warning "srcdreadd is not properly initialized!"
3596#endif // _MSC_VER
3597bool srcdreadd = false; // Set in INNER.NET
3598//Shadeadd\ := NAN2H (shadeadd\, dwrite, srcshade);
3599//Shadeadd := INV2 (shadeadd, shadeadd\);
3600bool shadeadd = dwrite && srcshade;
3601/* Data adder control, input A selection
3602000 Destination data
3603001 Initialiser pixel value
3604100 Source data - computed intensity fraction
3605101 Pattern data - computed intensity
3606110 Source zed 1 - computed zed
3607111 Source zed 2 - computed zed fraction
3608
3609Bit 0 = dwrite . gourd . atick[1]
3610 + dzwrite . gourz . atick[0]
3611 + istepadd
3612 + zstepfadd
3613 + init_if + init_ii + init_zf + init_zi
3614Bit 1 = dzwrite . gourz . (atick[0] + atick[1])
3615 + zstepadd
3616 + zstepfadd
3617Bit 2 = (gourd + gourz) . /(init_if + init_ii + init_zf + init_zi)
3618 + dwrite . srcshade
3619*/
3620uint8_t daddasel = ((dwrite && gourd) || (dzwrite && gourz) || istepadd || zstepfadd
3621 || init_if || init_ii || init_zf || init_zi ? 0x01 : 0x00);
3622daddasel |= ((dzwrite && gourz) || zstepadd || zstepfadd ? 0x02 : 0x00);
3623daddasel |= (((gourd || gourz) && !(init_if || init_ii || init_zf || init_zi))
3624 || (dwrite && srcshade) ? 0x04 : 0x00);
3625/* Data adder control, input B selection
36260000 Source data
36270001 Data initialiser increment
36280100 Bottom 16 bits of I increment repeated four times
36290101 Top 16 bits of I increment repeated four times
36300110 Bottom 16 bits of Z increment repeated four times
36310111 Top 16 bits of Z increment repeated four times
36321100 Bottom 16 bits of I step repeated four times
36331101 Top 16 bits of I step repeated four times
36341110 Bottom 16 bits of Z step repeated four times
36351111 Top 16 bits of Z step repeated four times
3636
3637Bit 0 = dwrite . gourd . atick[1]
3638 + dzwrite . gourz . atick[1]
3639 + dwrite . srcshade
3640 + istepadd
3641 + zstepadd
3642 + init_if + init_ii + init_zf + init_zi
3643Bit 1 = dzwrite . gourz . (atick[0] + atick[1])
3644 + zstepadd
3645 + zstepfadd
3646Bit 2 = dwrite . gourd . (atick[0] + atick[1])
3647 + dzwrite . gourz . (atick[0] + atick[1])
3648 + dwrite . srcshade
3649 + istepadd + istepfadd + zstepadd + zstepfadd
3650Bit 3 = istepadd + istepfadd + zstepadd + zstepfadd
3651*/
3652uint8_t daddbsel = ((dwrite && gourd) || (dzwrite && gourz) || (dwrite && srcshade)
3653 || istepadd || zstepadd || init_if || init_ii || init_zf || init_zi ? 0x01 : 0x00);
3654daddbsel |= ((dzwrite && gourz) || zstepadd || zstepfadd ? 0x02 : 0x00);
3655daddbsel |= ((dwrite && gourd) || (dzwrite && gourz) || (dwrite && srcshade)
3656 || istepadd || istepfadd || zstepadd || zstepfadd ? 0x04 : 0x00);
3657daddbsel |= (istepadd && istepfadd && zstepadd && zstepfadd ? 0x08 : 0x00);
3658/* Data adder mode control
3659000 16-bit normal add
3660001 16-bit saturating add with carry
3661010 8-bit saturating add with carry, carry into top byte is
3662 inhibited (YCrCb)
3663011 8-bit saturating add with carry, carry into top byte and
3664 between top nybbles is inhibited (CRY)
3665100 16-bit normal add with carry
3666101 16-bit saturating add
3667110 8-bit saturating add, carry into top byte is inhibited
3668111 8-bit saturating add, carry into top byte and between top
3669 nybbles is inhibited
3670
3671The first five are used for Gouraud calculations, the latter three
3672for adding source and destination data
3673
3674Bit 0 = dzwrite . gourz . atick[1]
3675 + dwrite . gourd . atick[1] . /topnen . /topben . /ext_int
3676 + dwrite . gourd . atick[1] . topnen . topben . /ext_int
3677 + zstepadd
3678 + istepadd . /topnen . /topben . /ext_int
3679 + istepadd . topnen . topben . /ext_int
3680 + /gourd . /gourz . /topnen . /topben
3681 + /gourd . /gourz . topnen . topben
3682 + shadeadd . /topnen . /topben
3683 + shadeadd . topnen . topben
3684 + init_ii . /topnen . /topben . /ext_int
3685 + init_ii . topnen . topben . /ext_int
3686 + init_zi
3687
3688Bit 1 = dwrite . gourd . atick[1] . /topben . /ext_int
3689 + istepadd . /topben . /ext_int
3690 + /gourd . /gourz . /topben
3691 + shadeadd . /topben
3692 + init_ii . /topben . /ext_int
3693
3694Bit 2 = /gourd . /gourz
3695 + shadeadd
3696 + dwrite . gourd . atick[1] . ext_int
3697 + istepadd . ext_int
3698 + init_ii . ext_int
3699*/
3700uint8_t daddmode = ((dzwrite && gourz) || (dwrite && gourd && !topnen && !topben && !ext_int)
3701 || (dwrite && gourd && topnen && topben && !ext_int) || zstepadd
3702 || (istepadd && !topnen && !topben && !ext_int)
3703 || (istepadd && topnen && topben && !ext_int) || (!gourd && !gourz && !topnen && !topben)
3704 || (!gourd && !gourz && topnen && topben) || (shadeadd && !topnen && !topben)
3705 || (shadeadd && topnen && topben) || (init_ii && !topnen && !topben && !ext_int)
3706 || (init_ii && topnen && topben && !ext_int) || init_zi ? 0x01 : 0x00);
3707daddmode |= ((dwrite && gourd && !topben && !ext_int) || (istepadd && !topben && !ext_int)
3708 || (!gourd && !gourz && !topben) || (shadeadd && !topben)
3709 || (init_ii && !topben && !ext_int) ? 0x02 : 0x00);
3710daddmode |= ((!gourd && !gourz) || shadeadd || (dwrite && gourd && ext_int)
3711 || (istepadd && ext_int) || (init_ii && ext_int) ? 0x04 : 0x00);
3712/* Data add load controls
3713Pattern fraction (dest data) is loaded on
3714 dwrite . gourd . atick[0]
3715 + istepfadd . /datinit
3716 + init_if
3717Pattern data is loaded on
3718 dwrite . gourd . atick[1]
3719 + istepadd . /datinit . /datinit
3720 + init_ii
3721Source z1 is loaded on
3722 dzwrite . gourz . atick[1]
3723 + zstepadd . /datinit . /datinit
3724 + init_zi
3725Source z2 is loaded on
3726 dzwrite . gourz . atick[0]
3727 + zstepfadd
3728 + init_zf
3729Texture map shaded data is loaded on
3730 srcdreadd . srcshade
3731*/
3732bool patfadd = (dwrite && gourd) || (istepfadd && !datinit) || init_if;
3733bool patdadd = (dwrite && gourd) || (istepadd && !datinit) || init_ii;
3734bool srcz1add = (dzwrite && gourz) || (zstepadd && !datinit) || init_zi;
3735bool srcz2add = (dzwrite && gourz) || zstepfadd || init_zf;
3736bool srcshadd = srcdreadd && srcshade;
3737bool daddq_sel = patfadd || patdadd || srcz1add || srcz2add || srcshadd;
3738/* Select write data
3739This has to be controlled from stage 1 of the pipe-line, delayed
3740by one tick, as the write occurs in the cycle after the ack.
3741
374200 pattern data
374301 lfu data
374410 adder output
374511 source zed
3746
3747Bit 0 = /patdsel . /adddsel
3748 + dzwrite1d
3749Bit 1 = adddsel
3750 + dzwrite1d
3751*/
3752uint8_t data_sel = ((!patdsel && !adddsel) || dzwrite ? 0x01 : 0x00)
3753 | (adddsel || dzwrite ? 0x02 : 0x00);
3754
3755uint32_t address, pixAddr;
3756ADDRGEN(address, pixAddr, gena2i, zaddr,
3757 a1_x, a1_y, a1_base, a1_pitch, a1_pixsize, a1_width, a1_zoffset,
3758 a2_x, a2_y, a2_base, a2_pitch, a2_pixsize, a2_width, a2_zoffset);
3759
3760//Here's my guess as to how the addresses get truncated to phrase boundaries in phrase mode...
3761if (!justify)
3762 address &= 0xFFFFF8;
3763
3764/* Generate source alignment shift
3765 -------------------------------
3766The source alignment shift for data move is the difference between
3767the source and destination X pointers, multiplied by the pixel
3768size. Only the low six bits of the pointers are of interest, as
3769pixel sizes are always a power of 2 and window rows are always
3770phrase aligned.
3771
3772When not in phrase mode, the top 3 bits of the shift value are
3773set to zero (2/26).
3774
3775Source shifting is also used to extract bits for bit-to-byte
3776expansion in phrase mode. This involves only the bottom three
3777bits of the shift value, and is based on the offset within the
3778phrase of the destination X pointer, in pixels.
3779
3780Source shifting is disabled when srcen is not set.
3781*/
3782uint8_t dstxp = (dsta2 ? a2_x : a1_x) & 0x3F;
3783uint8_t srcxp = (dsta2 ? a1_x : a2_x) & 0x3F;
3784uint8_t shftv = ((dstxp - srcxp) << pixsize) & 0x3F;
3785/* The phrase mode alignment count is given by the phrase offset
3786of the first pixel, for bit to byte expansion */
3787uint8_t pobb = 0;
3788
3789if (pixsize == 3)
3790 pobb = dstxp & 0x07;
3791if (pixsize == 4)
3792 pobb = dstxp & 0x03;
3793if (pixsize == 5)
3794 pobb = dstxp & 0x01;
3795
3796bool pobbsel = phrase_mode && bcompen;
3797uint8_t loshd = (pobbsel ? pobb : shftv) & 0x07;
3798uint8_t shfti = (srcen || pobbsel ? (sshftld ? loshd : srcshift & 0x07) : 0);
3799/* Enable for high bits is srcen . phrase_mode */
3800shfti |= (srcen && phrase_mode ? (sshftld ? shftv & 0x38 : srcshift & 0x38) : 0);
3801srcshift = shfti;
3802
3803 if (sreadx)
3804 {
3805#ifdef VERBOSE_BLITTER_LOGGING
3806if (logBlit)
3807 WriteLog(" Entering SREADX state...");
3808#endif
3809//uint32_t srcAddr, pixAddr;
3810//ADDRGEN(srcAddr, pixAddr, gena2i, zaddr,
3811// a1_x, a1_y, a1_base, a1_pitch, a1_pixsize, a1_width, a1_zoffset,
3812// a2_x, a2_y, a2_base, a2_pitch, a2_pixsize, a2_width, a2_zoffset);
3813 srcd2 = srcd1;
3814 srcd1 = ((uint64_t)JaguarReadLong(address + 0, BLITTER) << 32)
3815 | (uint64_t)JaguarReadLong(address + 4, BLITTER);
3816//Kludge to take pixel size into account...
3817//Hmm. If we're not in phrase mode, this is most likely NOT going to be used...
3818//Actually, it would be--because of BCOMPEN expansion, for example...
3819if (!phrase_mode)
3820{
3821 if (bcompen)
3822 srcd1 >>= 56;
3823 else
3824 {
3825 if (pixsize == 5)
3826 srcd1 >>= 32;
3827 else if (pixsize == 4)
3828 srcd1 >>= 48;
3829 else
3830 srcd1 >>= 56;
3831 }
3832}//*/
3833#ifdef VERBOSE_BLITTER_LOGGING
3834if (logBlit)
3835 WriteLog(" Source extra read address/pix address: %08X/%1X [%08X%08X]\n",
3836 address, pixAddr, (uint32_t)(srcd1 >> 32), (uint32_t)(srcd1 & 0xFFFFFFFF));
3837#endif
3838 }
3839
3840 if (szreadx)
3841 {
3842#ifdef VERBOSE_BLITTER_LOGGING
3843if (logBlit)
3844 WriteLog(" Entering SZREADX state...");
3845#endif
3846 srcz2 = srcz1;
3847 srcz1 = ((uint64_t)JaguarReadLong(address, BLITTER) << 32) | (uint64_t)JaguarReadLong(address + 4, BLITTER);
3848#ifdef VERBOSE_BLITTER_LOGGING
3849if (logBlit)
3850 WriteLog(" Src Z extra read address/pix address: %08X/%1X [%08X%08X]\n", address, pixAddr,
3851 (uint32_t)(dstz >> 32), (uint32_t)(dstz & 0xFFFFFFFF));
3852#endif
3853 }
3854
3855 if (sread)
3856 {
3857#ifdef VERBOSE_BLITTER_LOGGING
3858if (logBlit)
3859 WriteLog(" Entering SREAD state...");
3860#endif
3861//uint32_t srcAddr, pixAddr;
3862//ADDRGEN(srcAddr, pixAddr, gena2i, zaddr,
3863// a1_x, a1_y, a1_base, a1_pitch, a1_pixsize, a1_width, a1_zoffset,
3864// a2_x, a2_y, a2_base, a2_pitch, a2_pixsize, a2_width, a2_zoffset);
3865srcd2 = srcd1;
3866srcd1 = ((uint64_t)JaguarReadLong(address, BLITTER) << 32) | (uint64_t)JaguarReadLong(address + 4, BLITTER);
3867//Kludge to take pixel size into account...
3868if (!phrase_mode)
3869{
3870 if (bcompen)
3871 srcd1 >>= 56;
3872 else
3873 {
3874 if (pixsize == 5)
3875 srcd1 >>= 32;
3876 else if (pixsize == 4)
3877 srcd1 >>= 48;
3878 else
3879 srcd1 >>= 56;
3880 }
3881}
3882#ifdef VERBOSE_BLITTER_LOGGING
3883if (logBlit)
3884{
3885WriteLog(" Source read address/pix address: %08X/%1X [%08X%08X]\n", address, pixAddr,
3886 (uint32_t)(srcd1 >> 32), (uint32_t)(srcd1 & 0xFFFFFFFF));
3887//fflush(stdout);
3888}
3889#endif
3890 }
3891
3892 if (szread)
3893 {
3894#ifdef VERBOSE_BLITTER_LOGGING
3895if (logBlit)
3896{
3897WriteLog(" Entering SZREAD state...");
3898//fflush(stdout);
3899}
3900#endif
3901 srcz2 = srcz1;
3902 srcz1 = ((uint64_t)JaguarReadLong(address, BLITTER) << 32) | (uint64_t)JaguarReadLong(address + 4, BLITTER);
3903//Kludge to take pixel size into account... I believe that it only has to take 16BPP mode into account. Not sure tho.
3904if (!phrase_mode && pixsize == 4)
3905 srcz1 >>= 48;
3906
3907#ifdef VERBOSE_BLITTER_LOGGING
3908if (logBlit)
3909{
3910 WriteLog(" Src Z read address/pix address: %08X/%1X [%08X%08X]\n", address, pixAddr,
3911 (uint32_t)(dstz >> 32), (uint32_t)(dstz & 0xFFFFFFFF));
3912}
3913#endif
3914 }
3915
3916 if (dread)
3917 {
3918#ifdef VERBOSE_BLITTER_LOGGING
3919if (logBlit)
3920 WriteLog(" Entering DREAD state...");
3921#endif
3922//uint32_t dstAddr, pixAddr;
3923//ADDRGEN(dstAddr, pixAddr, gena2i, zaddr,
3924// a1_x, a1_y, a1_base, a1_pitch, a1_pixsize, a1_width, a1_zoffset,
3925// a2_x, a2_y, a2_base, a2_pitch, a2_pixsize, a2_width, a2_zoffset);
3926dstd = ((uint64_t)JaguarReadLong(address, BLITTER) << 32) | (uint64_t)JaguarReadLong(address + 4, BLITTER);
3927//Kludge to take pixel size into account...
3928if (!phrase_mode)
3929{
3930 if (pixsize == 5)
3931 dstd >>= 32;
3932 else if (pixsize == 4)
3933 dstd >>= 48;
3934 else
3935 dstd >>= 56;
3936}
3937#ifdef VERBOSE_BLITTER_LOGGING
3938if (logBlit)
3939 WriteLog(" Dest read address/pix address: %08X/%1X [%08X%08X]\n", address,
3940 pixAddr, (uint32_t)(dstd >> 32), (uint32_t)(dstd & 0xFFFFFFFF));
3941#endif
3942 }
3943
3944 if (dzread)
3945 {
3946// Is Z always 64 bit read? Or sometimes 16 bit (dependent on phrase_mode)?
3947#ifdef VERBOSE_BLITTER_LOGGING
3948if (logBlit)
3949 WriteLog(" Entering DZREAD state...");
3950#endif
3951 dstz = ((uint64_t)JaguarReadLong(address, BLITTER) << 32) | (uint64_t)JaguarReadLong(address + 4, BLITTER);
3952//Kludge to take pixel size into account... I believe that it only has to take 16BPP mode into account. Not sure tho.
3953if (!phrase_mode && pixsize == 4)
3954 dstz >>= 48;
3955
3956#ifdef VERBOSE_BLITTER_LOGGING
3957if (logBlit)
3958 WriteLog(" Dest Z read address/pix address: %08X/%1X [%08X%08X]\n", address,
3959 pixAddr, (uint32_t)(dstz >> 32), (uint32_t)(dstz & 0xFFFFFFFF));
3960#endif
3961 }
3962
3963// These vars should probably go further up in the code... !!! FIX !!!
3964// We can't preassign these unless they're static...
3965//uint64_t srcz = 0; // These are assigned to shut up stupid compiler warnings--dwrite is ALWAYS asserted
3966//bool winhibit = false;
3967uint64_t srcz;
3968bool winhibit;
3969//NOTE: SRCSHADE requires GOURZ to be set to work properly--another Jaguar I bug
3970 if (dwrite)
3971 {
3972#ifdef VERBOSE_BLITTER_LOGGING
3973if (logBlit)
3974 WriteLog(" Entering DWRITE state...");
3975#endif
3976//Counter is done on the dwrite state...! (We'll do it first, since it affects dstart/dend calculations.)
3977//Here's the voodoo for figuring the correct amount of pixels in phrase mode (or not):
3978 int8_t inct = -((dsta2 ? a2_x : a1_x) & 0x07); // From INNER_CNT
3979 uint8_t inc = 0;
3980 inc = (!phrase_mode || (phrase_mode && (inct & 0x01)) ? 0x01 : 0x00);
3981 inc |= (phrase_mode && (((pixsize == 3 || pixsize == 4) && (inct & 0x02)) || pixsize == 5 && !(inct & 0x01)) ? 0x02 : 0x00);
3982 inc |= (phrase_mode && ((pixsize == 3 && (inct & 0x04)) || (pixsize == 4 && !(inct & 0x03))) ? 0x04 : 0x00);
3983 inc |= (phrase_mode && pixsize == 3 && !(inct & 0x07) ? 0x08 : 0x00);
3984
3985 uint16_t oldicount = icount; // Save icount to detect underflow...
3986 icount -= inc;
3987
3988 if (icount == 0 || ((icount & 0x8000) && !(oldicount & 0x8000)))
3989 inner0 = true;
3990// X/Y stepping is also done here, I think...No. It's done when a1_add or a2_add is asserted...
3991
3992//*********************************************************************************
3993//Start & end write mask computations...
3994//*********************************************************************************
3995
3996uint8_t dstart = 0;
3997
3998if (pixsize == 3)
3999 dstart = (dstxp & 0x07) << 3;
4000if (pixsize == 4)
4001 dstart = (dstxp & 0x03) << 4;
4002if (pixsize == 5)
4003 dstart = (dstxp & 0x01) << 5;
4004
4005dstart = (phrase_mode ? dstart : pixAddr & 0x07);
4006
4007//This is the other Jaguar I bug... Normally, should ALWAYS select a1_x here.
4008uint16_t dstxwr = (dsta2 ? a2_x : a1_x) & 0x7FFE;
4009uint16_t pseq = dstxwr ^ (a1_win_x & 0x7FFE);
4010pseq = (pixsize == 5 ? pseq : pseq & 0x7FFC);
4011pseq = ((pixsize & 0x06) == 4 ? pseq : pseq & 0x7FF8);
4012bool penden = clip_a1 && (pseq == 0);
4013uint8_t window_mask = 0;
4014
4015if (pixsize == 3)
4016 window_mask = (a1_win_x & 0x07) << 3;
4017if (pixsize == 4)
4018 window_mask = (a1_win_x & 0x03) << 4;
4019if (pixsize == 5)
4020 window_mask = (a1_win_x & 0x01) << 5;
4021
4022window_mask = (penden ? window_mask : 0);
4023
4024/*
4025 Entering SREADX state... [dstart=0 dend=20 pwidth=8 srcshift=20]
4026 Source extra read address/pix address: 000095D0/0 [000004E40000001C]
4027 Entering A2_ADD state [a2_x=0002, a2_y=0000, addasel=0, addbsel=1, modx=2, addareg=F, adda_xconst=2, adda_yconst=0]...
4028 Entering SREAD state... [dstart=0 dend=20 pwidth=8 srcshift=20]
4029 Source read address/pix address: 000095D8/0 [0054003800009814]
4030 Entering A2_ADD state [a2_x=0004, a2_y=0000, addasel=0, addbsel=1, modx=2, addareg=F, adda_xconst=2, adda_yconst=0]...
4031 Entering DWRITE state...
4032 Dest write address/pix address: 00037290/0 [dstart=0 dend=20 pwidth=8 srcshift=20][daas=0 dabs=0 dam=7 ds=1 daq=F] [0000001C00000000] (icount=026E, inc=4)
4033 Entering A1_ADD state [a1_x=0000, a1_y=0000, addasel=0, addbsel=0, modx=2, addareg=F, adda_xconst=2, adda_yconst=0]...
4034
4035(icount=026E, inc=4)
4036icount & 0x03 = 0x02
4037 << 4 = 0x20
4038
4039window_mask = 0x1000
4040
4041Therefore, it chooses the inner_mask over the window_mask every time! Argh!
4042This is because we did this wrong:
4043Innerm[3-5] := AN2 (inner_mask[3-5], imb[3-5], inner0);
4044NOTE! This doesn't fix the problem because inner0 is asserted too late to help here. !!! FIX !!! [Should be DONE]
4045*/
4046
4047/* The mask to be used if within one phrase of the end of the inner
4048loop, similarly */
4049uint8_t inner_mask = 0;
4050
4051if (pixsize == 3)
4052 inner_mask = (icount & 0x07) << 3;
4053if (pixsize == 4)
4054 inner_mask = (icount & 0x03) << 4;
4055if (pixsize == 5)
4056 inner_mask = (icount & 0x01) << 5;
4057if (!inner0)
4058 inner_mask = 0;
4059/* The actual mask used should be the lesser of the window masks and
4060the inner mask, where is all cases 000 means 1000. */
4061window_mask = (window_mask == 0 ? 0x40 : window_mask);
4062inner_mask = (inner_mask == 0 ? 0x40 : inner_mask);
4063uint8_t emask = (window_mask > inner_mask ? inner_mask : window_mask);
4064/* The mask to be used for the pixel size, to which must be added
4065the bit offset */
4066uint8_t pma = pixAddr + (1 << pixsize);
4067/* Select the mask */
4068uint8_t dend = (phrase_mode ? emask : pma);
4069
4070/* The cycle width in phrase mode is normally one phrase. However,
4071at the start and end it may be narrower. The start and end masks
4072are used to generate this. The width is given by:
4073
4074 8 - start mask - (8 - end mask)
4075= end mask - start mask
4076
4077This is only used for writes in phrase mode.
4078Start and end from the address level of the pipeline are used.
4079*/
4080uint8_t pwidth = (((dend | dstart) & 0x07) == 0 ? 0x08 : (dend - dstart) & 0x07);
4081
4082//uint32_t dstAddr, pixAddr;
4083//ADDRGEN(dstAddr, pixAddr, gena2i, zaddr,
4084// a1_x, a1_y, a1_base, a1_pitch, a1_pixsize, a1_width, a1_zoffset,
4085// a2_x, a2_y, a2_base, a2_pitch, a2_pixsize, a2_width, a2_zoffset);
4086#ifdef VERBOSE_BLITTER_LOGGING
4087if (logBlit)
4088 WriteLog(" Dest write address/pix address: %08X/%1X", address, pixAddr);
4089#endif
4090
4091//More testing... This is almost certainly wrong, but how else does this work???
4092//Seems to kinda work... But still, this doesn't seem to make any sense!
4093if (phrase_mode && !dsten)
4094 dstd = ((uint64_t)JaguarReadLong(address, BLITTER) << 32) | (uint64_t)JaguarReadLong(address + 4, BLITTER);
4095
4096//Testing only... for now...
4097//This is wrong because the write data is a combination of srcd and dstd--either run
4098//thru the LFU or in PATDSEL or ADDDSEL mode. [DONE now, thru DATA module]
4099// Precedence is ADDDSEL > PATDSEL > LFU.
4100//Also, doesn't take into account the start & end masks, or the phrase width...
4101//Now it does!
4102
4103// srcd2 = xxxx xxxx 0123 4567, srcd = 8901 2345 xxxx xxxx, srcshift = $20 (32)
4104uint64_t srcd = (srcd2 << (64 - srcshift)) | (srcd1 >> srcshift);
4105//bleh, ugly ugly ugly
4106if (srcshift == 0)
4107 srcd = srcd1;
4108
4109//NOTE: This only works with pixel sizes less than 8BPP...
4110//DOUBLE NOTE: Still need to do regression testing to ensure that this doesn't break other stuff... !!! CHECK !!!
4111if (!phrase_mode && srcshift != 0)
4112 srcd = ((srcd2 & 0xFF) << (8 - srcshift)) | ((srcd1 & 0xFF) >> srcshift);
4113
4114//Z DATA() stuff done here... And it has to be done before any Z shifting...
4115//Note that we need to have phrase mode start/end support here... (Not since we moved it from dzwrite...!)
4116/*
4117Here are a couple of Cybermorph blits with Z:
4118$00113078 // DSTEN DSTENZ DSTWRZ CLIP_A1 GOURD GOURZ PATDSEL ZMODE=4
4119$09900F39 // SRCEN DSTEN DSTENZ DSTWRZ UPDA1 UPDA1F UPDA2 DSTA2 ZMODE=4 LFUFUNC=C DCOMPEN
4120
4121We're having the same phrase mode overwrite problem we had with the pixels... !!! FIX !!!
4122Odd. It's equating 0 with 0... Even though ZMODE is $04 (less than)!
4123*/
4124if (gourz)
4125{
4126/*
4127void ADDARRAY(uint16_t * addq, uint8_t daddasel, uint8_t daddbsel, uint8_t daddmode,
4128 uint64_t dstd, uint32_t iinc, uint8_t initcin[], uint64_t initinc, uint16_t initpix,
4129 uint32_t istep, uint64_t patd, uint64_t srcd, uint64_t srcz1, uint64_t srcz2,
4130 uint32_t zinc, uint32_t zstep)
4131*/
4132 uint16_t addq[4];
4133 uint8_t initcin[4] = { 0, 0, 0, 0 };
4134 ADDARRAY(addq, 7/*daddasel*/, 6/*daddbsel*/, 0/*daddmode*/, 0, 0, initcin, 0, 0, 0, 0, 0, srcz1, srcz2, zinc, 0);
4135 srcz2 = ((uint64_t)addq[3] << 48) | ((uint64_t)addq[2] << 32) | ((uint64_t)addq[1] << 16) | (uint64_t)addq[0];
4136 ADDARRAY(addq, 6/*daddasel*/, 7/*daddbsel*/, 1/*daddmode*/, 0, 0, initcin, 0, 0, 0, 0, 0, srcz1, srcz2, zinc, 0);
4137 srcz1 = ((uint64_t)addq[3] << 48) | ((uint64_t)addq[2] << 32) | ((uint64_t)addq[1] << 16) | (uint64_t)addq[0];
4138
4139#if 0//def VERBOSE_BLITTER_LOGGING
4140if (logBlit)
4141 WriteLog("\n[srcz1=%08X%08X, srcz2=%08X%08X, zinc=%08X",
4142 (uint32_t)(srcz1 >> 32), (uint32_t)(srcz1 & 0xFFFFFFFF),
4143 (uint32_t)(srcz2 >> 32), (uint32_t)(srcz2 & 0xFFFFFFFF), zinc);
4144#endif
4145}
4146
4147uint8_t zSrcShift = srcshift & 0x30;
4148srcz = (srcz2 << (64 - zSrcShift)) | (srcz1 >> zSrcShift);
4149//bleh, ugly ugly ugly
4150if (zSrcShift == 0)
4151 srcz = srcz1;
4152
4153#if 0//def VERBOSE_BLITTER_LOGGING
4154if (logBlit)
4155 WriteLog(" srcz=%08X%08X]\n", (uint32_t)(srcz >> 32), (uint32_t)(srcz & 0xFFFFFFFF));
4156#endif
4157
4158//When in SRCSHADE mode, it adds the IINC to the read source (from LFU???)
4159//According to following line, it gets LFU mode. But does it feed the source into the LFU
4160//after the add?
4161//Dest write address/pix address: 0014E83E/0 [dstart=0 dend=10 pwidth=8 srcshift=0][daas=4 dabs=5 dam=7 ds=1 daq=F] [0000000000006505] (icount=003F, inc=1)
4162//Let's try this:
4163if (srcshade)
4164{
4165//NOTE: This is basically doubling the work done by DATA--since this is what
4166// ADDARRAY is loaded with when srschshade is enabled... !!! FIX !!!
4167// Also note that it doesn't work properly unless GOURZ is set--there's the clue!
4168 uint16_t addq[4];
4169 uint8_t initcin[4] = { 0, 0, 0, 0 };
4170 ADDARRAY(addq, 4/*daddasel*/, 5/*daddbsel*/, 7/*daddmode*/, dstd, iinc, initcin, 0, 0, 0, patd, srcd, 0, 0, 0, 0);
4171 srcd = ((uint64_t)addq[3] << 48) | ((uint64_t)addq[2] << 32) | ((uint64_t)addq[1] << 16) | (uint64_t)addq[0];
4172}
4173//Seems to work... Not 100% sure tho.
4174//end try this
4175
4176//Temporary kludge, to see if the fractional pattern does anything...
4177//This works, BTW
4178//But it seems to mess up in Cybermorph... the shading should be smooth but it isn't...
4179//Seems the carry out is lost again... !!! FIX !!! [DONE--see below]
4180if (patfadd)
4181{
4182 uint16_t addq[4];
4183 uint8_t initcin[4] = { 0, 0, 0, 0 };
4184 ADDARRAY(addq, 4/*daddasel*/, 4/*daddbsel*/, 0/*daddmode*/, dstd, iinc, initcin, 0, 0, 0, patd, srcd, 0, 0, 0, 0);
4185 srcd1 = ((uint64_t)addq[3] << 48) | ((uint64_t)addq[2] << 32) | ((uint64_t)addq[1] << 16) | (uint64_t)addq[0];
4186}
4187
4188//Note that we still don't take atick[0] & [1] into account here, so this will skip half of the data needed... !!! FIX !!!
4189//Not yet enumerated: dbinh, srcdread, srczread
4190//Also, should do srcshift on the z value in phrase mode... !!! FIX !!! [DONE]
4191//As well as add a srcz variable we can set external to this state... !!! FIX !!! [DONE]
4192
4193uint64_t wdata;
4194uint8_t dcomp, zcomp;
4195DATA(wdata, dcomp, zcomp, winhibit,
4196 true, cmpdst, daddasel, daddbsel, daddmode, daddq_sel, data_sel, 0/*dbinh*/,
4197 dend, dstart, dstd, iinc, lfufunc, patd, patdadd,
4198 phrase_mode, srcd, false/*srcdread*/, false/*srczread*/, srcz2add, zmode,
4199 bcompen, bkgwren, dcompen, icount & 0x07, pixsize,
4200 srcz, dstz, zinc);
4201/*
4202Seems that the phrase mode writes with DCOMPEN and DSTEN are corrupting inside of DATA: !!! FIX !!!
4203It's fairly random as well. 7CFE -> 7DFE, 7FCA -> 78CA, 7FA4 -> 78A4, 7F88 -> 8F88
4204It could be related to an uninitialized variable, like the zmode bug...
4205[DONE]
4206It was a bug in the dech38el data--it returned $FF for ungated instead of $00...
4207
4208Blit! (CMD = 09800609)
4209Flags: SRCEN DSTEN UPDA1 UPDA2 LFUFUNC=C DCOMPEN
4210 count = 10 x 12
4211 a1_base = 00110000, a2_base = 0010B2A8
4212 a1_x = 004B, a1_y = 00D8, a1_frac_x = 0000, a1_frac_y = 0000, a2_x = 0704, a2_y = 0000
4213 a1_step_x = FFF3, a1_step_y = 0001, a1_stepf_x = 0000, a1_stepf_y = 0000, a2_step_x = FFFC, a2_step_y = 0000
4214 a1_inc_x = 0000, a1_inc_y = 0000, a1_incf_x = 0000, a1_incf_y = 0000
4215 a1_win_x = 0000, a1_win_y = 0000, a2_mask_x = 0000, a2_mask_y = 0000
4216 a2_mask=F a1add=+phr/+0 a2add=+phr/+0
4217 a1_pixsize = 4, a2_pixsize = 4
4218 srcd=0000000000000000 dstd=0000000000000000 patd=0000000000000000 iinc=00000000
4219 srcz1=0000000000000000 srcz2=0000000000000000 dstz=0000000000000000 zinc=00000000, coll=0
4220 Phrase mode is ON
4221 [in=T a1f=F a1=F zf=F z=F a2=F iif=F iii=F izf=F izi=F]
4222 Entering INNER state...
4223 Entering SREAD state... Source read address/pix address: 0010C0B0/0 [0000000078047804]
4224 Entering A2_ADD state [a2_x=0704, a2_y=0000, addasel=0, addbsel=1, modx=2, addareg=F, adda_xconst=2, adda_yconst=0]...
4225 Entering DREAD state...
4226 Dest read address/pix address: 00197240/0 [0000000000000028]
4227 Entering DWRITE state...
4228 Dest write address/pix address: 00197240/0 [dstart=30 dend=40 pwidth=8 srcshift=30][daas=0 dabs=0 dam=7 ds=1 daq=F] [0000000000000028] (icount=0009, inc=1)
4229 Entering A1_ADD state [a1_x=004B, a1_y=00D8, addasel=0, addbsel=0, modx=2, addareg=F, adda_xconst=2, adda_yconst=0]...
4230 Entering SREAD state... Source read address/pix address: 0010C0B8/0 [7804780478047804]
4231 Entering A2_ADD state [a2_x=0708, a2_y=0000, addasel=0, addbsel=1, modx=2, addareg=F, adda_xconst=2, adda_yconst=0]...
4232 Entering DREAD state...
4233 Dest read address/pix address: 00197260/0 [0028000000200008]
4234 Entering DWRITE state...
4235 Dest write address/pix address: 00197260/0 [dstart=0 dend=40 pwidth=8 srcshift=30][daas=0 dabs=0 dam=7 ds=1 daq=F] [0028780478047804] (icount=0005, inc=4)
4236 Entering A1_ADD state [a1_x=004C, a1_y=00D8, addasel=0, addbsel=0, modx=2, addareg=F, adda_xconst=2, adda_yconst=0]...
4237 Entering SREAD state... Source read address/pix address: 0010C0C0/0 [0000000000000000]
4238 Entering A2_ADD state [a2_x=070C, a2_y=0000, addasel=0, addbsel=1, modx=2, addareg=F, adda_xconst=2, adda_yconst=0]...
4239 Entering DREAD state...
4240 Dest read address/pix address: 00197280/0 [0008001800180018]
4241 Entering DWRITE state...
4242 Dest write address/pix address: 00197280/0 [dstart=0 dend=40 pwidth=8 srcshift=30][daas=0 dabs=0 dam=7 ds=1 daq=F] [7804780478040018] (icount=0001, inc=4)
4243 Entering A1_ADD state [a1_x=0050, a1_y=00D8, addasel=0, addbsel=0, modx=2, addareg=F, adda_xconst=2, adda_yconst=0]...
4244 Entering SREAD state... Source read address/pix address: 0010C0C8/0 [000078047BFE7BFE]
4245 Entering A2_ADD state [a2_x=0710, a2_y=0000, addasel=0, addbsel=1, modx=2, addareg=F, adda_xconst=2, adda_yconst=0]...
4246 Entering DREAD state...
4247 Dest read address/pix address: 001972A0/0 [0008002000000000]
4248 Entering DWRITE state...
4249 Dest write address/pix address: 001972A0/0 [dstart=0 dend=10 pwidth=8 srcshift=30][daas=0 dabs=0 dam=7 ds=1 daq=F] [0008002000000000] (icount=FFFD, inc=4)
4250 Entering A1_ADD state [a1_x=0054, a1_y=00D8, addasel=0, addbsel=0, modx=2, addareg=F, adda_xconst=2, adda_yconst=0]...
4251 Entering IDLE_INNER state...
4252*/
4253
4254//Why isn't this taken care of in DATA? Because, DATA is modifying its local copy instead of the one used here.
4255//!!! FIX !!! [DONE]
4256//if (patdadd)
4257// patd = wdata;
4258
4259//if (patfadd)
4260// srcd1 = wdata;
4261
4262/*
4263DEF ADDRCOMP (
4264 a1_outside // A1 pointer is outside window bounds
4265 :OUT;
4266INT16/ a1_x
4267INT16/ a1_y
4268INT15/ a1_win_x
4269INT15/ a1_win_y
4270 :IN);
4271BEGIN
4272
4273// The address is outside if negative, or if greater than or equal
4274// to the window size
4275
4276A1_xcomp := MAG_15 (a1xgr, a1xeq, a1xlt, a1_x{0..14}, a1_win_x{0..14});
4277A1_ycomp := MAG_15 (a1ygr, a1yeq, a1ylt, a1_y{0..14}, a1_win_y{0..14});
4278A1_outside := OR6 (a1_outside, a1_x{15}, a1xgr, a1xeq, a1_y{15}, a1ygr, a1yeq);
4279*/
4280//NOTE: There seems to be an off-by-one bug here in the clip_a1 section... !!! FIX !!!
4281// Actually, seems to be related to phrase mode writes...
4282// Or is it? Could be related to non-15-bit compares as above?
4283if (clip_a1 && ((a1_x & 0x8000) || (a1_y & 0x8000) || (a1_x >= a1_win_x) || (a1_y >= a1_win_y)))
4284 winhibit = true;
4285
4286if (!winhibit)
4287{
4288 if (phrase_mode)
4289 {
4290 JaguarWriteLong(address + 0, wdata >> 32, BLITTER);
4291 JaguarWriteLong(address + 4, wdata & 0xFFFFFFFF, BLITTER);
4292 }
4293 else
4294 {
4295 if (pixsize == 5)
4296 JaguarWriteLong(address, wdata & 0xFFFFFFFF, BLITTER);
4297 else if (pixsize == 4)
4298 JaguarWriteWord(address, wdata & 0x0000FFFF, BLITTER);
4299 else
4300 JaguarWriteByte(address, wdata & 0x000000FF, BLITTER);
4301 }
4302}
4303
4304#ifdef VERBOSE_BLITTER_LOGGING
4305if (logBlit)
4306{
4307 WriteLog(" [%08X%08X]%s", (uint32_t)(wdata >> 32), (uint32_t)(wdata & 0xFFFFFFFF), (winhibit ? "[X]" : ""));
4308 WriteLog(" (icount=%04X, inc=%u)\n", icount, (uint16_t)inc);
4309 WriteLog(" [dstart=%X dend=%X pwidth=%X srcshift=%X]", dstart, dend, pwidth, srcshift);
4310 WriteLog("[daas=%X dabs=%X dam=%X ds=%X daq=%s]\n", daddasel, daddbsel, daddmode, data_sel, (daddq_sel ? "T" : "F"));
4311}
4312#endif
4313 }
4314
4315 if (dzwrite)
4316 {
4317// OK, here's the big insight: When NOT in GOURZ mode, srcz1 & 2 function EXACTLY the same way that
4318// srcd1 & 2 work--there's an implicit shift from srcz1 to srcz2 whenever srcz1 is read.
4319// OTHERWISE, srcz1 is the integer for the computed Z and srcz2 is the fractional part.
4320// Writes to srcz1 & 2 follow the same pattern as the other 64-bit registers--low 32 at the low address,
4321// high 32 at the high address (little endian!).
4322// NOTE: GOURZ is still not properly supported. Check patd/patf handling...
4323// Phrase mode start/end masks are not properly supported either...
4324#ifdef VERBOSE_BLITTER_LOGGING
4325if (logBlit)
4326{
4327 WriteLog(" Entering DZWRITE state...");
4328 WriteLog(" Dest Z write address/pix address: %08X/%1X [%08X%08X]\n", address,
4329 pixAddr, (uint32_t)(srcz >> 32), (uint32_t)(srcz & 0xFFFFFFFF));
4330}
4331#endif
4332//This is not correct... !!! FIX !!!
4333//Should be OK now... We'll see...
4334//Nope. Having the same starstep write problems in phrase mode as we had with pixels... !!! FIX !!!
4335//This is not causing the problem in Hover Strike... :-/
4336//The problem was with the SREADX not shifting. Still problems with Z comparisons & other text in pregame screen...
4337if (!winhibit)
4338{
4339 if (phrase_mode)
4340 {
4341 JaguarWriteLong(address + 0, srcz >> 32, BLITTER);
4342 JaguarWriteLong(address + 4, srcz & 0xFFFFFFFF, BLITTER);
4343 }
4344 else
4345 {
4346 if (pixsize == 4)
4347 JaguarWriteWord(address, srcz & 0x0000FFFF, BLITTER);
4348 }
4349}//*/
4350#ifdef VERBOSE_BLITTER_LOGGING
4351if (logBlit)
4352{
4353// printf(" [%08X%08X]\n", (uint32_t)(srcz >> 32), (uint32_t)(srcz & 0xFFFFFFFF));
4354// fflush(stdout);
4355//printf(" [dstart=%X dend=%X pwidth=%X srcshift=%X]", dstart, dend, pwidth, srcshift);
4356 WriteLog(" [dstart=? dend=? pwidth=? srcshift=%X]", srcshift);
4357 WriteLog("[daas=%X dabs=%X dam=%X ds=%X daq=%s]\n", daddasel, daddbsel, daddmode, data_sel, (daddq_sel ? "T" : "F"));
4358// fflush(stdout);
4359}
4360#endif
4361 }
4362
4363/*
4364This is because the address generator was using only 15 bits of the X when it should have
4365used 16!
4366
4367There's a slight problem here: The X pointer isn't wrapping like it should when it hits
4368the edge of the window... Notice how the X isn't reset at the edge of the window:
4369
4370Blit! (CMD = 00010000)
4371Flags: PATDSEL
4372 count = 160 x 261
4373 a1_base = 000E8008, a2_base = 0001FA68
4374 a1_x = 0000, a1_y = 0000, a1_frac_x = 0000, a1_frac_y = 0000, a2_x = 0000, a2_y = 0000
4375 a1_step_x = 0000, a1_step_y = 0000, a1_stepf_x = 0000, a1_stepf_y = 0000, a2_step_x = 0000, a2_step_y = 0000
4376 a1_inc_x = 0000, a1_inc_y = 0000, a1_incf_x = 0000, a1_incf_y = 0000
4377 a1_win_x = 0000, a1_win_y = 0000, a2_mask_x = 0000, a2_mask_y = 0000
4378 a2_mask=F a1add=+phr/+0 a2add=+phr/+0
4379 a1_pixsize = 5, a2_pixsize = 5
4380 srcd=7717771777177717 dstd=0000000000000000 patd=7730773077307730 iinc=00000000
4381 srcz1=0000000000000000 srcz2=0000000000000000 dstz=0000000000000000 zinc=00000000, coll=0
4382 Phrase mode is ON
4383 [in=T a1f=F a1=F zf=F z=F a2=F iif=F iii=F izf=F izi=F]
4384 Entering INNER state...
4385 Entering DWRITE state... Dest write address/pix address: 000E8008/0 [7730773077307730] (icount=009E, inc=2)
4386 srcz=0000000000000000][dcomp=AA zcomp=00 dbinh=00]
4387[srcz=0000000000000000 dstz=0000000000000000 zwdata=0000000000000000 mask=7FFF]
4388 [dstart=0 dend=40 pwidth=8 srcshift=0][daas=0 dabs=0 dam=7 ds=0 daq=F]
4389 Entering A1_ADD state [a1_x=0000, a1_y=0000, addasel=0, addbsel=0, modx=1, addareg=F, adda_xconst=1, adda_yconst=0]...
4390 Entering DWRITE state... Dest write address/pix address: 000E8018/0 [7730773077307730] (icount=009C, inc=2)
4391 srcz=0000000000000000][dcomp=AA zcomp=00 dbinh=00]
4392[srcz=0000000000000000 dstz=0000000000000000 zwdata=0000000000000000 mask=7FFF]
4393 [dstart=0 dend=40 pwidth=8 srcshift=0][daas=0 dabs=0 dam=7 ds=0 daq=F]
4394 Entering A1_ADD state [a1_x=0002, a1_y=0000, addasel=0, addbsel=0, modx=1, addareg=F, adda_xconst=1, adda_yconst=0]...
4395
4396...
4397
4398 Entering A1_ADD state [a1_x=009C, a1_y=0000, addasel=0, addbsel=0, modx=1, addareg=F, adda_xconst=1, adda_yconst=0]...
4399 Entering DWRITE state... Dest write address/pix address: 000E84F8/0 [7730773077307730] (icount=0000, inc=2)
4400 srcz=0000000000000000][dcomp=AA zcomp=00 dbinh=00]
4401[srcz=0000000000000000 dstz=0000000000000000 zwdata=0000000000000000 mask=7FFF]
4402 [dstart=0 dend=40 pwidth=8 srcshift=0][daas=0 dabs=0 dam=7 ds=0 daq=F]
4403 Entering A1_ADD state [a1_x=009E, a1_y=0000, addasel=0, addbsel=0, modx=1, addareg=F, adda_xconst=1, adda_yconst=0]...
4404 Entering IDLE_INNER state...
4405
4406 Leaving INNER state... (ocount=0104)
4407 [in=T a1f=F a1=F zf=F z=F a2=F iif=F iii=F izf=F izi=F]
4408
4409 Entering INNER state...
4410 Entering DWRITE state... Dest write address/pix address: 000E8508/0 [7730773077307730] (icount=009E, inc=2)
4411 srcz=0000000000000000][dcomp=AA zcomp=00 dbinh=00]
4412[srcz=0000000000000000 dstz=0000000000000000 zwdata=0000000000000000 mask=7FFF]
4413 [dstart=0 dend=40 pwidth=8 srcshift=0][daas=0 dabs=0 dam=7 ds=0 daq=F]
4414 Entering A1_ADD state [a1_x=00A0, a1_y=0000, addasel=0, addbsel=0, modx=1, addareg=F, adda_xconst=1, adda_yconst=0]...
4415 Entering DWRITE state... Dest write address/pix address: 000E8518/0 [7730773077307730] (icount=009C, inc=2)
4416 srcz=0000000000000000][dcomp=AA zcomp=00 dbinh=00]
4417[srcz=0000000000000000 dstz=0000000000000000 zwdata=0000000000000000 mask=7FFF]
4418 [dstart=0 dend=40 pwidth=8 srcshift=0][daas=0 dabs=0 dam=7 ds=0 daq=F]
4419 Entering A1_ADD state [a1_x=00A2, a1_y=0000, addasel=0, addbsel=0, modx=1, addareg=F, adda_xconst=1, adda_yconst=0]...
4420
4421*/
4422
4423 if (a1_add)
4424 {
4425#ifdef VERBOSE_BLITTER_LOGGING
4426if (logBlit)
4427{
4428//printf(" Entering A1_ADD state [addasel=%X, addbsel=%X, modx=%X, addareg=%s, adda_xconst=%u, adda_yconst=%s]...\n", addasel, addbsel, modx, (addareg ? "T" : "F"), adda_xconst, (adda_yconst ? "1" : "0"));
4429WriteLog(" Entering A1_ADD state [a1_x=%04X, a1_y=%04X, addasel=%X, addbsel=%X, modx=%X, addareg=%s, adda_xconst=%u, adda_yconst=%s]...\n", a1_x, a1_y, addasel, addbsel, modx, (addareg ? "T" : "F"), adda_xconst, (adda_yconst ? "1" : "0"));
4430//fflush(stdout);
4431}
4432#endif
4433int16_t adda_x, adda_y, addb_x, addb_y, data_x, data_y, addq_x, addq_y;
4434ADDAMUX(adda_x, adda_y, addasel, a1_step_x, a1_step_y, a1_stepf_x, a1_stepf_y, a2_step_x, a2_step_y,
4435 a1_inc_x, a1_inc_y, a1_incf_x, a1_incf_y, adda_xconst, adda_yconst, addareg, suba_x, suba_y);
4436ADDBMUX(addb_x, addb_y, addbsel, a1_x, a1_y, a2_x, a2_y, a1_frac_x, a1_frac_y);
4437ADDRADD(addq_x, addq_y, a1fracldi, adda_x, adda_y, addb_x, addb_y, modx, suba_x, suba_y);
4438
4439#if 0//def VERBOSE_BLITTER_LOGGING
4440if (logBlit)
4441{
4442WriteLog(" [adda_x=%d, adda_y=%d, addb_x=%d, addb_y=%d, addq_x=%d, addq_y=%d]\n", adda_x, adda_y, addb_x, addb_y, addq_x, addq_y);
4443//fflush(stdout);
4444}
4445#endif
4446//Now, write to what???
4447//a2ptrld comes from a2ptrldi...
4448//I believe it's addbsel that determines the writeback...
4449// This is where atick[0] & [1] come in, in determining which part (fractional, integer)
4450// gets written to...
4451//a1_x = addq_x;
4452//a1_y = addq_y;
4453//Kludge, to get A1 channel increment working...
4454if (a1addx == 3)
4455{
4456 a1_frac_x = addq_x, a1_frac_y = addq_y;
4457
4458addasel = 2, addbsel = 0, a1fracldi = false;
4459ADDAMUX(adda_x, adda_y, addasel, a1_step_x, a1_step_y, a1_stepf_x, a1_stepf_y, a2_step_x, a2_step_y,
4460 a1_inc_x, a1_inc_y, a1_incf_x, a1_incf_y, adda_xconst, adda_yconst, addareg, suba_x, suba_y);
4461ADDBMUX(addb_x, addb_y, addbsel, a1_x, a1_y, a2_x, a2_y, a1_frac_x, a1_frac_y);
4462ADDRADD(addq_x, addq_y, a1fracldi, adda_x, adda_y, addb_x, addb_y, modx, suba_x, suba_y);
4463
4464 a1_x = addq_x, a1_y = addq_y;
4465}
4466else
4467 a1_x = addq_x, a1_y = addq_y;
4468 }
4469
4470 if (a2_add)
4471 {
4472#ifdef VERBOSE_BLITTER_LOGGING
4473if (logBlit)
4474{
4475//printf(" Entering A2_ADD state [addasel=%X, addbsel=%X, modx=%X, addareg=%s, adda_xconst=%u, adda_yconst=%s]...\n", addasel, addbsel, modx, (addareg ? "T" : "F"), adda_xconst, (adda_yconst ? "1" : "0"));
4476WriteLog(" Entering A2_ADD state [a2_x=%04X, a2_y=%04X, addasel=%X, addbsel=%X, modx=%X, addareg=%s, adda_xconst=%u, adda_yconst=%s]...\n", a2_x, a2_y, addasel, addbsel, modx, (addareg ? "T" : "F"), adda_xconst, (adda_yconst ? "1" : "0"));
4477//fflush(stdout);
4478}
4479#endif
4480//void ADDAMUX(int16_t &adda_x, int16_t &adda_y, uint8_t addasel, int16_t a1_step_x, int16_t a1_step_y,
4481// int16_t a1_stepf_x, int16_t a1_stepf_y, int16_t a2_step_x, int16_t a2_step_y,
4482// int16_t a1_inc_x, int16_t a1_inc_y, int16_t a1_incf_x, int16_t a1_incf_y, uint8_t adda_xconst,
4483// bool adda_yconst, bool addareg, bool suba_x, bool suba_y)
4484//void ADDBMUX(int16_t &addb_x, int16_t &addb_y, uint8_t addbsel, int16_t a1_x, int16_t a1_y,
4485// int16_t a2_x, int16_t a2_y, int16_t a1_frac_x, int16_t a1_frac_y)
4486//void ADDRADD(int16_t &addq_x, int16_t &addq_y, bool a1fracldi,
4487// int16_t adda_x, int16_t adda_y, int16_t addb_x, int16_t addb_y, uint8_t modx, bool suba_x, bool suba_y)
4488//void DATAMUX(int16_t &data_x, int16_t &data_y, uint32_t gpu_din, int16_t addq_x, int16_t addq_y, bool addqsel)
4489int16_t adda_x, adda_y, addb_x, addb_y, data_x, data_y, addq_x, addq_y;
4490ADDAMUX(adda_x, adda_y, addasel, a1_step_x, a1_step_y, a1_stepf_x, a1_stepf_y, a2_step_x, a2_step_y,
4491 a1_inc_x, a1_inc_y, a1_incf_x, a1_incf_y, adda_xconst, adda_yconst, addareg, suba_x, suba_y);
4492ADDBMUX(addb_x, addb_y, addbsel, a1_x, a1_y, a2_x, a2_y, a1_frac_x, a1_frac_y);
4493ADDRADD(addq_x, addq_y, a1fracldi, adda_x, adda_y, addb_x, addb_y, modx, suba_x, suba_y);
4494
4495#if 0//def VERBOSE_BLITTER_LOGGING
4496if (logBlit)
4497{
4498WriteLog(" [adda_x=%d, adda_y=%d, addb_x=%d, addb_y=%d, addq_x=%d, addq_y=%d]\n", adda_x, adda_y, addb_x, addb_y, addq_x, addq_y);
4499//fflush(stdout);
4500}
4501#endif
4502//Now, write to what???
4503//a2ptrld comes from a2ptrldi...
4504//I believe it's addbsel that determines the writeback...
4505a2_x = addq_x;
4506a2_y = addq_y;
4507 }
4508 }
4509/*
4510Flags: SRCEN CLIP_A1 UPDA1 UPDA1F UPDA2 DSTA2 GOURZ ZMODE=0 LFUFUNC=C SRCSHADE
4511 count = 64 x 55
4512 a1_base = 0015B000, a2_base = 0014B000
4513 a1_x = 0000, a1_y = 0000, a1_frac_x = 8000, a1_frac_y = 8000, a2_x = 001F, a2_y = 0038
4514 a1_step_x = FFFFFFC0, a1_step_y = 0001, a1_stepf_x = 0000, a1_stepf_y = 2AAA, a2_step_x = FFFFFFC0, a2_step_y = 0001
4515 a1_inc_x = 0001, a1_inc_y = 0000, a1_incf_x = 0000, a1_incf_y = 0000
4516 a1_win_x = 0040, a1_win_y = 0040, a2_mask_x = 0000, a2_mask_y = 0000
4517 a2_mask=F a1add=+inc/+0 a2add=+1/+0
4518 a1_pixsize = 4, a2_pixsize = 4
4519 srcd=FF00FF00FF00FF00 dstd=0000000000000000 patd=0000000000000000 iinc=00000000
4520 srcz1=0000000000000000 srcz2=0000000000000000 dstz=0000000000000000 zinc=00000000, col=0
4521 Phrase mode is off
4522 [in=T a1f=F a1=F zf=F z=F a2=F iif=F iii=F izf=F izi=F]
4523 Entering INNER state...
4524 Entering SREAD state... Source read address/pix address: 0015B000/0 [6505650565056505]
4525 Entering A1_ADD state [a1_x=0000, a1_y=0000, addasel=3, addbsel=2, modx=0, addareg=T, adda_xconst=7, adda_yconst=0]...
4526 Entering DWRITE state...
4527 Dest write address/pix address: 0014E83E/0 [dstart=0 dend=10 pwidth=8 srcshift=0][daas=4 dabs=5 dam=7 ds=1 daq=F] [0000000000006505] (icount=003F, inc=1)
4528 Entering A2_ADD state [a2_x=001F, a2_y=0038, addasel=0, addbsel=1, modx=0, addareg=F, adda_xconst=0, adda_yconst=0]...
4529 Entering SREAD state... Source read address/pix address: 0015B000/0 [6505650565056505]
4530 Entering A1_ADD state [a1_x=FFFF8000, a1_y=FFFF8000, addasel=3, addbsel=2, modx=0, addareg=T, adda_xconst=7, adda_yconst=0]...
4531 Entering DWRITE state...
4532 Dest write address/pix address: 0014E942/0 [dstart=0 dend=10 pwidth=8 srcshift=0][daas=4 dabs=5 dam=7 ds=1 daq=F] [0000000000006505] (icount=003E, inc=1)
4533 Entering A2_ADD state [a2_x=0021, a2_y=0039, addasel=0, addbsel=1, modx=0, addareg=F, adda_xconst=0, adda_yconst=0]...
4534 Entering SREAD state... Source read address/pix address: 0015B000/0 [6505650565056505]
4535 Entering A1_ADD state [a1_x=FFFF8000, a1_y=FFFF8000, addasel=3, addbsel=2, modx=0, addareg=T, adda_xconst=7, adda_yconst=0]...
4536 Entering DWRITE state...
4537 Dest write address/pix address: 0014EA46/0 [dstart=0 dend=10 pwidth=8 srcshift=0][daas=4 dabs=5 dam=7 ds=1 daq=F] [0000000000006505] (icount=003D, inc=1)
4538 Entering A2_ADD state [a2_x=0023, a2_y=003A, addasel=0, addbsel=1, modx=0, addareg=F, adda_xconst=0, adda_yconst=0]...
4539 Entering SREAD state... Source read address/pix address: 0015B000/0 [6505650565056505]
4540 Entering A1_ADD state [a1_x=FFFF8000, a1_y=FFFF8000, addasel=3, addbsel=2, modx=0, addareg=T, adda_xconst=7, adda_yconst=0]...
4541 Entering DWRITE state...
4542 Dest write address/pix address: 0014EB4A/0 [dstart=0 dend=10 pwidth=8 srcshift=0][daas=4 dabs=5 dam=7 ds=1 daq=F] [0000000000006505] (icount=003C, inc=1)
4543 Entering A2_ADD state [a2_x=0025, a2_y=003B, addasel=0, addbsel=1, modx=0, addareg=F, adda_xconst=0, adda_yconst=0]...
4544 ...
4545 Entering SREAD state... Source read address/pix address: 0015B000/0 [6505650565056505]
4546 Entering A1_ADD state [a1_x=FFFF8000, a1_y=FFFF8000, addasel=3, addbsel=2, modx=0, addareg=T, adda_xconst=7, adda_yconst=0]...
4547 Entering DWRITE state...
4548 Dest write address/pix address: 0015283A/0 [dstart=0 dend=10 pwidth=8 srcshift=0][daas=4 dabs=5 dam=7 ds=1 daq=F] [0000000000006505] (icount=0000, inc=1)
4549 Entering A2_ADD state [a2_x=009D, a2_y=0077, addasel=0, addbsel=1, modx=0, addareg=F, adda_xconst=0, adda_yconst=0]...
4550 Entering IDLE_INNER state...
4551 Leaving INNER state... (ocount=0036)
4552 [in=F a1f=T a1=F zf=F z=F a2=F iif=F iii=F izf=F izi=F]
4553 Entering A1FUPDATE state...
4554 [in=F a1f=F a1=T zf=F z=F a2=F iif=F iii=F izf=F izi=F]
4555 Entering A1UPDATE state... (-32768/-32768 -> 32704/-32767)
4556 [in=F a1f=F a1=F zf=F z=F a2=T iif=F iii=F izf=F izi=F]
4557 Entering A2UPDATE state... (159/120 -> 95/121)
4558 [in=T a1f=F a1=F zf=F z=F a2=F iif=F iii=F izf=F izi=F]
4559 Entering INNER state...
4560*/
4561
4562#ifdef VERBOSE_BLITTER_LOGGING
4563if (logBlit)
4564{
4565WriteLog(" Leaving INNER state...");
4566//fflush(stdout);
4567}
4568#endif
4569 indone = true;
4570// The outer counter is updated here as well on the clock cycle...
4571
4572/* the inner loop is started whenever another state is about to
4573cause the inner state to go active */
4574//Instart := ND7 (instart, innert[0], innert[2..7]);
4575
4576//Actually, it's done only when inner gets asserted without the 2nd line of conditions
4577//(inner AND !indone)
4578//fixed now...
4579//Since we don't get here until the inner loop is finished (indone = true) we can get
4580//away with doing it here...!
4581 ocount--;
4582
4583 if (ocount == 0)
4584 outer0 = true;
4585#ifdef VERBOSE_BLITTER_LOGGING
4586if (logBlit)
4587{
4588WriteLog(" (ocount=%04X)\n", ocount);
4589//fflush(stdout);
4590}
4591#endif
4592 }
4593
4594 if (a1fupdate)
4595 {
4596#ifdef VERBOSE_BLITTER_LOGGING
4597if (logBlit)
4598{
4599WriteLog(" Entering A1FUPDATE state...\n");
4600//fflush(stdout);
4601}
4602#endif
4603 uint32_t a1_frac_xt = (uint32_t)a1_frac_x + (uint32_t)a1_stepf_x;
4604 uint32_t a1_frac_yt = (uint32_t)a1_frac_y + (uint32_t)a1_stepf_y;
4605 a1FracCInX = a1_frac_xt >> 16;
4606 a1FracCInY = a1_frac_yt >> 16;
4607 a1_frac_x = (uint16_t)(a1_frac_xt & 0xFFFF);
4608 a1_frac_y = (uint16_t)(a1_frac_yt & 0xFFFF);
4609 }
4610
4611 if (a1update)
4612 {
4613#ifdef VERBOSE_BLITTER_LOGGING
4614if (logBlit)
4615{
4616WriteLog(" Entering A1UPDATE state... (%d/%d -> ", a1_x, a1_y);
4617//fflush(stdout);
4618}
4619#endif
4620 a1_x += a1_step_x + a1FracCInX;
4621 a1_y += a1_step_y + a1FracCInY;
4622#ifdef VERBOSE_BLITTER_LOGGING
4623if (logBlit)
4624{
4625WriteLog("%d/%d)\n", a1_x, a1_y);
4626//fflush(stdout);
4627}
4628#endif
4629 }
4630
4631 if (a2update)
4632 {
4633#ifdef VERBOSE_BLITTER_LOGGING
4634if (logBlit)
4635{
4636WriteLog(" Entering A2UPDATE state... (%d/%d -> ", a2_x, a2_y);
4637//fflush(stdout);
4638}
4639#endif
4640 a2_x += a2_step_x;
4641 a2_y += a2_step_y;
4642#ifdef VERBOSE_BLITTER_LOGGING
4643if (logBlit)
4644{
4645WriteLog("%d/%d)\n", a2_x, a2_y);
4646//fflush(stdout);
4647}
4648#endif
4649 }
4650 }
4651
4652// We never get here! !!! FIX !!!
4653
4654#ifdef VERBOSE_BLITTER_LOGGING
4655if (logBlit)
4656{
4657 WriteLog("Done!\na1_x=%04X a1_y=%04X a1_frac_x=%04X a1_frac_y=%04X a2_x=%04X a2_y%04X\n",
4658 GET16(blitter_ram, A1_PIXEL + 2),
4659 GET16(blitter_ram, A1_PIXEL + 0),
4660 GET16(blitter_ram, A1_FPIXEL + 2),
4661 GET16(blitter_ram, A1_FPIXEL + 0),
4662 GET16(blitter_ram, A2_PIXEL + 2),
4663 GET16(blitter_ram, A2_PIXEL + 0));
4664// fflush(stdout);
4665}
4666#endif
4667
4668 // Write values back to registers (in real blitter, these are continuously updated)
4669 SET16(blitter_ram, A1_PIXEL + 2, a1_x);
4670 SET16(blitter_ram, A1_PIXEL + 0, a1_y);
4671 SET16(blitter_ram, A1_FPIXEL + 2, a1_frac_x);
4672 SET16(blitter_ram, A1_FPIXEL + 0, a1_frac_y);
4673 SET16(blitter_ram, A2_PIXEL + 2, a2_x);
4674 SET16(blitter_ram, A2_PIXEL + 0, a2_y);
4675
4676#ifdef VERBOSE_BLITTER_LOGGING
4677if (logBlit)
4678{
4679 WriteLog("Writeback!\na1_x=%04X a1_y=%04X a1_frac_x=%04X a1_frac_y=%04X a2_x=%04X a2_y%04X\n",
4680 GET16(blitter_ram, A1_PIXEL + 2),
4681 GET16(blitter_ram, A1_PIXEL + 0),
4682 GET16(blitter_ram, A1_FPIXEL + 2),
4683 GET16(blitter_ram, A1_FPIXEL + 0),
4684 GET16(blitter_ram, A2_PIXEL + 2),
4685 GET16(blitter_ram, A2_PIXEL + 0));
4686// fflush(stdout);
4687}
4688#endif
4689}
4690
4691
4692/*
4693 int16_t a1_x = (int16_t)GET16(blitter_ram, A1_PIXEL + 2);
4694 int16_t a1_y = (int16_t)GET16(blitter_ram, A1_PIXEL + 0);
4695 uint16_t a1_frac_x = GET16(blitter_ram, A1_FPIXEL + 2);
4696 uint16_t a1_frac_y = GET16(blitter_ram, A1_FPIXEL + 0);
4697 int16_t a2_x = (int16_t)GET16(blitter_ram, A2_PIXEL + 2);
4698 int16_t a2_y = (int16_t)GET16(blitter_ram, A2_PIXEL + 0);
4699
4700Seems that the ending a1_x should be written between blits, but it doesn't seem to be...
4701
4702Blit! (CMD = 01800000)
4703Flags: LFUFUNC=C
4704 count = 28672 x 1
4705 a1_base = 00050000, a2_base = 00070000
4706 a1_x = 0000, a1_y = 0000, a1_frac_x = 49CD, a1_frac_y = 0000, a2_x = 0033, a2_y = 0001
4707 a1_step_x = 0000, a1_step_y = 0000, a1_stepf_x = 939A, a1_stepf_y = 0000, a2_step_x = 0000, a2_step_y = 0000
4708 a1_inc_x = 0000, a1_inc_y = 0000, a1_incf_x = 0000, a1_incf_y = 0000
4709 a1_win_x = 0100, a1_win_y = 0020, a2_mask_x = 0000, a2_mask_y = 0000
4710 a2_mask=F a1add=+phr/+0 a2add=+phr/+0
4711 a1_pixsize = 4, a2_pixsize = 3
4712 srcd=DEDEDEDEDEDEDEDE dstd=0000000000000000 patd=0000000000000000 iinc=00000000
4713 srcz1=0000000000000000 srcz2=0000000000000000 dstz=0000000000000000 zinc=00000000, coll=0
4714 Phrase mode is ON
4715
4716Blit! (CMD = 01800000)
4717Flags: LFUFUNC=C
4718 count = 28672 x 1
4719 a1_base = 00050000, a2_base = 00070000
4720 a1_x = 0000, a1_y = 0000, a1_frac_x = 49CD, a1_frac_y = 0000, a2_x = 0033, a2_y = 0001
4721 a1_step_x = 0000, a1_step_y = 0000, a1_stepf_x = 939A, a1_stepf_y = 0000, a2_step_x = 0000, a2_step_y = 0000
4722 a1_inc_x = 0000, a1_inc_y = 0000, a1_incf_x = 0000, a1_incf_y = 0000
4723 a1_win_x = 0100, a1_win_y = 0020, a2_mask_x = 0000, a2_mask_y = 0000
4724 a2_mask=F a1add=+phr/+0 a2add=+phr/+0
4725 a1_pixsize = 4, a2_pixsize = 3
4726 srcd=D6D6D6D6D6D6D6D6 dstd=0000000000000000 patd=0000000000000000 iinc=00000000
4727 srcz1=0000000000000000 srcz2=0000000000000000 dstz=0000000000000000 zinc=00000000, coll=0
4728 Phrase mode is ON
4729*/
4730
4731
4732
4733// Various pieces of the blitter puzzle are teased out here...
4734
4735
4736
4737/*
4738DEF ADDRGEN (
4739INT24/ address // byte address
4740 pixa[0..2] // bit part of address, un-pipe-lined
4741 :OUT;
4742INT16/ a1_x
4743INT16/ a1_y
4744INT21/ a1_base
4745 a1_pitch[0..1]
4746 a1_pixsize[0..2]
4747 a1_width[0..5]
4748 a1_zoffset[0..1]
4749INT16/ a2_x
4750INT16/ a2_y
4751INT21/ a2_base
4752 a2_pitch[0..1]
4753 a2_pixsize[0..2]
4754 a2_width[0..5]
4755 a2_zoffset[0..1]
4756 apipe // load address pipe-line latch
4757 clk // co-processor clock
4758 gena2 // generate A2 as opposed to A1
4759 zaddr // generate Z address
4760 :IN);
4761*/
4762
4763void ADDRGEN(uint32_t &address, uint32_t &pixa, bool gena2, bool zaddr,
4764 uint16_t a1_x, uint16_t a1_y, uint32_t a1_base, uint8_t a1_pitch, uint8_t a1_pixsize, uint8_t a1_width, uint8_t a1_zoffset,
4765 uint16_t a2_x, uint16_t a2_y, uint32_t a2_base, uint8_t a2_pitch, uint8_t a2_pixsize, uint8_t a2_width, uint8_t a2_zoffset)
4766{
4767// uint16_t x = (gena2 ? a2_x : a1_x) & 0x7FFF;
4768 uint16_t x = (gena2 ? a2_x : a1_x) & 0xFFFF; // Actually uses all 16 bits to generate address...!
4769 uint16_t y = (gena2 ? a2_y : a1_y) & 0x0FFF;
4770 uint8_t width = (gena2 ? a2_width : a1_width);
4771 uint8_t pixsize = (gena2 ? a2_pixsize : a1_pixsize);
4772 uint8_t pitch = (gena2 ? a2_pitch : a1_pitch);
4773 uint32_t base = (gena2 ? a2_base : a1_base) >> 3;//Only upper 21 bits are passed around the bus? Seems like it...
4774 uint8_t zoffset = (gena2 ? a2_zoffset : a1_zoffset);
4775
4776 uint32_t ytm = ((uint32_t)y << 2) + (width & 0x02 ? (uint32_t)y << 1 : 0) + (width & 0x01 ? (uint32_t)y : 0);
4777
4778 uint32_t ya = (ytm << (width >> 2)) >> 2;
4779
4780 uint32_t pa = ya + x;
4781
4782 /*uint32*/ pixa = pa << pixsize;
4783
4784 uint8_t pt = ((pitch & 0x01) && !(pitch & 0x02) ? 0x01 : 0x00)
4785 | (!(pitch & 0x01) && (pitch & 0x02) ? 0x02 : 0x00);
4786// uint32_t phradr = pixa << pt;
4787 uint32_t phradr = (pixa >> 6) << pt;
4788 uint32_t shup = (pitch == 0x03 ? (pixa >> 6) : 0);
4789
4790 uint8_t za = (zaddr ? zoffset : 0) & 0x03;
4791// uint32_t addr = za + (phradr & 0x07) + (shup << 1) + base;
4792 uint32_t addr = za + phradr + (shup << 1) + base;
4793 /*uint32*/ address = ((pixa & 0x38) >> 3) | ((addr & 0x1FFFFF) << 3);
4794#if 0//def VERBOSE_BLITTER_LOGGING
4795if (logBlit)
4796{
4797WriteLog(" [gena2=%s, x=%04X, y=%04X, w=%1X, pxsz=%1X, ptch=%1X, b=%08X, zoff=%1X]\n", (gena2 ? "T" : "F"), x, y, width, pixsize, pitch, base, zoffset);
4798WriteLog(" [ytm=%X, ya=%X, pa=%X, pixa=%X, pt=%X, phradr=%X, shup=%X, za=%X, addr=%X, address=%X]\n", ytm, ya, pa, pixa, pt, phradr, shup, za, addr, address);
4799//fflush(stdout);
4800}
4801#endif
4802 pixa &= 0x07;
4803/*
4804 Entering INNER state...
4805 [gena2=T, x=0002, y=0000, w=20, pxsz=4, ptch=0, b=000012BA, zoff=0]
4806 [ytm=0, ya=0, pa=2, pixa=20, pt=0, phradr=0, shup=0, za=0, addr=12BA, address=95D4]
4807 Entering SREADX state... [dstart=0 dend=20 pwidth=8 srcshift=20]
4808 Source extra read address/pix address: 000095D4/0 [0000001C00540038]
4809 Entering A2_ADD state [a2_x=0002, a2_y=0000, addasel=0, addbsel=1, modx=2, addareg=F, adda_xconst=2, adda_yconst=0]...
4810 [gena2=T, x=0004, y=0000, w=20, pxsz=4, ptch=0, b=000012BA, zoff=0]
4811 [ytm=0, ya=0, pa=4, pixa=40, pt=0, phradr=1, shup=0, za=0, addr=12BB, address=95D8]
4812 Entering SREAD state... [dstart=0 dend=20 pwidth=8 srcshift=0]
4813 Source read address/pix address: 000095D8/0 [0054003800009814]
4814 Entering A2_ADD state [a2_x=0004, a2_y=0000, addasel=0, addbsel=1, modx=2, addareg=F, adda_xconst=2, adda_yconst=0]...
4815 [gena2=F, x=0000, y=0000, w=20, pxsz=4, ptch=0, b=00006E52, zoff=0]
4816 [ytm=0, ya=0, pa=0, pixa=0, pt=0, phradr=0, shup=0, za=0, addr=6E52, address=37290]
4817 Entering DWRITE state...
4818 Dest write address/pix address: 00037290/0 [dstart=0 dend=20 pwidth=8 srcshift=0] (icount=026E, inc=4)
4819 Entering A1_ADD state [a1_x=0000, a1_y=0000, addasel=0, addbsel=0, modx=2, addareg=F, adda_xconst=2, adda_yconst=0]...
4820 [gena2=T, x=0008, y=0000, w=20, pxsz=4, ptch=0, b=000012BA, zoff=0]
4821 [ytm=0, ya=0, pa=8, pixa=80, pt=0, phradr=2, shup=0, za=0, addr=12BC, address=95E0]
4822*/
4823/*
4824Obviously wrong:
4825 Entering SREAD state...
4826 [gena2=T, x=0004, y=0000, w=20, pxsz=4, ptch=0, b=000010AC, zoff=0]
4827 [ytm=0, ya=0, pa=4, pixa=0, pt=0, phradr=40, shup=0, za=0, addr=10AC, address=8560]
4828 Source read address/pix address: 00008560/0 [8C27981B327E00F0]
4829
48302nd pass (still wrong):
4831 Entering SREAD state...
4832 [gena2=T, x=0004, y=0000, w=20, pxsz=4, ptch=0, b=000010AC, zoff=0]
4833 [ytm=0, ya=0, pa=4, pixa=0, pt=0, phradr=40, shup=0, za=0, addr=10EC, address=8760]
4834 Source read address/pix address: 00008760/0 [00E06DC04581880C]
4835
4836Correct!:
4837 Entering SREAD state...
4838 [gena2=T, x=0004, y=0000, w=20, pxsz=4, ptch=0, b=000010AC, zoff=0]
4839 [ytm=0, ya=0, pa=4, pixa=0, pt=0, phradr=1, shup=0, za=0, addr=10AD, address=8568]
4840 Source read address/pix address: 00008568/0 [6267981A327C00F0]
4841
4842OK, now we're back into incorrect (or is it?):
4843 Entering SREADX state... [dstart=0 dend=20 pwidth=8 srcshift=20]
4844 Source extra read address/pix address: 000095D4/0 [0000 001C 0054 0038]
4845 Entering A2_ADD state [a2_x=0002, a2_y=0000, addasel=0, addbsel=1, modx=2, addareg=F, adda_xconst=2, adda_yconst=0]...
4846 Entering SREAD state... [dstart=0 dend=20 pwidth=8 srcshift=0]
4847 Source read address/pix address: 000095D8/0 [0054 0038 0000 9814]
4848 Entering A2_ADD state [a2_x=0004, a2_y=0000, addasel=0, addbsel=1, modx=2, addareg=F, adda_xconst=2, adda_yconst=0]...
4849I think this may be correct...!
4850*/
4851}
4852
4853/*
4854// source and destination address update conditions
4855
4856Sraat0 := AN2 (sraat[0], sreadxi, srcenz\);
4857Sraat1 := AN2 (sraat[1], sreadi, srcenz\);
4858Srca_addi := OR4 (srca_addi, szreadxi, szreadi, sraat[0..1]);
4859Srca_add := FD1Q (srca_add, srca_addi, clk);
4860
4861Dstaat := AN2 (dstaat, dwritei, dstwrz\);
4862Dsta_addi := OR2 (dsta_addi, dzwritei, dstaat);
4863// Dsta_add := FD1Q (dsta_add, dsta_addi, clk);
4864
4865// source and destination address generate conditions
4866
4867Gensrc := OR4 (gensrc, sreadxi, szreadxi, sreadi, szreadi);
4868Gendst := OR4 (gendst, dreadi, dzreadi, dwritei, dzwritei);
4869Dsta2\ := INV1 (dsta2\, dsta2);
4870Gena2t0 := NAN2 (gena2t[0], gensrc, dsta2\);
4871Gena2t1 := NAN2 (gena2t[1], gendst, dsta2);
4872Gena2i := NAN2 (gena2i, gena2t[0..1]);
4873Gena2 := FD1QU (gena2, gena2i, clk);
4874
4875Zaddr := OR4 (zaddr, szreadx, szread, dzread, dzwrite);
4876*/
4877
4878/*void foo(void)
4879{
4880 // Basically, the above translates to:
4881 bool srca_addi = (sreadxi && !srcenz) || (sreadi && !srcenz) || szreadxi || szreadi;
4882
4883 bool dsta_addi = (dwritei && !dstwrz) || dzwritei;
4884
4885 bool gensrc = sreadxi || szreadxi || sreadi || szreadi;
4886 bool gendst = dreadi || szreadi || dwritei || dzwritei;
4887 bool gena2i = (gensrc && !dsta2) || (gendst && dsta2);
4888
4889 bool zaddr = szreadx || szread || dzread || dzwrite;
4890}*/
4891
4892/*
4893// source data reads
4894
4895Srcdpset\ := NAN2 (srcdpset\, readreq, sread);
4896Srcdpt1 := NAN2 (srcdpt[1], srcdpend, srcdack\);
4897Srcdpt2 := NAN2 (srcdpt[2], srcdpset\, srcdpt[1]);
4898Srcdpend := FD2Q (srcdpend, srcdpt[2], clk, reset\);
4899
4900Srcdxpset\ := NAN2 (srcdxpset\, readreq, sreadx);
4901Srcdxpt1 := NAN2 (srcdxpt[1], srcdxpend, srcdxack\);
4902Srcdxpt2 := NAN2 (srcdxpt[2], srcdxpset\, srcdxpt[1]);
4903Srcdxpend := FD2Q (srcdxpend, srcdxpt[2], clk, reset\);
4904
4905Sdpend := OR2 (sdpend, srcdxpend, srcdpend);
4906Srcdreadt := AN2 (srcdreadt, sdpend, read_ack);
4907
4908//2/9/92 - enhancement?
4909//Load srcdread on the next tick as well to modify it in srcshade
4910
4911Srcdreadd := FD1Q (srcdreadd, srcdreadt, clk);
4912Srcdread := AOR1 (srcdread, srcshade, srcdreadd, srcdreadt);
4913
4914// source zed reads
4915
4916Srczpset\ := NAN2 (srczpset\, readreq, szread);
4917Srczpt1 := NAN2 (srczpt[1], srczpend, srczack\);
4918Srczpt2 := NAN2 (srczpt[2], srczpset\, srczpt[1]);
4919Srczpend := FD2Q (srczpend, srczpt[2], clk, reset\);
4920
4921Srczxpset\ := NAN2 (srczxpset\, readreq, szreadx);
4922Srczxpt1 := NAN2 (srczxpt[1], srczxpend, srczxack\);
4923Srczxpt2 := NAN2 (srczxpt[2], srczxpset\, srczxpt[1]);
4924Srczxpend := FD2Q (srczxpend, srczxpt[2], clk, reset\);
4925
4926Szpend := OR2 (szpend, srczpend, srczxpend);
4927Srczread := AN2 (srczread, szpend, read_ack);
4928
4929// destination data reads
4930
4931Dstdpset\ := NAN2 (dstdpset\, readreq, dread);
4932Dstdpt0 := NAN2 (dstdpt[0], dstdpend, dstdack\);
4933Dstdpt1 := NAN2 (dstdpt[1], dstdpset\, dstdpt[0]);
4934Dstdpend := FD2Q (dstdpend, dstdpt[1], clk, reset\);
4935Dstdread := AN2 (dstdread, dstdpend, read_ack);
4936
4937// destination zed reads
4938
4939Dstzpset\ := NAN2 (dstzpset\, readreq, dzread);
4940Dstzpt0 := NAN2 (dstzpt[0], dstzpend, dstzack\);
4941Dstzpt1 := NAN2 (dstzpt[1], dstzpset\, dstzpt[0]);
4942Dstzpend := FD2Q (dstzpend, dstzpt[1], clk, reset\);
4943Dstzread := AN2 (dstzread, dstzpend, read_ack);
4944*/
4945
4946/*void foo2(void)
4947{
4948 // Basically, the above translates to:
4949 bool srcdpend = (readreq && sread) || (srcdpend && !srcdack);
4950 bool srcdxpend = (readreq && sreadx) || (srcdxpend && !srcdxack);
4951 bool sdpend = srcxpend || srcdpend;
4952 bool srcdread = ((sdpend && read_ack) && srcshade) || (sdpend && read_ack);//the latter term is lookahead
4953
4954}*/
4955
4956
4957////////////////////////////////////////////////////////////////////////////////////////////
4958////////////////////////////////////////////////////////////////////////////////////////////
4959// Here's an important bit: The source data adder logic. Need to track down the inputs!!! //
4960////////////////////////////////////////////////////////////////////////////////////////////
4961////////////////////////////////////////////////////////////////////////////////////////////
4962
4963/*
4964DEF ADDARRAY (
4965INT16/ addq[0..3]
4966 :OUT;
4967 clk
4968 daddasel[0..2] // data adder input A selection
4969 daddbsel[0..3]
4970 daddmode[0..2]
4971INT32/ dstd[0..1]
4972INT32/ iinc
4973 initcin[0..3] // carry into the adders from the initializers
4974 initinc[0..63] // the initialisation increment
4975 initpix[0..15] // Data initialiser pixel value
4976INT32/ istep
4977INT32/ patd[0..1]
4978INT32/ srcdlo
4979INT32/ srcdhi
4980INT32/ srcz1[0..1]
4981INT32/ srcz2[0..1]
4982 reset\
4983INT32/ zinc
4984INT32/ zstep
4985 :IN);
4986*/
4987void ADDARRAY(uint16_t * addq, uint8_t daddasel, uint8_t daddbsel, uint8_t daddmode,
4988 uint64_t dstd, uint32_t iinc, uint8_t initcin[], uint64_t initinc, uint16_t initpix,
4989 uint32_t istep, uint64_t patd, uint64_t srcd, uint64_t srcz1, uint64_t srcz2,
4990 uint32_t zinc, uint32_t zstep)
4991{
4992 uint32_t initpix2 = ((uint32_t)initpix << 16) | initpix;
4993 uint32_t addalo[8], addahi[8];
4994 addalo[0] = dstd & 0xFFFFFFFF;
4995 addalo[1] = initpix2;
4996 addalo[2] = 0;
4997 addalo[3] = 0;
4998 addalo[4] = srcd & 0xFFFFFFFF;
4999 addalo[5] = patd & 0xFFFFFFFF;
5000 addalo[6] = srcz1 & 0xFFFFFFFF;
5001 addalo[7] = srcz2 & 0xFFFFFFFF;
5002 addahi[0] = dstd >> 32;
5003 addahi[1] = initpix2;
5004 addahi[2] = 0;
5005 addahi[3] = 0;
5006 addahi[4] = srcd >> 32;
5007 addahi[5] = patd >> 32;
5008 addahi[6] = srcz1 >> 32;
5009 addahi[7] = srcz2 >> 32;
5010 uint16_t adda[4];
5011 adda[0] = addalo[daddasel] & 0xFFFF;
5012 adda[1] = addalo[daddasel] >> 16;
5013 adda[2] = addahi[daddasel] & 0xFFFF;
5014 adda[3] = addahi[daddasel] >> 16;
5015
5016 uint16_t wordmux[8];
5017 wordmux[0] = iinc & 0xFFFF;
5018 wordmux[1] = iinc >> 16;
5019 wordmux[2] = zinc & 0xFFFF;
5020 wordmux[3] = zinc >> 16;;
5021 wordmux[4] = istep & 0xFFFF;
5022 wordmux[5] = istep >> 16;;
5023 wordmux[6] = zstep & 0xFFFF;
5024 wordmux[7] = zstep >> 16;;
5025 uint16_t word = wordmux[((daddbsel & 0x08) >> 1) | (daddbsel & 0x03)];
5026 uint16_t addb[4];
5027 bool dbsel2 = daddbsel & 0x04;
5028 bool iincsel = (daddbsel & 0x01) && !(daddbsel & 0x04);
5029
5030 if (!dbsel2 && !iincsel)
5031 addb[0] = srcd & 0xFFFF,
5032 addb[1] = (srcd >> 16) & 0xFFFF,
5033 addb[2] = (srcd >> 32) & 0xFFFF,
5034 addb[3] = (srcd >> 48) & 0xFFFF;
5035 else if (dbsel2 && !iincsel)
5036 addb[0] = addb[1] = addb[2] = addb[3] = word;
5037 else if (!dbsel2 && iincsel)
5038 addb[0] = initinc & 0xFFFF,
5039 addb[1] = (initinc >> 16) & 0xFFFF,
5040 addb[2] = (initinc >> 32) & 0xFFFF,
5041 addb[3] = (initinc >> 48) & 0xFFFF;
5042 else
5043 addb[0] = addb[1] = addb[2] = addb[3] = 0;
5044
5045 uint8_t cinsel = (daddmode >= 1 && daddmode <= 4 ? 1 : 0);
5046
5047static uint8_t co[4];//These are preserved between calls...
5048 uint8_t cin[4];
5049
5050 for(int i=0; i<4; i++)
5051 cin[i] = initcin[i] | (co[i] & cinsel);
5052
5053 bool eightbit = daddmode & 0x02;
5054 bool sat = daddmode & 0x03;
5055 bool hicinh = ((daddmode & 0x03) == 0x03);
5056
5057//Note that the carry out is saved between calls to this function...
5058 for(int i=0; i<4; i++)
5059 ADD16SAT(addq[i], co[i], adda[i], addb[i], cin[i], sat, eightbit, hicinh);
5060}
5061
5062
5063/*
5064DEF ADD16SAT (
5065INT16/ r // result
5066 co // carry out
5067 :IO;
5068INT16/ a
5069INT16/ b
5070 cin
5071 sat
5072 eightbit
5073 hicinh
5074 :IN);
5075*/
5076void ADD16SAT(uint16_t &r, uint8_t &co, uint16_t a, uint16_t b, uint8_t cin, bool sat, bool eightbit, bool hicinh)
5077{
5078/*if (logBlit)
5079{
5080 printf("--> [sat=%s 8b=%s hicinh=%s] %04X + %04X (+ %u) = ", (sat ? "T" : "F"), (eightbit ? "T" : "F"), (hicinh ? "T" : "F"), a, b, cin);
5081 fflush(stdout);
5082}*/
5083 uint8_t carry[4];
5084 uint32_t qt = (a & 0xFF) + (b & 0xFF) + cin;
5085 carry[0] = (qt & 0x0100 ? 1 : 0);
5086 uint16_t q = qt & 0x00FF;
5087 carry[1] = (carry[0] && !eightbit ? carry[0] : 0);
5088 qt = (a & 0x0F00) + (b & 0x0F00) + (carry[1] << 8);
5089 carry[2] = (qt & 0x1000 ? 1 : 0);
5090 q |= qt & 0x0F00;
5091 carry[3] = (carry[2] && !hicinh ? carry[2] : 0);
5092 qt = (a & 0xF000) + (b & 0xF000) + (carry[3] << 12);
5093 co = (qt & 0x10000 ? 1 : 0);
5094 q |= qt & 0xF000;
5095
5096 uint8_t btop = (eightbit ? (b & 0x0080) >> 7 : (b & 0x8000) >> 15);
5097 uint8_t ctop = (eightbit ? carry[0] : co);
5098
5099 bool saturate = sat && (btop ^ ctop);
5100 bool hisaturate = saturate && !eightbit;
5101/*if (logBlit)
5102{
5103 printf("bt=%u ct=%u s=%u hs=%u] ", btop, ctop, saturate, hisaturate);
5104 fflush(stdout);
5105}*/
5106
5107 r = (saturate ? (ctop ? 0x00FF : 0x0000) : q & 0x00FF);
5108 r |= (hisaturate ? (ctop ? 0xFF00 : 0x0000) : q & 0xFF00);
5109/*if (logBlit)
5110{
5111 printf("%04X (co=%u)\n", r, co);
5112 fflush(stdout);
5113}*/
5114}
5115
5116
5117/** ADDAMUX - Address adder input A selection *******************
5118
5119This module generates the data loaded into the address adder input A. This is
5120the update value, and can be one of four registers : A1 step, A2 step, A1
5121increment and A1 fraction. It can complement these values to perform
5122subtraction, and it can generate constants to increment / decrement the window
5123pointers.
5124
5125addasel[0..2] select the register to add
5126
5127000 A1 step integer part
5128001 A1 step fraction part
5129010 A1 increment integer part
5130011 A1 increment fraction part
5131100 A2 step
5132
5133adda_xconst[0..2] generate a power of 2 in the range 1-64 or all zeroes when
5134they are all 1.
5135
5136addareg selects register value to be added as opposed to constant
5137value.
5138
5139suba_x, suba_y complement the X and Y values
5140
5141*/
5142
5143/*
5144DEF ADDAMUX (
5145INT16/ adda_x
5146INT16/ adda_y
5147 :OUT;
5148 addasel[0..2]
5149INT16/ a1_step_x
5150INT16/ a1_step_y
5151INT16/ a1_stepf_x
5152INT16/ a1_stepf_y
5153INT16/ a2_step_x
5154INT16/ a2_step_y
5155INT16/ a1_inc_x
5156INT16/ a1_inc_y
5157INT16/ a1_incf_x
5158INT16/ a1_incf_y
5159 adda_xconst[0..2]
5160 adda_yconst
5161 addareg
5162 suba_x
5163 suba_y :IN);
5164*/
5165void ADDAMUX(int16_t &adda_x, int16_t &adda_y, uint8_t addasel, int16_t a1_step_x, int16_t a1_step_y,
5166 int16_t a1_stepf_x, int16_t a1_stepf_y, int16_t a2_step_x, int16_t a2_step_y,
5167 int16_t a1_inc_x, int16_t a1_inc_y, int16_t a1_incf_x, int16_t a1_incf_y, uint8_t adda_xconst,
5168 bool adda_yconst, bool addareg, bool suba_x, bool suba_y)
5169{
5170
5171/*INT16/ addac_x, addac_y, addar_x, addar_y, addart_x, addart_y,
5172INT16/ addas_x, addas_y, suba_x16, suba_y16
5173:LOCAL;
5174BEGIN
5175
5176Zero := TIE0 (zero);*/
5177
5178/* Multiplex the register terms */
5179
5180/*Addaselb[0-2] := BUF8 (addaselb[0-2], addasel[0-2]);
5181Addart_x := MX4 (addart_x, a1_step_x, a1_stepf_x, a1_inc_x, a1_incf_x, addaselb[0..1]);
5182Addar_x := MX2 (addar_x, addart_x, a2_step_x, addaselb[2]);
5183Addart_y := MX4 (addart_y, a1_step_y, a1_stepf_y, a1_inc_y, a1_incf_y, addaselb[0..1]);
5184Addar_y := MX2 (addar_y, addart_y, a2_step_y, addaselb[2]);*/
5185
5186////////////////////////////////////// C++ CODE //////////////////////////////////////
5187 int16_t xterm[4], yterm[4];
5188 xterm[0] = a1_step_x, xterm[1] = a1_stepf_x, xterm[2] = a1_inc_x, xterm[3] = a1_incf_x;
5189 yterm[0] = a1_step_y, yterm[1] = a1_stepf_y, yterm[2] = a1_inc_y, yterm[3] = a1_incf_y;
5190 int16_t addar_x = (addasel & 0x04 ? a2_step_x : xterm[addasel & 0x03]);
5191 int16_t addar_y = (addasel & 0x04 ? a2_step_y : yterm[addasel & 0x03]);
5192//////////////////////////////////////////////////////////////////////////////////////
5193
5194/* Generate a constant value - this is a power of 2 in the range
51950-64, or zero. The control bits are adda_xconst[0..2], when they
5196are all 1 the result is 0.
5197Constants for Y can only be 0 or 1 */
5198
5199/*Addac_xlo := D38H (addac_x[0..6], unused[0], adda_xconst[0..2]);
5200Unused[0] := DUMMY (unused[0]);
5201
5202Addac_x := JOIN (addac_x, addac_x[0..6], zero, zero, zero, zero, zero, zero, zero, zero, zero);
5203Addac_y := JOIN (addac_y, adda_yconst, zero, zero, zero, zero, zero, zero, zero, zero, zero, zero,
5204 zero, zero, zero, zero, zero);*/
5205////////////////////////////////////// C++ CODE //////////////////////////////////////
5206 int16_t addac_x = (adda_xconst == 0x07 ? 0 : 1 << adda_xconst);
5207 int16_t addac_y = (adda_yconst ? 0x01 : 0);
5208//////////////////////////////////////////////////////////////////////////////////////
5209
5210/* Select between constant value and register value */
5211
5212/*Addas_x := MX2 (addas_x, addac_x, addar_x, addareg);
5213Addas_y := MX2 (addas_y, addac_y, addar_y, addareg);*/
5214////////////////////////////////////// C++ CODE //////////////////////////////////////
5215 int16_t addas_x = (addareg ? addar_x : addac_x);
5216 int16_t addas_y = (addareg ? addar_y : addac_y);
5217//////////////////////////////////////////////////////////////////////////////////////
5218
5219/* Complement these values (complement flag gives adder carry in)*/
5220
5221/*Suba_x16 := JOIN (suba_x16, suba_x, suba_x, suba_x, suba_x, suba_x, suba_x, suba_x, suba_x, suba_x,
5222 suba_x, suba_x, suba_x, suba_x, suba_x, suba_x, suba_x);
5223Suba_y16 := JOIN (suba_y16, suba_y, suba_y, suba_y, suba_y, suba_y, suba_y, suba_y, suba_y, suba_y,
5224 suba_y, suba_y, suba_y, suba_y, suba_y, suba_y, suba_y);
5225Adda_x := EO (adda_x, suba_x16, addas_x);
5226Adda_y := EO (adda_y, suba_y16, addas_y);*/
5227////////////////////////////////////// C++ CODE //////////////////////////////////////
5228 adda_x = addas_x ^ (suba_x ? 0xFFFF : 0x0000);
5229 adda_y = addas_y ^ (suba_y ? 0xFFFF : 0x0000);
5230//////////////////////////////////////////////////////////////////////////////////////
5231
5232//END;
5233}
5234
5235
5236/** ADDBMUX - Address adder input B selection *******************
5237
5238This module selects the register to be updated by the address
5239adder. This can be one of three registers, the A1 and A2
5240pointers, or the A1 fractional part. It can also be zero, so that the step
5241registers load directly into the pointers.
5242*/
5243
5244/*DEF ADDBMUX (
5245INT16/ addb_x
5246INT16/ addb_y
5247 :OUT;
5248 addbsel[0..1]
5249INT16/ a1_x
5250INT16/ a1_y
5251INT16/ a2_x
5252INT16/ a2_y
5253INT16/ a1_frac_x
5254INT16/ a1_frac_y
5255 :IN);
5256INT16/ zero16 :LOCAL;
5257BEGIN*/
5258void ADDBMUX(int16_t &addb_x, int16_t &addb_y, uint8_t addbsel, int16_t a1_x, int16_t a1_y,
5259 int16_t a2_x, int16_t a2_y, int16_t a1_frac_x, int16_t a1_frac_y)
5260{
5261
5262/*Zero := TIE0 (zero);
5263Zero16 := JOIN (zero16, zero, zero, zero, zero, zero, zero, zero,
5264 zero, zero, zero, zero, zero, zero, zero, zero, zero);
5265Addbselb[0-1] := BUF8 (addbselb[0-1], addbsel[0-1]);
5266Addb_x := MX4 (addb_x, a1_x, a2_x, a1_frac_x, zero16, addbselb[0..1]);
5267Addb_y := MX4 (addb_y, a1_y, a2_y, a1_frac_y, zero16, addbselb[0..1]);*/
5268////////////////////////////////////// C++ CODE //////////////////////////////////////
5269 int16_t xterm[4], yterm[4];
5270 xterm[0] = a1_x, xterm[1] = a2_x, xterm[2] = a1_frac_x, xterm[3] = 0;
5271 yterm[0] = a1_y, yterm[1] = a2_y, yterm[2] = a1_frac_y, yterm[3] = 0;
5272 addb_x = xterm[addbsel & 0x03];
5273 addb_y = yterm[addbsel & 0x03];
5274//////////////////////////////////////////////////////////////////////////////////////
5275
5276//END;
5277}
5278
5279
5280/** DATAMUX - Address local data bus selection ******************
5281
5282Select between the adder output and the input data bus
5283*/
5284
5285/*DEF DATAMUX (
5286INT16/ data_x
5287INT16/ data_y
5288 :OUT;
5289INT32/ gpu_din
5290INT16/ addq_x
5291INT16/ addq_y
5292 addqsel
5293 :IN);
5294
5295INT16/ gpu_lo, gpu_hi
5296:LOCAL;
5297BEGIN*/
5298void DATAMUX(int16_t &data_x, int16_t &data_y, uint32_t gpu_din, int16_t addq_x, int16_t addq_y, bool addqsel)
5299{
5300/*Gpu_lo := JOIN (gpu_lo, gpu_din{0..15});
5301Gpu_hi := JOIN (gpu_hi, gpu_din{16..31});
5302
5303Addqselb := BUF8 (addqselb, addqsel);
5304Data_x := MX2 (data_x, gpu_lo, addq_x, addqselb);
5305Data_y := MX2 (data_y, gpu_hi, addq_y, addqselb);*/
5306////////////////////////////////////// C++ CODE //////////////////////////////////////
5307 data_x = (addqsel ? addq_x : (int16_t)(gpu_din & 0xFFFF));
5308 data_y = (addqsel ? addq_y : (int16_t)(gpu_din >> 16));
5309//////////////////////////////////////////////////////////////////////////////////////
5310
5311//END;
5312}
5313
5314
5315/******************************************************************
5316addradd
531729/11/90
5318
5319Blitter Address Adder
5320---------------------
5321The blitter address adder is a pair of sixteen bit adders, one
5322each for X and Y. The multiplexing of the input terms is
5323performed elsewhere, but this adder can also perform modulo
5324arithmetic to align X-addresses onto phrase boundaries.
5325
5326modx[0..2] take values
5327000 no mask
5328001 mask bit 0
5329010 mask bits 1-0
5330..
5331110 mask bits 5-0
5332
5333******************************************************************/
5334
5335/*IMPORT duplo, tosh;
5336
5337DEF ADDRADD (
5338INT16/ addq_x
5339INT16/ addq_y
5340 :OUT;
5341 a1fracldi // propagate address adder carry
5342INT16/ adda_x
5343INT16/ adda_y
5344INT16/ addb_x
5345INT16/ addb_y
5346 clk[0] // co-processor clock
5347 modx[0..2]
5348 suba_x
5349 suba_y
5350 :IN);
5351
5352BEGIN
5353
5354Zero := TIE0 (zero);*/
5355void ADDRADD(int16_t &addq_x, int16_t &addq_y, bool a1fracldi,
5356 uint16_t adda_x, uint16_t adda_y, uint16_t addb_x, uint16_t addb_y, uint8_t modx, bool suba_x, bool suba_y)
5357{
5358
5359/* Perform the addition */
5360
5361/*Adder_x := ADD16 (addqt_x[0..15], co_x, adda_x{0..15}, addb_x{0..15}, ci_x);
5362Adder_y := ADD16 (addq_y[0..15], co_y, adda_y{0..15}, addb_y{0..15}, ci_y);*/
5363
5364/* latch carry and propagate if required */
5365
5366/*Cxt0 := AN2 (cxt[0], co_x, a1fracldi);
5367Cxt1 := FD1Q (cxt[1], cxt[0], clk[0]);
5368Ci_x := EO (ci_x, cxt[1], suba_x);
5369
5370yt0 := AN2 (cyt[0], co_y, a1fracldi);
5371Cyt1 := FD1Q (cyt[1], cyt[0], clk[0]);
5372Ci_y := EO (ci_y, cyt[1], suba_y);*/
5373
5374////////////////////////////////////// C++ CODE //////////////////////////////////////
5375//I'm sure the following will generate a bunch of warnings, but will have to do for now.
5376 static uint16_t co_x = 0, co_y = 0; // Carry out has to propogate between function calls...
5377 uint16_t ci_x = co_x ^ (suba_x ? 1 : 0);
5378 uint16_t ci_y = co_y ^ (suba_y ? 1 : 0);
5379 uint32_t addqt_x = adda_x + addb_x + ci_x;
5380 uint32_t addqt_y = adda_y + addb_y + ci_y;
5381 co_x = ((addqt_x & 0x10000) && a1fracldi ? 1 : 0);
5382 co_y = ((addqt_y & 0x10000) && a1fracldi ? 1 : 0);
5383//////////////////////////////////////////////////////////////////////////////////////
5384
5385/* Mask low bits of X to 0 if required */
5386
5387/*Masksel := D38H (unused[0], masksel[0..4], maskbit[5], unused[1], modx[0..2]);
5388
5389Maskbit[0-4] := OR2 (maskbit[0-4], masksel[0-4], maskbit[1-5]);
5390
5391Mask[0-5] := MX2 (addq_x[0-5], addqt_x[0-5], zero, maskbit[0-5]);
5392
5393Addq_x := JOIN (addq_x, addq_x[0..5], addqt_x[6..15]);
5394Addq_y := JOIN (addq_y, addq_y[0..15]);*/
5395
5396////////////////////////////////////// C++ CODE //////////////////////////////////////
5397 uint16_t mask[8] = { 0xFFFF, 0xFFFE, 0xFFFC, 0xFFF8, 0xFFF0, 0xFFE0, 0xFFC0, 0x0000 };
5398 addq_x = addqt_x & mask[modx];
5399 addq_y = addqt_y & 0xFFFF;
5400//////////////////////////////////////////////////////////////////////////////////////
5401
5402//Unused[0-1] := DUMMY (unused[0-1]);
5403
5404//END;
5405}
5406
5407
5408/*
5409DEF DATA (
5410 wdata[0..63] // co-processor write data bus
5411 :BUS;
5412 dcomp[0..7] // data byte equal flags
5413 srcd[0..7] // bits to use for bit to byte expansion
5414 zcomp[0..3] // output from Z comparators
5415 :OUT;
5416 a1_x[0..1] // low two bits of A1 X pointer
5417 big_pix // pixel organisation is big-endian
5418 blitter_active // blitter is active
5419 clk // co-processor clock
5420 cmpdst // compare dest rather than source
5421 colorld // load the pattern color fields
5422 daddasel[0..2] // data adder input A selection
5423 daddbsel[0..3] // data adder input B selection
5424 daddmode[0..2] // data adder mode
5425 daddq_sel // select adder output vs. GPU data
5426 data[0..63] // co-processor read data bus
5427 data_ena // enable write data
5428 data_sel[0..1] // select data to write
5429 dbinh\[0..7] // byte oriented changed data inhibits
5430 dend[0..5] // end of changed write data zone
5431 dpipe[0..1] // load computed data pipe-line latch
5432 dstart[0..5] // start of changed write data zone
5433 dstdld[0..1] // dest data load (two halves)
5434 dstzld[0..1] // dest zed load (two halves)
5435 ext_int // enable extended precision intensity calculations
5436INT32/ gpu_din // GPU data bus
5437 iincld // I increment load
5438 iincldx // alternate I increment load
5439 init_if // initialise I fraction phase
5440 init_ii // initialise I integer phase
5441 init_zf // initialise Z fraction phase
5442 intld[0..3] // computed intensities load
5443 istepadd // intensity step integer add
5444 istepfadd // intensity step fraction add
5445 istepld // I step load
5446 istepdld // I step delta load
5447 lfu_func[0..3] // LFU function code
5448 patdadd // pattern data gouraud add
5449 patdld[0..1] // pattern data load (two halves)
5450 pdsel[0..1] // select pattern data type
5451 phrase_mode // phrase write mode
5452 reload // transfer contents of double buffers
5453 reset\ // system reset
5454 srcd1ld[0..1] // source register 1 load (two halves)
5455 srcdread // source data read load enable
5456 srczread // source zed read load enable
5457 srcshift[0..5] // source alignment shift
5458 srcz1ld[0..1] // source zed 1 load (two halves)
5459 srcz2add // zed fraction gouraud add
5460 srcz2ld[0..1] // source zed 2 load (two halves)
5461 textrgb // texture mapping in RGB mode
5462 txtd[0..63] // data from the texture unit
5463 zedld[0..3] // computed zeds load
5464 zincld // Z increment load
5465 zmode[0..2] // Z comparator mode
5466 zpipe[0..1] // load computed zed pipe-line latch
5467 zstepadd // zed step integer add
5468 zstepfadd // zed step fraction add
5469 zstepld // Z step load
5470 zstepdld // Z step delta load
5471 :IN);
5472*/
5473
5474void DATA(uint64_t &wdata, uint8_t &dcomp, uint8_t &zcomp, bool &nowrite,
5475 bool big_pix, bool cmpdst, uint8_t daddasel, uint8_t daddbsel, uint8_t daddmode, bool daddq_sel, uint8_t data_sel,
5476 uint8_t dbinh, uint8_t dend, uint8_t dstart, uint64_t dstd, uint32_t iinc, uint8_t lfu_func, uint64_t &patd, bool patdadd,
5477 bool phrase_mode, uint64_t srcd, bool srcdread, bool srczread, bool srcz2add, uint8_t zmode,
5478 bool bcompen, bool bkgwren, bool dcompen, uint8_t icount, uint8_t pixsize,
5479 uint64_t &srcz, uint64_t dstz, uint32_t zinc)
5480{
5481/*
5482 Stuff we absolutely *need* to have passed in/out:
5483IN:
5484 patdadd, dstd, srcd, patd, daddasel, daddbsel, daddmode, iinc, srcz1, srcz2, big_pix, phrase_mode, cmpdst
5485OUT:
5486 changed patd (wdata I guess...) (Nope. We pass it back directly now...)
5487*/
5488
5489// Source data registers
5490
5491/*Data_src := DATA_SRC (srcdlo, srcdhi, srcz[0..1], srczo[0..1], srczp[0..1], srcz1[0..1], srcz2[0..1], big_pix,
5492 clk, gpu_din, intld[0..3], local_data0, local_data1, srcd1ld[0..1], srcdread, srczread, srcshift[0..5],
5493 srcz1ld[0..1], srcz2add, srcz2ld[0..1], zedld[0..3], zpipe[0..1]);
5494Srcd[0-7] := JOIN (srcd[0-7], srcdlo{0-7});
5495Srcd[8-31] := JOIN (srcd[8-31], srcdlo{8-31});
5496Srcd[32-63] := JOIN (srcd[32-63], srcdhi{0-31});*/
5497
5498// Destination data registers
5499
5500/*Data_dst := DATA_DST (dstd[0..63], dstz[0..1], clk, dstdld[0..1], dstzld[0..1], load_data[0..1]);
5501Dstdlo := JOIN (dstdlo, dstd[0..31]);
5502Dstdhi := JOIN (dstdhi, dstd[32..63]);*/
5503
5504// Pattern and Color data registers
5505
5506// Looks like this is simply another register file for the pattern data registers. No adding or anything funky
5507// going on. Note that patd & patdv will output the same info.
5508// Patdldl/h (patdld[0..1]) can select the local_data bus to overwrite the current pattern data...
5509// Actually, it can be either patdld OR patdadd...!
5510/*Data_pat := DATA_PAT (colord[0..15], int0dp[8..10], int1dp[8..10], int2dp[8..10], int3dp[8..10], mixsel[0..2],
5511 patd[0..63], patdv[0..1], clk, colorld, dpipe[0], ext_int, gpu_din, intld[0..3], local_data0, local_data1,
5512 patdadd, patdld[0..1], reload, reset\);
5513Patdlo := JOIN (patdlo, patd[0..31]);
5514Patdhi := JOIN (patdhi, patd[32..63]);*/
5515
5516// Multiplying data Mixer (NOT IN JAGUAR I)
5517
5518/*Datamix := DATAMIX (patdo[0..1], clk, colord[0..15], dpipe[1], dstd[0..63], int0dp[8..10], int1dp[8..10],
5519 int2dp[8..10], int3dp[8..10], mixsel[0..2], patd[0..63], pdsel[0..1], srcd[0..63], textrgb, txtd[0..63]);*/
5520
5521// Logic function unit
5522
5523/*Lfu := LFU (lfu[0..1], srcdlo, srcdhi, dstdlo, dstdhi, lfu_func[0..3]);*/
5524////////////////////////////////////// C++ CODE //////////////////////////////////////
5525 uint64_t funcmask[2] = { 0, 0xFFFFFFFFFFFFFFFFLL };
5526 uint64_t func0 = funcmask[lfu_func & 0x01];
5527 uint64_t func1 = funcmask[(lfu_func >> 1) & 0x01];
5528 uint64_t func2 = funcmask[(lfu_func >> 2) & 0x01];
5529 uint64_t func3 = funcmask[(lfu_func >> 3) & 0x01];
5530 uint64_t lfu = (~srcd & ~dstd & func0) | (~srcd & dstd & func1) | (srcd & ~dstd & func2) | (srcd & dstd & func3);
5531//////////////////////////////////////////////////////////////////////////////////////
5532
5533// Increment and Step Registers
5534
5535// Does it do anything without the step add lines? Check it!
5536// No. This is pretty much just a register file without the Jaguar II lines...
5537/*Inc_step := INC_STEP (iinc, istep[0..31], zinc, zstep[0..31], clk, ext_int, gpu_din, iincld, iincldx, istepadd,
5538 istepfadd, istepld, istepdld, reload, reset\, zincld, zstepadd, zstepfadd, zstepld, zstepdld);
5539Istep := JOIN (istep, istep[0..31]);
5540Zstep := JOIN (zstep, zstep[0..31]);*/
5541
5542// Pixel data comparator
5543
5544/*Datacomp := DATACOMP (dcomp[0..7], cmpdst, dstdlo, dstdhi, patdlo, patdhi, srcdlo, srcdhi);*/
5545////////////////////////////////////// C++ CODE //////////////////////////////////////
5546 dcomp = 0;
5547 uint64_t cmpd = patd ^ (cmpdst ? dstd : srcd);
5548
5549 if ((cmpd & 0x00000000000000FFLL) == 0)
5550 dcomp |= 0x01;
5551 if ((cmpd & 0x000000000000FF00LL) == 0)
5552 dcomp |= 0x02;
5553 if ((cmpd & 0x0000000000FF0000LL) == 0)
5554 dcomp |= 0x04;
5555 if ((cmpd & 0x00000000FF000000LL) == 0)
5556 dcomp |= 0x08;
5557 if ((cmpd & 0x000000FF00000000LL) == 0)
5558 dcomp |= 0x10;
5559 if ((cmpd & 0x0000FF0000000000LL) == 0)
5560 dcomp |= 0x20;
5561 if ((cmpd & 0x00FF000000000000LL) == 0)
5562 dcomp |= 0x40;
5563 if ((cmpd & 0xFF00000000000000LL) == 0)
5564 dcomp |= 0x80;
5565//////////////////////////////////////////////////////////////////////////////////////
5566
5567// Zed comparator for Z-buffer operations
5568
5569/*Zedcomp := ZEDCOMP (zcomp[0..3], srczp[0..1], dstz[0..1], zmode[0..2]);*/
5570////////////////////////////////////// C++ CODE //////////////////////////////////////
5571//srczp is srcz pipelined, also it goes through a source shift as well...
5572/*The shift is basically like so (each piece is 16 bits long):
5573
5574 0 1 2 3 4 5 6
5575 srcz1lolo srcz1lohi srcz1hilo srcz1hihi srcrz2lolo srcz2lohi srcz2hilo
5576
5577with srcshift bits 4 & 5 selecting the start position
5578*/
5579//So... basically what we have here is:
5580 zcomp = 0;
5581
5582 if ((((srcz & 0x000000000000FFFFLL) < (dstz & 0x000000000000FFFFLL)) && (zmode & 0x01))
5583 || (((srcz & 0x000000000000FFFFLL) == (dstz & 0x000000000000FFFFLL)) && (zmode & 0x02))
5584 || (((srcz & 0x000000000000FFFFLL) > (dstz & 0x000000000000FFFFLL)) && (zmode & 0x04)))
5585 zcomp |= 0x01;
5586
5587 if ((((srcz & 0x00000000FFFF0000LL) < (dstz & 0x00000000FFFF0000LL)) && (zmode & 0x01))
5588 || (((srcz & 0x00000000FFFF0000LL) == (dstz & 0x00000000FFFF0000LL)) && (zmode & 0x02))
5589 || (((srcz & 0x00000000FFFF0000LL) > (dstz & 0x00000000FFFF0000LL)) && (zmode & 0x04)))
5590 zcomp |= 0x02;
5591
5592 if ((((srcz & 0x0000FFFF00000000LL) < (dstz & 0x0000FFFF00000000LL)) && (zmode & 0x01))
5593 || (((srcz & 0x0000FFFF00000000LL) == (dstz & 0x0000FFFF00000000LL)) && (zmode & 0x02))
5594 || (((srcz & 0x0000FFFF00000000LL) > (dstz & 0x0000FFFF00000000LL)) && (zmode & 0x04)))
5595 zcomp |= 0x04;
5596
5597 if ((((srcz & 0xFFFF000000000000LL) < (dstz & 0xFFFF000000000000LL)) && (zmode & 0x01))
5598 || (((srcz & 0xFFFF000000000000LL) == (dstz & 0xFFFF000000000000LL)) && (zmode & 0x02))
5599 || (((srcz & 0xFFFF000000000000LL) > (dstz & 0xFFFF000000000000LL)) && (zmode & 0x04)))
5600 zcomp |= 0x08;
5601
5602//TEMP, TO TEST IF ZCOMP IS THE CULPRIT...
5603//Nope, this is NOT the problem...
5604//zcomp=0;
5605// We'll do the comparison/bit/byte inhibits here, since that's they way it happens
5606// in the real thing (dcomp goes out to COMP_CTRL and back into DATA through dbinh)...
5607#if 1
5608 uint8_t dbinht;
5609// bool nowrite;
5610 COMP_CTRL(dbinht, nowrite,
5611 bcompen, true/*big_pix*/, bkgwren, dcomp, dcompen, icount, pixsize, phrase_mode, srcd & 0xFF, zcomp);
5612 dbinh = dbinht;
5613// dbinh = 0x00;
5614#endif
5615
5616#if 1
5617#ifdef VERBOSE_BLITTER_LOGGING
5618if (logBlit)
5619 WriteLog("\n[dcomp=%02X zcomp=%02X dbinh=%02X]\n", dcomp, zcomp, dbinh);
5620#endif
5621#endif
5622//////////////////////////////////////////////////////////////////////////////////////
5623
5624// 22 Mar 94
5625// The data initializer - allows all four initial values to be computed from one (NOT IN JAGUAR I)
5626
5627/*Datinit := DATINIT (initcin[0..3], initinc[0..63], initpix[0..15], a1_x[0..1], big_pix, clk, iinc, init_if, init_ii,
5628 init_zf, istep[0..31], zinc, zstep[0..31]);*/
5629
5630// Adder array for Z and intensity increments
5631
5632/*Addarray := ADDARRAY (addq[0..3], clk, daddasel[0..2], daddbsel[0..3], daddmode[0..2], dstdlo, dstdhi, iinc,
5633 initcin[0..3], initinc[0..63], initpix[0..15], istep, patdv[0..1], srcdlo, srcdhi, srcz1[0..1],
5634 srcz2[0..1], reset\, zinc, zstep);*/
5635/*void ADDARRAY(uint16_t * addq, uint8_t daddasel, uint8_t daddbsel, uint8_t daddmode,
5636 uint64_t dstd, uint32_t iinc, uint8_t initcin[], uint64_t initinc, uint16_t initpix,
5637 uint32_t istep, uint64_t patd, uint64_t srcd, uint64_t srcz1, uint64_t srcz2,
5638 uint32_t zinc, uint32_t zstep)*/
5639////////////////////////////////////// C++ CODE //////////////////////////////////////
5640 uint16_t addq[4];
5641 uint8_t initcin[4] = { 0, 0, 0, 0 };
5642 ADDARRAY(addq, daddasel, daddbsel, daddmode, dstd, iinc, initcin, 0, 0, 0, patd, srcd, 0, 0, 0, 0);
5643
5644 //This is normally done asynchronously above (thru local_data) when in patdadd mode...
5645//And now it's passed back to the caller to be persistent between calls...!
5646//But it's causing some serious fuck-ups in T2K now... !!! FIX !!! [DONE--???]
5647//Weird! It doesn't anymore...!
5648 if (patdadd)
5649 patd = ((uint64_t)addq[3] << 48) | ((uint64_t)addq[2] << 32) | ((uint64_t)addq[1] << 16) | (uint64_t)addq[0];
5650//////////////////////////////////////////////////////////////////////////////////////
5651
5652// Local data bus multiplexer
5653
5654/*Local_mux := LOCAL_MUX (local_data[0..1], load_data[0..1],
5655 addq[0..3], gpu_din, data[0..63], blitter_active, daddq_sel);
5656Local_data0 := JOIN (local_data0, local_data[0]);
5657Local_data1 := JOIN (local_data1, local_data[1]);*/
5658////////////////////////////////////// C++ CODE //////////////////////////////////////
5659//////////////////////////////////////////////////////////////////////////////////////
5660
5661// Data output multiplexer and tri-state drive
5662
5663/*Data_mux := DATA_MUX (wdata[0..63], addq[0..3], big_pix, dstdlo, dstdhi, dstz[0..1], data_sel[0..1], data_ena,
5664 dstart[0..5], dend[0..5], dbinh\[0..7], lfu[0..1], patdo[0..1], phrase_mode, srczo[0..1]);*/
5665////////////////////////////////////// C++ CODE //////////////////////////////////////
5666// NOTE: patdo comes from DATAMIX and can be considered the same as patd for Jaguar I
5667
5668//////////////////////////////////////////////////////////////////////////////////////
5669//}
5670
5671/*DEF DATA_MUX (
5672 wdata[0..63] // co-processor rwrite data bus
5673 :BUS;
5674INT16/ addq[0..3]
5675 big_pix // Pixel organisation is big-endian
5676INT32/ dstdlo
5677INT32/ dstdhi
5678INT32/ dstzlo
5679INT32/ dstzhi
5680 data_sel[0..1] // source of write data
5681 data_ena // enable write data onto read/write bus
5682 dstart[0..5] // start of changed write data
5683 dend[0..5] // end of changed write data
5684 dbinh\[0..7] // byte oriented changed data inhibits
5685INT32/ lfu[0..1]
5686INT32/ patd[0..1]
5687 phrase_mode // phrase write mode
5688INT32/ srczlo
5689INT32/ srczhi
5690 :IN);*/
5691
5692/*INT32/ addql[0..1], ddatlo, ddathi zero32
5693:LOCAL;
5694BEGIN
5695
5696Phrase_mode\ := INV1 (phrase_mode\, phrase_mode);
5697Zero := TIE0 (zero);
5698Zero32 := JOIN (zero32, zero, zero, zero, zero, zero, zero, zero, zero, zero, zero, zero, zero, zero, zero, zero, zero, zero, zero, zero, zero, zero, zero, zero, zero, zero, zero, zero, zero, zero, zero, zero, zero);*/
5699
5700/* Generate a changed data mask */
5701
5702/*Edis := OR6 (edis\, dend[0..5]);
5703Ecoarse := DECL38E (e_coarse\[0..7], dend[3..5], edis\);
5704E_coarse[0] := INV1 (e_coarse[0], e_coarse\[0]);
5705Efine := DECL38E (unused[0], e_fine\[1..7], dend[0..2], e_coarse[0]);*/
5706////////////////////////////////////// C++ CODE //////////////////////////////////////
5707 uint8_t decl38e[2][8] = { { 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF },
5708 { 0xFE, 0xFD, 0xFB, 0xF7, 0xEF, 0xDF, 0xBF, 0x7F } };
5709 uint8_t dech38[8] = { 0x01, 0x02, 0x04, 0x08, 0x10, 0x20, 0x40, 0x80 };
5710 uint8_t dech38el[2][8] = { { 0x01, 0x02, 0x04, 0x08, 0x10, 0x20, 0x40, 0x80 },
5711 { 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00 } };
5712
5713 int en = (dend & 0x3F ? 1 : 0);
5714 uint8_t e_coarse = decl38e[en][(dend & 0x38) >> 3]; // Actually, this is e_coarse inverted...
5715 uint8_t e_fine = decl38e[(e_coarse & 0x01) ^ 0x01][dend & 0x07];
5716 e_fine &= 0xFE;
5717//////////////////////////////////////////////////////////////////////////////////////
5718
5719/*Scoarse := DECH38 (s_coarse[0..7], dstart[3..5]);
5720Sfen\ := INV1 (sfen\, s_coarse[0]);
5721Sfine := DECH38EL (s_fine[0..7], dstart[0..2], sfen\);*/
5722////////////////////////////////////// C++ CODE //////////////////////////////////////
5723 uint8_t s_coarse = dech38[(dstart & 0x38) >> 3];
5724 uint8_t s_fine = dech38el[(s_coarse & 0x01) ^ 0x01][dstart & 0x07];
5725//////////////////////////////////////////////////////////////////////////////////////
5726
5727/*Maskt[0] := BUF1 (maskt[0], s_fine[0]);
5728Maskt[1-7] := OAN1P (maskt[1-7], maskt[0-6], s_fine[1-7], e_fine\[1-7]);*/
5729////////////////////////////////////// C++ CODE //////////////////////////////////////
5730 uint16_t maskt = s_fine & 0x0001;
5731 maskt |= (((maskt & 0x0001) || (s_fine & 0x02)) && (e_fine & 0x02) ? 0x0002 : 0x0000);
5732 maskt |= (((maskt & 0x0002) || (s_fine & 0x04)) && (e_fine & 0x04) ? 0x0004 : 0x0000);
5733 maskt |= (((maskt & 0x0004) || (s_fine & 0x08)) && (e_fine & 0x08) ? 0x0008 : 0x0000);
5734 maskt |= (((maskt & 0x0008) || (s_fine & 0x10)) && (e_fine & 0x10) ? 0x0010 : 0x0000);
5735 maskt |= (((maskt & 0x0010) || (s_fine & 0x20)) && (e_fine & 0x20) ? 0x0020 : 0x0000);
5736 maskt |= (((maskt & 0x0020) || (s_fine & 0x40)) && (e_fine & 0x40) ? 0x0040 : 0x0000);
5737 maskt |= (((maskt & 0x0040) || (s_fine & 0x80)) && (e_fine & 0x80) ? 0x0080 : 0x0000);
5738//////////////////////////////////////////////////////////////////////////////////////
5739
5740/* Produce a look-ahead on the ripple carry:
5741masktla = s_coarse[0] . /e_coarse[0] */
5742/*Masktla := AN2 (masktla, s_coarse[0], e_coarse\[0]);
5743Maskt[8] := OAN1P (maskt[8], masktla, s_coarse[1], e_coarse\[1]);
5744Maskt[9-14] := OAN1P (maskt[9-14], maskt[8-13], s_coarse[2-7], e_coarse\[2-7]);*/
5745////////////////////////////////////// C++ CODE //////////////////////////////////////
5746 maskt |= (((s_coarse & e_coarse & 0x01) || (s_coarse & 0x02)) && (e_coarse & 0x02) ? 0x0100 : 0x0000);
5747 maskt |= (((maskt & 0x0100) || (s_coarse & 0x04)) && (e_coarse & 0x04) ? 0x0200 : 0x0000);
5748 maskt |= (((maskt & 0x0200) || (s_coarse & 0x08)) && (e_coarse & 0x08) ? 0x0400 : 0x0000);
5749 maskt |= (((maskt & 0x0400) || (s_coarse & 0x10)) && (e_coarse & 0x10) ? 0x0800 : 0x0000);
5750 maskt |= (((maskt & 0x0800) || (s_coarse & 0x20)) && (e_coarse & 0x20) ? 0x1000 : 0x0000);
5751 maskt |= (((maskt & 0x1000) || (s_coarse & 0x40)) && (e_coarse & 0x40) ? 0x2000 : 0x0000);
5752 maskt |= (((maskt & 0x2000) || (s_coarse & 0x80)) && (e_coarse & 0x80) ? 0x4000 : 0x0000);
5753//////////////////////////////////////////////////////////////////////////////////////
5754
5755/* The bit terms are mirrored for big-endian pixels outside phrase
5756mode. The byte terms are mirrored for big-endian pixels in phrase
5757mode. */
5758
5759/*Mirror_bit := AN2M (mir_bit, phrase_mode\, big_pix);
5760Mirror_byte := AN2H (mir_byte, phrase_mode, big_pix);
5761
5762Masktb[14] := BUF1 (masktb[14], maskt[14]);
5763Masku[0] := MX4 (masku[0], maskt[0], maskt[7], maskt[14], zero, mir_bit, mir_byte);
5764Masku[1] := MX4 (masku[1], maskt[1], maskt[6], maskt[14], zero, mir_bit, mir_byte);
5765Masku[2] := MX4 (masku[2], maskt[2], maskt[5], maskt[14], zero, mir_bit, mir_byte);
5766Masku[3] := MX4 (masku[3], maskt[3], maskt[4], masktb[14], zero, mir_bit, mir_byte);
5767Masku[4] := MX4 (masku[4], maskt[4], maskt[3], masktb[14], zero, mir_bit, mir_byte);
5768Masku[5] := MX4 (masku[5], maskt[5], maskt[2], masktb[14], zero, mir_bit, mir_byte);
5769Masku[6] := MX4 (masku[6], maskt[6], maskt[1], masktb[14], zero, mir_bit, mir_byte);
5770Masku[7] := MX4 (masku[7], maskt[7], maskt[0], masktb[14], zero, mir_bit, mir_byte);
5771Masku[8] := MX2 (masku[8], maskt[8], maskt[13], mir_byte);
5772Masku[9] := MX2 (masku[9], maskt[9], maskt[12], mir_byte);
5773Masku[10] := MX2 (masku[10], maskt[10], maskt[11], mir_byte);
5774Masku[11] := MX2 (masku[11], maskt[11], maskt[10], mir_byte);
5775Masku[12] := MX2 (masku[12], maskt[12], maskt[9], mir_byte);
5776Masku[13] := MX2 (masku[13], maskt[13], maskt[8], mir_byte);
5777Masku[14] := MX2 (masku[14], maskt[14], maskt[0], mir_byte);*/
5778////////////////////////////////////// C++ CODE //////////////////////////////////////
5779 bool mir_bit = true/*big_pix*/ && !phrase_mode;
5780 bool mir_byte = true/*big_pix*/ && phrase_mode;
5781 uint16_t masku = maskt;
5782
5783 if (mir_bit)
5784 {
5785 masku &= 0xFF00;
5786 masku |= (maskt >> 7) & 0x0001;
5787 masku |= (maskt >> 5) & 0x0002;
5788 masku |= (maskt >> 3) & 0x0004;
5789 masku |= (maskt >> 1) & 0x0008;
5790 masku |= (maskt << 1) & 0x0010;
5791 masku |= (maskt << 3) & 0x0020;
5792 masku |= (maskt << 5) & 0x0040;
5793 masku |= (maskt << 7) & 0x0080;
5794 }
5795
5796 if (mir_byte)
5797 {
5798 masku = 0;
5799 masku |= (maskt >> 14) & 0x0001;
5800 masku |= (maskt >> 13) & 0x0002;
5801 masku |= (maskt >> 12) & 0x0004;
5802 masku |= (maskt >> 11) & 0x0008;
5803 masku |= (maskt >> 10) & 0x0010;
5804 masku |= (maskt >> 9) & 0x0020;
5805 masku |= (maskt >> 8) & 0x0040;
5806 masku |= (maskt >> 7) & 0x0080;
5807
5808 masku |= (maskt >> 5) & 0x0100;
5809 masku |= (maskt >> 3) & 0x0200;
5810 masku |= (maskt >> 1) & 0x0400;
5811 masku |= (maskt << 1) & 0x0800;
5812 masku |= (maskt << 3) & 0x1000;
5813 masku |= (maskt << 5) & 0x2000;
5814 masku |= (maskt << 7) & 0x4000;
5815 }
5816//////////////////////////////////////////////////////////////////////////////////////
5817
5818/* The maskt terms define the area for changed data, but the byte
5819inhibit terms can override these */
5820
5821/*Mask[0-7] := AN2 (mask[0-7], masku[0-7], dbinh\[0]);
5822Mask[8-14] := AN2H (mask[8-14], masku[8-14], dbinh\[1-7]);*/
5823////////////////////////////////////// C++ CODE //////////////////////////////////////
5824 uint16_t mask = masku & (!(dbinh & 0x01) ? 0xFFFF : 0xFF00);
5825 mask &= ~(((uint16_t)dbinh & 0x00FE) << 7);
5826//////////////////////////////////////////////////////////////////////////////////////
5827
5828/*Addql[0] := JOIN (addql[0], addq[0..1]);
5829Addql[1] := JOIN (addql[1], addq[2..3]);
5830
5831Dsel0b[0-1] := BUF8 (dsel0b[0-1], data_sel[0]);
5832Dsel1b[0-1] := BUF8 (dsel1b[0-1], data_sel[1]);
5833Ddatlo := MX4 (ddatlo, patd[0], lfu[0], addql[0], zero32, dsel0b[0], dsel1b[0]);
5834Ddathi := MX4 (ddathi, patd[1], lfu[1], addql[1], zero32, dsel0b[1], dsel1b[1]);*/
5835////////////////////////////////////// C++ CODE //////////////////////////////////////
5836 uint64_t dmux[4];
5837 dmux[0] = patd;
5838 dmux[1] = lfu;
5839 dmux[2] = ((uint64_t)addq[3] << 48) | ((uint64_t)addq[2] << 32) | ((uint64_t)addq[1] << 16) | (uint64_t)addq[0];
5840 dmux[3] = 0;
5841 uint64_t ddat = dmux[data_sel];
5842//////////////////////////////////////////////////////////////////////////////////////
5843
5844/*Zed_sel := AN2 (zed_sel, data_sel[0..1]);
5845Zed_selb[0-1] := BUF8 (zed_selb[0-1], zed_sel);
5846
5847Dat[0-7] := MX4 (dat[0-7], dstdlo{0-7}, ddatlo{0-7}, dstzlo{0-7}, srczlo{0-7}, mask[0-7], zed_selb[0]);
5848Dat[8-15] := MX4 (dat[8-15], dstdlo{8-15}, ddatlo{8-15}, dstzlo{8-15}, srczlo{8-15}, mask[8], zed_selb[0]);
5849Dat[16-23] := MX4 (dat[16-23], dstdlo{16-23}, ddatlo{16-23}, dstzlo{16-23}, srczlo{16-23}, mask[9], zed_selb[0]);
5850Dat[24-31] := MX4 (dat[24-31], dstdlo{24-31}, ddatlo{24-31}, dstzlo{24-31}, srczlo{24-31}, mask[10], zed_selb[0]);
5851Dat[32-39] := MX4 (dat[32-39], dstdhi{0-7}, ddathi{0-7}, dstzhi{0-7}, srczhi{0-7}, mask[11], zed_selb[1]);
5852Dat[40-47] := MX4 (dat[40-47], dstdhi{8-15}, ddathi{8-15}, dstzhi{8-15}, srczhi{8-15}, mask[12], zed_selb[1]);
5853Dat[48-55] := MX4 (dat[48-55], dstdhi{16-23}, ddathi{16-23}, dstzhi{16-23}, srczhi{16-23}, mask[13], zed_selb[1]);
5854Dat[56-63] := MX4 (dat[56-63], dstdhi{24-31}, ddathi{24-31}, dstzhi{24-31}, srczhi{24-31}, mask[14], zed_selb[1]);*/
5855////////////////////////////////////// C++ CODE //////////////////////////////////////
5856 wdata = ((ddat & mask) | (dstd & ~mask)) & 0x00000000000000FFLL;
5857 wdata |= (mask & 0x0100 ? ddat : dstd) & 0x000000000000FF00LL;
5858 wdata |= (mask & 0x0200 ? ddat : dstd) & 0x0000000000FF0000LL;
5859 wdata |= (mask & 0x0400 ? ddat : dstd) & 0x00000000FF000000LL;
5860 wdata |= (mask & 0x0800 ? ddat : dstd) & 0x000000FF00000000LL;
5861 wdata |= (mask & 0x1000 ? ddat : dstd) & 0x0000FF0000000000LL;
5862 wdata |= (mask & 0x2000 ? ddat : dstd) & 0x00FF000000000000LL;
5863 wdata |= (mask & 0x4000 ? ddat : dstd) & 0xFF00000000000000LL;
5864/*if (logBlit)
5865{
5866 printf("\n[ddat=%08X%08X dstd=%08X%08X wdata=%08X%08X mask=%04X]\n",
5867 (uint32_t)(ddat >> 32), (uint32_t)(ddat & 0xFFFFFFFF),
5868 (uint32_t)(dstd >> 32), (uint32_t)(dstd & 0xFFFFFFFF),
5869 (uint32_t)(wdata >> 32), (uint32_t)(wdata & 0xFFFFFFFF), mask);
5870 fflush(stdout);
5871}//*/
5872//This is a crappy way of handling this, but it should work for now...
5873 uint64_t zwdata;
5874 zwdata = ((srcz & mask) | (dstz & ~mask)) & 0x00000000000000FFLL;
5875 zwdata |= (mask & 0x0100 ? srcz : dstz) & 0x000000000000FF00LL;
5876 zwdata |= (mask & 0x0200 ? srcz : dstz) & 0x0000000000FF0000LL;
5877 zwdata |= (mask & 0x0400 ? srcz : dstz) & 0x00000000FF000000LL;
5878 zwdata |= (mask & 0x0800 ? srcz : dstz) & 0x000000FF00000000LL;
5879 zwdata |= (mask & 0x1000 ? srcz : dstz) & 0x0000FF0000000000LL;
5880 zwdata |= (mask & 0x2000 ? srcz : dstz) & 0x00FF000000000000LL;
5881 zwdata |= (mask & 0x4000 ? srcz : dstz) & 0xFF00000000000000LL;
5882if (logBlit)
5883{
5884 WriteLog("\n[srcz=%08X%08X dstz=%08X%08X zwdata=%08X%08X mask=%04X]\n",
5885 (uint32_t)(srcz >> 32), (uint32_t)(srcz & 0xFFFFFFFF),
5886 (uint32_t)(dstz >> 32), (uint32_t)(dstz & 0xFFFFFFFF),
5887 (uint32_t)(zwdata >> 32), (uint32_t)(zwdata & 0xFFFFFFFF), mask);
5888// fflush(stdout);
5889}//*/
5890 srcz = zwdata;
5891//////////////////////////////////////////////////////////////////////////////////////
5892
5893/*Data_enab[0-1] := BUF8 (data_enab[0-1], data_ena);
5894Datadrv[0-31] := TS (wdata[0-31], dat[0-31], data_enab[0]);
5895Datadrv[32-63] := TS (wdata[32-63], dat[32-63], data_enab[1]);
5896
5897Unused[0] := DUMMY (unused[0]);
5898
5899END;*/
5900}
5901
5902
5903/** COMP_CTRL - Comparator output control logic *****************
5904
5905This block is responsible for taking the comparator outputs and
5906using them as appropriate to inhibit writes. Two methods are
5907supported for inhibiting write data:
5908
5909- suppression of the inner loop controlled write operation
5910- a set of eight byte inhibit lines to write back dest data
5911
5912The first technique is used in pixel oriented modes, the second in
5913phrase mode, but the phrase mode form is only applicable to eight
5914and sixteen bit pixel modes.
5915
5916Writes can be suppressed by data being equal, by the Z comparator
5917conditions being met, or by the bit to pixel expansion scheme.
5918
5919Pipe-lining issues: the data derived comparator outputs are stable
5920until the next data read, well after the affected write from this
5921operation. However, the inner counter bits can count immediately
5922before the ack for the last write. Therefore, it is necessary to
5923delay bcompbit select terms by one inner loop pipe-line stage,
5924when generating the select for the data control - the output is
5925delayed one further tick to give it write data timing (2/34).
5926
5927There is also a problem with computed data - the new values are
5928calculated before the write associated with the old value has been
5929performed. The is taken care of within the zed comparator by
5930pipe-lining the comparator inputs where appropriate.
5931*/
5932
5933//#define LOG_COMP_CTRL
5934/*DEF COMP_CTRL (
5935 dbinh\[0..7] // destination byte inhibit lines
5936 nowrite // suppress inner loop write operation
5937 :OUT;
5938 bcompen // bit selector inhibit enable
5939 big_pix // pixels are big-endian
5940 bkgwren // enable dest data write in pix inhibit
5941 clk // co-processor clock
5942 dcomp[0..7] // output of data byte comparators
5943 dcompen // data comparator inhibit enable
5944 icount[0..2] // low bits of inner count
5945 pixsize[0..2] // destination pixel size
5946 phrase_mode // phrase write mode
5947 srcd[0..7] // bits to use for bit to byte expansion
5948 step_inner // inner loop advance
5949 zcomp[0..3] // output of word zed comparators
5950 :IN);*/
5951void COMP_CTRL(uint8_t &dbinh, bool &nowrite,
5952 bool bcompen, bool big_pix, bool bkgwren, uint8_t dcomp, bool dcompen, uint8_t icount,
5953 uint8_t pixsize, bool phrase_mode, uint8_t srcd, uint8_t zcomp)
5954{
5955//BEGIN
5956
5957/*Bkgwren\ := INV1 (bkgwren\, bkgwren);
5958Phrase_mode\ := INV1 (phrase_mode\, phrase_mode);
5959Pixsize\[0-2] := INV2 (pixsize\[0-2], pixsize[0-2]);*/
5960
5961/* The bit comparator bits are derived from the source data, which
5962will have been suitably aligned for phrase mode. The contents of
5963the inner counter are used to select which bit to use.
5964
5965When not in phrase mode the inner count value is used to select
5966one bit. It is assumed that the count has already occurred, so,
59677 selects bit 0, etc. In big-endian pixel mode, this turns round,
5968so that a count of 7 selects bit 7.
5969
5970In phrase mode, the eight bits are used directly, and this mode is
5971only applicable to 8-bit pixel mode (2/34) */
5972
5973/*Bcompselt[0-2] := EO (bcompselt[0-2], icount[0-2], big_pix);
5974Bcompbit := MX8 (bcompbit, srcd[7], srcd[6], srcd[5],
5975 srcd[4], srcd[3], srcd[2], srcd[1], srcd[0], bcompselt[0..2]);
5976Bcompbit\ := INV1 (bcompbit\, bcompbit);*/
5977////////////////////////////////////// C++ CODE //////////////////////////////////////
5978#ifdef LOG_COMP_CTRL
5979if (logBlit)
5980{
5981 WriteLog("\n [bcompen=%s dcompen=%s phrase_mode=%s bkgwren=%s dcomp=%02X zcomp=%02X]", (bcompen ? "T" : "F"), (dcompen ? "T" : "F"), (phrase_mode ? "T" : "F"), (bkgwren ? "T" : "F"), dcomp, zcomp);
5982 WriteLog("\n ");
5983// fflush(stdout);
5984}
5985#endif
5986 uint8_t bcompselt = (big_pix ? ~icount : icount) & 0x07;
5987 uint8_t bitmask[8] = { 0x80, 0x40, 0x20, 0x10, 0x08, 0x04, 0x02, 0x01 };
5988 bool bcompbit = srcd & bitmask[bcompselt];
5989//////////////////////////////////////////////////////////////////////////////////////
5990
5991/* pipe-line the count */
5992/*Bcompsel[0-2] := FDSYNC (bcompsel[0-2], bcompselt[0-2], step_inner, clk);
5993Bcompbt := MX8 (bcompbitpt, srcd[7], srcd[6], srcd[5],
5994 srcd[4], srcd[3], srcd[2], srcd[1], srcd[0], bcompsel[0..2]);
5995Bcompbitp := FD1Q (bcompbitp, bcompbitpt, clk);
5996Bcompbitp\ := INV1 (bcompbitp\, bcompbitp);*/
5997
5998/* For pixel mode, generate the write inhibit signal for all modes
5999on bit inhibit, for 8 and 16 bit modes on comparator inhibit, and
6000for 16 bit mode on Z inhibit
6001
6002Nowrite = bcompen . /bcompbit . /phrase_mode
6003 + dcompen . dcomp[0] . /phrase_mode . pixsize = 011
6004 + dcompen . dcomp[0..1] . /phrase_mode . pixsize = 100
6005 + zcomp[0] . /phrase_mode . pixsize = 100
6006*/
6007
6008/*Nowt0 := NAN3 (nowt[0], bcompen, bcompbit\, phrase_mode\);
6009Nowt1 := ND6 (nowt[1], dcompen, dcomp[0], phrase_mode\, pixsize\[2], pixsize[0..1]);
6010Nowt2 := ND7 (nowt[2], dcompen, dcomp[0..1], phrase_mode\, pixsize[2], pixsize\[0..1]);
6011Nowt3 := NAN5 (nowt[3], zcomp[0], phrase_mode\, pixsize[2], pixsize\[0..1]);
6012Nowt4 := NAN4 (nowt[4], nowt[0..3]);
6013Nowrite := AN2 (nowrite, nowt[4], bkgwren\);*/
6014////////////////////////////////////// C++ CODE //////////////////////////////////////
6015 nowrite = ((bcompen && !bcompbit && !phrase_mode)
6016 || (dcompen && (dcomp & 0x01) && !phrase_mode && (pixsize == 3))
6017 || (dcompen && ((dcomp & 0x03) == 0x03) && !phrase_mode && (pixsize == 4))
6018 || ((zcomp & 0x01) && !phrase_mode && (pixsize == 4)))
6019 && !bkgwren;
6020//////////////////////////////////////////////////////////////////////////////////////
6021
6022/*Winht := NAN3 (winht, bcompen, bcompbitp\, phrase_mode\);
6023Winhibit := NAN4 (winhibit, winht, nowt[1..3]);*/
6024////////////////////////////////////// C++ CODE //////////////////////////////////////
6025//This is the same as above, but with bcompbit delayed one tick and called 'winhibit'
6026//Small difference: Besides the pipeline effect, it's also not using !bkgwren...
6027// bool winhibit = (bcompen && !
6028 bool winhibit = (bcompen && !bcompbit && !phrase_mode)
6029 || (dcompen && (dcomp & 0x01) && !phrase_mode && (pixsize == 3))
6030 || (dcompen && ((dcomp & 0x03) == 0x03) && !phrase_mode && (pixsize == 4))
6031 || ((zcomp & 0x01) && !phrase_mode && (pixsize == 4));
6032#ifdef LOG_COMP_CTRL
6033if (logBlit)
6034{
6035 WriteLog("[nw=%s wi=%s]", (nowrite ? "T" : "F"), (winhibit ? "T" : "F"));
6036// fflush(stdout);
6037}
6038#endif
6039//////////////////////////////////////////////////////////////////////////////////////
6040
6041/* For phrase mode, generate the byte inhibit signals for eight bit
6042mode 011, or sixteen bit mode 100
6043dbinh\[0] = pixsize[2] . zcomp[0]
6044 + pixsize[2] . dcomp[0] . dcomp[1] . dcompen
6045 + /pixsize[2] . dcomp[0] . dcompen
6046 + /srcd[0] . bcompen
6047
6048Inhibits 0-3 are also used when not in phrase mode to write back
6049destination data.
6050*/
6051
6052/*Srcd\[0-7] := INV1 (srcd\[0-7], srcd[0-7]);
6053
6054Di0t0 := NAN2H (di0t[0], pixsize[2], zcomp[0]);
6055Di0t1 := NAN4H (di0t[1], pixsize[2], dcomp[0..1], dcompen);
6056Di0t2 := NAN2 (di0t[2], srcd\[0], bcompen);
6057Di0t3 := NAN3 (di0t[3], pixsize\[2], dcomp[0], dcompen);
6058Di0t4 := NAN4 (di0t[4], di0t[0..3]);
6059Dbinh[0] := ANR1P (dbinh\[0], di0t[4], phrase_mode, winhibit);*/
6060////////////////////////////////////// C++ CODE //////////////////////////////////////
6061 dbinh = 0;
6062 bool di0t0_1 = ((pixsize & 0x04) && (zcomp & 0x01))
6063 || ((pixsize & 0x04) && (dcomp & 0x01) && (dcomp & 0x02) && dcompen);
6064 bool di0t4 = di0t0_1
6065 || (!(srcd & 0x01) && bcompen)
6066 || (!(pixsize & 0x04) && (dcomp & 0x01) && dcompen);
6067 dbinh |= (!((di0t4 && phrase_mode) || winhibit) ? 0x01 : 0x00);
6068#ifdef LOG_COMP_CTRL
6069if (logBlit)
6070{
6071 WriteLog("[di0t0_1=%s di0t4=%s]", (di0t0_1 ? "T" : "F"), (di0t4 ? "T" : "F"));
6072// fflush(stdout);
6073}
6074#endif
6075//////////////////////////////////////////////////////////////////////////////////////
6076
6077/*Di1t0 := NAN3 (di1t[0], pixsize\[2], dcomp[1], dcompen);
6078Di1t1 := NAN2 (di1t[1], srcd\[1], bcompen);
6079Di1t2 := NAN4 (di1t[2], di0t[0..1], di1t[0..1]);
6080Dbinh[1] := ANR1 (dbinh\[1], di1t[2], phrase_mode, winhibit);*/
6081////////////////////////////////////// C++ CODE //////////////////////////////////////
6082 bool di1t2 = di0t0_1
6083 || (!(srcd & 0x02) && bcompen)
6084 || (!(pixsize & 0x04) && (dcomp & 0x02) && dcompen);
6085 dbinh |= (!((di1t2 && phrase_mode) || winhibit) ? 0x02 : 0x00);
6086#ifdef LOG_COMP_CTRL
6087if (logBlit)
6088{
6089 WriteLog("[di1t2=%s]", (di1t2 ? "T" : "F"));
6090// fflush(stdout);
6091}
6092#endif
6093//////////////////////////////////////////////////////////////////////////////////////
6094
6095/*Di2t0 := NAN2H (di2t[0], pixsize[2], zcomp[1]);
6096Di2t1 := NAN4H (di2t[1], pixsize[2], dcomp[2..3], dcompen);
6097Di2t2 := NAN2 (di2t[2], srcd\[2], bcompen);
6098Di2t3 := NAN3 (di2t[3], pixsize\[2], dcomp[2], dcompen);
6099Di2t4 := NAN4 (di2t[4], di2t[0..3]);
6100Dbinh[2] := ANR1 (dbinh\[2], di2t[4], phrase_mode, winhibit);*/
6101////////////////////////////////////// C++ CODE //////////////////////////////////////
6102//[bcompen=F dcompen=T phrase_mode=T bkgwren=F][nw=F wi=F]
6103//[di0t0_1=F di0t4=F][di1t2=F][di2t0_1=T di2t4=T][di3t2=T][di4t0_1=F di2t4=F][di5t2=F][di6t0_1=F di6t4=F][di7t2=F]
6104//[dcomp=$00 dbinh=$0C][7804780400007804] (icount=0005, inc=4)
6105 bool di2t0_1 = ((pixsize & 0x04) && (zcomp & 0x02))
6106 || ((pixsize & 0x04) && (dcomp & 0x04) && (dcomp & 0x08) && dcompen);
6107 bool di2t4 = di2t0_1
6108 || (!(srcd & 0x04) && bcompen)
6109 || (!(pixsize & 0x04) && (dcomp & 0x04) && dcompen);
6110 dbinh |= (!((di2t4 && phrase_mode) || winhibit) ? 0x04 : 0x00);
6111#ifdef LOG_COMP_CTRL
6112if (logBlit)
6113{
6114 WriteLog("[di2t0_1=%s di2t4=%s]", (di2t0_1 ? "T" : "F"), (di2t4 ? "T" : "F"));
6115// fflush(stdout);
6116}
6117#endif
6118//////////////////////////////////////////////////////////////////////////////////////
6119
6120/*Di3t0 := NAN3 (di3t[0], pixsize\[2], dcomp[3], dcompen);
6121Di3t1 := NAN2 (di3t[1], srcd\[3], bcompen);
6122Di3t2 := NAN4 (di3t[2], di2t[0..1], di3t[0..1]);
6123Dbinh[3] := ANR1 (dbinh\[3], di3t[2], phrase_mode, winhibit);*/
6124////////////////////////////////////// C++ CODE //////////////////////////////////////
6125 bool di3t2 = di2t0_1
6126 || (!(srcd & 0x08) && bcompen)
6127 || (!(pixsize & 0x04) && (dcomp & 0x08) && dcompen);
6128 dbinh |= (!((di3t2 && phrase_mode) || winhibit) ? 0x08 : 0x00);
6129#ifdef LOG_COMP_CTRL
6130if (logBlit)
6131{
6132 WriteLog("[di3t2=%s]", (di3t2 ? "T" : "F"));
6133// fflush(stdout);
6134}
6135#endif
6136//////////////////////////////////////////////////////////////////////////////////////
6137
6138/*Di4t0 := NAN2H (di4t[0], pixsize[2], zcomp[2]);
6139Di4t1 := NAN4H (di4t[1], pixsize[2], dcomp[4..5], dcompen);
6140Di4t2 := NAN2 (di4t[2], srcd\[4], bcompen);
6141Di4t3 := NAN3 (di4t[3], pixsize\[2], dcomp[4], dcompen);
6142Di4t4 := NAN4 (di4t[4], di4t[0..3]);
6143Dbinh[4] := NAN2 (dbinh\[4], di4t[4], phrase_mode);*/
6144////////////////////////////////////// C++ CODE //////////////////////////////////////
6145 bool di4t0_1 = ((pixsize & 0x04) && (zcomp & 0x04))
6146 || ((pixsize & 0x04) && (dcomp & 0x10) && (dcomp & 0x20) && dcompen);
6147 bool di4t4 = di4t0_1
6148 || (!(srcd & 0x10) && bcompen)
6149 || (!(pixsize & 0x04) && (dcomp & 0x10) && dcompen);
6150 dbinh |= (!(di4t4 && phrase_mode) ? 0x10 : 0x00);
6151#ifdef LOG_COMP_CTRL
6152if (logBlit)
6153{
6154 WriteLog("[di4t0_1=%s di2t4=%s]", (di4t0_1 ? "T" : "F"), (di4t4 ? "T" : "F"));
6155// fflush(stdout);
6156}
6157#endif
6158//////////////////////////////////////////////////////////////////////////////////////
6159
6160/*Di5t0 := NAN3 (di5t[0], pixsize\[2], dcomp[5], dcompen);
6161Di5t1 := NAN2 (di5t[1], srcd\[5], bcompen);
6162Di5t2 := NAN4 (di5t[2], di4t[0..1], di5t[0..1]);
6163Dbinh[5] := NAN2 (dbinh\[5], di5t[2], phrase_mode);*/
6164////////////////////////////////////// C++ CODE //////////////////////////////////////
6165 bool di5t2 = di4t0_1
6166 || (!(srcd & 0x20) && bcompen)
6167 || (!(pixsize & 0x04) && (dcomp & 0x20) && dcompen);
6168 dbinh |= (!(di5t2 && phrase_mode) ? 0x20 : 0x00);
6169#ifdef LOG_COMP_CTRL
6170if (logBlit)
6171{
6172 WriteLog("[di5t2=%s]", (di5t2 ? "T" : "F"));
6173// fflush(stdout);
6174}
6175#endif
6176//////////////////////////////////////////////////////////////////////////////////////
6177
6178/*Di6t0 := NAN2H (di6t[0], pixsize[2], zcomp[3]);
6179Di6t1 := NAN4H (di6t[1], pixsize[2], dcomp[6..7], dcompen);
6180Di6t2 := NAN2 (di6t[2], srcd\[6], bcompen);
6181Di6t3 := NAN3 (di6t[3], pixsize\[2], dcomp[6], dcompen);
6182Di6t4 := NAN4 (di6t[4], di6t[0..3]);
6183Dbinh[6] := NAN2 (dbinh\[6], di6t[4], phrase_mode);*/
6184////////////////////////////////////// C++ CODE //////////////////////////////////////
6185 bool di6t0_1 = ((pixsize & 0x04) && (zcomp & 0x08))
6186 || ((pixsize & 0x04) && (dcomp & 0x40) && (dcomp & 0x80) && dcompen);
6187 bool di6t4 = di6t0_1
6188 || (!(srcd & 0x40) && bcompen)
6189 || (!(pixsize & 0x04) && (dcomp & 0x40) && dcompen);
6190 dbinh |= (!(di6t4 && phrase_mode) ? 0x40 : 0x00);
6191#ifdef LOG_COMP_CTRL
6192if (logBlit)
6193{
6194 WriteLog("[di6t0_1=%s di6t4=%s]", (di6t0_1 ? "T" : "F"), (di6t4 ? "T" : "F"));
6195// fflush(stdout);
6196}
6197#endif
6198//////////////////////////////////////////////////////////////////////////////////////
6199
6200/*Di7t0 := NAN3 (di7t[0], pixsize\[2], dcomp[7], dcompen);
6201Di7t1 := NAN2 (di7t[1], srcd\[7], bcompen);
6202Di7t2 := NAN4 (di7t[2], di6t[0..1], di7t[0..1]);
6203Dbinh[7] := NAN2 (dbinh\[7], di7t[2], phrase_mode);*/
6204////////////////////////////////////// C++ CODE //////////////////////////////////////
6205 bool di7t2 = di6t0_1
6206 || (!(srcd & 0x80) && bcompen)
6207 || (!(pixsize & 0x04) && (dcomp & 0x80) && dcompen);
6208 dbinh |= (!(di7t2 && phrase_mode) ? 0x80 : 0x00);
6209#ifdef LOG_COMP_CTRL
6210if (logBlit)
6211{
6212 WriteLog("[di7t2=%s]", (di7t2 ? "T" : "F"));
6213// fflush(stdout);
6214}
6215#endif
6216//////////////////////////////////////////////////////////////////////////////////////
6217
6218//END;
6219//kludge
6220dbinh = ~dbinh;
6221#ifdef LOG_COMP_CTRL
6222if (logBlit)
6223{
6224 WriteLog("[dcomp=$%02X dbinh=$%02X]\n ", dcomp, dbinh);
6225// fflush(stdout);
6226}
6227#endif
6228}
6229
6230
6231////////////////////////////////////// C++ CODE //////////////////////////////////////
6232//////////////////////////////////////////////////////////////////////////////////////
6233
6234// !!! TESTING !!! TESTING !!! TESTING !!! TESTING !!! TESTING !!! TESTING !!! TESTING !!!
6235// !!! TESTING !!! TESTING !!! TESTING !!! TESTING !!! TESTING !!! TESTING !!! TESTING !!!
6236// !!! TESTING !!! TESTING !!! TESTING !!! TESTING !!! TESTING !!! TESTING !!! TESTING !!!
6237
6238#endif
6239