2 * QEMU ATI SVGA emulation
5 * Copyright (c) 2019 BALATON Zoltan
7 * This work is licensed under the GNU GPL license version 2 or later.
10 #include "qemu/osdep.h"
14 #include "ui/pixel_ops.h"
15 #include "ui/console.h"
19 * This is 2D _acceleration_ and supposed to be fast. Therefore, don't try to
20 * reinvent the wheel (unlikely to get better with a naive implementation than
21 * existing libraries) and avoid (poorly) reimplementing gfx primitives.
22 * That is unnecessary and would become a performance problem. Instead, try to
23 * map to and reuse existing optimised facilities (e.g. pixman) wherever
27 static int ati_bpp_from_datatype(ATIVGAState
*s
)
29 switch (s
->regs
.dp_datatype
& 0xf) {
40 qemu_log_mask(LOG_UNIMP
, "Unknown dst datatype %d\n",
41 s
->regs
.dp_datatype
& 0xf);
46 #define DEFAULT_CNTL (s->regs.dp_gui_master_cntl & GMC_DST_PITCH_OFFSET_CNTL)
48 void ati_2d_blt(ATIVGAState
*s
)
50 /* FIXME it is probably more complex than this and may need to be */
51 /* rewritten but for now as a start just to get some output: */
52 DisplaySurface
*ds
= qemu_console_surface(s
->vga
.con
);
53 DPRINTF("%p %u ds: %p %d %d rop: %x\n", s
->vga
.vram_ptr
,
54 s
->vga
.vbe_start_addr
, surface_data(ds
), surface_stride(ds
),
55 surface_bits_per_pixel(ds
),
56 (s
->regs
.dp_mix
& GMC_ROP3_MASK
) >> 16);
57 unsigned dst_x
= (s
->regs
.dp_cntl
& DST_X_LEFT_TO_RIGHT
?
58 s
->regs
.dst_x
: s
->regs
.dst_x
+ 1 - s
->regs
.dst_width
);
59 unsigned dst_y
= (s
->regs
.dp_cntl
& DST_Y_TOP_TO_BOTTOM
?
60 s
->regs
.dst_y
: s
->regs
.dst_y
+ 1 - s
->regs
.dst_height
);
61 int bpp
= ati_bpp_from_datatype(s
);
63 qemu_log_mask(LOG_GUEST_ERROR
, "Invalid bpp\n");
66 int dst_stride
= DEFAULT_CNTL
? s
->regs
.dst_pitch
: s
->regs
.default_pitch
;
68 qemu_log_mask(LOG_GUEST_ERROR
, "Zero dest pitch\n");
71 uint8_t *dst_bits
= s
->vga
.vram_ptr
+ (DEFAULT_CNTL
?
72 s
->regs
.dst_offset
: s
->regs
.default_offset
);
74 if (s
->dev_id
== PCI_DEVICE_ID_ATI_RAGE128_PF
) {
75 dst_bits
+= s
->regs
.crtc_offset
& 0x07ffffff;
78 uint8_t *end
= s
->vga
.vram_ptr
+ s
->vga
.vram_size
;
79 if (dst_x
> 0x3fff || dst_y
> 0x3fff || dst_bits
>= end
81 + (dst_y
+ s
->regs
.dst_height
) * dst_stride
>= end
) {
82 qemu_log_mask(LOG_UNIMP
, "blt outside vram not implemented\n");
85 DPRINTF("%d %d %d, %d %d %d, (%d,%d) -> (%d,%d) %dx%d %c %c\n",
86 s
->regs
.src_offset
, s
->regs
.dst_offset
, s
->regs
.default_offset
,
87 s
->regs
.src_pitch
, s
->regs
.dst_pitch
, s
->regs
.default_pitch
,
88 s
->regs
.src_x
, s
->regs
.src_y
, dst_x
, dst_y
,
89 s
->regs
.dst_width
, s
->regs
.dst_height
,
90 (s
->regs
.dp_cntl
& DST_X_LEFT_TO_RIGHT
? '>' : '<'),
91 (s
->regs
.dp_cntl
& DST_Y_TOP_TO_BOTTOM
? 'v' : '^'));
92 switch (s
->regs
.dp_mix
& GMC_ROP3_MASK
) {
95 bool fallback
= false;
96 unsigned src_x
= (s
->regs
.dp_cntl
& DST_X_LEFT_TO_RIGHT
?
97 s
->regs
.src_x
: s
->regs
.src_x
+ 1 - s
->regs
.dst_width
);
98 unsigned src_y
= (s
->regs
.dp_cntl
& DST_Y_TOP_TO_BOTTOM
?
99 s
->regs
.src_y
: s
->regs
.src_y
+ 1 - s
->regs
.dst_height
);
100 int src_stride
= DEFAULT_CNTL
?
101 s
->regs
.src_pitch
: s
->regs
.default_pitch
;
103 qemu_log_mask(LOG_GUEST_ERROR
, "Zero source pitch\n");
106 uint8_t *src_bits
= s
->vga
.vram_ptr
+ (DEFAULT_CNTL
?
107 s
->regs
.src_offset
: s
->regs
.default_offset
);
109 if (s
->dev_id
== PCI_DEVICE_ID_ATI_RAGE128_PF
) {
110 src_bits
+= s
->regs
.crtc_offset
& 0x07ffffff;
113 if (src_x
> 0x3fff || src_y
> 0x3fff || src_bits
>= end
115 + (src_y
+ s
->regs
.dst_height
) * src_stride
>= end
) {
116 qemu_log_mask(LOG_UNIMP
, "blt outside vram not implemented\n");
120 src_stride
/= sizeof(uint32_t);
121 dst_stride
/= sizeof(uint32_t);
122 DPRINTF("pixman_blt(%p, %p, %d, %d, %d, %d, %d, %d, %d, %d, %d, %d)\n",
123 src_bits
, dst_bits
, src_stride
, dst_stride
, bpp
, bpp
,
124 src_x
, src_y
, dst_x
, dst_y
,
125 s
->regs
.dst_width
, s
->regs
.dst_height
);
127 if ((s
->use_pixman
& BIT(1)) &&
128 s
->regs
.dp_cntl
& DST_X_LEFT_TO_RIGHT
&&
129 s
->regs
.dp_cntl
& DST_Y_TOP_TO_BOTTOM
) {
130 fallback
= !pixman_blt((uint32_t *)src_bits
, (uint32_t *)dst_bits
,
131 src_stride
, dst_stride
, bpp
, bpp
,
132 src_x
, src_y
, dst_x
, dst_y
,
133 s
->regs
.dst_width
, s
->regs
.dst_height
);
134 } else if (s
->use_pixman
& BIT(1)) {
135 /* FIXME: We only really need a temporary if src and dst overlap */
136 int llb
= s
->regs
.dst_width
* (bpp
/ 8);
137 int tmp_stride
= DIV_ROUND_UP(llb
, sizeof(uint32_t));
138 uint32_t *tmp
= g_malloc(tmp_stride
* sizeof(uint32_t) *
140 fallback
= !pixman_blt((uint32_t *)src_bits
, tmp
,
141 src_stride
, tmp_stride
, bpp
, bpp
,
143 s
->regs
.dst_width
, s
->regs
.dst_height
);
145 fallback
= !pixman_blt(tmp
, (uint32_t *)dst_bits
,
146 tmp_stride
, dst_stride
, bpp
, bpp
,
148 s
->regs
.dst_width
, s
->regs
.dst_height
);
157 unsigned int y
, i
, j
, bypp
= bpp
/ 8;
158 unsigned int src_pitch
= src_stride
* sizeof(uint32_t);
159 unsigned int dst_pitch
= dst_stride
* sizeof(uint32_t);
161 for (y
= 0; y
< s
->regs
.dst_height
; y
++) {
164 if (s
->regs
.dp_cntl
& DST_Y_TOP_TO_BOTTOM
) {
165 i
+= (dst_y
+ y
) * dst_pitch
;
166 j
+= (src_y
+ y
) * src_pitch
;
168 i
+= (dst_y
+ s
->regs
.dst_height
- 1 - y
) * dst_pitch
;
169 j
+= (src_y
+ s
->regs
.dst_height
- 1 - y
) * src_pitch
;
171 memmove(&dst_bits
[i
], &src_bits
[j
], s
->regs
.dst_width
* bypp
);
174 if (dst_bits
>= s
->vga
.vram_ptr
+ s
->vga
.vbe_start_addr
&&
175 dst_bits
< s
->vga
.vram_ptr
+ s
->vga
.vbe_start_addr
+
176 s
->vga
.vbe_regs
[VBE_DISPI_INDEX_YRES
] * s
->vga
.vbe_line_offset
) {
177 memory_region_set_dirty(&s
->vga
.vram
, s
->vga
.vbe_start_addr
+
179 dst_y
* surface_stride(ds
),
180 s
->regs
.dst_height
* surface_stride(ds
));
182 s
->regs
.dst_x
= (s
->regs
.dp_cntl
& DST_X_LEFT_TO_RIGHT
?
183 dst_x
+ s
->regs
.dst_width
: dst_x
);
184 s
->regs
.dst_y
= (s
->regs
.dp_cntl
& DST_Y_TOP_TO_BOTTOM
?
185 dst_y
+ s
->regs
.dst_height
: dst_y
);
194 switch (s
->regs
.dp_mix
& GMC_ROP3_MASK
) {
196 filler
= s
->regs
.dp_brush_frgd_clr
;
199 filler
= 0xffUL
<< 24 | rgb_to_pixel32(s
->vga
.palette
[0],
200 s
->vga
.palette
[1], s
->vga
.palette
[2]);
203 filler
= 0xffUL
<< 24 | rgb_to_pixel32(s
->vga
.palette
[3],
204 s
->vga
.palette
[4], s
->vga
.palette
[5]);
208 dst_stride
/= sizeof(uint32_t);
209 DPRINTF("pixman_fill(%p, %d, %d, %d, %d, %d, %d, %x)\n",
210 dst_bits
, dst_stride
, bpp
, dst_x
, dst_y
,
211 s
->regs
.dst_width
, s
->regs
.dst_height
, filler
);
213 if (!(s
->use_pixman
& BIT(0)) ||
214 !pixman_fill((uint32_t *)dst_bits
, dst_stride
, bpp
, dst_x
, dst_y
,
215 s
->regs
.dst_width
, s
->regs
.dst_height
, filler
))
218 /* fallback when pixman failed or we don't want to call it */
219 unsigned int x
, y
, i
, bypp
= bpp
/ 8;
220 unsigned int dst_pitch
= dst_stride
* sizeof(uint32_t);
221 for (y
= 0; y
< s
->regs
.dst_height
; y
++) {
222 i
= dst_x
* bypp
+ (dst_y
+ y
) * dst_pitch
;
223 for (x
= 0; x
< s
->regs
.dst_width
; x
++, i
+= bypp
) {
224 stn_he_p(&dst_bits
[i
], bypp
, filler
);
228 if (dst_bits
>= s
->vga
.vram_ptr
+ s
->vga
.vbe_start_addr
&&
229 dst_bits
< s
->vga
.vram_ptr
+ s
->vga
.vbe_start_addr
+
230 s
->vga
.vbe_regs
[VBE_DISPI_INDEX_YRES
] * s
->vga
.vbe_line_offset
) {
231 memory_region_set_dirty(&s
->vga
.vram
, s
->vga
.vbe_start_addr
+
233 dst_y
* surface_stride(ds
),
234 s
->regs
.dst_height
* surface_stride(ds
));
236 s
->regs
.dst_y
= (s
->regs
.dp_cntl
& DST_Y_TOP_TO_BOTTOM
?
237 dst_y
+ s
->regs
.dst_height
: dst_y
);
241 qemu_log_mask(LOG_UNIMP
, "Unimplemented ati_2d blt op %x\n",
242 (s
->regs
.dp_mix
& GMC_ROP3_MASK
) >> 16);