2 * QEMU ATI SVGA emulation
5 * Copyright (c) 2019 BALATON Zoltan
7 * This work is licensed under the GNU GPL license version 2 or later.
10 #include "qemu/osdep.h"
14 #include "ui/pixel_ops.h"
15 #include "ui/console.h"
19 * This is 2D _acceleration_ and supposed to be fast. Therefore, don't try to
20 * reinvent the wheel (unlikely to get better with a naive implementation than
21 * existing libraries) and avoid (poorly) reimplementing gfx primitives.
22 * That is unnecessary and would become a performance problem. Instead, try to
23 * map to and reuse existing optimised facilities (e.g. pixman) wherever
27 static int ati_bpp_from_datatype(ATIVGAState
*s
)
29 switch (s
->regs
.dp_datatype
& 0xf) {
40 qemu_log_mask(LOG_UNIMP
, "Unknown dst datatype %d\n",
41 s
->regs
.dp_datatype
& 0xf);
46 #define DEFAULT_CNTL (s->regs.dp_gui_master_cntl & GMC_DST_PITCH_OFFSET_CNTL)
48 void ati_2d_blt(ATIVGAState
*s
)
50 /* FIXME it is probably more complex than this and may need to be */
51 /* rewritten but for now as a start just to get some output: */
52 DisplaySurface
*ds
= qemu_console_surface(s
->vga
.con
);
53 DPRINTF("%p %u ds: %p %d %d rop: %x\n", s
->vga
.vram_ptr
,
54 s
->vga
.vbe_start_addr
, surface_data(ds
), surface_stride(ds
),
55 surface_bits_per_pixel(ds
),
56 (s
->regs
.dp_mix
& GMC_ROP3_MASK
) >> 16);
57 unsigned dst_x
= (s
->regs
.dp_cntl
& DST_X_LEFT_TO_RIGHT
?
58 s
->regs
.dst_x
: s
->regs
.dst_x
+ 1 - s
->regs
.dst_width
);
59 unsigned dst_y
= (s
->regs
.dp_cntl
& DST_Y_TOP_TO_BOTTOM
?
60 s
->regs
.dst_y
: s
->regs
.dst_y
+ 1 - s
->regs
.dst_height
);
61 int bpp
= ati_bpp_from_datatype(s
);
63 qemu_log_mask(LOG_GUEST_ERROR
, "Invalid bpp\n");
66 int dst_stride
= DEFAULT_CNTL
? s
->regs
.dst_pitch
: s
->regs
.default_pitch
;
68 qemu_log_mask(LOG_GUEST_ERROR
, "Zero dest pitch\n");
71 uint8_t *dst_bits
= s
->vga
.vram_ptr
+ (DEFAULT_CNTL
?
72 s
->regs
.dst_offset
: s
->regs
.default_offset
);
74 if (s
->dev_id
== PCI_DEVICE_ID_ATI_RAGE128_PF
) {
75 dst_bits
+= s
->regs
.crtc_offset
& 0x07ffffff;
78 uint8_t *end
= s
->vga
.vram_ptr
+ s
->vga
.vram_size
;
79 if (dst_x
> 0x3fff || dst_y
> 0x3fff || dst_bits
>= end
81 + (dst_y
+ s
->regs
.dst_height
) * dst_stride
>= end
) {
82 qemu_log_mask(LOG_UNIMP
, "blt outside vram not implemented\n");
85 DPRINTF("%d %d %d, %d %d %d, (%d,%d) -> (%d,%d) %dx%d %c %c\n",
86 s
->regs
.src_offset
, s
->regs
.dst_offset
, s
->regs
.default_offset
,
87 s
->regs
.src_pitch
, s
->regs
.dst_pitch
, s
->regs
.default_pitch
,
88 s
->regs
.src_x
, s
->regs
.src_y
, dst_x
, dst_y
,
89 s
->regs
.dst_width
, s
->regs
.dst_height
,
90 (s
->regs
.dp_cntl
& DST_X_LEFT_TO_RIGHT
? '>' : '<'),
91 (s
->regs
.dp_cntl
& DST_Y_TOP_TO_BOTTOM
? 'v' : '^'));
92 switch (s
->regs
.dp_mix
& GMC_ROP3_MASK
) {
95 bool fallback
= false;
96 unsigned src_x
= (s
->regs
.dp_cntl
& DST_X_LEFT_TO_RIGHT
?
97 s
->regs
.src_x
: s
->regs
.src_x
+ 1 - s
->regs
.dst_width
);
98 unsigned src_y
= (s
->regs
.dp_cntl
& DST_Y_TOP_TO_BOTTOM
?
99 s
->regs
.src_y
: s
->regs
.src_y
+ 1 - s
->regs
.dst_height
);
100 int src_stride
= DEFAULT_CNTL
?
101 s
->regs
.src_pitch
: s
->regs
.default_pitch
;
103 qemu_log_mask(LOG_GUEST_ERROR
, "Zero source pitch\n");
106 uint8_t *src_bits
= s
->vga
.vram_ptr
+ (DEFAULT_CNTL
?
107 s
->regs
.src_offset
: s
->regs
.default_offset
);
109 if (s
->dev_id
== PCI_DEVICE_ID_ATI_RAGE128_PF
) {
110 src_bits
+= s
->regs
.crtc_offset
& 0x07ffffff;
113 if (src_x
> 0x3fff || src_y
> 0x3fff || src_bits
>= end
115 + (src_y
+ s
->regs
.dst_height
) * src_stride
>= end
) {
116 qemu_log_mask(LOG_UNIMP
, "blt outside vram not implemented\n");
120 src_stride
/= sizeof(uint32_t);
121 dst_stride
/= sizeof(uint32_t);
122 DPRINTF("pixman_blt(%p, %p, %d, %d, %d, %d, %d, %d, %d, %d, %d, %d)\n",
123 src_bits
, dst_bits
, src_stride
, dst_stride
, bpp
, bpp
,
124 src_x
, src_y
, dst_x
, dst_y
,
125 s
->regs
.dst_width
, s
->regs
.dst_height
);
126 if ((s
->use_pixman
& BIT(1)) &&
127 s
->regs
.dp_cntl
& DST_X_LEFT_TO_RIGHT
&&
128 s
->regs
.dp_cntl
& DST_Y_TOP_TO_BOTTOM
) {
129 fallback
= !pixman_blt((uint32_t *)src_bits
, (uint32_t *)dst_bits
,
130 src_stride
, dst_stride
, bpp
, bpp
,
131 src_x
, src_y
, dst_x
, dst_y
,
132 s
->regs
.dst_width
, s
->regs
.dst_height
);
133 } else if (s
->use_pixman
& BIT(1)) {
134 /* FIXME: We only really need a temporary if src and dst overlap */
135 int llb
= s
->regs
.dst_width
* (bpp
/ 8);
136 int tmp_stride
= DIV_ROUND_UP(llb
, sizeof(uint32_t));
137 uint32_t *tmp
= g_malloc(tmp_stride
* sizeof(uint32_t) *
139 fallback
= !pixman_blt((uint32_t *)src_bits
, tmp
,
140 src_stride
, tmp_stride
, bpp
, bpp
,
142 s
->regs
.dst_width
, s
->regs
.dst_height
);
144 fallback
= !pixman_blt(tmp
, (uint32_t *)dst_bits
,
145 tmp_stride
, dst_stride
, bpp
, bpp
,
147 s
->regs
.dst_width
, s
->regs
.dst_height
);
154 unsigned int y
, i
, j
, bypp
= bpp
/ 8;
155 unsigned int src_pitch
= src_stride
* sizeof(uint32_t);
156 unsigned int dst_pitch
= dst_stride
* sizeof(uint32_t);
158 for (y
= 0; y
< s
->regs
.dst_height
; y
++) {
161 if (s
->regs
.dp_cntl
& DST_Y_TOP_TO_BOTTOM
) {
162 i
+= (dst_y
+ y
) * dst_pitch
;
163 j
+= (src_y
+ y
) * src_pitch
;
165 i
+= (dst_y
+ s
->regs
.dst_height
- 1 - y
) * dst_pitch
;
166 j
+= (src_y
+ s
->regs
.dst_height
- 1 - y
) * src_pitch
;
168 memmove(&dst_bits
[i
], &src_bits
[j
], s
->regs
.dst_width
* bypp
);
171 if (dst_bits
>= s
->vga
.vram_ptr
+ s
->vga
.vbe_start_addr
&&
172 dst_bits
< s
->vga
.vram_ptr
+ s
->vga
.vbe_start_addr
+
173 s
->vga
.vbe_regs
[VBE_DISPI_INDEX_YRES
] * s
->vga
.vbe_line_offset
) {
174 memory_region_set_dirty(&s
->vga
.vram
, s
->vga
.vbe_start_addr
+
176 dst_y
* surface_stride(ds
),
177 s
->regs
.dst_height
* surface_stride(ds
));
179 s
->regs
.dst_x
= (s
->regs
.dp_cntl
& DST_X_LEFT_TO_RIGHT
?
180 dst_x
+ s
->regs
.dst_width
: dst_x
);
181 s
->regs
.dst_y
= (s
->regs
.dp_cntl
& DST_Y_TOP_TO_BOTTOM
?
182 dst_y
+ s
->regs
.dst_height
: dst_y
);
191 switch (s
->regs
.dp_mix
& GMC_ROP3_MASK
) {
193 filler
= s
->regs
.dp_brush_frgd_clr
;
196 filler
= 0xffUL
<< 24 | rgb_to_pixel32(s
->vga
.palette
[0],
197 s
->vga
.palette
[1], s
->vga
.palette
[2]);
200 filler
= 0xffUL
<< 24 | rgb_to_pixel32(s
->vga
.palette
[3],
201 s
->vga
.palette
[4], s
->vga
.palette
[5]);
205 dst_stride
/= sizeof(uint32_t);
206 DPRINTF("pixman_fill(%p, %d, %d, %d, %d, %d, %d, %x)\n",
207 dst_bits
, dst_stride
, bpp
, dst_x
, dst_y
,
208 s
->regs
.dst_width
, s
->regs
.dst_height
, filler
);
209 if (!(s
->use_pixman
& BIT(0)) ||
210 !pixman_fill((uint32_t *)dst_bits
, dst_stride
, bpp
, dst_x
, dst_y
,
211 s
->regs
.dst_width
, s
->regs
.dst_height
, filler
)) {
212 /* fallback when pixman failed or we don't want to call it */
213 unsigned int x
, y
, i
, bypp
= bpp
/ 8;
214 unsigned int dst_pitch
= dst_stride
* sizeof(uint32_t);
215 for (y
= 0; y
< s
->regs
.dst_height
; y
++) {
216 i
= dst_x
* bypp
+ (dst_y
+ y
) * dst_pitch
;
217 for (x
= 0; x
< s
->regs
.dst_width
; x
++, i
+= bypp
) {
218 stn_he_p(&dst_bits
[i
], bypp
, filler
);
222 if (dst_bits
>= s
->vga
.vram_ptr
+ s
->vga
.vbe_start_addr
&&
223 dst_bits
< s
->vga
.vram_ptr
+ s
->vga
.vbe_start_addr
+
224 s
->vga
.vbe_regs
[VBE_DISPI_INDEX_YRES
] * s
->vga
.vbe_line_offset
) {
225 memory_region_set_dirty(&s
->vga
.vram
, s
->vga
.vbe_start_addr
+
227 dst_y
* surface_stride(ds
),
228 s
->regs
.dst_height
* surface_stride(ds
));
230 s
->regs
.dst_y
= (s
->regs
.dp_cntl
& DST_Y_TOP_TO_BOTTOM
?
231 dst_y
+ s
->regs
.dst_height
: dst_y
);
235 qemu_log_mask(LOG_UNIMP
, "Unimplemented ati_2d blt op %x\n",
236 (s
->regs
.dp_mix
& GMC_ROP3_MASK
) >> 16);