OSDN Git Service

ANDROID: Add target/device support am: 8884508fa6 am: cf0ceff91e am: 96f63775f7 am...
[android-x86/external-minigbm.git] / amdgpu.c
1 /*
2  * Copyright 2016 The Chromium OS Authors. All rights reserved.
3  * Use of this source code is governed by a BSD-style license that can be
4  * found in the LICENSE file.
5  */
6 #ifdef DRV_AMDGPU
7 #include <amdgpu.h>
8 #include <amdgpu_drm.h>
9 #include <errno.h>
10 #include <stdio.h>
11 #include <stdlib.h>
12 #include <string.h>
13 #include <sys/mman.h>
14 #include <xf86drm.h>
15
16 #include "dri.h"
17 #include "drv_priv.h"
18 #include "helpers.h"
19 #include "util.h"
20
21 // clang-format off
22 #define DRI_PATH STRINGIZE(DRI_DRIVER_DIR/radeonsi_dri.so)
23 // clang-format on
24
25 #define TILE_TYPE_LINEAR 0
26 /* DRI backend decides tiling in this case. */
27 #define TILE_TYPE_DRI 1
28
29 struct amdgpu_priv {
30         struct dri_driver dri;
31         int drm_version;
32 };
33
34 const static uint32_t render_target_formats[] = { DRM_FORMAT_ABGR8888, DRM_FORMAT_ARGB8888,
35                                                   DRM_FORMAT_RGB565, DRM_FORMAT_XBGR8888,
36                                                   DRM_FORMAT_XRGB8888 };
37
38 const static uint32_t texture_source_formats[] = { DRM_FORMAT_GR88,           DRM_FORMAT_R8,
39                                                    DRM_FORMAT_NV21,           DRM_FORMAT_NV12,
40                                                    DRM_FORMAT_YVU420_ANDROID, DRM_FORMAT_YVU420 };
41
42 static int amdgpu_init(struct driver *drv)
43 {
44         struct amdgpu_priv *priv;
45         drmVersionPtr drm_version;
46         struct format_metadata metadata;
47         uint64_t use_flags = BO_USE_RENDER_MASK;
48
49         priv = calloc(1, sizeof(struct amdgpu_priv));
50         if (!priv)
51                 return -ENOMEM;
52
53         drm_version = drmGetVersion(drv_get_fd(drv));
54         if (!drm_version) {
55                 free(priv);
56                 return -ENODEV;
57         }
58
59         priv->drm_version = drm_version->version_minor;
60         drmFreeVersion(drm_version);
61
62         drv->priv = priv;
63
64         if (dri_init(drv, DRI_PATH, "radeonsi")) {
65                 free(priv);
66                 drv->priv = NULL;
67                 return -ENODEV;
68         }
69
70         metadata.tiling = TILE_TYPE_LINEAR;
71         metadata.priority = 1;
72         metadata.modifier = DRM_FORMAT_MOD_LINEAR;
73
74         drv_add_combinations(drv, render_target_formats, ARRAY_SIZE(render_target_formats),
75                              &metadata, use_flags);
76
77         drv_add_combinations(drv, texture_source_formats, ARRAY_SIZE(texture_source_formats),
78                              &metadata, BO_USE_TEXTURE_MASK);
79
80         /*
81          * Chrome uses DMA-buf mmap to write to YV12 buffers, which are then accessed by the
82          * Video Encoder Accelerator (VEA). It could also support NV12 potentially in the future.
83          */
84         drv_modify_combination(drv, DRM_FORMAT_YVU420, &metadata, BO_USE_HW_VIDEO_ENCODER);
85         drv_modify_combination(drv, DRM_FORMAT_NV12, &metadata, BO_USE_HW_VIDEO_ENCODER);
86
87         /* Android CTS tests require this. */
88         drv_add_combination(drv, DRM_FORMAT_BGR888, &metadata, BO_USE_SW_MASK);
89
90         /* Linear formats supported by display. */
91         drv_modify_combination(drv, DRM_FORMAT_ARGB8888, &metadata, BO_USE_CURSOR | BO_USE_SCANOUT);
92         drv_modify_combination(drv, DRM_FORMAT_XRGB8888, &metadata, BO_USE_CURSOR | BO_USE_SCANOUT);
93         drv_modify_combination(drv, DRM_FORMAT_ABGR8888, &metadata, BO_USE_SCANOUT);
94         drv_modify_combination(drv, DRM_FORMAT_XBGR8888, &metadata, BO_USE_SCANOUT);
95
96         /* YUV formats for camera and display. */
97         drv_modify_combination(drv, DRM_FORMAT_NV12, &metadata,
98                                BO_USE_CAMERA_READ | BO_USE_CAMERA_WRITE | BO_USE_SCANOUT |
99                                    BO_USE_HW_VIDEO_DECODER);
100
101         drv_modify_combination(drv, DRM_FORMAT_NV21, &metadata, BO_USE_SCANOUT);
102
103         /*
104          * R8 format is used for Android's HAL_PIXEL_FORMAT_BLOB and is used for JPEG snapshots
105          * from camera.
106          */
107         drv_modify_combination(drv, DRM_FORMAT_R8, &metadata,
108                                BO_USE_CAMERA_READ | BO_USE_CAMERA_WRITE);
109
110         /*
111          * The following formats will be allocated by the DRI backend and may be potentially tiled.
112          * Since format modifier support hasn't been implemented fully yet, it's not
113          * possible to enumerate the different types of buffers (like i915 can).
114          */
115         use_flags &= ~BO_USE_RENDERSCRIPT;
116         use_flags &= ~BO_USE_SW_WRITE_OFTEN;
117         use_flags &= ~BO_USE_SW_READ_OFTEN;
118         use_flags &= ~BO_USE_LINEAR;
119
120         metadata.tiling = TILE_TYPE_DRI;
121         metadata.priority = 2;
122
123         drv_add_combinations(drv, render_target_formats, ARRAY_SIZE(render_target_formats),
124                              &metadata, use_flags);
125
126         /* Potentially tiled formats supported by display. */
127         drv_modify_combination(drv, DRM_FORMAT_ARGB8888, &metadata, BO_USE_CURSOR | BO_USE_SCANOUT);
128         drv_modify_combination(drv, DRM_FORMAT_XRGB8888, &metadata, BO_USE_CURSOR | BO_USE_SCANOUT);
129         drv_modify_combination(drv, DRM_FORMAT_ABGR8888, &metadata, BO_USE_SCANOUT);
130         drv_modify_combination(drv, DRM_FORMAT_XBGR8888, &metadata, BO_USE_SCANOUT);
131         return 0;
132 }
133
134 static void amdgpu_close(struct driver *drv)
135 {
136         dri_close(drv);
137         free(drv->priv);
138         drv->priv = NULL;
139 }
140
141 static int amdgpu_create_bo_linear(struct bo *bo, uint32_t width, uint32_t height, uint32_t format,
142                                    uint64_t use_flags)
143 {
144         int ret;
145         uint32_t plane, stride;
146         union drm_amdgpu_gem_create gem_create;
147
148         stride = drv_stride_from_format(format, width, 0);
149         stride = ALIGN(stride, 256);
150
151         drv_bo_from_format(bo, stride, height, format);
152
153         memset(&gem_create, 0, sizeof(gem_create));
154         gem_create.in.bo_size = bo->meta.total_size;
155         gem_create.in.alignment = 256;
156         gem_create.in.domain_flags = 0;
157
158         if (use_flags & (BO_USE_LINEAR | BO_USE_SW_MASK))
159                 gem_create.in.domain_flags |= AMDGPU_GEM_CREATE_CPU_ACCESS_REQUIRED;
160
161         gem_create.in.domains = AMDGPU_GEM_DOMAIN_GTT;
162         if (!(use_flags & (BO_USE_SW_READ_OFTEN | BO_USE_SCANOUT)))
163                 gem_create.in.domain_flags |= AMDGPU_GEM_CREATE_CPU_GTT_USWC;
164
165         /* Allocate the buffer with the preferred heap. */
166         ret = drmCommandWriteRead(drv_get_fd(bo->drv), DRM_AMDGPU_GEM_CREATE, &gem_create,
167                                   sizeof(gem_create));
168         if (ret < 0)
169                 return ret;
170
171         for (plane = 0; plane < bo->meta.num_planes; plane++)
172                 bo->handles[plane].u32 = gem_create.out.handle;
173
174         bo->meta.format_modifiers[0] = DRM_FORMAT_MOD_LINEAR;
175
176         return 0;
177 }
178
179 static int amdgpu_create_bo(struct bo *bo, uint32_t width, uint32_t height, uint32_t format,
180                             uint64_t use_flags)
181 {
182         struct combination *combo;
183
184         combo = drv_get_combination(bo->drv, format, use_flags);
185         if (!combo)
186                 return -EINVAL;
187
188         if (combo->metadata.tiling == TILE_TYPE_DRI) {
189                 bool needs_alignment = false;
190 #ifdef __ANDROID__
191                 /*
192                  * Currently, the gralloc API doesn't differentiate between allocation time and map
193                  * time strides. A workaround for amdgpu DRI buffers is to always to align to 256 at
194                  * allocation time.
195                  *
196                  * See b/115946221,b/117942643
197                  */
198                 if (use_flags & (BO_USE_SW_MASK))
199                         needs_alignment = true;
200 #endif
201                 // See b/122049612
202                 if (use_flags & (BO_USE_SCANOUT))
203                         needs_alignment = true;
204
205                 if (needs_alignment) {
206                         uint32_t bytes_per_pixel = drv_bytes_per_pixel_from_format(format, 0);
207                         width = ALIGN(width, 256 / bytes_per_pixel);
208                 }
209
210                 return dri_bo_create(bo, width, height, format, use_flags);
211         }
212
213         return amdgpu_create_bo_linear(bo, width, height, format, use_flags);
214 }
215
216 static int amdgpu_create_bo_with_modifiers(struct bo *bo, uint32_t width, uint32_t height,
217                                            uint32_t format, const uint64_t *modifiers,
218                                            uint32_t count)
219 {
220         bool only_use_linear = true;
221
222         for (uint32_t i = 0; i < count; ++i)
223                 if (modifiers[i] != DRM_FORMAT_MOD_LINEAR)
224                         only_use_linear = false;
225
226         if (only_use_linear)
227                 return amdgpu_create_bo_linear(bo, width, height, format, BO_USE_SCANOUT);
228
229         return dri_bo_create_with_modifiers(bo, width, height, format, modifiers, count);
230 }
231
232 static int amdgpu_import_bo(struct bo *bo, struct drv_import_fd_data *data)
233 {
234         bool dri_tiling = data->format_modifiers[0] != DRM_FORMAT_MOD_LINEAR;
235         if (data->format_modifiers[0] == DRM_FORMAT_MOD_INVALID) {
236                 struct combination *combo;
237                 combo = drv_get_combination(bo->drv, data->format, data->use_flags);
238                 if (!combo)
239                         return -EINVAL;
240
241                 dri_tiling = combo->metadata.tiling == TILE_TYPE_DRI;
242         }
243
244         if (dri_tiling)
245                 return dri_bo_import(bo, data);
246         else
247                 return drv_prime_bo_import(bo, data);
248 }
249
250 static int amdgpu_destroy_bo(struct bo *bo)
251 {
252         if (bo->priv)
253                 return dri_bo_destroy(bo);
254         else
255                 return drv_gem_bo_destroy(bo);
256 }
257
258 static void *amdgpu_map_bo(struct bo *bo, struct vma *vma, size_t plane, uint32_t map_flags)
259 {
260         int ret;
261         union drm_amdgpu_gem_mmap gem_map;
262
263         if (bo->priv)
264                 return dri_bo_map(bo, vma, plane, map_flags);
265
266         memset(&gem_map, 0, sizeof(gem_map));
267         gem_map.in.handle = bo->handles[plane].u32;
268
269         ret = drmIoctl(bo->drv->fd, DRM_IOCTL_AMDGPU_GEM_MMAP, &gem_map);
270         if (ret) {
271                 drv_log("DRM_IOCTL_AMDGPU_GEM_MMAP failed\n");
272                 return MAP_FAILED;
273         }
274
275         vma->length = bo->meta.total_size;
276
277         return mmap(0, bo->meta.total_size, drv_get_prot(map_flags), MAP_SHARED, bo->drv->fd,
278                     gem_map.out.addr_ptr);
279 }
280
281 static int amdgpu_unmap_bo(struct bo *bo, struct vma *vma)
282 {
283         if (bo->priv)
284                 return dri_bo_unmap(bo, vma);
285         else
286                 return munmap(vma->addr, vma->length);
287 }
288
289 static int amdgpu_bo_invalidate(struct bo *bo, struct mapping *mapping)
290 {
291         int ret;
292         union drm_amdgpu_gem_wait_idle wait_idle;
293
294         if (bo->priv)
295                 return 0;
296
297         memset(&wait_idle, 0, sizeof(wait_idle));
298         wait_idle.in.handle = bo->handles[0].u32;
299         wait_idle.in.timeout = AMDGPU_TIMEOUT_INFINITE;
300
301         ret = drmCommandWriteRead(bo->drv->fd, DRM_AMDGPU_GEM_WAIT_IDLE, &wait_idle,
302                                   sizeof(wait_idle));
303
304         if (ret < 0) {
305                 drv_log("DRM_AMDGPU_GEM_WAIT_IDLE failed with %d\n", ret);
306                 return ret;
307         }
308
309         if (ret == 0 && wait_idle.out.status)
310                 drv_log("DRM_AMDGPU_GEM_WAIT_IDLE BO is busy\n");
311
312         return 0;
313 }
314
315 static uint32_t amdgpu_resolve_format(struct driver *drv, uint32_t format, uint64_t use_flags)
316 {
317         switch (format) {
318         case DRM_FORMAT_FLEX_IMPLEMENTATION_DEFINED:
319                 /* Camera subsystem requires NV12. */
320                 if (use_flags & (BO_USE_CAMERA_READ | BO_USE_CAMERA_WRITE))
321                         return DRM_FORMAT_NV12;
322                 /*HACK: See b/28671744 */
323                 return DRM_FORMAT_XBGR8888;
324         case DRM_FORMAT_FLEX_YCbCr_420_888:
325                 return DRM_FORMAT_NV12;
326         default:
327                 return format;
328         }
329 }
330
331 const struct backend backend_amdgpu = {
332         .name = "amdgpu",
333         .init = amdgpu_init,
334         .close = amdgpu_close,
335         .bo_create = amdgpu_create_bo,
336         .bo_create_with_modifiers = amdgpu_create_bo_with_modifiers,
337         .bo_destroy = amdgpu_destroy_bo,
338         .bo_import = amdgpu_import_bo,
339         .bo_map = amdgpu_map_bo,
340         .bo_unmap = amdgpu_unmap_bo,
341         .bo_invalidate = amdgpu_bo_invalidate,
342         .resolve_format = amdgpu_resolve_format,
343         .num_planes_from_modifier = dri_num_planes_from_modifier,
344 };
345
346 #endif