1 /*
2  * Copyright (C) 2019 Alyssa Rosenzweig
3  * Copyright (C) 2017-2018 Lyude Paul
4  * Copyright (C) 2019 Collabora, Ltd.
5  *
6  * Permission is hereby granted, free of charge, to any person obtaining a
7  * copy of this software and associated documentation files (the "Software"),
8  * to deal in the Software without restriction, including without limitation
9  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
10  * and/or sell copies of the Software, and to permit persons to whom the
11  * Software is furnished to do so, subject to the following conditions:
12  *
13  * The above copyright notice and this permission notice (including the next
14  * paragraph) shall be included in all copies or substantial portions of the
15  * Software.
16  *
17  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
18  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
19  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
20  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
21  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
22  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
23  * SOFTWARE.
24  */
25 
26 #include <stdio.h>
27 #include <stdlib.h>
28 #include <assert.h>
29 #include <stdint.h>
30 #include <string.h>
31 #include <sys/mman.h>
32 
33 #include "decode.h"
34 #include "util/macros.h"
35 #include "util/u_debug.h"
36 #include "util/u_dynarray.h"
37 #include "util/hash_table.h"
38 
39 FILE *pandecode_dump_stream;
40 
41 /* Memory handling */
42 
43 static struct hash_table_u64 *mmap_table;
44 
45 static struct util_dynarray ro_mappings;
46 
47 static struct pandecode_mapped_memory *
pandecode_find_mapped_gpu_mem_containing_rw(uint64_t addr)48 pandecode_find_mapped_gpu_mem_containing_rw(uint64_t addr)
49 {
50         return _mesa_hash_table_u64_search(mmap_table, addr & ~(4096 - 1));
51 }
52 
53 struct pandecode_mapped_memory *
pandecode_find_mapped_gpu_mem_containing(uint64_t addr)54 pandecode_find_mapped_gpu_mem_containing(uint64_t addr)
55 {
56         struct pandecode_mapped_memory *mem = pandecode_find_mapped_gpu_mem_containing_rw(addr);
57 
58         if (mem && mem->addr && !mem->ro) {
59                 mprotect(mem->addr, mem->length, PROT_READ);
60                 mem->ro = true;
61                 util_dynarray_append(&ro_mappings, struct pandecode_mapped_memory *, mem);
62         }
63 
64         return mem;
65 }
66 
67 void
pandecode_map_read_write(void)68 pandecode_map_read_write(void)
69 {
70         util_dynarray_foreach(&ro_mappings, struct pandecode_mapped_memory *, mem) {
71                 (*mem)->ro = false;
72                 mprotect((*mem)->addr, (*mem)->length, PROT_READ | PROT_WRITE);
73         }
74         util_dynarray_clear(&ro_mappings);
75 }
76 
77 static void
pandecode_add_name(struct pandecode_mapped_memory * mem,uint64_t gpu_va,const char * name)78 pandecode_add_name(struct pandecode_mapped_memory *mem, uint64_t gpu_va, const char *name)
79 {
80         if (!name) {
81                 /* If we don't have a name, assign one */
82 
83                 snprintf(mem->name, sizeof(mem->name) - 1,
84                          "memory_%" PRIx64, gpu_va);
85         } else {
86                 assert((strlen(name) + 1) < sizeof(mem->name));
87                 memcpy(mem->name, name, strlen(name) + 1);
88         }
89 }
90 
91 void
pandecode_inject_mmap(uint64_t gpu_va,void * cpu,unsigned sz,const char * name)92 pandecode_inject_mmap(uint64_t gpu_va, void *cpu, unsigned sz, const char *name)
93 {
94         /* First, search if we already mapped this and are just updating an address */
95 
96         struct pandecode_mapped_memory *existing =
97                 pandecode_find_mapped_gpu_mem_containing_rw(gpu_va);
98 
99         if (existing && existing->gpu_va == gpu_va) {
100                 existing->length = sz;
101                 existing->addr = cpu;
102                 pandecode_add_name(existing, gpu_va, name);
103                 return;
104         }
105 
106         /* Otherwise, add a fresh mapping */
107         struct pandecode_mapped_memory *mapped_mem = NULL;
108 
109         mapped_mem = calloc(1, sizeof(*mapped_mem));
110         mapped_mem->gpu_va = gpu_va;
111         mapped_mem->length = sz;
112         mapped_mem->addr = cpu;
113         pandecode_add_name(mapped_mem, gpu_va, name);
114 
115         /* Add it to the table */
116         assert((gpu_va & 4095) == 0);
117 
118         for (unsigned i = 0; i < sz; i += 4096)
119                 _mesa_hash_table_u64_insert(mmap_table, gpu_va + i, mapped_mem);
120 }
121 
122 void
pandecode_inject_free(uint64_t gpu_va,unsigned sz)123 pandecode_inject_free(uint64_t gpu_va, unsigned sz)
124 {
125         struct pandecode_mapped_memory *mem =
126                 pandecode_find_mapped_gpu_mem_containing_rw(gpu_va);
127 
128         if (!mem)
129                 return;
130 
131         assert(mem->gpu_va == gpu_va);
132         assert(mem->length == sz);
133 
134         free(mem);
135 
136         for (unsigned i = 0; i < sz; i += 4096)
137                 _mesa_hash_table_u64_remove(mmap_table, gpu_va + i);
138 }
139 
140 char *
pointer_as_memory_reference(uint64_t ptr)141 pointer_as_memory_reference(uint64_t ptr)
142 {
143         struct pandecode_mapped_memory *mapped;
144         char *out = malloc(128);
145 
146         /* Try to find the corresponding mapped zone */
147 
148         mapped = pandecode_find_mapped_gpu_mem_containing_rw(ptr);
149 
150         if (mapped) {
151                 snprintf(out, 128, "%s + %d", mapped->name, (int) (ptr - mapped->gpu_va));
152                 return out;
153         }
154 
155         /* Just use the raw address if other options are exhausted */
156 
157         snprintf(out, 128, "0x%" PRIx64, ptr);
158         return out;
159 
160 }
161 
162 static int pandecode_dump_frame_count = 0;
163 
164 static bool force_stderr = false;
165 
166 void
pandecode_dump_file_open(void)167 pandecode_dump_file_open(void)
168 {
169         if (pandecode_dump_stream)
170                 return;
171 
172         /* This does a getenv every frame, so it is possible to use
173          * setenv to change the base at runtime.
174          */
175         const char *dump_file_base = debug_get_option("PANDECODE_DUMP_FILE", "pandecode.dump");
176         if (force_stderr || !strcmp(dump_file_base, "stderr"))
177                 pandecode_dump_stream = stderr;
178         else {
179                 char buffer[1024];
180                 snprintf(buffer, sizeof(buffer), "%s.%04d", dump_file_base, pandecode_dump_frame_count);
181                 printf("pandecode: dump command stream to file %s\n", buffer);
182                 pandecode_dump_stream = fopen(buffer, "w");
183                 if (!pandecode_dump_stream)
184                         fprintf(stderr,
185                                 "pandecode: failed to open command stream log file %s\n",
186                                 buffer);
187         }
188 }
189 
190 static void
pandecode_dump_file_close(void)191 pandecode_dump_file_close(void)
192 {
193         if (pandecode_dump_stream && pandecode_dump_stream != stderr) {
194                 if (fclose(pandecode_dump_stream))
195                         perror("pandecode: dump file");
196 
197                 pandecode_dump_stream = NULL;
198         }
199 }
200 
201 void
pandecode_initialize(bool to_stderr)202 pandecode_initialize(bool to_stderr)
203 {
204         force_stderr = to_stderr;
205         mmap_table = _mesa_hash_table_u64_create(NULL);
206         util_dynarray_init(&ro_mappings, NULL);
207 }
208 
209 void
pandecode_next_frame(void)210 pandecode_next_frame(void)
211 {
212         pandecode_dump_file_close();
213         pandecode_dump_frame_count++;
214 }
215 
216 void
pandecode_close(void)217 pandecode_close(void)
218 {
219         _mesa_hash_table_u64_destroy(mmap_table);
220         util_dynarray_fini(&ro_mappings);
221         pandecode_dump_file_close();
222 }
223 
224 void pandecode_abort_on_fault_v4(mali_ptr jc_gpu_va);
225 void pandecode_abort_on_fault_v5(mali_ptr jc_gpu_va);
226 void pandecode_abort_on_fault_v6(mali_ptr jc_gpu_va);
227 void pandecode_abort_on_fault_v7(mali_ptr jc_gpu_va);
228 
229 void
pandecode_abort_on_fault(mali_ptr jc_gpu_va,unsigned gpu_id)230 pandecode_abort_on_fault(mali_ptr jc_gpu_va, unsigned gpu_id)
231 {
232         switch (pan_arch(gpu_id)) {
233         case 4: pandecode_abort_on_fault_v4(jc_gpu_va); return;
234         case 5: pandecode_abort_on_fault_v5(jc_gpu_va); return;
235         case 6: pandecode_abort_on_fault_v6(jc_gpu_va); return;
236         case 7: pandecode_abort_on_fault_v7(jc_gpu_va); return;
237         default: unreachable("Unsupported architecture");
238         }
239 }
240 
241 void pandecode_jc_v4(mali_ptr jc_gpu_va, unsigned gpu_id);
242 void pandecode_jc_v5(mali_ptr jc_gpu_va, unsigned gpu_id);
243 void pandecode_jc_v6(mali_ptr jc_gpu_va, unsigned gpu_id);
244 void pandecode_jc_v7(mali_ptr jc_gpu_va, unsigned gpu_id);
245 
246 void
pandecode_jc(mali_ptr jc_gpu_va,unsigned gpu_id)247 pandecode_jc(mali_ptr jc_gpu_va, unsigned gpu_id)
248 {
249         switch (pan_arch(gpu_id)) {
250         case 4: pandecode_jc_v4(jc_gpu_va, gpu_id); return;
251         case 5: pandecode_jc_v5(jc_gpu_va, gpu_id); return;
252         case 6: pandecode_jc_v6(jc_gpu_va, gpu_id); return;
253         case 7: pandecode_jc_v7(jc_gpu_va, gpu_id); return;
254         default: unreachable("Unsupported architecture");
255         }
256 }
257