2 * Copyright © 2010 Daniel Vetter
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
23 * $FreeBSD: src/sys/dev/drm2/i915/i915_gem_gtt.c,v 1.1 2012/05/22 11:07:44 kib Exp $
26 #include <sys/sfbuf.h>
29 #include <drm/i915_drm.h>
31 #include "intel_drv.h"
33 typedef uint32_t gtt_pte_t;
36 #define GEN6_GTT_ADDR_ENCODE(addr) ((addr) | (((addr) >> 28) & 0xff0))
38 #define GEN6_PDE_VALID (1 << 0)
39 /* gen6+ has bit 11-4 for physical addr bit 39-32 */
40 #define GEN6_PDE_ADDR_ENCODE(addr) GEN6_GTT_ADDR_ENCODE(addr)
42 #define GEN6_PTE_VALID (1 << 0)
43 #define GEN6_PTE_UNCACHED (1 << 1)
44 #define HSW_PTE_UNCACHED (0)
45 #define GEN6_PTE_CACHE_LLC (2 << 1)
46 #define GEN6_PTE_CACHE_LLC_MLC (3 << 1)
47 #define GEN6_PTE_ADDR_ENCODE(addr) GEN6_GTT_ADDR_ENCODE(addr)
49 static inline gtt_pte_t pte_encode(struct drm_device *dev,
51 enum i915_cache_level level)
53 gtt_pte_t pte = GEN6_PTE_VALID;
54 pte |= GEN6_PTE_ADDR_ENCODE(addr);
57 case I915_CACHE_LLC_MLC:
58 /* Haswell doesn't set L3 this way */
60 pte |= GEN6_PTE_CACHE_LLC;
62 pte |= GEN6_PTE_CACHE_LLC_MLC;
65 pte |= GEN6_PTE_CACHE_LLC;
69 pte |= HSW_PTE_UNCACHED;
71 pte |= GEN6_PTE_UNCACHED;
81 /* PPGTT support for Sandybdrige/Gen6 and later */
82 static void i915_ppgtt_clear_range(struct i915_hw_ppgtt *ppgtt,
87 gtt_pte_t scratch_pte;
89 unsigned act_pd = first_entry / I915_PPGTT_PT_ENTRIES;
90 unsigned first_pte = first_entry % I915_PPGTT_PT_ENTRIES;
93 scratch_pte = GEN6_GTT_ADDR_ENCODE(ppgtt->scratch_page_dma_addr);
94 scratch_pte |= GEN6_PTE_VALID | GEN6_PTE_CACHE_LLC;
97 last_pte = first_pte + num_entries;
98 if (last_pte > I915_PPGTT_PT_ENTRIES)
99 last_pte = I915_PPGTT_PT_ENTRIES;
101 sf = sf_buf_alloc(ppgtt->pt_pages[act_pd]);
102 pt_vaddr = (uint32_t *)(uintptr_t)sf_buf_kva(sf);
104 for (i = first_pte; i < last_pte; i++)
105 pt_vaddr[i] = scratch_pte;
109 num_entries -= last_pte - first_pte;
116 i915_gem_init_aliasing_ppgtt(struct drm_device *dev)
118 struct drm_i915_private *dev_priv;
119 struct i915_hw_ppgtt *ppgtt;
120 u_int first_pd_entry_in_global_pt, i;
122 dev_priv = dev->dev_private;
125 * ppgtt PDEs reside in the global gtt pagetable, which has 512*1024
126 * entries. For aliasing ppgtt support we just steal them at the end for
129 first_pd_entry_in_global_pt = 512 * 1024 - I915_PPGTT_PD_ENTRIES;
131 ppgtt = kmalloc(sizeof(*ppgtt), DRM_I915_GEM, M_WAITOK | M_ZERO);
133 ppgtt->num_pd_entries = I915_PPGTT_PD_ENTRIES;
134 ppgtt->pt_pages = kmalloc(sizeof(vm_page_t) * ppgtt->num_pd_entries,
135 DRM_I915_GEM, M_WAITOK | M_ZERO);
137 for (i = 0; i < ppgtt->num_pd_entries; i++) {
138 ppgtt->pt_pages[i] = vm_page_alloc(NULL, 0,
139 VM_ALLOC_NORMAL | VM_ALLOC_ZERO);
140 if (ppgtt->pt_pages[i] == NULL) {
141 dev_priv->mm.aliasing_ppgtt = ppgtt;
142 i915_gem_cleanup_aliasing_ppgtt(dev);
147 ppgtt->scratch_page_dma_addr = dev_priv->mm.gtt->scratch_page_dma;
149 i915_ppgtt_clear_range(ppgtt, 0, ppgtt->num_pd_entries *
150 I915_PPGTT_PT_ENTRIES);
151 ppgtt->pd_offset = (first_pd_entry_in_global_pt) * sizeof(uint32_t);
152 dev_priv->mm.aliasing_ppgtt = ppgtt;
157 i915_ppgtt_insert_pages(struct i915_hw_ppgtt *ppgtt, unsigned first_entry,
158 unsigned num_entries, vm_page_t *pages, uint32_t pte_flags)
160 uint32_t *pt_vaddr, pte;
162 unsigned act_pd, first_pte;
163 unsigned last_pte, i;
164 vm_paddr_t page_addr;
166 act_pd = first_entry / I915_PPGTT_PT_ENTRIES;
167 first_pte = first_entry % I915_PPGTT_PT_ENTRIES;
169 while (num_entries) {
170 last_pte = first_pte + num_entries;
171 if (last_pte > I915_PPGTT_PT_ENTRIES)
172 last_pte = I915_PPGTT_PT_ENTRIES;
174 sf = sf_buf_alloc(ppgtt->pt_pages[act_pd]);
175 pt_vaddr = (uint32_t *)(uintptr_t)sf_buf_kva(sf);
177 for (i = first_pte; i < last_pte; i++) {
178 page_addr = VM_PAGE_TO_PHYS(*pages);
179 pte = GEN6_PTE_ADDR_ENCODE(page_addr);
180 pt_vaddr[i] = pte | pte_flags;
187 num_entries -= last_pte - first_pte;
194 i915_ppgtt_bind_object(struct i915_hw_ppgtt *ppgtt,
195 struct drm_i915_gem_object *obj, enum i915_cache_level cache_level)
197 struct drm_device *dev;
198 struct drm_i915_private *dev_priv;
202 dev_priv = dev->dev_private;
203 pte_flags = GEN6_PTE_VALID;
205 switch (cache_level) {
206 case I915_CACHE_LLC_MLC:
207 pte_flags |= GEN6_PTE_CACHE_LLC_MLC;
210 pte_flags |= GEN6_PTE_CACHE_LLC;
212 case I915_CACHE_NONE:
213 pte_flags |= GEN6_PTE_UNCACHED;
219 i915_ppgtt_insert_pages(ppgtt, obj->gtt_space->start >> PAGE_SHIFT,
220 obj->base.size >> PAGE_SHIFT, obj->pages, pte_flags);
223 void i915_ppgtt_unbind_object(struct i915_hw_ppgtt *ppgtt,
224 struct drm_i915_gem_object *obj)
226 i915_ppgtt_clear_range(ppgtt, obj->gtt_space->start >> PAGE_SHIFT,
227 obj->base.size >> PAGE_SHIFT);
231 i915_gem_cleanup_aliasing_ppgtt(struct drm_device *dev)
233 struct drm_i915_private *dev_priv;
234 struct i915_hw_ppgtt *ppgtt;
238 dev_priv = dev->dev_private;
239 ppgtt = dev_priv->mm.aliasing_ppgtt;
242 dev_priv->mm.aliasing_ppgtt = NULL;
244 for (i = 0; i < ppgtt->num_pd_entries; i++) {
245 m = ppgtt->pt_pages[i];
247 vm_page_busy_wait(m, FALSE, "i915gem");
248 vm_page_unwire(m, 0);
252 drm_free(ppgtt->pt_pages, DRM_I915_GEM);
253 drm_free(ppgtt, DRM_I915_GEM);
258 cache_level_to_agp_type(struct drm_device *dev, enum i915_cache_level
262 switch (cache_level) {
263 case I915_CACHE_LLC_MLC:
264 if (INTEL_INFO(dev)->gen >= 6)
265 return (AGP_USER_CACHED_MEMORY_LLC_MLC);
267 * Older chipsets do not have this extra level of CPU
268 * cacheing, so fallthrough and request the PTE simply
272 return (AGP_USER_CACHED_MEMORY);
275 case I915_CACHE_NONE:
276 return (AGP_USER_MEMORY);
281 do_idling(struct drm_i915_private *dev_priv)
283 bool ret = dev_priv->mm.interruptible;
285 if (unlikely(dev_priv->mm.gtt->do_idle_maps)) {
286 dev_priv->mm.interruptible = false;
287 if (i915_gpu_idle(dev_priv->dev, false)) {
288 DRM_ERROR("Couldn't idle GPU\n");
289 /* Wait a bit, in hopes it avoids the hang */
298 undo_idling(struct drm_i915_private *dev_priv, bool interruptible)
301 if (unlikely(dev_priv->mm.gtt->do_idle_maps))
302 dev_priv->mm.interruptible = interruptible;
306 i915_gem_restore_gtt_mappings(struct drm_device *dev)
308 struct drm_i915_private *dev_priv;
309 struct drm_i915_gem_object *obj;
311 dev_priv = dev->dev_private;
313 /* First fill our portion of the GTT with scratch pages */
314 intel_gtt_clear_range(dev_priv->mm.gtt_start / PAGE_SIZE,
315 (dev_priv->mm.gtt_end - dev_priv->mm.gtt_start) / PAGE_SIZE);
317 list_for_each_entry(obj, &dev_priv->mm.gtt_list, gtt_list) {
318 i915_gem_clflush_object(obj);
319 i915_gem_gtt_rebind_object(obj, obj->cache_level);
322 intel_gtt_chipset_flush();
326 i915_gem_gtt_bind_object(struct drm_i915_gem_object *obj)
328 unsigned int agp_type;
330 agp_type = cache_level_to_agp_type(obj->base.dev, obj->cache_level);
331 intel_gtt_insert_pages(obj->gtt_space->start >> PAGE_SHIFT,
332 obj->base.size >> PAGE_SHIFT, obj->pages, agp_type);
337 i915_gem_gtt_rebind_object(struct drm_i915_gem_object *obj,
338 enum i915_cache_level cache_level)
340 struct drm_device *dev;
341 struct drm_i915_private *dev_priv;
342 unsigned int agp_type;
345 dev_priv = dev->dev_private;
346 agp_type = cache_level_to_agp_type(dev, cache_level);
348 intel_gtt_insert_pages(obj->gtt_space->start >> PAGE_SHIFT,
349 obj->base.size >> PAGE_SHIFT, obj->pages, agp_type);
353 i915_gem_gtt_unbind_object(struct drm_i915_gem_object *obj)
355 struct drm_device *dev = obj->base.dev;
356 struct drm_i915_private *dev_priv = dev->dev_private;
360 dev_priv = dev->dev_private;
362 interruptible = do_idling(dev_priv);
364 intel_gtt_clear_range(obj->gtt_space->start >> PAGE_SHIFT,
365 obj->base.size >> PAGE_SHIFT);
367 undo_idling(dev_priv, interruptible);
370 #define GFX_MODE_ENABLE(bit) (((bit) << 16) | (bit))
372 void i915_gem_init_ppgtt(struct drm_device *dev)
374 drm_i915_private_t *dev_priv = dev->dev_private;
376 struct intel_ring_buffer *ring;
377 struct i915_hw_ppgtt *ppgtt = dev_priv->mm.aliasing_ppgtt;
380 u_int first_pd_entry_in_global_pt, i;
385 first_pd_entry_in_global_pt = 512 * 1024 - I915_PPGTT_PD_ENTRIES;
386 for (i = 0; i < ppgtt->num_pd_entries; i++) {
387 pt_addr = VM_PAGE_TO_PHYS(ppgtt->pt_pages[i]);
388 pd_entry = GEN6_PDE_ADDR_ENCODE(pt_addr);
389 pd_entry |= GEN6_PDE_VALID;
390 intel_gtt_write(first_pd_entry_in_global_pt + i, pd_entry);
392 intel_gtt_read_pte(first_pd_entry_in_global_pt);
394 pd_offset = ppgtt->pd_offset;
395 pd_offset /= 64; /* in cachelines, */
398 if (INTEL_INFO(dev)->gen == 6) {
399 uint32_t ecochk = I915_READ(GAM_ECOCHK);
400 I915_WRITE(GAM_ECOCHK, ecochk | ECOCHK_SNB_BIT |
401 ECOCHK_PPGTT_CACHE64B);
402 I915_WRITE(GFX_MODE, GFX_MODE_ENABLE(GFX_PPGTT_ENABLE));
403 } else if (INTEL_INFO(dev)->gen >= 7) {
404 I915_WRITE(GAM_ECOCHK, ECOCHK_PPGTT_CACHE64B);
405 /* GFX_MODE is per-ring on gen7+ */
408 for (i = 0; i < I915_NUM_RINGS; i++) {
409 ring = &dev_priv->rings[i];
411 if (INTEL_INFO(dev)->gen >= 7)
412 I915_WRITE(RING_MODE_GEN7(ring),
413 GFX_MODE_ENABLE(GFX_PPGTT_ENABLE));
415 I915_WRITE(RING_PP_DIR_DCLV(ring), PP_DIR_DCLV_2G);
416 I915_WRITE(RING_PP_DIR_BASE(ring), pd_offset);