Linux-libre 3.10.48-gnu
[librecmc/linux-libre.git] / drivers / gpu / drm / gma500 / mmu.c
1 /**************************************************************************
2  * Copyright (c) 2007, Intel Corporation.
3  *
4  * This program is free software; you can redistribute it and/or modify it
5  * under the terms and conditions of the GNU General Public License,
6  * version 2, as published by the Free Software Foundation.
7  *
8  * This program is distributed in the hope it will be useful, but WITHOUT
9  * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
10  * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
11  * more details.
12  *
13  * You should have received a copy of the GNU General Public License along with
14  * this program; if not, write to the Free Software Foundation, Inc.,
15  * 51 Franklin St - Fifth Floor, Boston, MA 02110-1301 USA.
16  *
17  **************************************************************************/
18 #include <drm/drmP.h>
19 #include "psb_drv.h"
20 #include "psb_reg.h"
21
22 /*
23  * Code for the SGX MMU:
24  */
25
26 /*
27  * clflush on one processor only:
28  * clflush should apparently flush the cache line on all processors in an
29  * SMP system.
30  */
31
32 /*
33  * kmap atomic:
34  * The usage of the slots must be completely encapsulated within a spinlock, and
35  * no other functions that may be using the locks for other purposed may be
36  * called from within the locked region.
37  * Since the slots are per processor, this will guarantee that we are the only
38  * user.
39  */
40
41 /*
42  * TODO: Inserting ptes from an interrupt handler:
43  * This may be desirable for some SGX functionality where the GPU can fault in
44  * needed pages. For that, we need to make an atomic insert_pages function, that
45  * may fail.
46  * If it fails, the caller need to insert the page using a workqueue function,
47  * but on average it should be fast.
48  */
49
50 struct psb_mmu_driver {
51         /* protects driver- and pd structures. Always take in read mode
52          * before taking the page table spinlock.
53          */
54         struct rw_semaphore sem;
55
56         /* protects page tables, directory tables and pt tables.
57          * and pt structures.
58          */
59         spinlock_t lock;
60
61         atomic_t needs_tlbflush;
62
63         uint8_t __iomem *register_map;
64         struct psb_mmu_pd *default_pd;
65         /*uint32_t bif_ctrl;*/
66         int has_clflush;
67         int clflush_add;
68         unsigned long clflush_mask;
69
70         struct drm_psb_private *dev_priv;
71 };
72
73 struct psb_mmu_pd;
74
75 struct psb_mmu_pt {
76         struct psb_mmu_pd *pd;
77         uint32_t index;
78         uint32_t count;
79         struct page *p;
80         uint32_t *v;
81 };
82
83 struct psb_mmu_pd {
84         struct psb_mmu_driver *driver;
85         int hw_context;
86         struct psb_mmu_pt **tables;
87         struct page *p;
88         struct page *dummy_pt;
89         struct page *dummy_page;
90         uint32_t pd_mask;
91         uint32_t invalid_pde;
92         uint32_t invalid_pte;
93 };
94
95 static inline uint32_t psb_mmu_pt_index(uint32_t offset)
96 {
97         return (offset >> PSB_PTE_SHIFT) & 0x3FF;
98 }
99
100 static inline uint32_t psb_mmu_pd_index(uint32_t offset)
101 {
102         return offset >> PSB_PDE_SHIFT;
103 }
104
105 static inline void psb_clflush(void *addr)
106 {
107         __asm__ __volatile__("clflush (%0)\n" : : "r"(addr) : "memory");
108 }
109
110 static inline void psb_mmu_clflush(struct psb_mmu_driver *driver,
111                                    void *addr)
112 {
113         if (!driver->has_clflush)
114                 return;
115
116         mb();
117         psb_clflush(addr);
118         mb();
119 }
120
121 static void psb_page_clflush(struct psb_mmu_driver *driver, struct page* page)
122 {
123         uint32_t clflush_add = driver->clflush_add >> PAGE_SHIFT;
124         uint32_t clflush_count = PAGE_SIZE / clflush_add;
125         int i;
126         uint8_t *clf;
127
128         clf = kmap_atomic(page);
129         mb();
130         for (i = 0; i < clflush_count; ++i) {
131                 psb_clflush(clf);
132                 clf += clflush_add;
133         }
134         mb();
135         kunmap_atomic(clf);
136 }
137
138 static void psb_pages_clflush(struct psb_mmu_driver *driver,
139                                 struct page *page[], unsigned long num_pages)
140 {
141         int i;
142
143         if (!driver->has_clflush)
144                 return ;
145
146         for (i = 0; i < num_pages; i++)
147                 psb_page_clflush(driver, *page++);
148 }
149
150 static void psb_mmu_flush_pd_locked(struct psb_mmu_driver *driver,
151                                     int force)
152 {
153         atomic_set(&driver->needs_tlbflush, 0);
154 }
155
156 static void psb_mmu_flush_pd(struct psb_mmu_driver *driver, int force)
157 {
158         down_write(&driver->sem);
159         psb_mmu_flush_pd_locked(driver, force);
160         up_write(&driver->sem);
161 }
162
163 void psb_mmu_flush(struct psb_mmu_driver *driver, int rc_prot)
164 {
165         if (rc_prot)
166                 down_write(&driver->sem);
167         if (rc_prot)
168                 up_write(&driver->sem);
169 }
170
171 void psb_mmu_set_pd_context(struct psb_mmu_pd *pd, int hw_context)
172 {
173         /*ttm_tt_cache_flush(&pd->p, 1);*/
174         psb_pages_clflush(pd->driver, &pd->p, 1);
175         down_write(&pd->driver->sem);
176         wmb();
177         psb_mmu_flush_pd_locked(pd->driver, 1);
178         pd->hw_context = hw_context;
179         up_write(&pd->driver->sem);
180
181 }
182
183 static inline unsigned long psb_pd_addr_end(unsigned long addr,
184                                             unsigned long end)
185 {
186
187         addr = (addr + PSB_PDE_MASK + 1) & ~PSB_PDE_MASK;
188         return (addr < end) ? addr : end;
189 }
190
191 static inline uint32_t psb_mmu_mask_pte(uint32_t pfn, int type)
192 {
193         uint32_t mask = PSB_PTE_VALID;
194
195         if (type & PSB_MMU_CACHED_MEMORY)
196                 mask |= PSB_PTE_CACHED;
197         if (type & PSB_MMU_RO_MEMORY)
198                 mask |= PSB_PTE_RO;
199         if (type & PSB_MMU_WO_MEMORY)
200                 mask |= PSB_PTE_WO;
201
202         return (pfn << PAGE_SHIFT) | mask;
203 }
204
205 struct psb_mmu_pd *psb_mmu_alloc_pd(struct psb_mmu_driver *driver,
206                                     int trap_pagefaults, int invalid_type)
207 {
208         struct psb_mmu_pd *pd = kmalloc(sizeof(*pd), GFP_KERNEL);
209         uint32_t *v;
210         int i;
211
212         if (!pd)
213                 return NULL;
214
215         pd->p = alloc_page(GFP_DMA32);
216         if (!pd->p)
217                 goto out_err1;
218         pd->dummy_pt = alloc_page(GFP_DMA32);
219         if (!pd->dummy_pt)
220                 goto out_err2;
221         pd->dummy_page = alloc_page(GFP_DMA32);
222         if (!pd->dummy_page)
223                 goto out_err3;
224
225         if (!trap_pagefaults) {
226                 pd->invalid_pde =
227                     psb_mmu_mask_pte(page_to_pfn(pd->dummy_pt),
228                                      invalid_type);
229                 pd->invalid_pte =
230                     psb_mmu_mask_pte(page_to_pfn(pd->dummy_page),
231                                      invalid_type);
232         } else {
233                 pd->invalid_pde = 0;
234                 pd->invalid_pte = 0;
235         }
236
237         v = kmap(pd->dummy_pt);
238         for (i = 0; i < (PAGE_SIZE / sizeof(uint32_t)); ++i)
239                 v[i] = pd->invalid_pte;
240
241         kunmap(pd->dummy_pt);
242
243         v = kmap(pd->p);
244         for (i = 0; i < (PAGE_SIZE / sizeof(uint32_t)); ++i)
245                 v[i] = pd->invalid_pde;
246
247         kunmap(pd->p);
248
249         clear_page(kmap(pd->dummy_page));
250         kunmap(pd->dummy_page);
251
252         pd->tables = vmalloc_user(sizeof(struct psb_mmu_pt *) * 1024);
253         if (!pd->tables)
254                 goto out_err4;
255
256         pd->hw_context = -1;
257         pd->pd_mask = PSB_PTE_VALID;
258         pd->driver = driver;
259
260         return pd;
261
262 out_err4:
263         __free_page(pd->dummy_page);
264 out_err3:
265         __free_page(pd->dummy_pt);
266 out_err2:
267         __free_page(pd->p);
268 out_err1:
269         kfree(pd);
270         return NULL;
271 }
272
273 static void psb_mmu_free_pt(struct psb_mmu_pt *pt)
274 {
275         __free_page(pt->p);
276         kfree(pt);
277 }
278
279 void psb_mmu_free_pagedir(struct psb_mmu_pd *pd)
280 {
281         struct psb_mmu_driver *driver = pd->driver;
282         struct psb_mmu_pt *pt;
283         int i;
284
285         down_write(&driver->sem);
286         if (pd->hw_context != -1)
287                 psb_mmu_flush_pd_locked(driver, 1);
288
289         /* Should take the spinlock here, but we don't need to do that
290            since we have the semaphore in write mode. */
291
292         for (i = 0; i < 1024; ++i) {
293                 pt = pd->tables[i];
294                 if (pt)
295                         psb_mmu_free_pt(pt);
296         }
297
298         vfree(pd->tables);
299         __free_page(pd->dummy_page);
300         __free_page(pd->dummy_pt);
301         __free_page(pd->p);
302         kfree(pd);
303         up_write(&driver->sem);
304 }
305
306 static struct psb_mmu_pt *psb_mmu_alloc_pt(struct psb_mmu_pd *pd)
307 {
308         struct psb_mmu_pt *pt = kmalloc(sizeof(*pt), GFP_KERNEL);
309         void *v;
310         uint32_t clflush_add = pd->driver->clflush_add >> PAGE_SHIFT;
311         uint32_t clflush_count = PAGE_SIZE / clflush_add;
312         spinlock_t *lock = &pd->driver->lock;
313         uint8_t *clf;
314         uint32_t *ptes;
315         int i;
316
317         if (!pt)
318                 return NULL;
319
320         pt->p = alloc_page(GFP_DMA32);
321         if (!pt->p) {
322                 kfree(pt);
323                 return NULL;
324         }
325
326         spin_lock(lock);
327
328         v = kmap_atomic(pt->p);
329         clf = (uint8_t *) v;
330         ptes = (uint32_t *) v;
331         for (i = 0; i < (PAGE_SIZE / sizeof(uint32_t)); ++i)
332                 *ptes++ = pd->invalid_pte;
333
334
335         if (pd->driver->has_clflush && pd->hw_context != -1) {
336                 mb();
337                 for (i = 0; i < clflush_count; ++i) {
338                         psb_clflush(clf);
339                         clf += clflush_add;
340                 }
341                 mb();
342         }
343
344         kunmap_atomic(v);
345         spin_unlock(lock);
346
347         pt->count = 0;
348         pt->pd = pd;
349         pt->index = 0;
350
351         return pt;
352 }
353
354 static struct psb_mmu_pt *psb_mmu_pt_alloc_map_lock(struct psb_mmu_pd *pd,
355                                              unsigned long addr)
356 {
357         uint32_t index = psb_mmu_pd_index(addr);
358         struct psb_mmu_pt *pt;
359         uint32_t *v;
360         spinlock_t *lock = &pd->driver->lock;
361
362         spin_lock(lock);
363         pt = pd->tables[index];
364         while (!pt) {
365                 spin_unlock(lock);
366                 pt = psb_mmu_alloc_pt(pd);
367                 if (!pt)
368                         return NULL;
369                 spin_lock(lock);
370
371                 if (pd->tables[index]) {
372                         spin_unlock(lock);
373                         psb_mmu_free_pt(pt);
374                         spin_lock(lock);
375                         pt = pd->tables[index];
376                         continue;
377                 }
378
379                 v = kmap_atomic(pd->p);
380                 pd->tables[index] = pt;
381                 v[index] = (page_to_pfn(pt->p) << 12) | pd->pd_mask;
382                 pt->index = index;
383                 kunmap_atomic((void *) v);
384
385                 if (pd->hw_context != -1) {
386                         psb_mmu_clflush(pd->driver, (void *) &v[index]);
387                         atomic_set(&pd->driver->needs_tlbflush, 1);
388                 }
389         }
390         pt->v = kmap_atomic(pt->p);
391         return pt;
392 }
393
394 static struct psb_mmu_pt *psb_mmu_pt_map_lock(struct psb_mmu_pd *pd,
395                                               unsigned long addr)
396 {
397         uint32_t index = psb_mmu_pd_index(addr);
398         struct psb_mmu_pt *pt;
399         spinlock_t *lock = &pd->driver->lock;
400
401         spin_lock(lock);
402         pt = pd->tables[index];
403         if (!pt) {
404                 spin_unlock(lock);
405                 return NULL;
406         }
407         pt->v = kmap_atomic(pt->p);
408         return pt;
409 }
410
411 static void psb_mmu_pt_unmap_unlock(struct psb_mmu_pt *pt)
412 {
413         struct psb_mmu_pd *pd = pt->pd;
414         uint32_t *v;
415
416         kunmap_atomic(pt->v);
417         if (pt->count == 0) {
418                 v = kmap_atomic(pd->p);
419                 v[pt->index] = pd->invalid_pde;
420                 pd->tables[pt->index] = NULL;
421
422                 if (pd->hw_context != -1) {
423                         psb_mmu_clflush(pd->driver,
424                                         (void *) &v[pt->index]);
425                         atomic_set(&pd->driver->needs_tlbflush, 1);
426                 }
427                 kunmap_atomic(pt->v);
428                 spin_unlock(&pd->driver->lock);
429                 psb_mmu_free_pt(pt);
430                 return;
431         }
432         spin_unlock(&pd->driver->lock);
433 }
434
435 static inline void psb_mmu_set_pte(struct psb_mmu_pt *pt,
436                                    unsigned long addr, uint32_t pte)
437 {
438         pt->v[psb_mmu_pt_index(addr)] = pte;
439 }
440
441 static inline void psb_mmu_invalidate_pte(struct psb_mmu_pt *pt,
442                                           unsigned long addr)
443 {
444         pt->v[psb_mmu_pt_index(addr)] = pt->pd->invalid_pte;
445 }
446
447
448 void psb_mmu_mirror_gtt(struct psb_mmu_pd *pd,
449                         uint32_t mmu_offset, uint32_t gtt_start,
450                         uint32_t gtt_pages)
451 {
452         uint32_t *v;
453         uint32_t start = psb_mmu_pd_index(mmu_offset);
454         struct psb_mmu_driver *driver = pd->driver;
455         int num_pages = gtt_pages;
456
457         down_read(&driver->sem);
458         spin_lock(&driver->lock);
459
460         v = kmap_atomic(pd->p);
461         v += start;
462
463         while (gtt_pages--) {
464                 *v++ = gtt_start | pd->pd_mask;
465                 gtt_start += PAGE_SIZE;
466         }
467
468         /*ttm_tt_cache_flush(&pd->p, num_pages);*/
469         psb_pages_clflush(pd->driver, &pd->p, num_pages);
470         kunmap_atomic(v);
471         spin_unlock(&driver->lock);
472
473         if (pd->hw_context != -1)
474                 atomic_set(&pd->driver->needs_tlbflush, 1);
475
476         up_read(&pd->driver->sem);
477         psb_mmu_flush_pd(pd->driver, 0);
478 }
479
480 struct psb_mmu_pd *psb_mmu_get_default_pd(struct psb_mmu_driver *driver)
481 {
482         struct psb_mmu_pd *pd;
483
484         /* down_read(&driver->sem); */
485         pd = driver->default_pd;
486         /* up_read(&driver->sem); */
487
488         return pd;
489 }
490
491 void psb_mmu_driver_takedown(struct psb_mmu_driver *driver)
492 {
493         psb_mmu_free_pagedir(driver->default_pd);
494         kfree(driver);
495 }
496
497 struct psb_mmu_driver *psb_mmu_driver_init(uint8_t __iomem * registers,
498                                         int trap_pagefaults,
499                                         int invalid_type,
500                                         struct drm_psb_private *dev_priv)
501 {
502         struct psb_mmu_driver *driver;
503
504         driver = kmalloc(sizeof(*driver), GFP_KERNEL);
505
506         if (!driver)
507                 return NULL;
508         driver->dev_priv = dev_priv;
509
510         driver->default_pd = psb_mmu_alloc_pd(driver, trap_pagefaults,
511                                               invalid_type);
512         if (!driver->default_pd)
513                 goto out_err1;
514
515         spin_lock_init(&driver->lock);
516         init_rwsem(&driver->sem);
517         down_write(&driver->sem);
518         driver->register_map = registers;
519         atomic_set(&driver->needs_tlbflush, 1);
520
521         driver->has_clflush = 0;
522
523         if (boot_cpu_has(X86_FEATURE_CLFLSH)) {
524                 uint32_t tfms, misc, cap0, cap4, clflush_size;
525
526                 /*
527                  * clflush size is determined at kernel setup for x86_64
528                  *  but not for i386. We have to do it here.
529                  */
530
531                 cpuid(0x00000001, &tfms, &misc, &cap0, &cap4);
532                 clflush_size = ((misc >> 8) & 0xff) * 8;
533                 driver->has_clflush = 1;
534                 driver->clflush_add =
535                     PAGE_SIZE * clflush_size / sizeof(uint32_t);
536                 driver->clflush_mask = driver->clflush_add - 1;
537                 driver->clflush_mask = ~driver->clflush_mask;
538         }
539
540         up_write(&driver->sem);
541         return driver;
542
543 out_err1:
544         kfree(driver);
545         return NULL;
546 }
547
548 static void psb_mmu_flush_ptes(struct psb_mmu_pd *pd,
549                                unsigned long address, uint32_t num_pages,
550                                uint32_t desired_tile_stride,
551                                uint32_t hw_tile_stride)
552 {
553         struct psb_mmu_pt *pt;
554         uint32_t rows = 1;
555         uint32_t i;
556         unsigned long addr;
557         unsigned long end;
558         unsigned long next;
559         unsigned long add;
560         unsigned long row_add;
561         unsigned long clflush_add = pd->driver->clflush_add;
562         unsigned long clflush_mask = pd->driver->clflush_mask;
563
564         if (!pd->driver->has_clflush) {
565                 /*ttm_tt_cache_flush(&pd->p, num_pages);*/
566                 psb_pages_clflush(pd->driver, &pd->p, num_pages);
567                 return;
568         }
569
570         if (hw_tile_stride)
571                 rows = num_pages / desired_tile_stride;
572         else
573                 desired_tile_stride = num_pages;
574
575         add = desired_tile_stride << PAGE_SHIFT;
576         row_add = hw_tile_stride << PAGE_SHIFT;
577         mb();
578         for (i = 0; i < rows; ++i) {
579
580                 addr = address;
581                 end = addr + add;
582
583                 do {
584                         next = psb_pd_addr_end(addr, end);
585                         pt = psb_mmu_pt_map_lock(pd, addr);
586                         if (!pt)
587                                 continue;
588                         do {
589                                 psb_clflush(&pt->v
590                                             [psb_mmu_pt_index(addr)]);
591                         } while (addr +=
592                                  clflush_add,
593                                  (addr & clflush_mask) < next);
594
595                         psb_mmu_pt_unmap_unlock(pt);
596                 } while (addr = next, next != end);
597                 address += row_add;
598         }
599         mb();
600 }
601
602 void psb_mmu_remove_pfn_sequence(struct psb_mmu_pd *pd,
603                                  unsigned long address, uint32_t num_pages)
604 {
605         struct psb_mmu_pt *pt;
606         unsigned long addr;
607         unsigned long end;
608         unsigned long next;
609         unsigned long f_address = address;
610
611         down_read(&pd->driver->sem);
612
613         addr = address;
614         end = addr + (num_pages << PAGE_SHIFT);
615
616         do {
617                 next = psb_pd_addr_end(addr, end);
618                 pt = psb_mmu_pt_alloc_map_lock(pd, addr);
619                 if (!pt)
620                         goto out;
621                 do {
622                         psb_mmu_invalidate_pte(pt, addr);
623                         --pt->count;
624                 } while (addr += PAGE_SIZE, addr < next);
625                 psb_mmu_pt_unmap_unlock(pt);
626
627         } while (addr = next, next != end);
628
629 out:
630         if (pd->hw_context != -1)
631                 psb_mmu_flush_ptes(pd, f_address, num_pages, 1, 1);
632
633         up_read(&pd->driver->sem);
634
635         if (pd->hw_context != -1)
636                 psb_mmu_flush(pd->driver, 0);
637
638         return;
639 }
640
641 void psb_mmu_remove_pages(struct psb_mmu_pd *pd, unsigned long address,
642                           uint32_t num_pages, uint32_t desired_tile_stride,
643                           uint32_t hw_tile_stride)
644 {
645         struct psb_mmu_pt *pt;
646         uint32_t rows = 1;
647         uint32_t i;
648         unsigned long addr;
649         unsigned long end;
650         unsigned long next;
651         unsigned long add;
652         unsigned long row_add;
653         unsigned long f_address = address;
654
655         if (hw_tile_stride)
656                 rows = num_pages / desired_tile_stride;
657         else
658                 desired_tile_stride = num_pages;
659
660         add = desired_tile_stride << PAGE_SHIFT;
661         row_add = hw_tile_stride << PAGE_SHIFT;
662
663         /* down_read(&pd->driver->sem); */
664
665         /* Make sure we only need to flush this processor's cache */
666
667         for (i = 0; i < rows; ++i) {
668
669                 addr = address;
670                 end = addr + add;
671
672                 do {
673                         next = psb_pd_addr_end(addr, end);
674                         pt = psb_mmu_pt_map_lock(pd, addr);
675                         if (!pt)
676                                 continue;
677                         do {
678                                 psb_mmu_invalidate_pte(pt, addr);
679                                 --pt->count;
680
681                         } while (addr += PAGE_SIZE, addr < next);
682                         psb_mmu_pt_unmap_unlock(pt);
683
684                 } while (addr = next, next != end);
685                 address += row_add;
686         }
687         if (pd->hw_context != -1)
688                 psb_mmu_flush_ptes(pd, f_address, num_pages,
689                                    desired_tile_stride, hw_tile_stride);
690
691         /* up_read(&pd->driver->sem); */
692
693         if (pd->hw_context != -1)
694                 psb_mmu_flush(pd->driver, 0);
695 }
696
697 int psb_mmu_insert_pfn_sequence(struct psb_mmu_pd *pd, uint32_t start_pfn,
698                                 unsigned long address, uint32_t num_pages,
699                                 int type)
700 {
701         struct psb_mmu_pt *pt;
702         uint32_t pte;
703         unsigned long addr;
704         unsigned long end;
705         unsigned long next;
706         unsigned long f_address = address;
707         int ret = 0;
708
709         down_read(&pd->driver->sem);
710
711         addr = address;
712         end = addr + (num_pages << PAGE_SHIFT);
713
714         do {
715                 next = psb_pd_addr_end(addr, end);
716                 pt = psb_mmu_pt_alloc_map_lock(pd, addr);
717                 if (!pt) {
718                         ret = -ENOMEM;
719                         goto out;
720                 }
721                 do {
722                         pte = psb_mmu_mask_pte(start_pfn++, type);
723                         psb_mmu_set_pte(pt, addr, pte);
724                         pt->count++;
725                 } while (addr += PAGE_SIZE, addr < next);
726                 psb_mmu_pt_unmap_unlock(pt);
727
728         } while (addr = next, next != end);
729
730 out:
731         if (pd->hw_context != -1)
732                 psb_mmu_flush_ptes(pd, f_address, num_pages, 1, 1);
733
734         up_read(&pd->driver->sem);
735
736         if (pd->hw_context != -1)
737                 psb_mmu_flush(pd->driver, 1);
738
739         return ret;
740 }
741
742 int psb_mmu_insert_pages(struct psb_mmu_pd *pd, struct page **pages,
743                          unsigned long address, uint32_t num_pages,
744                          uint32_t desired_tile_stride,
745                          uint32_t hw_tile_stride, int type)
746 {
747         struct psb_mmu_pt *pt;
748         uint32_t rows = 1;
749         uint32_t i;
750         uint32_t pte;
751         unsigned long addr;
752         unsigned long end;
753         unsigned long next;
754         unsigned long add;
755         unsigned long row_add;
756         unsigned long f_address = address;
757         int ret = 0;
758
759         if (hw_tile_stride) {
760                 if (num_pages % desired_tile_stride != 0)
761                         return -EINVAL;
762                 rows = num_pages / desired_tile_stride;
763         } else {
764                 desired_tile_stride = num_pages;
765         }
766
767         add = desired_tile_stride << PAGE_SHIFT;
768         row_add = hw_tile_stride << PAGE_SHIFT;
769
770         down_read(&pd->driver->sem);
771
772         for (i = 0; i < rows; ++i) {
773
774                 addr = address;
775                 end = addr + add;
776
777                 do {
778                         next = psb_pd_addr_end(addr, end);
779                         pt = psb_mmu_pt_alloc_map_lock(pd, addr);
780                         if (!pt) {
781                                 ret = -ENOMEM;
782                                 goto out;
783                         }
784                         do {
785                                 pte =
786                                     psb_mmu_mask_pte(page_to_pfn(*pages++),
787                                                      type);
788                                 psb_mmu_set_pte(pt, addr, pte);
789                                 pt->count++;
790                         } while (addr += PAGE_SIZE, addr < next);
791                         psb_mmu_pt_unmap_unlock(pt);
792
793                 } while (addr = next, next != end);
794
795                 address += row_add;
796         }
797 out:
798         if (pd->hw_context != -1)
799                 psb_mmu_flush_ptes(pd, f_address, num_pages,
800                                    desired_tile_stride, hw_tile_stride);
801
802         up_read(&pd->driver->sem);
803
804         if (pd->hw_context != -1)
805                 psb_mmu_flush(pd->driver, 1);
806
807         return ret;
808 }
809
810 int psb_mmu_virtual_to_pfn(struct psb_mmu_pd *pd, uint32_t virtual,
811                            unsigned long *pfn)
812 {
813         int ret;
814         struct psb_mmu_pt *pt;
815         uint32_t tmp;
816         spinlock_t *lock = &pd->driver->lock;
817
818         down_read(&pd->driver->sem);
819         pt = psb_mmu_pt_map_lock(pd, virtual);
820         if (!pt) {
821                 uint32_t *v;
822
823                 spin_lock(lock);
824                 v = kmap_atomic(pd->p);
825                 tmp = v[psb_mmu_pd_index(virtual)];
826                 kunmap_atomic(v);
827                 spin_unlock(lock);
828
829                 if (tmp != pd->invalid_pde || !(tmp & PSB_PTE_VALID) ||
830                     !(pd->invalid_pte & PSB_PTE_VALID)) {
831                         ret = -EINVAL;
832                         goto out;
833                 }
834                 ret = 0;
835                 *pfn = pd->invalid_pte >> PAGE_SHIFT;
836                 goto out;
837         }
838         tmp = pt->v[psb_mmu_pt_index(virtual)];
839         if (!(tmp & PSB_PTE_VALID)) {
840                 ret = -EINVAL;
841         } else {
842                 ret = 0;
843                 *pfn = tmp >> PAGE_SHIFT;
844         }
845         psb_mmu_pt_unmap_unlock(pt);
846 out:
847         up_read(&pd->driver->sem);
848         return ret;
849 }