m1n1/src/dart.c
Janne Grunau 0104abbea7 dart: Add dart_find_iova() to find unused IOVA space
Signed-off-by: Janne Grunau <j@jannau.net>
2022-04-19 21:29:30 +09:00

378 lines
9.9 KiB
C

/* SPDX-License-Identifier: MIT */
#include "dart.h"
#include "adt.h"
#include "assert.h"
#include "malloc.h"
#include "memory.h"
#include "string.h"
#include "utils.h"
#define DART_CONFIG 0x60
#define DART_CONFIG_LOCK BIT(15)
#define DART_ERROR 0x40
#define DART_ERROR_STREAM_SHIFT 24
#define DART_ERROR_STREAM_MASK 0xf
#define DART_ERROR_CODE_MASK 0xffffff
#define DART_ERROR_FLAG BIT(31)
#define DART_ERROR_READ_FAULT BIT(4)
#define DART_ERROR_WRITE_FAULT BIT(3)
#define DART_ERROR_NO_PTE BIT(2)
#define DART_ERROR_NO_PMD BIT(1)
#define DART_ERROR_NO_TTBR BIT(0)
#define DART_STREAM_SELECT 0x34
#define DART_STREAM_COMMAND 0x20
#define DART_STREAM_COMMAND_BUSY BIT(2)
#define DART_STREAM_COMMAND_INVALIDATE BIT(20)
#define DART_STREAM_COMMAND_BUSY_TIMEOUT 100
#define DART_STREAM_REMAP 0x80
#define DART_ERROR_ADDR_HI 0x54
#define DART_ERROR_ADDR_LO 0x50
#define DART_ENABLED_STREAMS 0xfc
#define DART_TCR(sid) (0x100 + 4 * (sid))
#define DART_TCR_TRANSLATE_ENABLE BIT(7)
#define DART_TCR_BYPASS_DART BIT(8)
#define DART_TCR_BYPASS_DAPF BIT(12)
#define DART_TTBR(sid, idx) (0x200 + 16 * (sid) + 4 * (idx))
#define DART_TTBR_VALID BIT(31)
#define DART_TTBR_ADDR GENMASK(30, 0)
#define DART_TTBR_SHIFT 12
#define DART_PTE_OFFSET_SHIFT 14
#define DART_PTE_SP_START GENMASK(63, 52)
#define DART_PTE_SP_END GENMASK(51, 40)
#define DART_PTE_OFFSET_T8020 GENMASK(39, 14)
#define DART_PTE_OFFSET_T6000 GENMASK(39, 10)
#define DART_PTE_VALID 0b11
struct dart_dev {
bool locked;
bool keep;
uintptr_t regs;
u8 device;
u64 offset_mask;
u64 *l1[4];
};
static void dart_tlb_invalidate(dart_dev_t *dart)
{
write32(dart->regs + DART_STREAM_SELECT, BIT(dart->device));
/* ensure that the DART can see the updated pagetables before invalidating */
dma_wmb();
write32(dart->regs + DART_STREAM_COMMAND, DART_STREAM_COMMAND_INVALIDATE);
if (poll32(dart->regs + DART_STREAM_COMMAND, DART_STREAM_COMMAND_BUSY, 0, 100))
printf("dart: DART_STREAM_COMMAND_BUSY did not clear.\n");
}
dart_dev_t *dart_init(uintptr_t base, u8 device, bool keep_pts)
{
dart_dev_t *dart = malloc(sizeof(*dart));
if (!dart)
return NULL;
memset(dart, 0, sizeof(*dart));
dart->regs = base;
dart->device = device;
if (read32(dart->regs + DART_CONFIG) & DART_CONFIG_LOCK)
dart->locked = true;
dart->offset_mask = DART_PTE_OFFSET_T8020;
dart->keep = keep_pts;
if (dart->locked || keep_pts) {
for (int i = 0; i < 4; i++) {
u32 ttbr = read32(dart->regs + DART_TTBR(device, i));
if (ttbr & DART_TTBR_VALID)
dart->l1[i] = (u64 *)((ttbr & DART_TTBR_ADDR) << DART_TTBR_SHIFT);
}
}
for (int i = 0; i < 4; i++) {
if (dart->l1[i])
continue;
dart->l1[i] = memalign(SZ_16K, SZ_16K);
if (!dart->l1[i])
goto error;
memset(dart->l1[i], 0, SZ_16K);
write32(dart->regs + DART_TTBR(device, i),
DART_TTBR_VALID | (((uintptr_t)dart->l1[i]) >> DART_TTBR_SHIFT));
}
if (!dart->locked && !keep_pts)
write32(dart->regs + DART_TCR(device), DART_TCR_TRANSLATE_ENABLE);
dart_tlb_invalidate(dart);
return dart;
error:
if (!dart->locked)
free(dart->l1);
free(dart);
return NULL;
}
dart_dev_t *dart_init_adt(const char *path, int instance, int device, bool keep_pts)
{
int dart_path[8];
int node = adt_path_offset_trace(adt, path, dart_path);
if (node < 0) {
printf("dart: Error getting DART node %s\n", path);
return NULL;
}
u64 base;
if (adt_get_reg(adt, dart_path, "reg", instance, &base, NULL) < 0) {
printf("dart: Error getting DART %s base address.\n", path);
return NULL;
}
dart_dev_t *dart = dart_init(base, device, keep_pts);
if (!dart)
return NULL;
if (adt_is_compatible(adt, node, "dart,t8020")) {
printf("dart: dart %s at 0x%lx is a t8020%s\n", path, base,
dart->locked ? " (locked)" : "");
dart->offset_mask = DART_PTE_OFFSET_T8020;
} else if (adt_is_compatible(adt, node, "dart,t6000")) {
printf("dart: dart %s at 0x%lx is a t6000%s\n", path, base,
dart->locked ? " (locked)" : "");
dart->offset_mask = DART_PTE_OFFSET_T6000;
}
return dart;
}
static u64 *dart_get_l2(dart_dev_t *dart, u32 idx)
{
int ttbr = idx >> 11;
idx &= 0x7ff;
if (dart->l1[ttbr][idx] & DART_PTE_VALID) {
u64 off = FIELD_GET(dart->offset_mask, dart->l1[ttbr][idx]) << DART_PTE_OFFSET_SHIFT;
return (u64 *)off;
}
u64 *tbl = memalign(SZ_16K, SZ_16K);
if (!tbl)
return NULL;
memset(tbl, 0, SZ_16K);
u64 offset = FIELD_PREP(dart->offset_mask, ((u64)tbl) >> DART_PTE_OFFSET_SHIFT);
dart->l1[ttbr][idx] = offset | DART_PTE_VALID;
return tbl;
}
static int dart_map_page(dart_dev_t *dart, uintptr_t iova, uintptr_t paddr)
{
u32 l1_index = (iova >> 25) & 0x1fff;
u32 l2_index = (iova >> 14) & 0x7ff;
u64 *l2 = dart_get_l2(dart, l1_index);
if (!l2) {
printf("dart: couldn't create l2 for iova %lx\n", iova);
return -1;
}
if (l2[l2_index] & DART_PTE_VALID) {
printf("dart: iova %lx already has a valid PTE: %lx\n", iova, l2[l2_index]);
return -1;
}
u64 offset = FIELD_PREP(dart->offset_mask, paddr >> DART_PTE_OFFSET_SHIFT);
l2[l2_index] = offset | FIELD_PREP(DART_PTE_SP_END, 0xfff) | FIELD_PREP(DART_PTE_SP_START, 0) |
DART_PTE_VALID;
return 0;
}
int dart_map(dart_dev_t *dart, uintptr_t iova, void *bfr, size_t len)
{
uintptr_t paddr = (uintptr_t)bfr;
u64 offset = 0;
if (len % SZ_16K)
return -1;
if (paddr % SZ_16K)
return -1;
if (iova % SZ_16K)
return -1;
while (offset < len) {
int ret = dart_map_page(dart, iova + offset, paddr + offset);
if (ret) {
dart_unmap(dart, iova, offset);
return ret;
}
offset += SZ_16K;
}
dart_tlb_invalidate(dart);
return 0;
}
static void dart_unmap_page(dart_dev_t *dart, uintptr_t iova)
{
u32 ttbr = (iova >> 36) & 0x3;
u32 l1_index = (iova >> 25) & 0x7ff;
u32 l2_index = (iova >> 14) & 0x7ff;
if (!(dart->l1[ttbr][l1_index] & DART_PTE_VALID))
return;
u64 *l2 = dart_get_l2(dart, l1_index);
l2[l2_index] = 0;
}
void dart_unmap(dart_dev_t *dart, uintptr_t iova, size_t len)
{
if (len % SZ_16K)
return;
if (iova % SZ_16K)
return;
while (len) {
dart_unmap_page(dart, iova);
len -= SZ_16K;
iova += SZ_16K;
}
dart_tlb_invalidate(dart);
}
static void *dart_translate_internal(dart_dev_t *dart, uintptr_t iova, int silent)
{
u32 ttbr = (iova >> 36) & 0x3;
u32 l1_index = (iova >> 25) & 0x7ff;
if (!(dart->l1[ttbr][l1_index] & DART_PTE_VALID) && !silent) {
printf("dart: l1 translation failure %x %lx\n", l1_index, iova);
return NULL;
}
u32 l2_index = (iova >> 14) & 0x7ff;
u64 *l2 =
(u64 *)(FIELD_GET(dart->offset_mask, dart->l1[ttbr][l1_index]) << DART_PTE_OFFSET_SHIFT);
if (!(l2[l2_index] & DART_PTE_VALID) && !silent) {
printf("dart: l2 translation failure\n");
return NULL;
}
u32 offset = iova & 0x3fff;
void *base = (void *)(FIELD_GET(dart->offset_mask, l2[l2_index]) << DART_PTE_OFFSET_SHIFT);
return base + offset;
}
void *dart_translate(dart_dev_t *dart, uintptr_t iova)
{
return dart_translate_internal(dart, iova, 0);
}
u64 dart_search(dart_dev_t *dart, void *paddr)
{
for (int ttbr = 0; ttbr < 4; ++ttbr) {
if (!dart->l1[ttbr])
continue;
for (u32 l1_index = 0; l1_index < 0x7ff; l1_index++) {
if (!(dart->l1[ttbr][l1_index] & DART_PTE_VALID))
continue;
u64 *l2 = (u64 *)(FIELD_GET(dart->offset_mask, dart->l1[ttbr][l1_index])
<< DART_PTE_OFFSET_SHIFT);
for (u32 l2_index = 0; l2_index < 0x7ff; l2_index++) {
if (!(l2[l2_index] & DART_PTE_VALID))
continue;
u64 *dst =
(u64 *)(FIELD_GET(dart->offset_mask, l2[l2_index]) << DART_PTE_OFFSET_SHIFT);
if (dst == paddr)
return ((u64)ttbr << 36) | ((u64)l1_index << 25) | (l2_index << 14);
}
}
}
return 0;
}
s64 dart_find_iova(dart_dev_t *dart, s64 start, size_t len)
{
if (len % SZ_16K)
return -1;
if (start < 0 || start % SZ_16K)
return -1;
uintptr_t end = 1LLU << 32;
uintptr_t iova = start;
while (iova + len <= end) {
if (dart_translate_internal(dart, iova, 1) == NULL) {
size_t size;
for (size = SZ_16K; size < len; size += SZ_16K) {
if (dart_translate_internal(dart, iova + size, 1) != NULL)
break;
}
if (size == len)
return iova;
iova += size + SZ_16K;
} else
iova += SZ_16K;
}
return -1;
}
void dart_shutdown(dart_dev_t *dart)
{
if (!dart->locked && !dart->keep)
write32(dart->regs + DART_TCR(dart->device), DART_TCR_BYPASS_DART | DART_TCR_BYPASS_DAPF);
for (int i = 0; i < 4; ++i)
if (is_heap(dart->l1[i]))
write32(dart->regs + DART_TTBR(dart->device, i), 0);
for (int ttbr = 0; ttbr < 4; ++ttbr) {
for (int i = 0; i < SZ_16K / 8; ++i) {
if (dart->l1[ttbr][i] & DART_PTE_VALID) {
void *l2 = dart_get_l2(dart, i);
if (is_heap(l2)) {
free(l2);
dart->l1[ttbr][i] = 0;
}
}
}
}
dart_tlb_invalidate(dart);
for (int i = 0; i < 4; ++i)
if (is_heap(dart->l1[i]))
free(dart->l1[i]);
free(dart);
}