/*-
* SPDX-License-Identifier: BSD-2-Clause
*
* Copyright (c) 2023-2025 Ruslan Bukin
*
* This work was supported by Innovate UK project 105694, "Digital Security
* by Design (DSbD) Technology Platform Prototype".
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
*
* THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
* ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
* OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
* SUCH DAMAGE.
*/
/* Hardware Trace (HWT) framework. */
#include
#include
#include
#include
#include
#include
#include
#include
#include
#include
#include
#include
#include
#include
#include
#include
#include
#include
#include
#include
#include
#include
#include
#define HWT_IOCTL_DEBUG
#undef HWT_IOCTL_DEBUG
#ifdef HWT_IOCTL_DEBUG
#define dprintf(fmt, ...) printf(fmt, ##__VA_ARGS__)
#else
#define dprintf(fmt, ...)
#endif
/* No real reason for these limitations just sanity checks. */
#define HWT_MAXBUFSIZE (32UL * 1024 * 1024 * 1024) /* 32 GB */
static MALLOC_DEFINE(M_HWT_IOCTL, "hwt_ioctl", "Hardware Trace");
/*
* Check if owner process *o can trace target process *t.
*/
static int
hwt_priv_check(struct proc *o, struct proc *t)
{
struct ucred *oc, *tc;
int error;
int i;
PROC_LOCK(o);
oc = o->p_ucred;
crhold(oc);
PROC_UNLOCK(o);
PROC_LOCK_ASSERT(t, MA_OWNED);
tc = t->p_ucred;
crhold(tc);
error = 0;
/*
* The effective uid of the HWT owner should match at least one
* of the effective / real / saved uids of the target process.
*/
if (oc->cr_uid != tc->cr_uid &&
oc->cr_uid != tc->cr_svuid &&
oc->cr_uid != tc->cr_ruid) {
error = EPERM;
goto done;
}
/*
* Everyone of the target's group ids must be in the owner's
* group list.
*/
for (i = 0; i < tc->cr_ngroups; i++)
if (!groupmember(tc->cr_groups[i], oc)) {
error = EPERM;
goto done;
}
/* Check the read and saved GIDs too. */
if (!groupmember(tc->cr_rgid, oc) ||
!groupmember(tc->cr_svgid, oc)) {
error = EPERM;
goto done;
}
done:
crfree(tc);
crfree(oc);
return (error);
}
static int
hwt_ioctl_alloc_mode_thread(struct thread *td, struct hwt_owner *ho,
struct hwt_backend *backend, struct hwt_alloc *halloc)
{
struct thread **threads, *td1;
struct hwt_record_entry *entry;
struct hwt_context *ctx, *ctx1;
struct hwt_thread *thr;
char path[MAXPATHLEN];
struct proc *p;
int thread_id;
int error;
int cnt;
int i;
/* Check if the owner have this pid configured already. */
ctx = hwt_owner_lookup_ctx(ho, halloc->pid);
if (ctx)
return (EEXIST);
/* Allocate a new HWT context. */
error = hwt_ctx_alloc(&ctx);
if (error)
return (error);
ctx->bufsize = halloc->bufsize;
ctx->pid = halloc->pid;
ctx->hwt_backend = backend;
ctx->hwt_owner = ho;
ctx->mode = HWT_MODE_THREAD;
ctx->hwt_td = td;
ctx->kqueue_fd = halloc->kqueue_fd;
error = copyout(&ctx->ident, halloc->ident, sizeof(int));
if (error) {
hwt_ctx_free(ctx);
return (error);
}
/* Now get the victim proc. */
p = pfind(halloc->pid);
if (p == NULL) {
hwt_ctx_free(ctx);
return (ENXIO);
}
/* Ensure we can trace it. */
error = hwt_priv_check(td->td_proc, p);
if (error) {
PROC_UNLOCK(p);
hwt_ctx_free(ctx);
return (error);
}
/* Ensure it is not being traced already. */
ctx1 = hwt_contexthash_lookup(p);
if (ctx1) {
refcount_release(&ctx1->refcnt);
PROC_UNLOCK(p);
hwt_ctx_free(ctx);
return (EEXIST);
}
/* Allocate hwt threads and buffers. */
cnt = 0;
FOREACH_THREAD_IN_PROC(p, td1) {
cnt += 1;
}
KASSERT(cnt > 0, ("no threads"));
threads = malloc(sizeof(struct thread *) * cnt, M_HWT_IOCTL,
M_NOWAIT | M_ZERO);
if (threads == NULL) {
PROC_UNLOCK(p);
hwt_ctx_free(ctx);
return (ENOMEM);
}
i = 0;
FOREACH_THREAD_IN_PROC(p, td1) {
threads[i++] = td1;
}
ctx->proc = p;
PROC_UNLOCK(p);
for (i = 0; i < cnt; i++) {
thread_id = atomic_fetchadd_int(&ctx->thread_counter, 1);
sprintf(path, "hwt_%d_%d", ctx->ident, thread_id);
error = hwt_thread_alloc(&thr, path, ctx->bufsize,
ctx->hwt_backend->kva_req);
if (error) {
free(threads, M_HWT_IOCTL);
hwt_ctx_free(ctx);
return (error);
}
/* Allocate backend-specific thread data. */
error = hwt_backend_thread_alloc(ctx, thr);
if (error != 0) {
dprintf("%s: failed to allocate thread backend data\n",
__func__);
free(threads, M_HWT_IOCTL);
hwt_ctx_free(ctx);
return (error);
}
/*
* Insert a THREAD_CREATE record so userspace picks up
* the thread's tracing buffers.
*/
entry = hwt_record_entry_alloc();
entry->record_type = HWT_RECORD_THREAD_CREATE;
entry->thread_id = thread_id;
thr->vm->ctx = ctx;
thr->td = threads[i];
thr->ctx = ctx;
thr->backend = ctx->hwt_backend;
thr->thread_id = thread_id;
HWT_CTX_LOCK(ctx);
hwt_thread_insert(ctx, thr, entry);
HWT_CTX_UNLOCK(ctx);
}
free(threads, M_HWT_IOCTL);
error = hwt_backend_init(ctx);
if (error) {
hwt_ctx_free(ctx);
return (error);
}
/* hwt_owner_insert_ctx? */
mtx_lock(&ho->mtx);
LIST_INSERT_HEAD(&ho->hwts, ctx, next_hwts);
mtx_unlock(&ho->mtx);
/*
* Hooks are now in action after this, but the ctx is not in RUNNING
* state.
*/
hwt_contexthash_insert(ctx);
p = pfind(halloc->pid);
if (p) {
p->p_flag2 |= P2_HWT;
PROC_UNLOCK(p);
}
return (0);
}
static int
hwt_ioctl_alloc_mode_cpu(struct thread *td, struct hwt_owner *ho,
struct hwt_backend *backend, struct hwt_alloc *halloc)
{
struct hwt_context *ctx;
struct hwt_cpu *cpu;
struct hwt_vm *vm;
char path[MAXPATHLEN];
size_t cpusetsize;
cpuset_t cpu_map;
int cpu_count = 0;
int cpu_id;
int error;
CPU_ZERO(&cpu_map);
cpusetsize = min(halloc->cpusetsize, sizeof(cpuset_t));
error = copyin(halloc->cpu_map, &cpu_map, cpusetsize);
if (error)
return (error);
CPU_FOREACH_ISSET(cpu_id, &cpu_map) {
#ifdef SMP
/* Ensure CPU is not halted. */
if (CPU_ISSET(cpu_id, &hlt_cpus_mask))
return (ENXIO);
#endif
#if 0
/* TODO: Check if the owner have this cpu configured already. */
ctx = hwt_owner_lookup_ctx_by_cpu(ho, halloc->cpu);
if (ctx)
return (EEXIST);
#endif
cpu_count++;
}
if (cpu_count == 0)
return (ENODEV);
/* Allocate a new HWT context. */
error = hwt_ctx_alloc(&ctx);
if (error)
return (error);
ctx->bufsize = halloc->bufsize;
ctx->hwt_backend = backend;
ctx->hwt_owner = ho;
ctx->mode = HWT_MODE_CPU;
ctx->cpu_map = cpu_map;
ctx->hwt_td = td;
ctx->kqueue_fd = halloc->kqueue_fd;
error = copyout(&ctx->ident, halloc->ident, sizeof(int));
if (error) {
hwt_ctx_free(ctx);
return (error);
}
CPU_FOREACH_ISSET(cpu_id, &cpu_map) {
sprintf(path, "hwt_%d_%d", ctx->ident, cpu_id);
error = hwt_vm_alloc(ctx->bufsize, ctx->hwt_backend->kva_req,
path, &vm);
if (error) {
/* TODO: remove all allocated cpus. */
hwt_ctx_free(ctx);
return (error);
}
cpu = hwt_cpu_alloc();
cpu->cpu_id = cpu_id;
cpu->vm = vm;
vm->cpu = cpu;
vm->ctx = ctx;
HWT_CTX_LOCK(ctx);
hwt_cpu_insert(ctx, cpu);
HWT_CTX_UNLOCK(ctx);
}
error = hwt_backend_init(ctx);
if (error) {
/* TODO: remove all allocated cpus. */
hwt_ctx_free(ctx);
return (error);
}
/* hwt_owner_insert_ctx? */
mtx_lock(&ho->mtx);
LIST_INSERT_HEAD(&ho->hwts, ctx, next_hwts);
mtx_unlock(&ho->mtx);
hwt_record_kernel_objects(ctx);
return (0);
}
static int
hwt_ioctl_alloc(struct thread *td, struct hwt_alloc *halloc)
{
char backend_name[HWT_BACKEND_MAXNAMELEN];
struct hwt_backend *backend;
struct hwt_owner *ho;
int error;
if (halloc->bufsize > HWT_MAXBUFSIZE)
return (EINVAL);
if (halloc->bufsize % PAGE_SIZE)
return (EINVAL);
if (halloc->backend_name == NULL)
return (EINVAL);
error = copyinstr(halloc->backend_name, (void *)backend_name,
HWT_BACKEND_MAXNAMELEN, NULL);
if (error)
return (error);
backend = hwt_backend_lookup(backend_name);
if (backend == NULL)
return (ENODEV);
/* First get the owner. */
ho = hwt_ownerhash_lookup(td->td_proc);
if (ho == NULL) {
/* Create a new owner. */
ho = hwt_owner_alloc(td->td_proc);
if (ho == NULL)
return (ENOMEM);
hwt_ownerhash_insert(ho);
}
switch (halloc->mode) {
case HWT_MODE_THREAD:
error = hwt_ioctl_alloc_mode_thread(td, ho, backend, halloc);
break;
case HWT_MODE_CPU:
error = hwt_ioctl_alloc_mode_cpu(td, ho, backend, halloc);
break;
default:
error = ENXIO;
};
return (error);
}
int
hwt_ioctl(struct cdev *dev, u_long cmd, caddr_t addr, int flags,
struct thread *td)
{
int error;
switch (cmd) {
case HWT_IOC_ALLOC:
/* Allocate HWT context. */
error = hwt_ioctl_alloc(td, (struct hwt_alloc *)addr);
return (error);
default:
return (ENXIO);
};
}