aa5e65dc08
We can see that "Time namespaces are not supported" on LoongArch: (1) clone3 test # cd tools/testing/selftests/clone3 && make && ./clone3 ... # Time namespaces are not supported ok 18 # SKIP Skipping clone3() with CLONE_NEWTIME # Totals: pass:17 fail:0 xfail:0 xpass:0 skip:1 error:0 (2) timens test # cd tools/testing/selftests/timens && make && ./timens ... 1..0 # SKIP Time namespaces are not supported On LoongArch the current kernel does not support CONFIG_TIME_NS which depends on GENERIC_VDSO_TIME_NS, select GENERIC_VDSO_TIME_NS to enable CONFIG_TIME_NS to build kernel/time/namespace.c. Additionally, it needs to define some arch-dependent functions for the timens, such as __arch_get_timens_vdso_data(), arch_get_vdso_data() and vdso_join_timens(). At the same time, modify the layout of vvar to use one page size for generic vdso data, expand another page size for timens vdso data and assign LOONGARCH_VDSO_DATA_SIZE (maybe exceeds a page size if expand in the future) for loongarch vdso data, at last add the callback function vvar_fault() and modify stack_top(). With this patch under CONFIG_TIME_NS: (1) clone3 test # cd tools/testing/selftests/clone3 && make && ./clone3 ... ok 18 [739] Result (0) matches expectation (0) # Totals: pass:18 fail:0 xfail:0 xpass:0 skip:0 error:0 (2) timens test # cd tools/testing/selftests/timens && make && ./timens ... # Totals: pass:10 fail:0 xfail:0 xpass:0 skip:0 error:0 Signed-off-by: Tiezhu Yang <yangtiezhu@loongson.cn> Signed-off-by: Huacai Chen <chenhuacai@loongson.cn>
210 lines
5.0 KiB
C
210 lines
5.0 KiB
C
// SPDX-License-Identifier: GPL-2.0
|
|
/*
|
|
* Author: Huacai Chen <chenhuacai@loongson.cn>
|
|
* Copyright (C) 2020-2022 Loongson Technology Corporation Limited
|
|
*/
|
|
|
|
#include <linux/binfmts.h>
|
|
#include <linux/elf.h>
|
|
#include <linux/err.h>
|
|
#include <linux/init.h>
|
|
#include <linux/ioport.h>
|
|
#include <linux/kernel.h>
|
|
#include <linux/mm.h>
|
|
#include <linux/random.h>
|
|
#include <linux/sched.h>
|
|
#include <linux/slab.h>
|
|
#include <linux/time_namespace.h>
|
|
#include <linux/timekeeper_internal.h>
|
|
|
|
#include <asm/page.h>
|
|
#include <asm/vdso.h>
|
|
#include <vdso/helpers.h>
|
|
#include <vdso/vsyscall.h>
|
|
#include <generated/vdso-offsets.h>
|
|
|
|
extern char vdso_start[], vdso_end[];
|
|
|
|
/* Kernel-provided data used by the VDSO. */
|
|
static union {
|
|
u8 page[PAGE_SIZE];
|
|
struct vdso_data data[CS_BASES];
|
|
} generic_vdso_data __page_aligned_data;
|
|
|
|
static union {
|
|
u8 page[LOONGARCH_VDSO_DATA_SIZE];
|
|
struct loongarch_vdso_data vdata;
|
|
} loongarch_vdso_data __page_aligned_data;
|
|
|
|
static struct page *vdso_pages[] = { NULL };
|
|
struct vdso_data *vdso_data = generic_vdso_data.data;
|
|
struct vdso_pcpu_data *vdso_pdata = loongarch_vdso_data.vdata.pdata;
|
|
|
|
static int vdso_mremap(const struct vm_special_mapping *sm, struct vm_area_struct *new_vma)
|
|
{
|
|
current->mm->context.vdso = (void *)(new_vma->vm_start);
|
|
|
|
return 0;
|
|
}
|
|
|
|
static vm_fault_t vvar_fault(const struct vm_special_mapping *sm,
|
|
struct vm_area_struct *vma, struct vm_fault *vmf)
|
|
{
|
|
unsigned long pfn;
|
|
struct page *timens_page = find_timens_vvar_page(vma);
|
|
|
|
switch (vmf->pgoff) {
|
|
case VVAR_GENERIC_PAGE_OFFSET:
|
|
if (!timens_page)
|
|
pfn = sym_to_pfn(vdso_data);
|
|
else
|
|
pfn = page_to_pfn(timens_page);
|
|
break;
|
|
#ifdef CONFIG_TIME_NS
|
|
case VVAR_TIMENS_PAGE_OFFSET:
|
|
/*
|
|
* If a task belongs to a time namespace then a namespace specific
|
|
* VVAR is mapped with the VVAR_GENERIC_PAGE_OFFSET and the real
|
|
* VVAR page is mapped with the VVAR_TIMENS_PAGE_OFFSET offset.
|
|
* See also the comment near timens_setup_vdso_data().
|
|
*/
|
|
if (!timens_page)
|
|
return VM_FAULT_SIGBUS;
|
|
else
|
|
pfn = sym_to_pfn(vdso_data);
|
|
break;
|
|
#endif /* CONFIG_TIME_NS */
|
|
case VVAR_LOONGARCH_PAGES_START ... VVAR_LOONGARCH_PAGES_END:
|
|
pfn = sym_to_pfn(&loongarch_vdso_data) + vmf->pgoff - VVAR_LOONGARCH_PAGES_START;
|
|
break;
|
|
default:
|
|
return VM_FAULT_SIGBUS;
|
|
}
|
|
|
|
return vmf_insert_pfn(vma, vmf->address, pfn);
|
|
}
|
|
|
|
struct loongarch_vdso_info vdso_info = {
|
|
.vdso = vdso_start,
|
|
.size = PAGE_SIZE,
|
|
.code_mapping = {
|
|
.name = "[vdso]",
|
|
.pages = vdso_pages,
|
|
.mremap = vdso_mremap,
|
|
},
|
|
.data_mapping = {
|
|
.name = "[vvar]",
|
|
.fault = vvar_fault,
|
|
},
|
|
.offset_sigreturn = vdso_offset_sigreturn,
|
|
};
|
|
|
|
static int __init init_vdso(void)
|
|
{
|
|
unsigned long i, cpu, pfn;
|
|
|
|
BUG_ON(!PAGE_ALIGNED(vdso_info.vdso));
|
|
BUG_ON(!PAGE_ALIGNED(vdso_info.size));
|
|
|
|
for_each_possible_cpu(cpu)
|
|
vdso_pdata[cpu].node = cpu_to_node(cpu);
|
|
|
|
pfn = __phys_to_pfn(__pa_symbol(vdso_info.vdso));
|
|
for (i = 0; i < vdso_info.size / PAGE_SIZE; i++)
|
|
vdso_info.code_mapping.pages[i] = pfn_to_page(pfn + i);
|
|
|
|
return 0;
|
|
}
|
|
subsys_initcall(init_vdso);
|
|
|
|
#ifdef CONFIG_TIME_NS
|
|
struct vdso_data *arch_get_vdso_data(void *vvar_page)
|
|
{
|
|
return (struct vdso_data *)(vvar_page);
|
|
}
|
|
|
|
/*
|
|
* The vvar mapping contains data for a specific time namespace, so when a
|
|
* task changes namespace we must unmap its vvar data for the old namespace.
|
|
* Subsequent faults will map in data for the new namespace.
|
|
*
|
|
* For more details see timens_setup_vdso_data().
|
|
*/
|
|
int vdso_join_timens(struct task_struct *task, struct time_namespace *ns)
|
|
{
|
|
struct mm_struct *mm = task->mm;
|
|
struct vm_area_struct *vma;
|
|
|
|
VMA_ITERATOR(vmi, mm, 0);
|
|
|
|
mmap_read_lock(mm);
|
|
for_each_vma(vmi, vma) {
|
|
if (vma_is_special_mapping(vma, &vdso_info.data_mapping))
|
|
zap_vma_pages(vma);
|
|
}
|
|
mmap_read_unlock(mm);
|
|
|
|
return 0;
|
|
}
|
|
#endif
|
|
|
|
static unsigned long vdso_base(void)
|
|
{
|
|
unsigned long base = STACK_TOP;
|
|
|
|
if (current->flags & PF_RANDOMIZE) {
|
|
base += get_random_u32_below(VDSO_RANDOMIZE_SIZE);
|
|
base = PAGE_ALIGN(base);
|
|
}
|
|
|
|
return base;
|
|
}
|
|
|
|
int arch_setup_additional_pages(struct linux_binprm *bprm, int uses_interp)
|
|
{
|
|
int ret;
|
|
unsigned long size, data_addr, vdso_addr;
|
|
struct mm_struct *mm = current->mm;
|
|
struct vm_area_struct *vma;
|
|
struct loongarch_vdso_info *info = current->thread.vdso;
|
|
|
|
if (mmap_write_lock_killable(mm))
|
|
return -EINTR;
|
|
|
|
/*
|
|
* Determine total area size. This includes the VDSO data itself
|
|
* and the data pages.
|
|
*/
|
|
size = VVAR_SIZE + info->size;
|
|
|
|
data_addr = get_unmapped_area(NULL, vdso_base(), size, 0, 0);
|
|
if (IS_ERR_VALUE(data_addr)) {
|
|
ret = data_addr;
|
|
goto out;
|
|
}
|
|
|
|
vma = _install_special_mapping(mm, data_addr, VVAR_SIZE,
|
|
VM_READ | VM_MAYREAD | VM_PFNMAP,
|
|
&info->data_mapping);
|
|
if (IS_ERR(vma)) {
|
|
ret = PTR_ERR(vma);
|
|
goto out;
|
|
}
|
|
|
|
vdso_addr = data_addr + VVAR_SIZE;
|
|
vma = _install_special_mapping(mm, vdso_addr, info->size,
|
|
VM_READ | VM_EXEC | VM_MAYREAD | VM_MAYWRITE | VM_MAYEXEC,
|
|
&info->code_mapping);
|
|
if (IS_ERR(vma)) {
|
|
ret = PTR_ERR(vma);
|
|
goto out;
|
|
}
|
|
|
|
mm->context.vdso = (void *)vdso_addr;
|
|
ret = 0;
|
|
|
|
out:
|
|
mmap_write_unlock(mm);
|
|
return ret;
|
|
}
|