| // SPDX-License-Identifier: GPL-2.0 |
| /* |
| * Basic resctrl file system operations |
| * |
| * Copyright (C) 2018 Intel Corporation |
| * |
| * Authors: |
| * Sai Praneeth Prakhya <sai.praneeth.prakhya@intel.com>, |
| * Fenghua Yu <fenghua.yu@intel.com> |
| */ |
| #include <fcntl.h> |
| #include <limits.h> |
| |
| #include "resctrl.h" |
| |
| static int find_resctrl_mount(char *buffer) |
| { |
| FILE *mounts; |
| char line[256], *fs, *mntpoint; |
| |
| mounts = fopen("/proc/mounts", "r"); |
| if (!mounts) { |
| perror("/proc/mounts"); |
| return -ENXIO; |
| } |
| while (!feof(mounts)) { |
| if (!fgets(line, 256, mounts)) |
| break; |
| fs = strtok(line, " \t"); |
| if (!fs) |
| continue; |
| mntpoint = strtok(NULL, " \t"); |
| if (!mntpoint) |
| continue; |
| fs = strtok(NULL, " \t"); |
| if (!fs) |
| continue; |
| if (strcmp(fs, "resctrl")) |
| continue; |
| |
| fclose(mounts); |
| if (buffer) |
| strncpy(buffer, mntpoint, 256); |
| |
| return 0; |
| } |
| |
| fclose(mounts); |
| |
| return -ENOENT; |
| } |
| |
| /* |
| * mount_resctrlfs - Mount resctrl FS at /sys/fs/resctrl |
| * |
| * Mounts resctrl FS. Fails if resctrl FS is already mounted to avoid |
| * pre-existing settings interfering with the test results. |
| * |
| * Return: 0 on success, non-zero on failure |
| */ |
| int mount_resctrlfs(void) |
| { |
| int ret; |
| |
| ret = find_resctrl_mount(NULL); |
| if (ret != -ENOENT) |
| return -1; |
| |
| ksft_print_msg("Mounting resctrl to \"%s\"\n", RESCTRL_PATH); |
| ret = mount("resctrl", RESCTRL_PATH, "resctrl", 0, NULL); |
| if (ret) |
| perror("# mount"); |
| |
| return ret; |
| } |
| |
| int umount_resctrlfs(void) |
| { |
| char mountpoint[256]; |
| int ret; |
| |
| ret = find_resctrl_mount(mountpoint); |
| if (ret == -ENOENT) |
| return 0; |
| if (ret) |
| return ret; |
| |
| if (umount(mountpoint)) { |
| perror("# Unable to umount resctrl"); |
| |
| return errno; |
| } |
| |
| return 0; |
| } |
| |
| /* |
| * get_resource_id - Get socket number/l3 id for a specified CPU |
| * @cpu_no: CPU number |
| * @resource_id: Socket number or l3_id |
| * |
| * Return: >= 0 on success, < 0 on failure. |
| */ |
| int get_resource_id(int cpu_no, int *resource_id) |
| { |
| char phys_pkg_path[1024]; |
| FILE *fp; |
| |
| if (get_vendor() == ARCH_AMD) |
| sprintf(phys_pkg_path, "%s%d/cache/index3/id", |
| PHYS_ID_PATH, cpu_no); |
| else |
| sprintf(phys_pkg_path, "%s%d/topology/physical_package_id", |
| PHYS_ID_PATH, cpu_no); |
| |
| fp = fopen(phys_pkg_path, "r"); |
| if (!fp) { |
| perror("Failed to open physical_package_id"); |
| |
| return -1; |
| } |
| if (fscanf(fp, "%d", resource_id) <= 0) { |
| perror("Could not get socket number or l3 id"); |
| fclose(fp); |
| |
| return -1; |
| } |
| fclose(fp); |
| |
| return 0; |
| } |
| |
| /* |
| * get_cache_size - Get cache size for a specified CPU |
| * @cpu_no: CPU number |
| * @cache_type: Cache level L2/L3 |
| * @cache_size: pointer to cache_size |
| * |
| * Return: = 0 on success, < 0 on failure. |
| */ |
| int get_cache_size(int cpu_no, char *cache_type, unsigned long *cache_size) |
| { |
| char cache_path[1024], cache_str[64]; |
| int length, i, cache_num; |
| FILE *fp; |
| |
| if (!strcmp(cache_type, "L3")) { |
| cache_num = 3; |
| } else if (!strcmp(cache_type, "L2")) { |
| cache_num = 2; |
| } else { |
| perror("Invalid cache level"); |
| return -1; |
| } |
| |
| sprintf(cache_path, "/sys/bus/cpu/devices/cpu%d/cache/index%d/size", |
| cpu_no, cache_num); |
| fp = fopen(cache_path, "r"); |
| if (!fp) { |
| perror("Failed to open cache size"); |
| |
| return -1; |
| } |
| if (fscanf(fp, "%s", cache_str) <= 0) { |
| perror("Could not get cache_size"); |
| fclose(fp); |
| |
| return -1; |
| } |
| fclose(fp); |
| |
| length = (int)strlen(cache_str); |
| |
| *cache_size = 0; |
| |
| for (i = 0; i < length; i++) { |
| if ((cache_str[i] >= '0') && (cache_str[i] <= '9')) |
| |
| *cache_size = *cache_size * 10 + (cache_str[i] - '0'); |
| |
| else if (cache_str[i] == 'K') |
| |
| *cache_size = *cache_size * 1024; |
| |
| else if (cache_str[i] == 'M') |
| |
| *cache_size = *cache_size * 1024 * 1024; |
| |
| else |
| break; |
| } |
| |
| return 0; |
| } |
| |
| #define CORE_SIBLINGS_PATH "/sys/bus/cpu/devices/cpu" |
| |
| /* |
| * get_cbm_mask - Get cbm mask for given cache |
| * @cache_type: Cache level L2/L3 |
| * @cbm_mask: cbm_mask returned as a string |
| * |
| * Return: = 0 on success, < 0 on failure. |
| */ |
| int get_cbm_mask(char *cache_type, char *cbm_mask) |
| { |
| char cbm_mask_path[1024]; |
| FILE *fp; |
| |
| if (!cbm_mask) |
| return -1; |
| |
| sprintf(cbm_mask_path, "%s/%s/cbm_mask", INFO_PATH, cache_type); |
| |
| fp = fopen(cbm_mask_path, "r"); |
| if (!fp) { |
| perror("Failed to open cache level"); |
| |
| return -1; |
| } |
| if (fscanf(fp, "%s", cbm_mask) <= 0) { |
| perror("Could not get max cbm_mask"); |
| fclose(fp); |
| |
| return -1; |
| } |
| fclose(fp); |
| |
| return 0; |
| } |
| |
| /* |
| * get_core_sibling - Get sibling core id from the same socket for given CPU |
| * @cpu_no: CPU number |
| * |
| * Return: > 0 on success, < 0 on failure. |
| */ |
| int get_core_sibling(int cpu_no) |
| { |
| char core_siblings_path[1024], cpu_list_str[64]; |
| int sibling_cpu_no = -1; |
| FILE *fp; |
| |
| sprintf(core_siblings_path, "%s%d/topology/core_siblings_list", |
| CORE_SIBLINGS_PATH, cpu_no); |
| |
| fp = fopen(core_siblings_path, "r"); |
| if (!fp) { |
| perror("Failed to open core siblings path"); |
| |
| return -1; |
| } |
| if (fscanf(fp, "%s", cpu_list_str) <= 0) { |
| perror("Could not get core_siblings list"); |
| fclose(fp); |
| |
| return -1; |
| } |
| fclose(fp); |
| |
| char *token = strtok(cpu_list_str, "-,"); |
| |
| while (token) { |
| sibling_cpu_no = atoi(token); |
| /* Skipping core 0 as we don't want to run test on core 0 */ |
| if (sibling_cpu_no != 0 && sibling_cpu_no != cpu_no) |
| break; |
| token = strtok(NULL, "-,"); |
| } |
| |
| return sibling_cpu_no; |
| } |
| |
| /* |
| * taskset_benchmark - Taskset PID (i.e. benchmark) to a specified cpu |
| * @bm_pid: PID that should be binded |
| * @cpu_no: CPU number at which the PID would be binded |
| * |
| * Return: 0 on success, non-zero on failure |
| */ |
| int taskset_benchmark(pid_t bm_pid, int cpu_no) |
| { |
| cpu_set_t my_set; |
| |
| CPU_ZERO(&my_set); |
| CPU_SET(cpu_no, &my_set); |
| |
| if (sched_setaffinity(bm_pid, sizeof(cpu_set_t), &my_set)) { |
| perror("Unable to taskset benchmark"); |
| |
| return -1; |
| } |
| |
| return 0; |
| } |
| |
| /* |
| * create_grp - Create a group only if one doesn't exist |
| * @grp_name: Name of the group |
| * @grp: Full path and name of the group |
| * @parent_grp: Full path and name of the parent group |
| * |
| * Return: 0 on success, non-zero on failure |
| */ |
| static int create_grp(const char *grp_name, char *grp, const char *parent_grp) |
| { |
| int found_grp = 0; |
| struct dirent *ep; |
| DIR *dp; |
| |
| /* |
| * At this point, we are guaranteed to have resctrl FS mounted and if |
| * length of grp_name == 0, it means, user wants to use root con_mon |
| * grp, so do nothing |
| */ |
| if (strlen(grp_name) == 0) |
| return 0; |
| |
| /* Check if requested grp exists or not */ |
| dp = opendir(parent_grp); |
| if (dp) { |
| while ((ep = readdir(dp)) != NULL) { |
| if (strcmp(ep->d_name, grp_name) == 0) |
| found_grp = 1; |
| } |
| closedir(dp); |
| } else { |
| perror("Unable to open resctrl for group"); |
| |
| return -1; |
| } |
| |
| /* Requested grp doesn't exist, hence create it */ |
| if (found_grp == 0) { |
| if (mkdir(grp, 0) == -1) { |
| perror("Unable to create group"); |
| |
| return -1; |
| } |
| } |
| |
| return 0; |
| } |
| |
| static int write_pid_to_tasks(char *tasks, pid_t pid) |
| { |
| FILE *fp; |
| |
| fp = fopen(tasks, "w"); |
| if (!fp) { |
| perror("Failed to open tasks file"); |
| |
| return -1; |
| } |
| if (fprintf(fp, "%d\n", pid) < 0) { |
| perror("Failed to wr pid to tasks file"); |
| fclose(fp); |
| |
| return -1; |
| } |
| fclose(fp); |
| |
| return 0; |
| } |
| |
| /* |
| * write_bm_pid_to_resctrl - Write a PID (i.e. benchmark) to resctrl FS |
| * @bm_pid: PID that should be written |
| * @ctrlgrp: Name of the control monitor group (con_mon grp) |
| * @mongrp: Name of the monitor group (mon grp) |
| * @resctrl_val: Resctrl feature (Eg: mbm, mba.. etc) |
| * |
| * If a con_mon grp is requested, create it and write pid to it, otherwise |
| * write pid to root con_mon grp. |
| * If a mon grp is requested, create it and write pid to it, otherwise |
| * pid is not written, this means that pid is in con_mon grp and hence |
| * should consult con_mon grp's mon_data directory for results. |
| * |
| * Return: 0 on success, non-zero on failure |
| */ |
| int write_bm_pid_to_resctrl(pid_t bm_pid, char *ctrlgrp, char *mongrp, |
| char *resctrl_val) |
| { |
| char controlgroup[128], monitorgroup[512], monitorgroup_p[256]; |
| char tasks[1024]; |
| int ret = 0; |
| |
| if (strlen(ctrlgrp)) |
| sprintf(controlgroup, "%s/%s", RESCTRL_PATH, ctrlgrp); |
| else |
| sprintf(controlgroup, "%s", RESCTRL_PATH); |
| |
| /* Create control and monitoring group and write pid into it */ |
| ret = create_grp(ctrlgrp, controlgroup, RESCTRL_PATH); |
| if (ret) |
| goto out; |
| sprintf(tasks, "%s/tasks", controlgroup); |
| ret = write_pid_to_tasks(tasks, bm_pid); |
| if (ret) |
| goto out; |
| |
| /* Create mon grp and write pid into it for "mbm" and "cmt" test */ |
| if (!strncmp(resctrl_val, CMT_STR, sizeof(CMT_STR)) || |
| !strncmp(resctrl_val, MBM_STR, sizeof(MBM_STR))) { |
| if (strlen(mongrp)) { |
| sprintf(monitorgroup_p, "%s/mon_groups", controlgroup); |
| sprintf(monitorgroup, "%s/%s", monitorgroup_p, mongrp); |
| ret = create_grp(mongrp, monitorgroup, monitorgroup_p); |
| if (ret) |
| goto out; |
| |
| sprintf(tasks, "%s/mon_groups/%s/tasks", |
| controlgroup, mongrp); |
| ret = write_pid_to_tasks(tasks, bm_pid); |
| if (ret) |
| goto out; |
| } |
| } |
| |
| out: |
| ksft_print_msg("Writing benchmark parameters to resctrl FS\n"); |
| if (ret) |
| perror("# writing to resctrlfs"); |
| |
| return ret; |
| } |
| |
| /* |
| * write_schemata - Update schemata of a con_mon grp |
| * @ctrlgrp: Name of the con_mon grp |
| * @schemata: Schemata that should be updated to |
| * @cpu_no: CPU number that the benchmark PID is binded to |
| * @resctrl_val: Resctrl feature (Eg: mbm, mba.. etc) |
| * |
| * Update schemata of a con_mon grp *only* if requested resctrl feature is |
| * allocation type |
| * |
| * Return: 0 on success, non-zero on failure |
| */ |
| int write_schemata(char *ctrlgrp, char *schemata, int cpu_no, char *resctrl_val) |
| { |
| char controlgroup[1024], reason[128], schema[1024] = {}; |
| int resource_id, fd, schema_len = -1, ret = 0; |
| |
| if (strncmp(resctrl_val, MBA_STR, sizeof(MBA_STR)) && |
| strncmp(resctrl_val, MBM_STR, sizeof(MBM_STR)) && |
| strncmp(resctrl_val, CAT_STR, sizeof(CAT_STR)) && |
| strncmp(resctrl_val, CMT_STR, sizeof(CMT_STR))) |
| return -ENOENT; |
| |
| if (!schemata) { |
| ksft_print_msg("Skipping empty schemata update\n"); |
| |
| return -1; |
| } |
| |
| if (get_resource_id(cpu_no, &resource_id) < 0) { |
| sprintf(reason, "Failed to get resource id"); |
| ret = -1; |
| |
| goto out; |
| } |
| |
| if (strlen(ctrlgrp) != 0) |
| sprintf(controlgroup, "%s/%s/schemata", RESCTRL_PATH, ctrlgrp); |
| else |
| sprintf(controlgroup, "%s/schemata", RESCTRL_PATH); |
| |
| if (!strncmp(resctrl_val, CAT_STR, sizeof(CAT_STR)) || |
| !strncmp(resctrl_val, CMT_STR, sizeof(CMT_STR))) |
| schema_len = snprintf(schema, sizeof(schema), "%s%d%c%s\n", |
| "L3:", resource_id, '=', schemata); |
| if (!strncmp(resctrl_val, MBA_STR, sizeof(MBA_STR)) || |
| !strncmp(resctrl_val, MBM_STR, sizeof(MBM_STR))) |
| schema_len = snprintf(schema, sizeof(schema), "%s%d%c%s\n", |
| "MB:", resource_id, '=', schemata); |
| if (schema_len < 0 || schema_len >= sizeof(schema)) { |
| snprintf(reason, sizeof(reason), |
| "snprintf() failed with return value : %d", schema_len); |
| ret = -1; |
| goto out; |
| } |
| |
| fd = open(controlgroup, O_WRONLY); |
| if (fd < 0) { |
| snprintf(reason, sizeof(reason), |
| "open() failed : %s", strerror(errno)); |
| ret = -1; |
| |
| goto err_schema_not_empty; |
| } |
| if (write(fd, schema, schema_len) < 0) { |
| snprintf(reason, sizeof(reason), |
| "write() failed : %s", strerror(errno)); |
| close(fd); |
| ret = -1; |
| |
| goto err_schema_not_empty; |
| } |
| close(fd); |
| |
| err_schema_not_empty: |
| schema[schema_len - 1] = 0; |
| out: |
| ksft_print_msg("Write schema \"%s\" to resctrl FS%s%s\n", |
| schema, ret ? " # " : "", |
| ret ? reason : ""); |
| |
| return ret; |
| } |
| |
| bool check_resctrlfs_support(void) |
| { |
| FILE *inf = fopen("/proc/filesystems", "r"); |
| DIR *dp; |
| char *res; |
| bool ret = false; |
| |
| if (!inf) |
| return false; |
| |
| res = fgrep(inf, "nodev\tresctrl\n"); |
| |
| if (res) { |
| ret = true; |
| free(res); |
| } |
| |
| fclose(inf); |
| |
| ksft_print_msg("%s Check kernel supports resctrl filesystem\n", |
| ret ? "Pass:" : "Fail:"); |
| |
| if (!ret) |
| return ret; |
| |
| dp = opendir(RESCTRL_PATH); |
| ksft_print_msg("%s Check resctrl mountpoint \"%s\" exists\n", |
| dp ? "Pass:" : "Fail:", RESCTRL_PATH); |
| if (dp) |
| closedir(dp); |
| |
| ksft_print_msg("resctrl filesystem %s mounted\n", |
| find_resctrl_mount(NULL) ? "not" : "is"); |
| |
| return ret; |
| } |
| |
| char *fgrep(FILE *inf, const char *str) |
| { |
| char line[256]; |
| int slen = strlen(str); |
| |
| while (!feof(inf)) { |
| if (!fgets(line, 256, inf)) |
| break; |
| if (strncmp(line, str, slen)) |
| continue; |
| |
| return strdup(line); |
| } |
| |
| return NULL; |
| } |
| |
| /* |
| * validate_resctrl_feature_request - Check if requested feature is valid. |
| * @resource: Required resource (e.g., MB, L3, L2, L3_MON, etc.) |
| * @feature: Required monitor feature (in mon_features file). Can only be |
| * set for L3_MON. Must be NULL for all other resources. |
| * |
| * Return: True if the resource/feature is supported, else false. False is |
| * also returned if resctrl FS is not mounted. |
| */ |
| bool validate_resctrl_feature_request(const char *resource, const char *feature) |
| { |
| char res_path[PATH_MAX]; |
| struct stat statbuf; |
| char *res; |
| FILE *inf; |
| int ret; |
| |
| if (!resource) |
| return false; |
| |
| ret = find_resctrl_mount(NULL); |
| if (ret) |
| return false; |
| |
| snprintf(res_path, sizeof(res_path), "%s/%s", INFO_PATH, resource); |
| |
| if (stat(res_path, &statbuf)) |
| return false; |
| |
| if (!feature) |
| return true; |
| |
| snprintf(res_path, sizeof(res_path), "%s/%s/mon_features", INFO_PATH, resource); |
| inf = fopen(res_path, "r"); |
| if (!inf) |
| return false; |
| |
| res = fgrep(inf, feature); |
| free(res); |
| fclose(inf); |
| |
| return !!res; |
| } |
| |
| int filter_dmesg(void) |
| { |
| char line[1024]; |
| FILE *fp; |
| int pipefds[2]; |
| pid_t pid; |
| int ret; |
| |
| ret = pipe(pipefds); |
| if (ret) { |
| perror("pipe"); |
| return ret; |
| } |
| fflush(stdout); |
| pid = fork(); |
| if (pid == 0) { |
| close(pipefds[0]); |
| dup2(pipefds[1], STDOUT_FILENO); |
| execlp("dmesg", "dmesg", NULL); |
| perror("executing dmesg"); |
| exit(1); |
| } |
| close(pipefds[1]); |
| fp = fdopen(pipefds[0], "r"); |
| if (!fp) { |
| perror("fdopen(pipe)"); |
| kill(pid, SIGTERM); |
| |
| return -1; |
| } |
| |
| while (fgets(line, 1024, fp)) { |
| if (strstr(line, "intel_rdt:")) |
| ksft_print_msg("dmesg: %s", line); |
| if (strstr(line, "resctrl:")) |
| ksft_print_msg("dmesg: %s", line); |
| } |
| fclose(fp); |
| waitpid(pid, NULL, 0); |
| |
| return 0; |
| } |
| |
| int validate_bw_report_request(char *bw_report) |
| { |
| if (strcmp(bw_report, "reads") == 0) |
| return 0; |
| if (strcmp(bw_report, "writes") == 0) |
| return 0; |
| if (strcmp(bw_report, "nt-writes") == 0) { |
| strcpy(bw_report, "writes"); |
| return 0; |
| } |
| if (strcmp(bw_report, "total") == 0) |
| return 0; |
| |
| fprintf(stderr, "Requested iMC B/W report type unavailable\n"); |
| |
| return -1; |
| } |
| |
| int perf_event_open(struct perf_event_attr *hw_event, pid_t pid, int cpu, |
| int group_fd, unsigned long flags) |
| { |
| int ret; |
| |
| ret = syscall(__NR_perf_event_open, hw_event, pid, cpu, |
| group_fd, flags); |
| return ret; |
| } |
| |
| unsigned int count_bits(unsigned long n) |
| { |
| unsigned int count = 0; |
| |
| while (n) { |
| count += n & 1; |
| n >>= 1; |
| } |
| |
| return count; |
| } |