/* * This file and its contents are supplied under the terms of the * Common Development and Distribution License ("CDDL"), version 1.0. * You may only use this file in accordance with the terms of version * 1.0 of the CDDL. * * A full copy of the text of the CDDL should have accompanied this * source. A copy of the CDDL is also available via the Internet at * http://www.illumos.org/license/CDDL. */ /* * Copyright 2017 Joyent, Inc. * Copyright 2021 Oxide Computer Company * Copyright 2022 Tintri by DDN, Inc. All rights reserved. */ /* * nvmeadm -- NVMe administration utility * * nvmeadm [-v] [-d] [-h] [[/][,...]] [args] * commands: list * identify * get-logpage * get-features [,...] * format ... * secure-erase ... * detach ... * attach ... * list-firmware ... * load-firmware ... * commit-firmware ... * activate-firmware ... */ #include #include #include #include #include #include #include #include #include #include #include "nvmeadm.h" struct nvme_feature { char *f_name; char *f_short; uint8_t f_feature; size_t f_bufsize; uint_t f_getflags; int (*f_get)(int, const nvme_feature_t *, const nvme_process_arg_t *); void (*f_print)(uint64_t, void *, size_t, nvme_identify_ctrl_t *, nvme_version_t *); }; #define NVMEADM_CTRL 1 #define NVMEADM_NS 2 #define NVMEADM_BOTH (NVMEADM_CTRL | NVMEADM_NS) struct nvmeadm_cmd { char *c_name; const char *c_desc; const char *c_flagdesc; int (*c_func)(int, const nvme_process_arg_t *); void (*c_usage)(const char *); boolean_t c_multi; void (*c_optparse)(nvme_process_arg_t *); }; static void usage(const nvmeadm_cmd_t *); static void nvme_walk(nvme_process_arg_t *, di_node_t); static boolean_t nvme_match(nvme_process_arg_t *); static int nvme_process(di_node_t, di_minor_t, void *); static int do_list(int, const nvme_process_arg_t *); static int do_identify(int, const nvme_process_arg_t *); static int do_get_logpage_error(int, const nvme_process_arg_t *); static int do_get_logpage_health(int, const nvme_process_arg_t *); static int do_get_logpage_fwslot(int, const nvme_process_arg_t *); static int do_get_logpage(int, const nvme_process_arg_t *); static int do_get_feat_common(int, const nvme_feature_t *, const nvme_process_arg_t *); static int do_get_feat_intr_vect(int, const nvme_feature_t *, const nvme_process_arg_t *); static int do_get_feat_temp_thresh(int, const nvme_feature_t *, const nvme_process_arg_t *); static int do_get_features(int, const nvme_process_arg_t *); static int do_format(int, const nvme_process_arg_t *); static int do_secure_erase(int, const nvme_process_arg_t *); static int do_attach_detach(int, const nvme_process_arg_t *); static int do_firmware_load(int, const nvme_process_arg_t *); static int do_firmware_commit(int, const nvme_process_arg_t *); static int do_firmware_activate(int, const nvme_process_arg_t *); static void optparse_list(nvme_process_arg_t *); static void usage_list(const char *); static void usage_identify(const char *); static void usage_get_logpage(const char *); static void usage_get_features(const char *); static void usage_format(const char *); static void usage_secure_erase(const char *); static void usage_attach_detach(const char *); static void usage_firmware_list(const char *); static void usage_firmware_load(const char *); static void usage_firmware_commit(const char *); static void usage_firmware_activate(const char *); int verbose; int debug; static int exitcode; static const nvmeadm_cmd_t nvmeadm_cmds[] = { { "list", "list controllers and namespaces", " -p\t\tprint parsable output\n" " -o field\tselect a field for parsable output\n", do_list, usage_list, B_TRUE, optparse_list }, { "identify", "identify controllers and/or namespaces", NULL, do_identify, usage_identify, B_TRUE }, { "get-logpage", "get a log page from controllers and/or namespaces", NULL, do_get_logpage, usage_get_logpage, B_TRUE }, { "get-features", "get features from controllers and/or namespaces", NULL, do_get_features, usage_get_features, B_TRUE }, { "format", "format namespace(s) of a controller", NULL, do_format, usage_format, B_FALSE }, { "secure-erase", "secure erase namespace(s) of a controller", " -c Do a cryptographic erase.", do_secure_erase, usage_secure_erase, B_FALSE }, { "detach", "detach blkdev(7d) from namespace(s) of a controller", NULL, do_attach_detach, usage_attach_detach, B_FALSE }, { "attach", "attach blkdev(7d) to namespace(s) of a controller", NULL, do_attach_detach, usage_attach_detach, B_FALSE }, { "list-firmware", "list firmware on a controller", NULL, do_get_logpage_fwslot, usage_firmware_list, B_FALSE }, { "load-firmware", "load firmware to a controller", NULL, do_firmware_load, usage_firmware_load, B_FALSE }, { "commit-firmware", "commit downloaded firmware to a slot of a controller", NULL, do_firmware_commit, usage_firmware_commit, B_FALSE }, { "activate-firmware", "activate a firmware slot of a controller", NULL, do_firmware_activate, usage_firmware_activate, B_FALSE }, { NULL, NULL, NULL, NULL, NULL, B_FALSE } }; static const nvme_feature_t features[] = { { "Arbitration", "", NVME_FEAT_ARBITRATION, 0, NVMEADM_CTRL, do_get_feat_common, nvme_print_feat_arbitration }, { "Power Management", "", NVME_FEAT_POWER_MGMT, 0, NVMEADM_CTRL, do_get_feat_common, nvme_print_feat_power_mgmt }, { "LBA Range Type", "range", NVME_FEAT_LBA_RANGE, NVME_LBA_RANGE_BUFSIZE, NVMEADM_NS, do_get_feat_common, nvme_print_feat_lba_range }, { "Temperature Threshold", "", NVME_FEAT_TEMPERATURE, 0, NVMEADM_CTRL, do_get_feat_temp_thresh, nvme_print_feat_temperature }, { "Error Recovery", "", NVME_FEAT_ERROR, 0, NVMEADM_CTRL, do_get_feat_common, nvme_print_feat_error }, { "Volatile Write Cache", "cache", NVME_FEAT_WRITE_CACHE, 0, NVMEADM_CTRL, do_get_feat_common, nvme_print_feat_write_cache }, { "Number of Queues", "queues", NVME_FEAT_NQUEUES, 0, NVMEADM_CTRL, do_get_feat_common, nvme_print_feat_nqueues }, { "Interrupt Coalescing", "coalescing", NVME_FEAT_INTR_COAL, 0, NVMEADM_CTRL, do_get_feat_common, nvme_print_feat_intr_coal }, { "Interrupt Vector Configuration", "vector", NVME_FEAT_INTR_VECT, 0, NVMEADM_CTRL, do_get_feat_intr_vect, nvme_print_feat_intr_vect }, { "Write Atomicity", "atomicity", NVME_FEAT_WRITE_ATOM, 0, NVMEADM_CTRL, do_get_feat_common, nvme_print_feat_write_atom }, { "Asynchronous Event Configuration", "event", NVME_FEAT_ASYNC_EVENT, 0, NVMEADM_CTRL, do_get_feat_common, nvme_print_feat_async_event }, { "Autonomous Power State Transition", "", NVME_FEAT_AUTO_PST, NVME_AUTO_PST_BUFSIZE, NVMEADM_CTRL, do_get_feat_common, nvme_print_feat_auto_pst }, { "Software Progress Marker", "progress", NVME_FEAT_PROGRESS, 0, NVMEADM_CTRL, do_get_feat_common, nvme_print_feat_progress }, { NULL, NULL, 0, 0, B_FALSE, NULL } }; int main(int argc, char **argv) { int c; const nvmeadm_cmd_t *cmd; di_node_t node; nvme_process_arg_t npa = { 0 }; int help = 0; char *tmp, *lasts = NULL; char *ctrl = NULL; while ((c = getopt(argc, argv, "dhv")) != -1) { switch (c) { case 'd': debug++; break; case 'v': verbose++; break; case 'h': help++; break; case '?': usage(NULL); exit(-1); } } if (optind == argc) { usage(NULL); if (help) exit(0); else exit(-1); } /* Look up the specified command in the command table. */ for (cmd = &nvmeadm_cmds[0]; cmd->c_name != NULL; cmd++) if (strcmp(cmd->c_name, argv[optind]) == 0) break; if (cmd->c_name == NULL) { usage(NULL); exit(-1); } if (help) { usage(cmd); exit(0); } npa.npa_cmd = cmd; optind++; /* * Store the remaining arguments for use by the command. Give the * command a chance to process the options across the board before going * into each controller. */ npa.npa_argc = argc - optind; npa.npa_argv = &argv[optind]; if (cmd->c_optparse != NULL) { cmd->c_optparse(&npa); } /* * All commands but "list" require a ctl/ns argument. However, this * should not be passed through to the command in its subsequent * arguments. */ if ((npa.npa_argc == 0 || (strncmp(npa.npa_argv[0], "nvme", 4) != 0)) && cmd->c_func != do_list) { warnx("missing controller/namespace name"); usage(cmd); exit(-1); } if (npa.npa_argc > 0) { ctrl = npa.npa_argv[0]; npa.npa_argv++; npa.npa_argc--; } else { ctrl = NULL; } /* * Make sure we're not running commands on multiple controllers that * aren't allowed to do that. */ if (ctrl != NULL && strchr(ctrl, ',') != NULL && cmd->c_multi == B_FALSE) { warnx("%s not allowed on multiple controllers", cmd->c_name); usage(cmd); exit(-1); } /* * Get controller/namespace arguments and run command. */ npa.npa_name = strtok_r(ctrl, ",", &lasts); do { if (npa.npa_name != NULL) { tmp = strchr(npa.npa_name, '/'); if (tmp != NULL) { *tmp++ = '\0'; npa.npa_nsid = tmp; npa.npa_isns = B_TRUE; } } if ((node = di_init("/", DINFOSUBTREE | DINFOMINOR)) == NULL) err(-1, "failed to initialize libdevinfo"); nvme_walk(&npa, node); di_fini(node); if (npa.npa_found == 0) { if (npa.npa_name != NULL) { warnx("%s%.*s%.*s: no such controller or " "namespace", npa.npa_name, npa.npa_isns ? -1 : 0, "/", npa.npa_isns ? -1 : 0, npa.npa_nsid); } else { warnx("no controllers found"); } exitcode--; } npa.npa_found = 0; npa.npa_name = strtok_r(NULL, ",", &lasts); } while (npa.npa_name != NULL); exit(exitcode); } static void nvme_oferr(const char *fmt, ...) { va_list ap; va_start(ap, fmt); verrx(-1, fmt, ap); } static void usage(const nvmeadm_cmd_t *cmd) { (void) fprintf(stderr, "usage:\n"); (void) fprintf(stderr, " %s -h %s\n", getprogname(), cmd != NULL ? cmd->c_name : "[]"); (void) fprintf(stderr, " %s [-dv] ", getprogname()); if (cmd != NULL) { cmd->c_usage(cmd->c_name); } else { (void) fprintf(stderr, " [/][,...] []\n"); (void) fprintf(stderr, "\n Manage NVMe controllers and namespaces.\n"); (void) fprintf(stderr, "\ncommands:\n"); for (cmd = &nvmeadm_cmds[0]; cmd->c_name != NULL; cmd++) (void) fprintf(stderr, " %-18s - %s\n", cmd->c_name, cmd->c_desc); } (void) fprintf(stderr, "\nflags:\n" " -h\t\tprint usage information\n" " -d\t\tprint information useful for debugging %s\n" " -v\t\tprint verbose information\n", getprogname()); if (cmd != NULL && cmd->c_flagdesc != NULL) (void) fprintf(stderr, "%s\n", cmd->c_flagdesc); } static boolean_t nvme_match(nvme_process_arg_t *npa) { char *name; char *nsid = NULL; if (npa->npa_name == NULL) return (B_TRUE); if (asprintf(&name, "%s%d", di_driver_name(npa->npa_node), di_instance(npa->npa_node)) < 0) err(-1, "nvme_match()"); if (strcmp(name, npa->npa_name) != 0) { free(name); return (B_FALSE); } free(name); if (npa->npa_isns) { if (npa->npa_nsid == NULL) return (B_TRUE); nsid = di_minor_name(npa->npa_minor); if (nsid == NULL || strcmp(npa->npa_nsid, nsid) != 0) return (B_FALSE); } return (B_TRUE); } char * nvme_dskname(const nvme_process_arg_t *npa) { char *path = NULL; di_node_t child; di_dim_t dim; char *addr; dim = di_dim_init(); for (child = di_child_node(npa->npa_node); child != DI_NODE_NIL; child = di_sibling_node(child)) { addr = di_bus_addr(child); if (addr == NULL) continue; if (addr[0] == 'w') addr++; if (strncasecmp(addr, di_minor_name(npa->npa_minor), strchrnul(addr, ',') - addr) != 0) continue; path = di_dim_path_dev(dim, di_driver_name(child), di_instance(child), "c"); /* * Error out if we didn't get a path, or if it's too short for * the following operations to be safe. */ if (path == NULL || strlen(path) < 2) goto fail; /* Chop off 's0' and get everything past the last '/' */ path[strlen(path) - 2] = '\0'; path = strrchr(path, '/'); if (path == NULL) goto fail; path++; break; } di_dim_fini(dim); return (path); fail: err(-1, "nvme_dskname"); } static int nvme_process(di_node_t node, di_minor_t minor, void *arg) { nvme_process_arg_t *npa = arg; int fd; npa->npa_node = node; npa->npa_minor = minor; if (!nvme_match(npa)) return (DI_WALK_CONTINUE); if ((fd = nvme_open(minor)) < 0) return (DI_WALK_CONTINUE); npa->npa_found++; npa->npa_path = di_devfs_path(node); if (npa->npa_path == NULL) goto out; npa->npa_version = nvme_version(fd); if (npa->npa_version == NULL) goto out; npa->npa_idctl = nvme_identify_ctrl(fd); if (npa->npa_idctl == NULL) goto out; npa->npa_idns = nvme_identify_nsid(fd); if (npa->npa_idns == NULL) goto out; if (npa->npa_isns) npa->npa_dsk = nvme_dskname(npa); exitcode += npa->npa_cmd->c_func(fd, npa); out: di_devfs_path_free(npa->npa_path); free(npa->npa_dsk); free(npa->npa_version); free(npa->npa_idctl); free(npa->npa_idns); npa->npa_version = NULL; npa->npa_idctl = NULL; npa->npa_idns = NULL; nvme_close(fd); return (DI_WALK_CONTINUE); } static void nvme_walk(nvme_process_arg_t *npa, di_node_t node) { char *minor_nodetype = DDI_NT_NVME_NEXUS; if (npa->npa_isns) minor_nodetype = DDI_NT_NVME_ATTACHMENT_POINT; (void) di_walk_minor(node, minor_nodetype, 0, npa, nvme_process); } static void usage_list(const char *c_name) { (void) fprintf(stderr, "%s " "[-p -o field[,...]] [[/][,...]\n\n" " List NVMe controllers and their namespaces. If no " "controllers and/or name-\n spaces are specified, all " "controllers and namespaces in the system will be\n " "listed.\n", c_name); } static void optparse_list(nvme_process_arg_t *npa) { int c; uint_t oflags = 0; boolean_t parse = B_FALSE; const char *fields = NULL; optind = 0; while ((c = getopt(npa->npa_argc, npa->npa_argv, ":o:p")) != -1) { switch (c) { case 'o': fields = optarg; break; case 'p': parse = B_TRUE; oflags |= OFMT_PARSABLE; break; case '?': errx(-1, "unknown list option: -%c", optopt); break; case ':': errx(-1, "option -%c requires an argument", optopt); default: break; } } if (fields != NULL && !parse) { errx(-1, "-o can only be used when in parsable mode (-p)"); } if (parse && fields == NULL) { errx(-1, "parsable mode (-p) requires one to specify output " "fields with -o"); } if (parse) { ofmt_status_t oferr; oferr = ofmt_open(fields, nvme_list_ofmt, oflags, 0, &npa->npa_ofmt); ofmt_check(oferr, B_TRUE, npa->npa_ofmt, nvme_oferr, warnx); } npa->npa_argc -= optind; npa->npa_argv += optind; } static int do_list_nsid(int fd, const nvme_process_arg_t *npa) { _NOTE(ARGUNUSED(fd)); const uint_t format = npa->npa_idns->id_flbas.lba_format; const uint_t bshift = npa->npa_idns->id_lbaf[format].lbaf_lbads; /* * Some devices have extra namespaces with illegal block sizes and * zero blocks. Don't list them when verbose operation isn't requested. */ if ((bshift < 9 || npa->npa_idns->id_nsize == 0) && verbose == 0) return (0); if (npa->npa_ofmt == NULL) { (void) printf(" %s/%s (%s): ", npa->npa_name, di_minor_name(npa->npa_minor), npa->npa_dsk != NULL ? npa->npa_dsk : "unattached"); nvme_print_nsid_summary(npa->npa_idns); } else { ofmt_print(npa->npa_ofmt, (void *)npa); } return (0); } static int do_list(int fd, const nvme_process_arg_t *npa) { _NOTE(ARGUNUSED(fd)); nvme_process_arg_t ns_npa = { 0 }; nvmeadm_cmd_t cmd = { 0 }; char *name; if (asprintf(&name, "%s%d", di_driver_name(npa->npa_node), di_instance(npa->npa_node)) < 0) err(-1, "do_list()"); if (npa->npa_ofmt == NULL) { (void) printf("%s: ", name); nvme_print_ctrl_summary(npa->npa_idctl, npa->npa_version); } ns_npa.npa_name = name; ns_npa.npa_isns = B_TRUE; ns_npa.npa_nsid = npa->npa_nsid; cmd = *(npa->npa_cmd); cmd.c_func = do_list_nsid; ns_npa.npa_cmd = &cmd; ns_npa.npa_ofmt = npa->npa_ofmt; ns_npa.npa_idctl = npa->npa_idctl; nvme_walk(&ns_npa, npa->npa_node); free(name); return (exitcode); } static void usage_identify(const char *c_name) { (void) fprintf(stderr, "%s [/][,...]\n\n" " Print detailed information about the specified NVMe " "controllers and/or name-\n spaces.\n", c_name); } static int do_identify(int fd, const nvme_process_arg_t *npa) { if (!npa->npa_isns) { nvme_capabilities_t *cap; cap = nvme_capabilities(fd); if (cap == NULL) return (-1); (void) printf("%s: ", npa->npa_name); nvme_print_identify_ctrl(npa->npa_idctl, cap, npa->npa_version); free(cap); } else { (void) printf("%s/%s: ", npa->npa_name, di_minor_name(npa->npa_minor)); nvme_print_identify_nsid(npa->npa_idns, npa->npa_version); } return (0); } static void usage_get_logpage(const char *c_name) { (void) fprintf(stderr, "%s [/][,...] \n\n" " Print the specified log page of the specified NVMe " "controllers and/or name-\n spaces. Supported log pages " "are error, health, and firmware.\n", c_name); } static void usage_firmware_list(const char *c_name) { (void) fprintf(stderr, "%s \n\n" " Print the log page that contains the list of firmware " "images installed on the specified NVMe controller.\n", c_name); } static int do_get_logpage_error(int fd, const nvme_process_arg_t *npa) { int nlog = npa->npa_idctl->id_elpe + 1; size_t bufsize = sizeof (nvme_error_log_entry_t) * nlog; nvme_error_log_entry_t *elog; if (npa->npa_isns) errx(-1, "Error Log not available on a per-namespace basis"); elog = nvme_get_logpage(fd, NVME_LOGPAGE_ERROR, &bufsize); if (elog == NULL) return (-1); nlog = bufsize / sizeof (nvme_error_log_entry_t); (void) printf("%s: ", npa->npa_name); nvme_print_error_log(nlog, elog, npa->npa_version); free(elog); return (0); } static int do_get_logpage_health(int fd, const nvme_process_arg_t *npa) { size_t bufsize = sizeof (nvme_health_log_t); nvme_health_log_t *hlog; if (npa->npa_isns) { if (npa->npa_idctl->id_lpa.lp_smart == 0) errx(-1, "SMART/Health information not available " "on a per-namespace basis on this controller"); } hlog = nvme_get_logpage(fd, NVME_LOGPAGE_HEALTH, &bufsize); if (hlog == NULL) return (-1); (void) printf("%s: ", npa->npa_name); nvme_print_health_log(hlog, npa->npa_idctl, npa->npa_version); free(hlog); return (0); } static int do_get_logpage_fwslot(int fd, const nvme_process_arg_t *npa) { size_t bufsize = sizeof (nvme_fwslot_log_t); nvme_fwslot_log_t *fwlog; if (npa->npa_isns) errx(-1, "Firmware Slot information not available on a " "per-namespace basis"); fwlog = nvme_get_logpage(fd, NVME_LOGPAGE_FWSLOT, &bufsize); if (fwlog == NULL) return (-1); (void) printf("%s: ", npa->npa_name); nvme_print_fwslot_log(fwlog, npa->npa_idctl); free(fwlog); return (0); } static int do_get_logpage(int fd, const nvme_process_arg_t *npa) { int ret = 0; int (*func)(int, const nvme_process_arg_t *); if (npa->npa_argc < 1) { warnx("missing logpage name"); usage(npa->npa_cmd); exit(-1); } if (strcmp(npa->npa_argv[0], "error") == 0) func = do_get_logpage_error; else if (strcmp(npa->npa_argv[0], "health") == 0) func = do_get_logpage_health; else if (strcmp(npa->npa_argv[0], "firmware") == 0) func = do_get_logpage_fwslot; else errx(-1, "invalid log page: %s", npa->npa_argv[0]); ret = func(fd, npa); return (ret); } static void usage_get_features(const char *c_name) { const nvme_feature_t *feat; (void) fprintf(stderr, "%s [/][,...] [[,...]]\n\n" " Print the specified features of the specified NVMe controllers " "and/or\n namespaces. Supported features are:\n\n", c_name); (void) fprintf(stderr, " %-35s %-14s %s\n", "FEATURE NAME", "SHORT NAME", "CONTROLLER/NAMESPACE"); for (feat = &features[0]; feat->f_feature != 0; feat++) { char *type; if ((feat->f_getflags & NVMEADM_BOTH) == NVMEADM_BOTH) type = "both"; else if ((feat->f_getflags & NVMEADM_CTRL) != 0) type = "controller only"; else type = "namespace only"; (void) fprintf(stderr, " %-35s %-14s %s\n", feat->f_name, feat->f_short, type); } } static int do_get_feat_common(int fd, const nvme_feature_t *feat, const nvme_process_arg_t *npa) { void *buf = NULL; size_t bufsize = feat->f_bufsize; uint64_t res; if (nvme_get_feature(fd, feat->f_feature, 0, &res, &bufsize, &buf) == B_FALSE) return (EINVAL); nvme_print(2, feat->f_name, -1, NULL); feat->f_print(res, buf, bufsize, npa->npa_idctl, npa->npa_version); free(buf); return (0); } static int do_get_feat_temp_thresh_one(int fd, const nvme_feature_t *feat, const char *label, uint16_t tmpsel, uint16_t thsel, const nvme_process_arg_t *npa) { uint64_t res; void *buf = NULL; size_t bufsize = feat->f_bufsize; nvme_temp_threshold_t tt; tt.r = 0; tt.b.tt_tmpsel = tmpsel; tt.b.tt_thsel = thsel; if (!nvme_get_feature(fd, feat->f_feature, tt.r, &res, &bufsize, &buf)) { return (EINVAL); } feat->f_print(res, (void *)label, 0, npa->npa_idctl, npa->npa_version); free(buf); return (0); } /* * In NVMe 1.2, the specification allowed for up to 8 sensors to be on the * device and changed the main device to have a composite temperature sensor. As * a result, there is a set of thresholds for each sensor. In addition, they * added both an over-temperature and under-temperature threshold. Since most * devices don't actually implement all the sensors, we get the health page and * see which sensors have a non-zero value to determine how to proceed. */ static int do_get_feat_temp_thresh(int fd, const nvme_feature_t *feat, const nvme_process_arg_t *npa) { int ret; size_t bufsize = sizeof (nvme_health_log_t); nvme_health_log_t *hlog; nvme_print(2, feat->f_name, -1, NULL); if ((ret = do_get_feat_temp_thresh_one(fd, feat, "Composite Over Temp. Threshold", 0, NVME_TEMP_THRESH_OVER, npa)) != 0) { return (ret); } if (!nvme_version_check(npa->npa_version, 1, 2)) { return (0); } if ((ret = do_get_feat_temp_thresh_one(fd, feat, "Composite Under Temp. Threshold", 0, NVME_TEMP_THRESH_UNDER, npa)) != 0) { return (ret); } hlog = nvme_get_logpage(fd, NVME_LOGPAGE_HEALTH, &bufsize); if (hlog == NULL) { warnx("failed to get health log page, unable to get " "thresholds for additional sensors"); return (0); } if (hlog->hl_temp_sensor_1 != 0) { (void) do_get_feat_temp_thresh_one(fd, feat, "Temp. Sensor 1 Over Temp. Threshold", 1, NVME_TEMP_THRESH_OVER, npa); (void) do_get_feat_temp_thresh_one(fd, feat, "Temp. Sensor 1 Under Temp. Threshold", 1, NVME_TEMP_THRESH_UNDER, npa); } if (hlog->hl_temp_sensor_2 != 0) { (void) do_get_feat_temp_thresh_one(fd, feat, "Temp. Sensor 2 Over Temp. Threshold", 2, NVME_TEMP_THRESH_OVER, npa); (void) do_get_feat_temp_thresh_one(fd, feat, "Temp. Sensor 2 Under Temp. Threshold", 2, NVME_TEMP_THRESH_UNDER, npa); } if (hlog->hl_temp_sensor_3 != 0) { (void) do_get_feat_temp_thresh_one(fd, feat, "Temp. Sensor 3 Over Temp. Threshold", 3, NVME_TEMP_THRESH_OVER, npa); (void) do_get_feat_temp_thresh_one(fd, feat, "Temp. Sensor 3 Under Temp. Threshold", 3, NVME_TEMP_THRESH_UNDER, npa); } if (hlog->hl_temp_sensor_4 != 0) { (void) do_get_feat_temp_thresh_one(fd, feat, "Temp. Sensor 4 Over Temp. Threshold", 4, NVME_TEMP_THRESH_OVER, npa); (void) do_get_feat_temp_thresh_one(fd, feat, "Temp. Sensor 4 Under Temp. Threshold", 4, NVME_TEMP_THRESH_UNDER, npa); } if (hlog->hl_temp_sensor_5 != 0) { (void) do_get_feat_temp_thresh_one(fd, feat, "Temp. Sensor 5 Over Temp. Threshold", 5, NVME_TEMP_THRESH_OVER, npa); (void) do_get_feat_temp_thresh_one(fd, feat, "Temp. Sensor 5 Under Temp. Threshold", 5, NVME_TEMP_THRESH_UNDER, npa); } if (hlog->hl_temp_sensor_6 != 0) { (void) do_get_feat_temp_thresh_one(fd, feat, "Temp. Sensor 6 Over Temp. Threshold", 6, NVME_TEMP_THRESH_OVER, npa); (void) do_get_feat_temp_thresh_one(fd, feat, "Temp. Sensor 6 Under Temp. Threshold", 6, NVME_TEMP_THRESH_UNDER, npa); } if (hlog->hl_temp_sensor_7 != 0) { (void) do_get_feat_temp_thresh_one(fd, feat, "Temp. Sensor 7 Over Temp. Threshold", 7, NVME_TEMP_THRESH_OVER, npa); (void) do_get_feat_temp_thresh_one(fd, feat, "Temp. Sensor 7 Under Temp. Threshold", 7, NVME_TEMP_THRESH_UNDER, npa); } if (hlog->hl_temp_sensor_8 != 0) { (void) do_get_feat_temp_thresh_one(fd, feat, "Temp. Sensor 8 Over Temp. Threshold", 8, NVME_TEMP_THRESH_OVER, npa); (void) do_get_feat_temp_thresh_one(fd, feat, "Temp. Sensor 8 Under Temp. Threshold", 8, NVME_TEMP_THRESH_UNDER, npa); } free(hlog); return (0); } static int do_get_feat_intr_vect(int fd, const nvme_feature_t *feat, const nvme_process_arg_t *npa) { uint64_t res; uint64_t arg; int intr_cnt; intr_cnt = nvme_intr_cnt(fd); if (intr_cnt == -1) return (EINVAL); nvme_print(2, feat->f_name, -1, NULL); for (arg = 0; arg < intr_cnt; arg++) { if (nvme_get_feature(fd, feat->f_feature, arg, &res, NULL, NULL) == B_FALSE) return (EINVAL); feat->f_print(res, NULL, 0, npa->npa_idctl, npa->npa_version); } return (0); } static int do_get_features(int fd, const nvme_process_arg_t *npa) { const nvme_feature_t *feat; char *f, *flist, *lasts; boolean_t header_printed = B_FALSE; if (npa->npa_argc > 1) errx(-1, "unexpected arguments"); /* * No feature list given, print all supported features. */ if (npa->npa_argc == 0) { (void) printf("%s: Get Features\n", npa->npa_name); for (feat = &features[0]; feat->f_feature != 0; feat++) { if ((npa->npa_isns && (feat->f_getflags & NVMEADM_NS) == 0) || (!npa->npa_isns && (feat->f_getflags & NVMEADM_CTRL) == 0)) continue; (void) feat->f_get(fd, feat, npa); } return (0); } /* * Process feature list. */ flist = strdup(npa->npa_argv[0]); if (flist == NULL) err(-1, "do_get_features"); for (f = strtok_r(flist, ",", &lasts); f != NULL; f = strtok_r(NULL, ",", &lasts)) { while (isspace(*f)) f++; for (feat = &features[0]; feat->f_feature != 0; feat++) { if (strncasecmp(feat->f_name, f, strlen(f)) == 0 || strncasecmp(feat->f_short, f, strlen(f)) == 0) break; } if (feat->f_feature == 0) { warnx("unknown feature %s", f); continue; } if ((npa->npa_isns && (feat->f_getflags & NVMEADM_NS) == 0) || (!npa->npa_isns && (feat->f_getflags & NVMEADM_CTRL) == 0)) { warnx("feature %s %s supported for namespaces", feat->f_name, (feat->f_getflags & NVMEADM_NS) != 0 ? "only" : "not"); continue; } if (!header_printed) { (void) printf("%s: Get Features\n", npa->npa_name); header_printed = B_TRUE; } if (feat->f_get(fd, feat, npa) != 0) { warnx("unsupported feature: %s", feat->f_name); continue; } } free(flist); return (0); } static int do_format_common(int fd, const nvme_process_arg_t *npa, unsigned long lbaf, unsigned long ses) { nvme_process_arg_t ns_npa = { 0 }; nvmeadm_cmd_t cmd = { 0 }; cmd = *(npa->npa_cmd); cmd.c_func = do_attach_detach; cmd.c_name = "detach"; ns_npa = *npa; ns_npa.npa_cmd = &cmd; if (do_attach_detach(fd, &ns_npa) != 0) return (exitcode); if (nvme_format_nvm(fd, lbaf, ses) == B_FALSE) { warn("%s failed", npa->npa_cmd->c_name); exitcode += -1; } cmd.c_name = "attach"; exitcode += do_attach_detach(fd, &ns_npa); return (exitcode); } static void usage_format(const char *c_name) { (void) fprintf(stderr, "%s [/] []\n\n" " Format one or all namespaces of the specified NVMe " "controller. Supported LBA\n formats can be queried with " "the \"%s identify\" command on the namespace\n to be " "formatted.\n", c_name, getprogname()); } static int do_format(int fd, const nvme_process_arg_t *npa) { unsigned long lbaf; if (npa->npa_idctl->id_oacs.oa_format == 0) errx(-1, "%s not supported", npa->npa_cmd->c_name); if (npa->npa_isns && npa->npa_idctl->id_fna.fn_format != 0) errx(-1, "%s not supported on individual namespace", npa->npa_cmd->c_name); if (npa->npa_argc > 0) { errno = 0; lbaf = strtoul(npa->npa_argv[0], NULL, 10); if (errno != 0 || lbaf > NVME_FRMT_MAX_LBAF) errx(-1, "invalid LBA format %d", lbaf + 1); if (npa->npa_idns->id_lbaf[lbaf].lbaf_ms != 0) errx(-1, "LBA formats with metadata not supported"); } else { lbaf = npa->npa_idns->id_flbas.lba_format; } return (do_format_common(fd, npa, lbaf, 0)); } static void usage_secure_erase(const char *c_name) { (void) fprintf(stderr, "%s [/] [-c]\n\n" " Secure-Erase one or all namespaces of the specified " "NVMe controller.\n", c_name); } static int do_secure_erase(int fd, const nvme_process_arg_t *npa) { unsigned long lbaf; uint8_t ses = NVME_FRMT_SES_USER; if (npa->npa_idctl->id_oacs.oa_format == 0) errx(-1, "%s not supported", npa->npa_cmd->c_name); if (npa->npa_isns && npa->npa_idctl->id_fna.fn_sec_erase != 0) errx(-1, "%s not supported on individual namespace", npa->npa_cmd->c_name); if (npa->npa_argc > 0) { if (strcmp(npa->npa_argv[0], "-c") == 0) ses = NVME_FRMT_SES_CRYPTO; else usage(npa->npa_cmd); } if (ses == NVME_FRMT_SES_CRYPTO && npa->npa_idctl->id_fna.fn_crypt_erase == 0) errx(-1, "cryptographic %s not supported", npa->npa_cmd->c_name); lbaf = npa->npa_idns->id_flbas.lba_format; return (do_format_common(fd, npa, lbaf, ses)); } static void usage_attach_detach(const char *c_name) { (void) fprintf(stderr, "%s [/]\n\n" " %c%s blkdev(7d) %s one or all namespaces of the " "specified NVMe controller.\n", c_name, toupper(c_name[0]), &c_name[1], c_name[0] == 'd' ? "from" : "to"); } static int do_attach_detach(int fd, const nvme_process_arg_t *npa) { char *c_name = npa->npa_cmd->c_name; if (!npa->npa_isns) { nvme_process_arg_t ns_npa = { 0 }; ns_npa.npa_name = npa->npa_name; ns_npa.npa_isns = B_TRUE; ns_npa.npa_cmd = npa->npa_cmd; nvme_walk(&ns_npa, npa->npa_node); return (exitcode); } else { if ((c_name[0] == 'd' ? nvme_detach : nvme_attach)(fd) == B_FALSE) { warn("%s failed", c_name); return (-1); } } return (0); } static void usage_firmware_load(const char *c_name) { (void) fprintf(stderr, "%s []\n\n" " Load firmware to offset .\n" " The firmware needs to be committed to a slot using " "\"nvmeadm commit-firmware\"\n command.\n", c_name); } /* * Read exactly len bytes, or until eof. */ static ssize_t read_block(int fd, char *buf, size_t len) { size_t remain; ssize_t bytes; remain = len; while (remain > 0) { bytes = read(fd, buf, remain); if (bytes == 0) break; if (bytes < 0) { if (errno == EINTR) continue; return (-1); } buf += bytes; remain -= bytes; } return (len - remain); } /* * Convert a string to a valid firmware upload offset (in bytes). */ static offset_t get_fw_offsetb(char *str) { longlong_t offsetb; char *valend; errno = 0; offsetb = strtoll(str, &valend, 0); if (errno != 0 || *valend != '\0' || offsetb < 0 || offsetb > NVME_FW_OFFSETB_MAX) errx(-1, "Offset must be numeric and in the range of 0 to %llu", NVME_FW_OFFSETB_MAX); if ((offsetb & NVME_DWORD_MASK) != 0) errx(-1, "Offset must be multiple of %d", NVME_DWORD_SIZE); return ((offset_t)offsetb); } #define FIRMWARE_READ_BLKSIZE (64 * 1024) /* 64K */ static int do_firmware_load(int fd, const nvme_process_arg_t *npa) { int fw_fd; ssize_t len; offset_t offset = 0; size_t size; uint16_t sc; char buf[FIRMWARE_READ_BLKSIZE]; if (npa->npa_argc > 2) errx(-1, "Too many arguments"); if (npa->npa_argc == 0) errx(-1, "Requires firmware file name, and an " "optional offset"); if (npa->npa_isns) errx(-1, "Firmware loading not available on a per-namespace " "basis"); if (npa->npa_argc == 2) offset = get_fw_offsetb(npa->npa_argv[1]); fw_fd = open(npa->npa_argv[0], O_RDONLY); if (fw_fd < 0) errx(-1, "Failed to open \"%s\": %s", npa->npa_argv[0], strerror(errno)); size = 0; do { len = read_block(fw_fd, buf, sizeof (buf)); if (len < 0) errx(-1, "Error reading \"%s\": %s", npa->npa_argv[0], strerror(errno)); if (len == 0) break; if (!nvme_firmware_load(fd, buf, len, offset, &sc)) errx(-1, "Error loading \"%s\": %s", npa->npa_argv[0], nvme_fw_error(errno, sc)); offset += len; size += len; } while (len == sizeof (buf)); (void) close(fw_fd); if (verbose) (void) printf("%zu bytes downloaded.\n", size); return (0); } /* * Convert str to a valid firmware slot number. */ static uint_t get_slot_number(char *str) { longlong_t slot; char *valend; errno = 0; slot = strtoll(str, &valend, 0); if (errno != 0 || *valend != '\0' || slot < NVME_FW_SLOT_MIN || slot > NVME_FW_SLOT_MAX) errx(-1, "Slot must be numeric and in the range of %d to %d", NVME_FW_SLOT_MIN, NVME_FW_SLOT_MAX); return ((uint_t)slot); } static void usage_firmware_commit(const char *c_name) { (void) fprintf(stderr, "%s \n\n" " Commit previously downloaded firmware to slot .\n" " The firmware is only activated after a " "\"nvmeadm activate-firmware\" command.\n", c_name); } static int do_firmware_commit(int fd, const nvme_process_arg_t *npa) { uint_t slot; uint16_t sc; if (npa->npa_argc > 1) errx(-1, "Too many arguments"); if (npa->npa_argc == 0) errx(-1, "Firmware slot number is required"); if (npa->npa_isns) errx(-1, "Firmware committing not available on a per-namespace " "basis"); slot = get_slot_number(npa->npa_argv[0]); if (slot == 1 && npa->npa_idctl->id_frmw.fw_readonly) errx(-1, "Cannot commit firmware to slot 1: slot is read-only"); if (!nvme_firmware_commit(fd, slot, NVME_FWC_SAVE, &sc)) errx(-1, "Failed to commit firmware to slot %u: %s", slot, nvme_fw_error(errno, sc)); if (verbose) (void) printf("Firmware committed to slot %u.\n", slot); return (0); } static void usage_firmware_activate(const char *c_name) { (void) fprintf(stderr, "%s \n\n" " Activate firmware in slot .\n" " The firmware will be in use after the next system reset.\n", c_name); } static int do_firmware_activate(int fd, const nvme_process_arg_t *npa) { uint_t slot; uint16_t sc; if (npa->npa_argc > 1) errx(-1, "Too many arguments"); if (npa->npa_argc == 0) errx(-1, "Firmware slot number is required"); if (npa->npa_isns) errx(-1, "Firmware activation not available on a per-namespace " "basis"); slot = get_slot_number(npa->npa_argv[0]); if (!nvme_firmware_commit(fd, slot, NVME_FWC_ACTIVATE, &sc)) errx(-1, "Failed to activate slot %u: %s", slot, nvme_fw_error(errno, sc)); if (verbose) printf("Slot %u activated: %s.\n", slot, nvme_fw_error(errno, sc)); return (0); } /* * While the NVME_VERSION_ATLEAST macro exists, specifying a version of 1.0 * causes GCC to helpfully flag the -Wtype-limits warning because a uint_t is * always >= 0. In many cases it's useful to always indicate what version * something was added in to simplify code (e.g. nvmeadm_print_bit) and we'd * rather just say it's version 1.0 rather than making folks realize that a * hardcoded true is equivalent. Therefore we have this function which can't * trigger this warning today (and adds a minor amount of type safety). If GCC * or clang get smart enough to see through this, then we'll have to just * disable the warning for the single minor comparison (and reformat this a bit * to minimize the impact). */ boolean_t nvme_version_check(nvme_version_t *vers, uint_t major, uint_t minor) { if (vers->v_major > major) { return (B_TRUE); } return (vers->v_major == major && vers->v_minor >= minor); }