]> git.ipfire.org Git - thirdparty/mdadm.git/blame - platform-intel.c
monitor: refactor checkpoint update
[thirdparty/mdadm.git] / platform-intel.c
CommitLineData
b390f610
DW
1/*
2 * Intel(R) Matrix Storage Manager hardware and firmware support routines
3 *
4 * Copyright (C) 2008 Intel Corporation
5 *
6 * This program is free software; you can redistribute it and/or modify it
7 * under the terms and conditions of the GNU General Public License,
8 * version 2, as published by the Free Software Foundation.
9 *
10 * This program is distributed in the hope it will be useful, but WITHOUT
11 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
12 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
13 * more details.
14 *
15 * You should have received a copy of the GNU General Public License along with
16 * this program; if not, write to the Free Software Foundation, Inc.,
17 * 51 Franklin St - Fifth Floor, Boston, MA 02110-1301 USA.
18 */
19#include "mdadm.h"
20#include "platform-intel.h"
21#include "probe_roms.h"
22#include <stdio.h>
23#include <stdlib.h>
24#include <string.h>
25#include <unistd.h>
26#include <dirent.h>
27#include <fcntl.h>
28#include <sys/mman.h>
29#include <sys/types.h>
30#include <sys/stat.h>
fc13853f
LM
31#include <limits.h>
32
d835518b
BK
33#define NVME_SUBSYS_PATH "/sys/devices/virtual/nvme-subsystem/"
34
9c747fa0
LM
35static int devpath_to_ll(const char *dev_path, const char *entry,
36 unsigned long long *val);
37
9bc4ae77 38static void free_sys_dev(struct sys_dev **list)
b390f610
DW
39{
40 while (*list) {
41 struct sys_dev *next = (*list)->next;
42
43 if ((*list)->path)
44 free((*list)->path);
45 free(*list);
46 *list = next;
47 }
48}
49
50struct sys_dev *find_driver_devices(const char *bus, const char *driver)
51{
52 /* search sysfs for devices driven by 'driver' */
30730cb8
AO
53 char path[PATH_MAX];
54 char link[PATH_MAX];
55 char *c, *p;
b390f610
DW
56 DIR *driver_dir;
57 struct dirent *de;
58 struct sys_dev *head = NULL;
59 struct sys_dev *list = NULL;
60f0f54d 60 struct sys_dev *vmd = NULL;
a8e5382a 61 enum sys_dev_type type;
9c747fa0 62 unsigned long long dev_id;
6b781d33 63 unsigned long long class;
a8e5382a
LM
64
65 if (strcmp(driver, "isci") == 0)
66 type = SYS_DEV_SAS;
75350d87
KF
67 else if (strcmp(driver, "ahci") == 0) {
68 vmd = find_driver_devices("pci", "vmd");
a8e5382a 69 type = SYS_DEV_SATA;
75350d87 70 } else if (strcmp(driver, "nvme") == 0) {
60f0f54d
PB
71 /* if looking for nvme devs, first look for vmd */
72 vmd = find_driver_devices("pci", "vmd");
614902f6 73 type = SYS_DEV_NVME;
60f0f54d
PB
74 } else if (strcmp(driver, "vmd") == 0)
75 type = SYS_DEV_VMD;
a8e5382a
LM
76 else
77 type = SYS_DEV_UNKNOWN;
b390f610
DW
78
79 sprintf(path, "/sys/bus/%s/drivers/%s", bus, driver);
80 driver_dir = opendir(path);
60f0f54d
PB
81 if (!driver_dir) {
82 if (vmd)
83 free_sys_dev(&vmd);
b390f610 84 return NULL;
60f0f54d 85 }
b390f610 86 for (de = readdir(driver_dir); de; de = readdir(driver_dir)) {
5a1920f2 87 int n;
60f0f54d 88 int skip = 0;
5a1920f2 89
b390f610
DW
90 /* is 'de' a device? check that the 'subsystem' link exists and
91 * that its target matches 'bus'
92 */
93 sprintf(path, "/sys/bus/%s/drivers/%s/%s/subsystem",
94 bus, driver, de->d_name);
5a1920f2 95 n = readlink(path, link, sizeof(link));
f21e18ca 96 if (n < 0 || n >= (int)sizeof(link))
b390f610 97 continue;
5a1920f2 98 link[n] = '\0';
b390f610
DW
99 c = strrchr(link, '/');
100 if (!c)
101 continue;
102 if (strncmp(bus, c+1, strlen(bus)) != 0)
103 continue;
104
a8e5382a
LM
105 sprintf(path, "/sys/bus/%s/drivers/%s/%s",
106 bus, driver, de->d_name);
107
60f0f54d
PB
108 /* if searching for nvme - skip vmd connected one */
109 if (type == SYS_DEV_NVME) {
110 struct sys_dev *dev;
111 char *rp = realpath(path, NULL);
112 for (dev = vmd; dev; dev = dev->next) {
113 if ((strncmp(dev->path, rp, strlen(dev->path)) == 0))
114 skip = 1;
115 }
116 free(rp);
117 }
118
75350d87
KF
119 /* change sata type if under a vmd controller */
120 if (type == SYS_DEV_SATA) {
121 struct sys_dev *dev;
122 char *rp = realpath(path, NULL);
123 for (dev = vmd; dev; dev = dev->next) {
124 if ((strncmp(dev->path, rp, strlen(dev->path)) == 0))
125 type = SYS_DEV_SATA_VMD;
126 }
127 free(rp);
128 }
129
60f0f54d
PB
130 /* if it's not Intel device or mark as VMD connected - skip it. */
131 if (devpath_to_vendor(path) != 0x8086 || skip == 1)
a8e5382a
LM
132 continue;
133
9c747fa0
LM
134 if (devpath_to_ll(path, "device", &dev_id) != 0)
135 continue;
136
6b781d33
AP
137 if (devpath_to_ll(path, "class", &class) != 0)
138 continue;
139
30730cb8
AO
140 /*
141 * Each VMD device (domain) adds separate PCI bus, it is better
142 * to store path as a path to that bus (easier further
143 * determination which NVMe dev is connected to this particular
144 * VMD domain).
145 */
146 if (type == SYS_DEV_VMD) {
147 sprintf(path, "/sys/bus/%s/drivers/%s/%s/domain/device",
148 bus, driver, de->d_name);
149 }
150 p = realpath(path, NULL);
151 if (p == NULL) {
152 pr_err("Unable to get real path for '%s'\n", path);
153 continue;
154 }
155
b390f610
DW
156 /* start / add list entry */
157 if (!head) {
503975b9 158 head = xmalloc(sizeof(*head));
b390f610
DW
159 list = head;
160 } else {
503975b9 161 list->next = xmalloc(sizeof(*head));
b390f610
DW
162 list = list->next;
163 }
164
165 if (!list) {
166 free_sys_dev(&head);
167 break;
168 }
169
9c747fa0 170 list->dev_id = (__u16) dev_id;
6b781d33 171 list->class = (__u32) class;
a8e5382a 172 list->type = type;
b390f610 173 list->next = NULL;
30730cb8
AO
174 list->path = p;
175
a8e5382a
LM
176 if ((list->pci_id = strrchr(list->path, '/')) != NULL)
177 list->pci_id++;
b390f610 178 }
2a17c77b 179 closedir(driver_dir);
60f0f54d 180
75350d87
KF
181 /* nvme vmd needs a list separate from sata vmd */
182 if (vmd && type == SYS_DEV_NVME) {
60f0f54d
PB
183 if (list)
184 list->next = vmd;
185 else
186 head = vmd;
187 }
188
b390f610
DW
189 return head;
190}
191
9c747fa0 192static struct sys_dev *intel_devices=NULL;
9bc4ae77 193static time_t valid_time = 0;
9c747fa0 194
0858eccf
AP
195struct sys_dev *device_by_id(__u16 device_id)
196{
197 struct sys_dev *iter;
198
199 for (iter = intel_devices; iter != NULL; iter = iter->next)
200 if (iter->dev_id == device_id)
201 return iter;
202 return NULL;
203}
204
d3c11416
AO
205struct sys_dev *device_by_id_and_path(__u16 device_id, const char *path)
206{
207 struct sys_dev *iter;
208
209 for (iter = intel_devices; iter != NULL; iter = iter->next)
210 if ((iter->dev_id == device_id) && strstr(iter->path, path))
211 return iter;
212 return NULL;
213}
214
9c747fa0
LM
215static int devpath_to_ll(const char *dev_path, const char *entry, unsigned long long *val)
216{
dd5ab402 217 char path[strnlen(dev_path, PATH_MAX) + strnlen(entry, PATH_MAX) + 2];
9c747fa0
LM
218 int fd;
219 int n;
220
221 sprintf(path, "%s/%s", dev_path, entry);
222
223 fd = open(path, O_RDONLY);
224 if (fd < 0)
225 return -1;
226 n = sysfs_fd_get_ll(fd, val);
227 close(fd);
228 return n;
229}
230
60f0f54d 231__u16 devpath_to_vendor(const char *dev_path)
b390f610
DW
232{
233 char path[strlen(dev_path) + strlen("/vendor") + 1];
234 char vendor[7];
235 int fd;
236 __u16 id = 0xffff;
237 int n;
238
239 sprintf(path, "%s/vendor", dev_path);
240
241 fd = open(path, O_RDONLY);
242 if (fd < 0)
243 return 0xffff;
244
245 n = read(fd, vendor, sizeof(vendor));
246 if (n == sizeof(vendor)) {
247 vendor[n - 1] = '\0';
248 id = strtoul(vendor, NULL, 16);
249 }
250 close(fd);
251
252 return id;
253}
254
fcebeb77
MT
255/* Description: Read text value of dev_path/entry field
256 * Parameters:
257 * dev_path - sysfs path to the device
258 * entry - entry to be read
259 * buf - buffer for read value
260 * len - size of buf
261 * verbose - error logging level
262 */
263int devpath_to_char(const char *dev_path, const char *entry, char *buf, int len,
264 int verbose)
265{
266 char path[PATH_MAX];
267
268 snprintf(path, sizeof(path), "%s/%s", dev_path, entry);
269 if (load_sys(path, buf, len)) {
270 if (verbose)
271 pr_err("Cannot read %s, aborting\n", path);
272 return 1;
273 }
274
275 return 0;
276}
277
a8e5382a 278struct sys_dev *find_intel_devices(void)
b390f610 279{
614902f6 280 struct sys_dev *ahci, *isci, *nvme;
a8e5382a 281
9bc4ae77
N
282 if (valid_time > time(0) - 10)
283 return intel_devices;
284
285 if (intel_devices)
286 free_sys_dev(&intel_devices);
287
a8e5382a 288 isci = find_driver_devices("pci", "isci");
75350d87 289 /* Searching for AHCI will return list of SATA and SATA VMD controllers */
a8e5382a 290 ahci = find_driver_devices("pci", "ahci");
60f0f54d 291 /* Searching for NVMe will return list of NVMe and VMD controllers */
614902f6 292 nvme = find_driver_devices("pci", "nvme");
a8e5382a 293
614902f6
PB
294 if (!isci && !ahci) {
295 ahci = nvme;
296 } else if (!ahci) {
a8e5382a 297 ahci = isci;
614902f6
PB
298 struct sys_dev *elem = ahci;
299 while (elem->next)
300 elem = elem->next;
301 elem->next = nvme;
a8e5382a
LM
302 } else {
303 struct sys_dev *elem = ahci;
304 while (elem->next)
305 elem = elem->next;
306 elem->next = isci;
614902f6
PB
307 while (elem->next)
308 elem = elem->next;
309 elem->next = nvme;
a8e5382a 310 }
9bc4ae77
N
311 intel_devices = ahci;
312 valid_time = time(0);
313 return intel_devices;
b390f610
DW
314}
315
3c8bfb5d 316/*
fc13853f 317 * PCI Expansion ROM Data Structure Format */
3c8bfb5d
LM
318struct pciExpDataStructFormat {
319 __u8 ver[4];
320 __u16 vendorID;
321 __u16 deviceID;
6b781d33 322 __u16 devListOffset;
f666bcc6
PB
323 __u16 pciDataStructLen;
324 __u8 pciDataStructRev;
3c8bfb5d
LM
325} __attribute__ ((packed));
326
5e1d6128 327struct orom_entry *orom_entries;
0858eccf 328
72a45777 329const struct orom_entry *get_orom_entry_by_device_id(__u16 dev_id)
6b781d33 330{
5e1d6128
AP
331 struct orom_entry *entry;
332 struct devid_list *devid;
6b781d33 333
5e1d6128
AP
334 for (entry = orom_entries; entry; entry = entry->next) {
335 for (devid = entry->devid_list; devid; devid = devid->next) {
336 if (devid->devid == dev_id)
72a45777 337 return entry;
6b781d33
AP
338 }
339 }
5e1d6128 340
6b781d33
AP
341 return NULL;
342}
343
72a45777
PB
344const struct imsm_orom *get_orom_by_device_id(__u16 dev_id)
345{
346 const struct orom_entry *entry = get_orom_entry_by_device_id(dev_id);
347
348 if (entry)
349 return &entry->orom;
350
351 return NULL;
352}
353
5e1d6128 354static struct orom_entry *add_orom(const struct imsm_orom *orom)
6b781d33 355{
5e1d6128
AP
356 struct orom_entry *list;
357 struct orom_entry *prev = NULL;
358
359 for (list = orom_entries; list; prev = list, list = list->next)
360 ;
361
362 list = xmalloc(sizeof(struct orom_entry));
363 list->orom = *orom;
364 list->devid_list = NULL;
365 list->next = NULL;
366
367 if (prev == NULL)
368 orom_entries = list;
369 else
370 prev->next = list;
371
372 return list;
6b781d33
AP
373}
374
5e1d6128 375static void add_orom_device_id(struct orom_entry *entry, __u16 dev_id)
6b781d33 376{
6b781d33
AP
377 struct devid_list *list;
378 struct devid_list *prev = NULL;
379
5e1d6128
AP
380 for (list = entry->devid_list; list; prev = list, list = list->next) {
381 if (list->devid == dev_id)
6b781d33 382 return;
6b781d33 383 }
5e1d6128
AP
384 list = xmalloc(sizeof(struct devid_list));
385 list->devid = dev_id;
386 list->next = NULL;
387
388 if (prev == NULL)
389 entry->devid_list = list;
390 else
391 prev->next = list;
6b781d33 392}
fc13853f 393
3c8bfb5d 394static int scan(const void *start, const void *end, const void *data)
b390f610
DW
395{
396 int offset;
6b781d33 397 const struct imsm_orom *imsm_mem = NULL;
b390f610 398 int len = (end - start);
3c8bfb5d
LM
399 struct pciExpDataStructFormat *ptr= (struct pciExpDataStructFormat *)data;
400
9c747fa0
LM
401 if (data + 0x18 > end) {
402 dprintf("cannot find pciExpDataStruct \n");
403 return 0;
404 }
405
3c8bfb5d
LM
406 dprintf("ptr->vendorID: %lx __le16_to_cpu(ptr->deviceID): %lx \n",
407 (ulong) __le16_to_cpu(ptr->vendorID),
408 (ulong) __le16_to_cpu(ptr->deviceID));
409
6b781d33 410 if (__le16_to_cpu(ptr->vendorID) != 0x8086)
3c8bfb5d 411 return 0;
b390f610 412
5c4cc0c8
RS
413 if (get_orom_by_device_id(ptr->deviceID))
414 return 0;
415
b390f610 416 for (offset = 0; offset < len; offset += 4) {
6b781d33
AP
417 const void *mem = start + offset;
418
419 if ((memcmp(mem, IMSM_OROM_SIGNATURE, 4) == 0)) {
420 imsm_mem = mem;
421 break;
b390f610
DW
422 }
423 }
6b781d33
AP
424
425 if (!imsm_mem)
426 return 0;
427
5e1d6128 428 struct orom_entry *orom = add_orom(imsm_mem);
6b781d33 429
f666bcc6
PB
430 /* only PciDataStructure with revision 3 and above supports devices list. */
431 if (ptr->pciDataStructRev >= 3 && ptr->devListOffset) {
6b781d33
AP
432 const __u16 *dev_list = (void *)ptr + ptr->devListOffset;
433 int i;
434
435 for (i = 0; dev_list[i] != 0; i++)
436 add_orom_device_id(orom, dev_list[i]);
437 } else {
438 add_orom_device_id(orom, __le16_to_cpu(ptr->deviceID));
439 }
440
b390f610
DW
441 return 0;
442}
443
6b781d33 444const struct imsm_orom *imsm_platform_test(struct sys_dev *hba)
fc13853f 445{
6b781d33
AP
446 struct imsm_orom orom = {
447 .signature = IMSM_OROM_SIGNATURE,
448 .rlc = IMSM_OROM_RLC_RAID0 | IMSM_OROM_RLC_RAID1 |
449 IMSM_OROM_RLC_RAID10 | IMSM_OROM_RLC_RAID5,
450 .sss = IMSM_OROM_SSS_4kB | IMSM_OROM_SSS_8kB |
451 IMSM_OROM_SSS_16kB | IMSM_OROM_SSS_32kB |
452 IMSM_OROM_SSS_64kB | IMSM_OROM_SSS_128kB |
453 IMSM_OROM_SSS_256kB | IMSM_OROM_SSS_512kB |
454 IMSM_OROM_SSS_1MB | IMSM_OROM_SSS_2MB,
455 .dpa = IMSM_OROM_DISKS_PER_ARRAY,
456 .tds = IMSM_OROM_TOTAL_DISKS,
457 .vpa = IMSM_OROM_VOLUMES_PER_ARRAY,
458 .vphba = IMSM_OROM_VOLUMES_PER_HBA
459 };
460 orom.attr = orom.rlc | IMSM_OROM_ATTR_ChecksumVerify;
fc13853f
LM
461
462 if (check_env("IMSM_TEST_OROM_NORAID5")) {
6b781d33 463 orom.rlc = IMSM_OROM_RLC_RAID0 | IMSM_OROM_RLC_RAID1 |
fc13853f
LM
464 IMSM_OROM_RLC_RAID10;
465 }
6b781d33
AP
466 if (check_env("IMSM_TEST_AHCI_EFI_NORAID5") && (hba->type == SYS_DEV_SAS)) {
467 orom.rlc = IMSM_OROM_RLC_RAID0 | IMSM_OROM_RLC_RAID1 |
fc13853f
LM
468 IMSM_OROM_RLC_RAID10;
469 }
6b781d33
AP
470 if (check_env("IMSM_TEST_SCU_EFI_NORAID5") && (hba->type == SYS_DEV_SATA)) {
471 orom.rlc = IMSM_OROM_RLC_RAID0 | IMSM_OROM_RLC_RAID1 |
fc13853f 472 IMSM_OROM_RLC_RAID10;
cceebc67
DW
473 }
474
5e1d6128 475 struct orom_entry *ret = add_orom(&orom);
6b781d33
AP
476
477 add_orom_device_id(ret, hba->dev_id);
478
5e1d6128 479 return &ret->orom;
fc13853f
LM
480}
481
6b781d33 482static const struct imsm_orom *find_imsm_hba_orom(struct sys_dev *hba)
fc13853f
LM
483{
484 unsigned long align;
485
6b781d33
AP
486 if (check_env("IMSM_TEST_OROM"))
487 return imsm_platform_test(hba);
fc13853f 488
fc13853f 489 /* return empty OROM capabilities in EFI test mode */
6b781d33 490 if (check_env("IMSM_TEST_AHCI_EFI") || check_env("IMSM_TEST_SCU_EFI"))
fc13853f
LM
491 return NULL;
492
9bc4ae77 493 find_intel_devices();
9c747fa0
LM
494
495 if (intel_devices == NULL)
b390f610
DW
496 return NULL;
497
498 /* scan option-rom memory looking for an imsm signature */
969c2555
DW
499 if (check_env("IMSM_SAFE_OROM_SCAN"))
500 align = 2048;
501 else
502 align = 512;
503 if (probe_roms_init(align) != 0)
b390f610
DW
504 return NULL;
505 probe_roms();
9c747fa0 506 /* ignore return value - True is returned if both adapater roms are found */
fc13853f 507 scan_adapter_roms(scan);
b390f610
DW
508 probe_roms_exit();
509
6b781d33 510 return get_orom_by_device_id(hba->dev_id);
fc13853f
LM
511}
512
1a901471
LM
513#define EFI_GUID(a, b, c, d0, d1, d2, d3, d4, d5, d6, d7) \
514((struct efi_guid) \
515{{ (a) & 0xff, ((a) >> 8) & 0xff, ((a) >> 16) & 0xff, ((a) >> 24) & 0xff, \
516 (b) & 0xff, ((b) >> 8) & 0xff, \
517 (c) & 0xff, ((c) >> 8) & 0xff, \
518 (d0), (d1), (d2), (d3), (d4), (d5), (d6), (d7) }})
fc13853f 519
5a6baf66 520#define SYS_EFI_VAR_PATH "/sys/firmware/efi/vars"
88605db9 521#define SYS_EFIVARS_PATH "/sys/firmware/efi/efivars"
5a6baf66
LM
522#define SCU_PROP "RstScuV"
523#define AHCI_PROP "RstSataV"
81188ef8 524#define AHCI_SSATA_PROP "RstsSatV"
f94df5cf 525#define AHCI_TSATA_PROP "RsttSatV"
ea7a02a3
OJ
526#define VROC_VMD_PROP "RstUefiV"
527#define RST_VMD_PROP "RstVmdV"
5a6baf66
LM
528
529#define VENDOR_GUID \
530 EFI_GUID(0x193dfefa, 0xa445, 0x4302, 0x99, 0xd8, 0xef, 0x3a, 0xad, 0x1a, 0x04, 0xc6)
531
6b781d33 532#define PCI_CLASS_RAID_CNTRL 0x010400
5a6baf66 533
f94df5cf
MT
534static int read_efi_var(void *buffer, ssize_t buf_size,
535 const char *variable_name, struct efi_guid guid)
88605db9
AP
536{
537 char path[PATH_MAX];
538 char buf[GUID_STR_MAX];
539 int fd;
540 ssize_t n;
541
542 snprintf(path, PATH_MAX, "%s/%s-%s", SYS_EFIVARS_PATH, variable_name, guid_str(buf, guid));
543
544 fd = open(path, O_RDONLY);
545 if (fd < 0)
546 return 1;
547
548 /* read the variable attributes and ignore it */
549 n = read(fd, buf, sizeof(__u32));
550 if (n < 0) {
551 close(fd);
552 return 1;
553 }
554
555 /* read the variable data */
556 n = read(fd, buffer, buf_size);
557 close(fd);
558 if (n < buf_size)
559 return 1;
560
561 return 0;
562}
563
f94df5cf
MT
564static int read_efi_variable(void *buffer, ssize_t buf_size,
565 const char *variable_name, struct efi_guid guid)
5a6baf66 566{
5a6baf66
LM
567 char path[PATH_MAX];
568 char buf[GUID_STR_MAX];
aae4c111
HCP
569 int dfd;
570 ssize_t n, var_data_len;
571
88605db9
AP
572 /* Try to read the variable using the new efivarfs interface first.
573 * If that fails, fall back to the old sysfs-efivars interface. */
574 if (!read_efi_var(buffer, buf_size, variable_name, guid))
575 return 0;
576
aae4c111
HCP
577 snprintf(path, PATH_MAX, "%s/%s-%s/size", SYS_EFI_VAR_PATH, variable_name, guid_str(buf, guid));
578
579 dprintf("EFI VAR: path=%s\n", path);
580 /* get size of variable data */
581 dfd = open(path, O_RDONLY);
582 if (dfd < 0)
583 return 1;
584
585 n = read(dfd, &buf, sizeof(buf));
586 close(dfd);
587 if (n < 0)
588 return 1;
589 buf[n] = '\0';
590
591 errno = 0;
592 var_data_len = strtoul(buf, NULL, 16);
d7be7d87
JS
593 if ((errno == ERANGE && (var_data_len == LONG_MAX)) ||
594 (errno != 0 && var_data_len == 0))
aae4c111
HCP
595 return 1;
596
597 /* get data */
598 snprintf(path, PATH_MAX, "%s/%s-%s/data", SYS_EFI_VAR_PATH, variable_name, guid_str(buf, guid));
599
600 dprintf("EFI VAR: path=%s\n", path);
601 dfd = open(path, O_RDONLY);
602 if (dfd < 0)
603 return 1;
604
605 n = read(dfd, buffer, buf_size);
606 close(dfd);
607 if (n != var_data_len || n < buf_size) {
608 return 1;
609 }
610
611 return 0;
612}
5a6baf66 613
6b781d33 614const struct imsm_orom *find_imsm_efi(struct sys_dev *hba)
aae4c111 615{
6b781d33 616 struct imsm_orom orom;
5e1d6128 617 struct orom_entry *ret;
f94df5cf
MT
618 static const char * const sata_efivars[] = {AHCI_PROP, AHCI_SSATA_PROP,
619 AHCI_TSATA_PROP};
ea7a02a3 620 static const char * const vmd_efivars[] = {VROC_VMD_PROP, RST_VMD_PROP};
f94df5cf 621 unsigned long i;
5a6baf66 622
6b781d33
AP
623 if (check_env("IMSM_TEST_AHCI_EFI") || check_env("IMSM_TEST_SCU_EFI"))
624 return imsm_platform_test(hba);
5a6baf66 625
5a6baf66 626 /* OROM test is set, return that there is no EFI capabilities */
aae4c111 627 if (check_env("IMSM_TEST_OROM"))
5a6baf66 628 return NULL;
5a6baf66 629
f94df5cf
MT
630 switch (hba->type) {
631 case SYS_DEV_SAS:
632 if (!read_efi_variable(&orom, sizeof(orom), SCU_PROP,
633 VENDOR_GUID))
634 break;
81188ef8 635
f94df5cf
MT
636 return NULL;
637 case SYS_DEV_SATA:
638 if (hba->class != PCI_CLASS_RAID_CNTRL)
639 return NULL;
81188ef8 640
f94df5cf
MT
641 for (i = 0; i < ARRAY_SIZE(sata_efivars); i++) {
642 if (!read_efi_variable(&orom, sizeof(orom),
643 sata_efivars[i], VENDOR_GUID))
644 break;
81188ef8 645
81188ef8 646 }
f94df5cf
MT
647 if (i == ARRAY_SIZE(sata_efivars))
648 return NULL;
81188ef8 649
f94df5cf
MT
650 break;
651 case SYS_DEV_VMD:
75350d87 652 case SYS_DEV_SATA_VMD:
ea7a02a3
OJ
653 for (i = 0; i < ARRAY_SIZE(vmd_efivars); i++) {
654 if (!read_efi_variable(&orom, sizeof(orom),
655 vmd_efivars[i], VENDOR_GUID))
656 break;
657 }
658
659 if (i == ARRAY_SIZE(vmd_efivars))
660 return NULL;
661
662 break;
f94df5cf
MT
663 default:
664 return NULL;
665 }
5a6baf66 666
6b781d33
AP
667 ret = add_orom(&orom);
668 add_orom_device_id(ret, hba->dev_id);
60f0f54d 669 ret->type = hba->type;
6b781d33 670
5e1d6128 671 return &ret->orom;
fc13853f
LM
672}
673
614902f6
PB
674const struct imsm_orom *find_imsm_nvme(struct sys_dev *hba)
675{
5e1d6128 676 static struct orom_entry *nvme_orom;
614902f6
PB
677
678 if (hba->type != SYS_DEV_NVME)
679 return NULL;
680
681 if (!nvme_orom) {
682 struct imsm_orom nvme_orom_compat = {
683 .signature = IMSM_NVME_OROM_COMPAT_SIGNATURE,
684 .rlc = IMSM_OROM_RLC_RAID0 | IMSM_OROM_RLC_RAID1 |
685 IMSM_OROM_RLC_RAID10 | IMSM_OROM_RLC_RAID5,
686 .sss = IMSM_OROM_SSS_4kB | IMSM_OROM_SSS_8kB |
687 IMSM_OROM_SSS_16kB | IMSM_OROM_SSS_32kB |
688 IMSM_OROM_SSS_64kB | IMSM_OROM_SSS_128kB,
689 .dpa = IMSM_OROM_DISKS_PER_ARRAY_NVME,
690 .tds = IMSM_OROM_TOTAL_DISKS_NVME,
691 .vpa = IMSM_OROM_VOLUMES_PER_ARRAY,
692 .vphba = IMSM_OROM_TOTAL_DISKS_NVME / 2 * IMSM_OROM_VOLUMES_PER_ARRAY,
693 .attr = IMSM_OROM_ATTR_2TB | IMSM_OROM_ATTR_2TB_DISK,
0858eccf 694 .driver_features = IMSM_OROM_CAPABILITIES_EnterpriseSystem
614902f6
PB
695 };
696 nvme_orom = add_orom(&nvme_orom_compat);
697 }
698 add_orom_device_id(nvme_orom, hba->dev_id);
60f0f54d 699 nvme_orom->type = SYS_DEV_NVME;
5e1d6128 700 return &nvme_orom->orom;
614902f6
PB
701}
702
8d1114be
MG
703#define VMD_REGISTER_OFFSET 0x3FC
704#define VMD_REGISTER_SKU_SHIFT 1
705#define VMD_REGISTER_SKU_MASK (0x00000007)
706#define VMD_REGISTER_SKU_PREMIUM 2
707#define MD_REGISTER_VER_MAJOR_SHIFT 4
708#define MD_REGISTER_VER_MAJOR_MASK (0x0000000F)
709#define MD_REGISTER_VER_MINOR_SHIFT 8
710#define MD_REGISTER_VER_MINOR_MASK (0x0000000F)
711
712/*
713 * read_vmd_register() - Reads VMD register and writes contents to buff ptr
714 * @buff: buffer for vmd register data, should be the size of uint32_t
715 *
716 * Return: 0 on success, 1 on error
717 */
718int read_vmd_register(uint32_t *buff, struct sys_dev *hba)
719{
720 int fd;
721 char vmd_pci_config_path[PATH_MAX];
722
723 if (!vmd_domain_to_controller(hba, vmd_pci_config_path))
724 return 1;
725
726 strncat(vmd_pci_config_path, "/config", PATH_MAX - strnlen(vmd_pci_config_path, PATH_MAX));
727
728 fd = open(vmd_pci_config_path, O_RDONLY);
729 if (fd < 0)
730 return 1;
731
732 if (pread(fd, buff, sizeof(uint32_t), VMD_REGISTER_OFFSET) != sizeof(uint32_t)) {
733 close(fd);
734 return 1;
735 }
736 close(fd);
737 return 0;
738}
739
740/*
741 * add_vmd_orom() - Adds VMD orom cap to orom list, writes orom_entry ptr into vmd_orom
742 * @vmd_orom: pointer to orom entry pointer
743 *
744 * Return: 0 on success, 1 on error
745 */
746int add_vmd_orom(struct orom_entry **vmd_orom, struct sys_dev *hba)
747{
748 uint8_t sku;
749 uint32_t vmd_register_data;
750 struct imsm_orom vmd_orom_cap = {
751 .signature = IMSM_VMD_OROM_COMPAT_SIGNATURE,
752 .sss = IMSM_OROM_SSS_4kB | IMSM_OROM_SSS_8kB |
753 IMSM_OROM_SSS_16kB | IMSM_OROM_SSS_32kB |
754 IMSM_OROM_SSS_64kB | IMSM_OROM_SSS_128kB,
755 .dpa = IMSM_OROM_DISKS_PER_ARRAY_NVME,
756 .tds = IMSM_OROM_TOTAL_DISKS_VMD,
757 .vpa = IMSM_OROM_VOLUMES_PER_ARRAY,
758 .vphba = IMSM_OROM_VOLUMES_PER_HBA_VMD,
759 .attr = IMSM_OROM_ATTR_2TB | IMSM_OROM_ATTR_2TB_DISK,
760 .driver_features = IMSM_OROM_CAPABILITIES_EnterpriseSystem |
761 IMSM_OROM_CAPABILITIES_TPV
762 };
763
764 if (read_vmd_register(&vmd_register_data, hba) != 0)
765 return 1;
766
767 sku = (uint8_t)((vmd_register_data >> VMD_REGISTER_SKU_SHIFT) &
768 VMD_REGISTER_SKU_MASK);
769
770 if (sku == VMD_REGISTER_SKU_PREMIUM)
771 vmd_orom_cap.rlc = IMSM_OROM_RLC_RAID0 | IMSM_OROM_RLC_RAID1 |
772 IMSM_OROM_RLC_RAID10 | IMSM_OROM_RLC_RAID5;
773 else
774 vmd_orom_cap.rlc = IMSM_OROM_RLC_RAID_CNG;
775
776 vmd_orom_cap.major_ver = (uint8_t)
777 ((vmd_register_data >> MD_REGISTER_VER_MAJOR_SHIFT) &
778 MD_REGISTER_VER_MAJOR_MASK);
779 vmd_orom_cap.minor_ver = (uint8_t)
780 ((vmd_register_data >> MD_REGISTER_VER_MINOR_SHIFT) &
781 MD_REGISTER_VER_MINOR_MASK);
782
783 *vmd_orom = add_orom(&vmd_orom_cap);
784
785 return 0;
786}
787
788const struct imsm_orom *find_imsm_vmd(struct sys_dev *hba)
789{
790 static struct orom_entry *vmd_orom;
791
792 if (hba->type != SYS_DEV_VMD)
793 return NULL;
794
795 if (!vmd_orom && add_vmd_orom(&vmd_orom, hba) != 0)
796 return NULL;
797
798 add_orom_device_id(vmd_orom, hba->dev_id);
799 vmd_orom->type = SYS_DEV_VMD;
800 return &vmd_orom->orom;
801}
802
6b781d33 803const struct imsm_orom *find_imsm_capability(struct sys_dev *hba)
fc13853f 804{
6b781d33
AP
805 const struct imsm_orom *cap = get_orom_by_device_id(hba->dev_id);
806
807 if (cap)
808 return cap;
fc13853f 809
614902f6
PB
810 if (hba->type == SYS_DEV_NVME)
811 return find_imsm_nvme(hba);
8d1114be
MG
812
813 cap = find_imsm_efi(hba);
814 if (cap)
5a6baf66 815 return cap;
8d1114be
MG
816
817 if (hba->type == SYS_DEV_VMD) {
818 cap = find_imsm_vmd(hba);
819 if (cap)
820 return cap;
821 }
822
823 cap = find_imsm_hba_orom(hba);
824 if (cap)
fc13853f 825 return cap;
614902f6 826
b390f610
DW
827 return NULL;
828}
25921536 829
d835518b
BK
830/* Check whether the nvme device is represented by nvme subsytem,
831 * if yes virtual path should be changed to hardware device path,
832 * to allow IMSM capabilities detection.
833 * Returns:
834 * hardware path to device - if the device is represented via
835 * nvme virtual subsytem
836 * NULL - if the device is not represented via nvme virtual subsytem
837 */
838char *get_nvme_multipath_dev_hw_path(const char *dev_path)
839{
840 DIR *dir;
841 struct dirent *ent;
842 char *rp = NULL;
843
844 if (strncmp(dev_path, NVME_SUBSYS_PATH, strlen(NVME_SUBSYS_PATH)) != 0)
845 return NULL;
846
847 dir = opendir(dev_path);
848 if (!dir)
849 return NULL;
850
851 for (ent = readdir(dir); ent; ent = readdir(dir)) {
852 char buf[strlen(dev_path) + strlen(ent->d_name) + 1];
853
854 /* Check if dir is a controller, ignore namespaces*/
855 if (!(strncmp(ent->d_name, "nvme", 4) == 0) ||
856 (strrchr(ent->d_name, 'n') != &ent->d_name[0]))
857 continue;
858
859 sprintf(buf, "%s/%s", dev_path, ent->d_name);
860 rp = realpath(buf, NULL);
861 break;
862 }
863
864 closedir(dir);
865 return rp;
866}
867
7c798f87
MT
868/* Description: Return part or whole realpath for the dev
869 * Parameters:
870 * dev - the device to be quered
871 * dev_level - level of "/device" entries. It allows to caller to access
872 * virtual or physical devices which are on "path" to quered
873 * one.
874 * buf - optional, must be PATH_MAX size. If set, then will be used.
875 */
876char *devt_to_devpath(dev_t dev, int dev_level, char *buf)
25921536 877{
7c798f87
MT
878 char device[PATH_MAX];
879 char *hw_path;
880 int i;
881 unsigned long device_free_len = sizeof(device) - 1;
882 char dev_str[] = "/device";
883 unsigned long dev_str_len = strlen(dev_str);
884
885 snprintf(device, sizeof(device), "/sys/dev/block/%d:%d", major(dev),
886 minor(dev));
887
888 /* If caller wants block device, return path to it even if it is exposed
889 * via virtual layer.
890 */
891 if (dev_level == 0)
892 return realpath(device, buf);
25921536 893
7c798f87
MT
894 device_free_len -= strlen(device);
895 for (i = 0; i < dev_level; i++) {
896 if (device_free_len < dev_str_len)
897 return NULL;
d835518b 898
7c798f87 899 strncat(device, dev_str, device_free_len);
d835518b 900
7c798f87
MT
901 /* Resolve nvme-subsystem abstraction if needed
902 */
903 device_free_len -= dev_str_len;
904 if (i == 0) {
905 char rp[PATH_MAX];
906
907 if (!realpath(device, rp))
908 return NULL;
909 hw_path = get_nvme_multipath_dev_hw_path(rp);
910 if (hw_path) {
911 strcpy(device, hw_path);
912 device_free_len = sizeof(device) -
913 strlen(device) - 1;
914 free(hw_path);
915 }
916 }
d835518b
BK
917 }
918
7c798f87 919 return realpath(device, buf);
25921536
DW
920}
921
7c798f87 922char *diskfd_to_devpath(int fd, int dev_level, char *buf)
25921536
DW
923{
924 /* return the device path for a disk, return NULL on error or fd
925 * refers to a partition
926 */
927 struct stat st;
928
929 if (fstat(fd, &st) != 0)
930 return NULL;
931 if (!S_ISBLK(st.st_mode))
932 return NULL;
933
7c798f87 934 return devt_to_devpath(st.st_rdev, dev_level, buf);
25921536
DW
935}
936
937int path_attached_to_hba(const char *disk_path, const char *hba_path)
938{
939 int rc;
940
fc13853f
LM
941 if (check_env("IMSM_TEST_AHCI_DEV") ||
942 check_env("IMSM_TEST_SCU_DEV")) {
943 return 1;
944 }
945
25921536
DW
946 if (!disk_path || !hba_path)
947 return 0;
a8e5382a 948 dprintf("hba: %s - disk: %s\n", hba_path, disk_path);
25921536
DW
949 if (strncmp(disk_path, hba_path, strlen(hba_path)) == 0)
950 rc = 1;
951 else
952 rc = 0;
953
954 return rc;
955}
956
957int devt_attached_to_hba(dev_t dev, const char *hba_path)
958{
7c798f87 959 char *disk_path = devt_to_devpath(dev, 1, NULL);
25921536
DW
960 int rc = path_attached_to_hba(disk_path, hba_path);
961
962 if (disk_path)
963 free(disk_path);
964
965 return rc;
966}
967
968int disk_attached_to_hba(int fd, const char *hba_path)
969{
7c798f87 970 char *disk_path = diskfd_to_devpath(fd, 1, NULL);
25921536
DW
971 int rc = path_attached_to_hba(disk_path, hba_path);
972
973 if (disk_path)
974 free(disk_path);
975
976 return rc;
977}
60f0f54d
PB
978
979char *vmd_domain_to_controller(struct sys_dev *hba, char *buf)
980{
981 struct dirent *ent;
982 DIR *dir;
983 char path[PATH_MAX];
984
985 if (!hba)
986 return NULL;
987
988 if (hba->type != SYS_DEV_VMD)
989 return NULL;
990
991 dir = opendir("/sys/bus/pci/drivers/vmd");
b9135011
JS
992 if (!dir)
993 return NULL;
60f0f54d 994
b9135011 995 for (ent = readdir(dir); ent; ent = readdir(dir)) {
60f0f54d
PB
996 sprintf(path, "/sys/bus/pci/drivers/vmd/%s/domain/device",
997 ent->d_name);
998
999 if (!realpath(path, buf))
1000 continue;
1001
1002 if (strncmp(buf, hba->path, strlen(buf)) == 0) {
1003 sprintf(path, "/sys/bus/pci/drivers/vmd/%s", ent->d_name);
b9135011 1004 closedir(dir);
7071320a 1005 return realpath(path, buf);
60f0f54d
PB
1006 }
1007 }
b9135011
JS
1008
1009 closedir(dir);
60f0f54d
PB
1010 return NULL;
1011}
8662f92d
MT
1012
1013/* Scan over all controller's namespaces and compare nsid value to verify if
1014 * current one is supported. The routine doesn't check IMSM capabilities for
1015 * namespace. Only one nvme namespace is supported by IMSM.
1016 * Paramteres:
1017 * fd - open descriptor to the nvme namespace
1018 * verbose - error logging level
a8f3cfd5 1019 * Returns:
8662f92d
MT
1020 * 1 - if namespace is supported
1021 * 0 - otherwise
a8f3cfd5 1022 */
8662f92d 1023int imsm_is_nvme_namespace_supported(int fd, int verbose)
a8f3cfd5 1024{
8662f92d
MT
1025 DIR *dir = NULL;
1026 struct dirent *ent;
1027 char cntrl_path[PATH_MAX];
1028 char ns_path[PATH_MAX];
1029 unsigned long long lowest_nsid = ULLONG_MAX;
1030 unsigned long long this_nsid;
1031 int rv = 0;
a8f3cfd5 1032
a8f3cfd5 1033
8662f92d
MT
1034 if (!diskfd_to_devpath(fd, 1, cntrl_path) ||
1035 !diskfd_to_devpath(fd, 0, ns_path)) {
1036 if (verbose)
1037 pr_err("Cannot get device paths\n");
1038 goto abort;
1039 }
a8f3cfd5 1040
a8f3cfd5 1041
8662f92d 1042 if (devpath_to_ll(ns_path, "nsid", &this_nsid)) {
a8f3cfd5 1043 if (verbose)
8662f92d
MT
1044 pr_err("Cannot read nsid value for %s",
1045 basename(ns_path));
1046 goto abort;
a8f3cfd5 1047 }
8662f92d
MT
1048
1049 dir = opendir(cntrl_path);
1050 if (!dir)
1051 goto abort;
1052
1053 /* The lowest nvme namespace is supported */
1054 for (ent = readdir(dir); ent; ent = readdir(dir)) {
1055 unsigned long long curr_nsid;
1056 char curr_ns_path[PATH_MAX + 256];
1057
1058 if (!strstr(ent->d_name, "nvme"))
1059 continue;
1060
1061 snprintf(curr_ns_path, sizeof(curr_ns_path), "%s/%s",
1062 cntrl_path, ent->d_name);
1063
1064 if (devpath_to_ll(curr_ns_path, "nsid", &curr_nsid))
1065 goto abort;
1066
1067 if (lowest_nsid > curr_nsid)
1068 lowest_nsid = curr_nsid;
1069 }
1070
1071 if (this_nsid == lowest_nsid)
1072 rv = 1;
1073 else if (verbose)
1074 pr_err("IMSM is supported on the lowest NVMe namespace\n");
1075
1076abort:
1077 if (dir)
1078 closedir(dir);
1079
1080 return rv;
a8f3cfd5 1081}
d835518b
BK
1082
1083/* Verify if multipath is supported by NVMe controller
1084 * Returns:
1085 * 0 - not supported
1086 * 1 - supported
1087 */
1088int is_multipath_nvme(int disk_fd)
1089{
d835518b 1090 char ns_path[PATH_MAX];
d835518b 1091
7c798f87 1092 if (!diskfd_to_devpath(disk_fd, 0, ns_path))
d835518b
BK
1093 return 0;
1094
1095 if (strncmp(ns_path, NVME_SUBSYS_PATH, strlen(NVME_SUBSYS_PATH)) == 0)
1096 return 1;
1097
1098 return 0;
1099}