]> git.ipfire.org Git - thirdparty/mdadm.git/blob - platform-intel.c
IncRemove: Set "auto-read" only after successful excl open.
[thirdparty/mdadm.git] / platform-intel.c
1 /*
2 * Intel(R) Matrix Storage Manager hardware and firmware support routines
3 *
4 * Copyright (C) 2008 Intel Corporation
5 *
6 * This program is free software; you can redistribute it and/or modify it
7 * under the terms and conditions of the GNU General Public License,
8 * version 2, as published by the Free Software Foundation.
9 *
10 * This program is distributed in the hope it will be useful, but WITHOUT
11 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
12 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
13 * more details.
14 *
15 * You should have received a copy of the GNU General Public License along with
16 * this program; if not, write to the Free Software Foundation, Inc.,
17 * 51 Franklin St - Fifth Floor, Boston, MA 02110-1301 USA.
18 */
19 #include "mdadm.h"
20 #include "platform-intel.h"
21 #include "probe_roms.h"
22 #include <stdio.h>
23 #include <stdlib.h>
24 #include <string.h>
25 #include <unistd.h>
26 #include <dirent.h>
27 #include <fcntl.h>
28 #include <sys/mman.h>
29 #include <sys/types.h>
30 #include <sys/stat.h>
31 #include <limits.h>
32
33 static int devpath_to_ll(const char *dev_path, const char *entry,
34 unsigned long long *val);
35
36 static __u16 devpath_to_vendor(const char *dev_path);
37
38 static void free_sys_dev(struct sys_dev **list)
39 {
40 while (*list) {
41 struct sys_dev *next = (*list)->next;
42
43 if ((*list)->path)
44 free((*list)->path);
45 free(*list);
46 *list = next;
47 }
48 }
49
50 struct sys_dev *find_driver_devices(const char *bus, const char *driver)
51 {
52 /* search sysfs for devices driven by 'driver' */
53 char path[292];
54 char link[256];
55 char *c;
56 DIR *driver_dir;
57 struct dirent *de;
58 struct sys_dev *head = NULL;
59 struct sys_dev *list = NULL;
60 enum sys_dev_type type;
61 unsigned long long dev_id;
62 unsigned long long class;
63
64 if (strcmp(driver, "isci") == 0)
65 type = SYS_DEV_SAS;
66 else if (strcmp(driver, "ahci") == 0)
67 type = SYS_DEV_SATA;
68 else if (strcmp(driver, "nvme") == 0)
69 type = SYS_DEV_NVME;
70 else
71 type = SYS_DEV_UNKNOWN;
72
73 sprintf(path, "/sys/bus/%s/drivers/%s", bus, driver);
74 driver_dir = opendir(path);
75 if (!driver_dir)
76 return NULL;
77 for (de = readdir(driver_dir); de; de = readdir(driver_dir)) {
78 int n;
79
80 /* is 'de' a device? check that the 'subsystem' link exists and
81 * that its target matches 'bus'
82 */
83 sprintf(path, "/sys/bus/%s/drivers/%s/%s/subsystem",
84 bus, driver, de->d_name);
85 n = readlink(path, link, sizeof(link));
86 if (n < 0 || n >= (int)sizeof(link))
87 continue;
88 link[n] = '\0';
89 c = strrchr(link, '/');
90 if (!c)
91 continue;
92 if (strncmp(bus, c+1, strlen(bus)) != 0)
93 continue;
94
95 sprintf(path, "/sys/bus/%s/drivers/%s/%s",
96 bus, driver, de->d_name);
97
98 /* if it's not Intel device skip it. */
99 if (devpath_to_vendor(path) != 0x8086)
100 continue;
101
102 if (devpath_to_ll(path, "device", &dev_id) != 0)
103 continue;
104
105 if (devpath_to_ll(path, "class", &class) != 0)
106 continue;
107
108 /* start / add list entry */
109 if (!head) {
110 head = xmalloc(sizeof(*head));
111 list = head;
112 } else {
113 list->next = xmalloc(sizeof(*head));
114 list = list->next;
115 }
116
117 if (!list) {
118 free_sys_dev(&head);
119 break;
120 }
121
122 list->dev_id = (__u16) dev_id;
123 list->class = (__u32) class;
124 list->type = type;
125 list->path = realpath(path, NULL);
126 list->next = NULL;
127 if ((list->pci_id = strrchr(list->path, '/')) != NULL)
128 list->pci_id++;
129 }
130 closedir(driver_dir);
131 return head;
132 }
133
134 static struct sys_dev *intel_devices=NULL;
135 static time_t valid_time = 0;
136
137 struct sys_dev *device_by_id(__u16 device_id)
138 {
139 struct sys_dev *iter;
140
141 for (iter = intel_devices; iter != NULL; iter = iter->next)
142 if (iter->dev_id == device_id)
143 return iter;
144 return NULL;
145 }
146
147 static int devpath_to_ll(const char *dev_path, const char *entry, unsigned long long *val)
148 {
149 char path[strlen(dev_path) + strlen(entry) + 2];
150 int fd;
151 int n;
152
153 sprintf(path, "%s/%s", dev_path, entry);
154
155 fd = open(path, O_RDONLY);
156 if (fd < 0)
157 return -1;
158 n = sysfs_fd_get_ll(fd, val);
159 close(fd);
160 return n;
161 }
162
163 static __u16 devpath_to_vendor(const char *dev_path)
164 {
165 char path[strlen(dev_path) + strlen("/vendor") + 1];
166 char vendor[7];
167 int fd;
168 __u16 id = 0xffff;
169 int n;
170
171 sprintf(path, "%s/vendor", dev_path);
172
173 fd = open(path, O_RDONLY);
174 if (fd < 0)
175 return 0xffff;
176
177 n = read(fd, vendor, sizeof(vendor));
178 if (n == sizeof(vendor)) {
179 vendor[n - 1] = '\0';
180 id = strtoul(vendor, NULL, 16);
181 }
182 close(fd);
183
184 return id;
185 }
186
187 struct sys_dev *find_intel_devices(void)
188 {
189 struct sys_dev *ahci, *isci, *nvme;
190
191 if (valid_time > time(0) - 10)
192 return intel_devices;
193
194 if (intel_devices)
195 free_sys_dev(&intel_devices);
196
197 isci = find_driver_devices("pci", "isci");
198 ahci = find_driver_devices("pci", "ahci");
199 nvme = find_driver_devices("pci", "nvme");
200
201 if (!isci && !ahci) {
202 ahci = nvme;
203 } else if (!ahci) {
204 ahci = isci;
205 struct sys_dev *elem = ahci;
206 while (elem->next)
207 elem = elem->next;
208 elem->next = nvme;
209 } else {
210 struct sys_dev *elem = ahci;
211 while (elem->next)
212 elem = elem->next;
213 elem->next = isci;
214 while (elem->next)
215 elem = elem->next;
216 elem->next = nvme;
217 }
218 intel_devices = ahci;
219 valid_time = time(0);
220 return intel_devices;
221 }
222
223 /*
224 * PCI Expansion ROM Data Structure Format */
225 struct pciExpDataStructFormat {
226 __u8 ver[4];
227 __u16 vendorID;
228 __u16 deviceID;
229 __u16 devListOffset;
230 __u16 pciDataStructLen;
231 __u8 pciDataStructRev;
232 } __attribute__ ((packed));
233
234 struct orom_entry *orom_entries;
235
236 const struct imsm_orom *get_orom_by_device_id(__u16 dev_id)
237 {
238 struct orom_entry *entry;
239 struct devid_list *devid;
240
241 for (entry = orom_entries; entry; entry = entry->next) {
242 for (devid = entry->devid_list; devid; devid = devid->next) {
243 if (devid->devid == dev_id)
244 return &entry->orom;
245 }
246 }
247
248 return NULL;
249 }
250
251 static struct orom_entry *add_orom(const struct imsm_orom *orom)
252 {
253 struct orom_entry *list;
254 struct orom_entry *prev = NULL;
255
256 for (list = orom_entries; list; prev = list, list = list->next)
257 ;
258
259 list = xmalloc(sizeof(struct orom_entry));
260 list->orom = *orom;
261 list->devid_list = NULL;
262 list->next = NULL;
263
264 if (prev == NULL)
265 orom_entries = list;
266 else
267 prev->next = list;
268
269 return list;
270 }
271
272 static void add_orom_device_id(struct orom_entry *entry, __u16 dev_id)
273 {
274 struct devid_list *list;
275 struct devid_list *prev = NULL;
276
277 for (list = entry->devid_list; list; prev = list, list = list->next) {
278 if (list->devid == dev_id)
279 return;
280 }
281 list = xmalloc(sizeof(struct devid_list));
282 list->devid = dev_id;
283 list->next = NULL;
284
285 if (prev == NULL)
286 entry->devid_list = list;
287 else
288 prev->next = list;
289 }
290
291 static int scan(const void *start, const void *end, const void *data)
292 {
293 int offset;
294 const struct imsm_orom *imsm_mem = NULL;
295 int len = (end - start);
296 struct pciExpDataStructFormat *ptr= (struct pciExpDataStructFormat *)data;
297
298 if (data + 0x18 > end) {
299 dprintf("cannot find pciExpDataStruct \n");
300 return 0;
301 }
302
303 dprintf("ptr->vendorID: %lx __le16_to_cpu(ptr->deviceID): %lx \n",
304 (ulong) __le16_to_cpu(ptr->vendorID),
305 (ulong) __le16_to_cpu(ptr->deviceID));
306
307 if (__le16_to_cpu(ptr->vendorID) != 0x8086)
308 return 0;
309
310 for (offset = 0; offset < len; offset += 4) {
311 const void *mem = start + offset;
312
313 if ((memcmp(mem, IMSM_OROM_SIGNATURE, 4) == 0)) {
314 imsm_mem = mem;
315 break;
316 }
317 }
318
319 if (!imsm_mem)
320 return 0;
321
322 struct orom_entry *orom = add_orom(imsm_mem);
323
324 /* only PciDataStructure with revision 3 and above supports devices list. */
325 if (ptr->pciDataStructRev >= 3 && ptr->devListOffset) {
326 const __u16 *dev_list = (void *)ptr + ptr->devListOffset;
327 int i;
328
329 for (i = 0; dev_list[i] != 0; i++)
330 add_orom_device_id(orom, dev_list[i]);
331 } else {
332 add_orom_device_id(orom, __le16_to_cpu(ptr->deviceID));
333 }
334
335 return 0;
336 }
337
338 const struct imsm_orom *imsm_platform_test(struct sys_dev *hba)
339 {
340 struct imsm_orom orom = {
341 .signature = IMSM_OROM_SIGNATURE,
342 .rlc = IMSM_OROM_RLC_RAID0 | IMSM_OROM_RLC_RAID1 |
343 IMSM_OROM_RLC_RAID10 | IMSM_OROM_RLC_RAID5,
344 .sss = IMSM_OROM_SSS_4kB | IMSM_OROM_SSS_8kB |
345 IMSM_OROM_SSS_16kB | IMSM_OROM_SSS_32kB |
346 IMSM_OROM_SSS_64kB | IMSM_OROM_SSS_128kB |
347 IMSM_OROM_SSS_256kB | IMSM_OROM_SSS_512kB |
348 IMSM_OROM_SSS_1MB | IMSM_OROM_SSS_2MB,
349 .dpa = IMSM_OROM_DISKS_PER_ARRAY,
350 .tds = IMSM_OROM_TOTAL_DISKS,
351 .vpa = IMSM_OROM_VOLUMES_PER_ARRAY,
352 .vphba = IMSM_OROM_VOLUMES_PER_HBA
353 };
354 orom.attr = orom.rlc | IMSM_OROM_ATTR_ChecksumVerify;
355
356 if (check_env("IMSM_TEST_OROM_NORAID5")) {
357 orom.rlc = IMSM_OROM_RLC_RAID0 | IMSM_OROM_RLC_RAID1 |
358 IMSM_OROM_RLC_RAID10;
359 }
360 if (check_env("IMSM_TEST_AHCI_EFI_NORAID5") && (hba->type == SYS_DEV_SAS)) {
361 orom.rlc = IMSM_OROM_RLC_RAID0 | IMSM_OROM_RLC_RAID1 |
362 IMSM_OROM_RLC_RAID10;
363 }
364 if (check_env("IMSM_TEST_SCU_EFI_NORAID5") && (hba->type == SYS_DEV_SATA)) {
365 orom.rlc = IMSM_OROM_RLC_RAID0 | IMSM_OROM_RLC_RAID1 |
366 IMSM_OROM_RLC_RAID10;
367 }
368
369 struct orom_entry *ret = add_orom(&orom);
370
371 add_orom_device_id(ret, hba->dev_id);
372
373 return &ret->orom;
374 }
375
376 static const struct imsm_orom *find_imsm_hba_orom(struct sys_dev *hba)
377 {
378 unsigned long align;
379
380 if (check_env("IMSM_TEST_OROM"))
381 return imsm_platform_test(hba);
382
383 /* return empty OROM capabilities in EFI test mode */
384 if (check_env("IMSM_TEST_AHCI_EFI") || check_env("IMSM_TEST_SCU_EFI"))
385 return NULL;
386
387 find_intel_devices();
388
389 if (intel_devices == NULL)
390 return NULL;
391
392 /* scan option-rom memory looking for an imsm signature */
393 if (check_env("IMSM_SAFE_OROM_SCAN"))
394 align = 2048;
395 else
396 align = 512;
397 if (probe_roms_init(align) != 0)
398 return NULL;
399 probe_roms();
400 /* ignore return value - True is returned if both adapater roms are found */
401 scan_adapter_roms(scan);
402 probe_roms_exit();
403
404 return get_orom_by_device_id(hba->dev_id);
405 }
406
407 #define GUID_STR_MAX 37 /* according to GUID format:
408 * xxxxxxxx-xxxx-xxxx-xxxx-xxxxxxxxxxxx" */
409
410 #define EFI_GUID(a, b, c, d0, d1, d2, d3, d4, d5, d6, d7) \
411 ((struct efi_guid) \
412 {{ (a) & 0xff, ((a) >> 8) & 0xff, ((a) >> 16) & 0xff, ((a) >> 24) & 0xff, \
413 (b) & 0xff, ((b) >> 8) & 0xff, \
414 (c) & 0xff, ((c) >> 8) & 0xff, \
415 (d0), (d1), (d2), (d3), (d4), (d5), (d6), (d7) }})
416
417 #define SYS_EFI_VAR_PATH "/sys/firmware/efi/vars"
418 #define SYS_EFIVARS_PATH "/sys/firmware/efi/efivars"
419 #define SCU_PROP "RstScuV"
420 #define AHCI_PROP "RstSataV"
421 #define AHCI_SSATA_PROP "RstsSatV"
422 #define AHCI_CSATA_PROP "RstCSatV"
423
424 #define VENDOR_GUID \
425 EFI_GUID(0x193dfefa, 0xa445, 0x4302, 0x99, 0xd8, 0xef, 0x3a, 0xad, 0x1a, 0x04, 0xc6)
426
427 #define PCI_CLASS_RAID_CNTRL 0x010400
428
429 static int read_efi_var(void *buffer, ssize_t buf_size, char *variable_name, struct efi_guid guid)
430 {
431 char path[PATH_MAX];
432 char buf[GUID_STR_MAX];
433 int fd;
434 ssize_t n;
435
436 snprintf(path, PATH_MAX, "%s/%s-%s", SYS_EFIVARS_PATH, variable_name, guid_str(buf, guid));
437
438 fd = open(path, O_RDONLY);
439 if (fd < 0)
440 return 1;
441
442 /* read the variable attributes and ignore it */
443 n = read(fd, buf, sizeof(__u32));
444 if (n < 0) {
445 close(fd);
446 return 1;
447 }
448
449 /* read the variable data */
450 n = read(fd, buffer, buf_size);
451 close(fd);
452 if (n < buf_size)
453 return 1;
454
455 return 0;
456 }
457
458 static int read_efi_variable(void *buffer, ssize_t buf_size, char *variable_name, struct efi_guid guid)
459 {
460 char path[PATH_MAX];
461 char buf[GUID_STR_MAX];
462 int dfd;
463 ssize_t n, var_data_len;
464
465 /* Try to read the variable using the new efivarfs interface first.
466 * If that fails, fall back to the old sysfs-efivars interface. */
467 if (!read_efi_var(buffer, buf_size, variable_name, guid))
468 return 0;
469
470 snprintf(path, PATH_MAX, "%s/%s-%s/size", SYS_EFI_VAR_PATH, variable_name, guid_str(buf, guid));
471
472 dprintf("EFI VAR: path=%s\n", path);
473 /* get size of variable data */
474 dfd = open(path, O_RDONLY);
475 if (dfd < 0)
476 return 1;
477
478 n = read(dfd, &buf, sizeof(buf));
479 close(dfd);
480 if (n < 0)
481 return 1;
482 buf[n] = '\0';
483
484 errno = 0;
485 var_data_len = strtoul(buf, NULL, 16);
486 if ((errno == ERANGE && (var_data_len == LONG_MAX))
487 || (errno != 0 && var_data_len == 0))
488 return 1;
489
490 /* get data */
491 snprintf(path, PATH_MAX, "%s/%s-%s/data", SYS_EFI_VAR_PATH, variable_name, guid_str(buf, guid));
492
493 dprintf("EFI VAR: path=%s\n", path);
494 dfd = open(path, O_RDONLY);
495 if (dfd < 0)
496 return 1;
497
498 n = read(dfd, buffer, buf_size);
499 close(dfd);
500 if (n != var_data_len || n < buf_size) {
501 return 1;
502 }
503
504 return 0;
505 }
506
507 const struct imsm_orom *find_imsm_efi(struct sys_dev *hba)
508 {
509 struct imsm_orom orom;
510 struct orom_entry *ret;
511 int err;
512
513 if (check_env("IMSM_TEST_AHCI_EFI") || check_env("IMSM_TEST_SCU_EFI"))
514 return imsm_platform_test(hba);
515
516 /* OROM test is set, return that there is no EFI capabilities */
517 if (check_env("IMSM_TEST_OROM"))
518 return NULL;
519
520 if (hba->type == SYS_DEV_SATA && hba->class != PCI_CLASS_RAID_CNTRL)
521 return NULL;
522
523 err = read_efi_variable(&orom, sizeof(orom), hba->type == SYS_DEV_SAS ? SCU_PROP : AHCI_PROP, VENDOR_GUID);
524
525 /* try to read variable for second AHCI controller */
526 if (err && hba->type == SYS_DEV_SATA)
527 err = read_efi_variable(&orom, sizeof(orom), AHCI_SSATA_PROP, VENDOR_GUID);
528
529 /* try to read variable for combined AHCI controllers */
530 if (err && hba->type == SYS_DEV_SATA) {
531 static struct orom_entry *csata;
532
533 err = read_efi_variable(&orom, sizeof(orom), AHCI_CSATA_PROP, VENDOR_GUID);
534 if (!err) {
535 if (!csata)
536 csata = add_orom(&orom);
537 add_orom_device_id(csata, hba->dev_id);
538 return &csata->orom;
539 }
540 }
541
542 if (err)
543 return NULL;
544
545 ret = add_orom(&orom);
546 add_orom_device_id(ret, hba->dev_id);
547
548 return &ret->orom;
549 }
550
551 const struct imsm_orom *find_imsm_nvme(struct sys_dev *hba)
552 {
553 static struct orom_entry *nvme_orom;
554
555 if (hba->type != SYS_DEV_NVME)
556 return NULL;
557
558 if (!nvme_orom) {
559 struct imsm_orom nvme_orom_compat = {
560 .signature = IMSM_NVME_OROM_COMPAT_SIGNATURE,
561 .rlc = IMSM_OROM_RLC_RAID0 | IMSM_OROM_RLC_RAID1 |
562 IMSM_OROM_RLC_RAID10 | IMSM_OROM_RLC_RAID5,
563 .sss = IMSM_OROM_SSS_4kB | IMSM_OROM_SSS_8kB |
564 IMSM_OROM_SSS_16kB | IMSM_OROM_SSS_32kB |
565 IMSM_OROM_SSS_64kB | IMSM_OROM_SSS_128kB,
566 .dpa = IMSM_OROM_DISKS_PER_ARRAY_NVME,
567 .tds = IMSM_OROM_TOTAL_DISKS_NVME,
568 .vpa = IMSM_OROM_VOLUMES_PER_ARRAY,
569 .vphba = IMSM_OROM_TOTAL_DISKS_NVME / 2 * IMSM_OROM_VOLUMES_PER_ARRAY,
570 .attr = IMSM_OROM_ATTR_2TB | IMSM_OROM_ATTR_2TB_DISK,
571 .driver_features = IMSM_OROM_CAPABILITIES_EnterpriseSystem
572 };
573 nvme_orom = add_orom(&nvme_orom_compat);
574 }
575 add_orom_device_id(nvme_orom, hba->dev_id);
576 return &nvme_orom->orom;
577 }
578
579 const struct imsm_orom *find_imsm_capability(struct sys_dev *hba)
580 {
581 const struct imsm_orom *cap = get_orom_by_device_id(hba->dev_id);
582
583 if (cap)
584 return cap;
585
586 if (hba->type == SYS_DEV_NVME)
587 return find_imsm_nvme(hba);
588 if ((cap = find_imsm_efi(hba)) != NULL)
589 return cap;
590 if ((cap = find_imsm_hba_orom(hba)) != NULL)
591 return cap;
592
593 return NULL;
594 }
595
596 char *devt_to_devpath(dev_t dev)
597 {
598 char device[46];
599
600 sprintf(device, "/sys/dev/block/%d:%d/device", major(dev), minor(dev));
601 return realpath(device, NULL);
602 }
603
604 char *diskfd_to_devpath(int fd)
605 {
606 /* return the device path for a disk, return NULL on error or fd
607 * refers to a partition
608 */
609 struct stat st;
610
611 if (fstat(fd, &st) != 0)
612 return NULL;
613 if (!S_ISBLK(st.st_mode))
614 return NULL;
615
616 return devt_to_devpath(st.st_rdev);
617 }
618
619 int path_attached_to_hba(const char *disk_path, const char *hba_path)
620 {
621 int rc;
622
623 if (check_env("IMSM_TEST_AHCI_DEV") ||
624 check_env("IMSM_TEST_SCU_DEV")) {
625 return 1;
626 }
627
628 if (!disk_path || !hba_path)
629 return 0;
630 dprintf("hba: %s - disk: %s\n", hba_path, disk_path);
631 if (strncmp(disk_path, hba_path, strlen(hba_path)) == 0)
632 rc = 1;
633 else
634 rc = 0;
635
636 return rc;
637 }
638
639 int devt_attached_to_hba(dev_t dev, const char *hba_path)
640 {
641 char *disk_path = devt_to_devpath(dev);
642 int rc = path_attached_to_hba(disk_path, hba_path);
643
644 if (disk_path)
645 free(disk_path);
646
647 return rc;
648 }
649
650 int disk_attached_to_hba(int fd, const char *hba_path)
651 {
652 char *disk_path = diskfd_to_devpath(fd);
653 int rc = path_attached_to_hba(disk_path, hba_path);
654
655 if (disk_path)
656 free(disk_path);
657
658 return rc;
659 }