2 * Hypervisor filesystem for Linux on s390. Diag 204 and 224
5 * Copyright IBM Corp. 2006, 2008
9 #define KMSG_COMPONENT "hypfs"
10 #define pr_fmt(fmt) KMSG_COMPONENT ": " fmt
12 #include <linux/types.h>
13 #include <linux/errno.h>
14 #include <linux/slab.h>
15 #include <linux/string.h>
16 #include <linux/vmalloc.h>
18 #include <asm/ebcdic.h>
21 #define LPAR_NAME_LEN 8 /* lpar name len in diag 204 data */
22 #define CPU_NAME_LEN 16 /* type name len of cpus in diag224 name table */
23 #define TMP_SIZE 64 /* size of temporary buffers */
25 #define DBFS_D204_HDR_VERSION 0
27 /* diag 204 subcodes */
35 /* The two available diag 204 data formats */
41 /* bit is set in flags, when physical cpu info is included in diag 204 data */
42 #define LPAR_PHYS_FLG 0x80
44 static char *diag224_cpu_names; /* diag 224 name table */
45 static enum diag204_sc diag204_store_sc; /* used subcode for store */
46 static enum diag204_format diag204_info_type; /* used diag 204 data format */
48 static void *diag204_buf; /* 4K aligned buffer for diag204 data */
49 static void *diag204_buf_vmalloc; /* vmalloc pointer for diag204 data */
50 static int diag204_buf_pages; /* number of pages for diag204 data */
52 static struct dentry *dbfs_d204_file;
55 * DIAG 204 data structures and member access functions.
57 * Since we have two different diag 204 data formats for old and new s390
58 * machines, we do not access the structs directly, but use getter functions for
59 * each struct member instead. This should make the code more readable.
62 /* Time information block */
71 } __attribute__ ((packed));
73 struct x_info_blk_hdr {
82 } __attribute__ ((packed));
84 static inline int info_blk_hdr__size(enum diag204_format type)
86 if (type == INFO_SIMPLE)
87 return sizeof(struct info_blk_hdr);
89 return sizeof(struct x_info_blk_hdr);
92 static inline __u8 info_blk_hdr__npar(enum diag204_format type, void *hdr)
94 if (type == INFO_SIMPLE)
95 return ((struct info_blk_hdr *)hdr)->npar;
97 return ((struct x_info_blk_hdr *)hdr)->npar;
100 static inline __u8 info_blk_hdr__flags(enum diag204_format type, void *hdr)
102 if (type == INFO_SIMPLE)
103 return ((struct info_blk_hdr *)hdr)->flags;
105 return ((struct x_info_blk_hdr *)hdr)->flags;
108 static inline __u16 info_blk_hdr__pcpus(enum diag204_format type, void *hdr)
110 if (type == INFO_SIMPLE)
111 return ((struct info_blk_hdr *)hdr)->phys_cpus;
113 return ((struct x_info_blk_hdr *)hdr)->phys_cpus;
116 /* Partition header */
122 char part_name[LPAR_NAME_LEN];
123 } __attribute__ ((packed));
131 char part_name[LPAR_NAME_LEN];
141 } __attribute__ ((packed));
143 static inline int part_hdr__size(enum diag204_format type)
145 if (type == INFO_SIMPLE)
146 return sizeof(struct part_hdr);
148 return sizeof(struct x_part_hdr);
151 static inline __u8 part_hdr__rcpus(enum diag204_format type, void *hdr)
153 if (type == INFO_SIMPLE)
154 return ((struct part_hdr *)hdr)->cpus;
156 return ((struct x_part_hdr *)hdr)->rcpus;
159 static inline void part_hdr__part_name(enum diag204_format type, void *hdr,
162 if (type == INFO_SIMPLE)
163 memcpy(name, ((struct part_hdr *)hdr)->part_name,
166 memcpy(name, ((struct x_part_hdr *)hdr)->part_name,
168 EBCASC(name, LPAR_NAME_LEN);
169 name[LPAR_NAME_LEN] = 0;
181 } __attribute__ ((packed));
200 } __attribute__ ((packed));
204 static inline int cpu_info__size(enum diag204_format type)
206 if (type == INFO_SIMPLE)
207 return sizeof(struct cpu_info);
209 return sizeof(struct x_cpu_info);
212 static inline __u8 cpu_info__ctidx(enum diag204_format type, void *hdr)
214 if (type == INFO_SIMPLE)
215 return ((struct cpu_info *)hdr)->ctidx;
217 return ((struct x_cpu_info *)hdr)->ctidx;
220 static inline __u16 cpu_info__cpu_addr(enum diag204_format type, void *hdr)
222 if (type == INFO_SIMPLE)
223 return ((struct cpu_info *)hdr)->cpu_addr;
225 return ((struct x_cpu_info *)hdr)->cpu_addr;
228 static inline __u64 cpu_info__acc_time(enum diag204_format type, void *hdr)
230 if (type == INFO_SIMPLE)
231 return ((struct cpu_info *)hdr)->acc_time;
233 return ((struct x_cpu_info *)hdr)->acc_time;
236 static inline __u64 cpu_info__lp_time(enum diag204_format type, void *hdr)
238 if (type == INFO_SIMPLE)
239 return ((struct cpu_info *)hdr)->lp_time;
241 return ((struct x_cpu_info *)hdr)->lp_time;
244 static inline __u64 cpu_info__online_time(enum diag204_format type, void *hdr)
246 if (type == INFO_SIMPLE)
247 return 0; /* online_time not available in simple info */
249 return ((struct x_cpu_info *)hdr)->online_time;
252 /* Physical header */
259 } __attribute__ ((packed));
267 } __attribute__ ((packed));
269 static inline int phys_hdr__size(enum diag204_format type)
271 if (type == INFO_SIMPLE)
272 return sizeof(struct phys_hdr);
274 return sizeof(struct x_phys_hdr);
277 static inline __u8 phys_hdr__cpus(enum diag204_format type, void *hdr)
279 if (type == INFO_SIMPLE)
280 return ((struct phys_hdr *)hdr)->cpus;
282 return ((struct x_phys_hdr *)hdr)->cpus;
285 /* Physical CPU info block */
294 } __attribute__ ((packed));
303 } __attribute__ ((packed));
305 static inline int phys_cpu__size(enum diag204_format type)
307 if (type == INFO_SIMPLE)
308 return sizeof(struct phys_cpu);
310 return sizeof(struct x_phys_cpu);
313 static inline __u16 phys_cpu__cpu_addr(enum diag204_format type, void *hdr)
315 if (type == INFO_SIMPLE)
316 return ((struct phys_cpu *)hdr)->cpu_addr;
318 return ((struct x_phys_cpu *)hdr)->cpu_addr;
321 static inline __u64 phys_cpu__mgm_time(enum diag204_format type, void *hdr)
323 if (type == INFO_SIMPLE)
324 return ((struct phys_cpu *)hdr)->mgm_time;
326 return ((struct x_phys_cpu *)hdr)->mgm_time;
329 static inline __u64 phys_cpu__ctidx(enum diag204_format type, void *hdr)
331 if (type == INFO_SIMPLE)
332 return ((struct phys_cpu *)hdr)->ctidx;
334 return ((struct x_phys_cpu *)hdr)->ctidx;
337 /* Diagnose 204 functions */
339 static int diag204(unsigned long subcode, unsigned long size, void *addr)
341 register unsigned long _subcode asm("0") = subcode;
342 register unsigned long _size asm("1") = size;
345 " diag %2,%0,0x204\n"
348 : "+d" (_subcode), "+d" (_size) : "d" (addr) : "memory");
355 * For the old diag subcode 4 with simple data format we have to use real
356 * memory. If we use subcode 6 or 7 with extended data format, we can (and
357 * should) use vmalloc, since we need a lot of memory in that case. Currently
361 static void diag204_free_buffer(void)
365 if (diag204_buf_vmalloc) {
366 vfree(diag204_buf_vmalloc);
367 diag204_buf_vmalloc = NULL;
369 free_pages((unsigned long) diag204_buf, 0);
374 static void *page_align_ptr(void *ptr)
376 return (void *) PAGE_ALIGN((unsigned long) ptr);
379 static void *diag204_alloc_vbuf(int pages)
381 /* The buffer has to be page aligned! */
382 diag204_buf_vmalloc = vmalloc(PAGE_SIZE * (pages + 1));
383 if (!diag204_buf_vmalloc)
384 return ERR_PTR(-ENOMEM);
385 diag204_buf = page_align_ptr(diag204_buf_vmalloc);
386 diag204_buf_pages = pages;
390 static void *diag204_alloc_rbuf(void)
392 diag204_buf = (void*)__get_free_pages(GFP_KERNEL,0);
394 return ERR_PTR(-ENOMEM);
395 diag204_buf_pages = 1;
399 static void *diag204_get_buffer(enum diag204_format fmt, int *pages)
402 *pages = diag204_buf_pages;
405 if (fmt == INFO_SIMPLE) {
407 return diag204_alloc_rbuf();
408 } else {/* INFO_EXT */
409 *pages = diag204((unsigned long)SUBC_RSI |
410 (unsigned long)INFO_EXT, 0, NULL);
412 return ERR_PTR(-ENOSYS);
414 return diag204_alloc_vbuf(*pages);
419 * diag204_probe() has to find out, which type of diagnose 204 implementation
420 * we have on our machine. Currently there are three possible scanarios:
421 * - subcode 4 + simple data format (only one page)
422 * - subcode 4-6 + extended data format
423 * - subcode 4-7 + extended data format
425 * Subcode 5 is used to retrieve the size of the data, provided by subcodes
426 * 6 and 7. Subcode 7 basically has the same function as subcode 6. In addition
427 * to subcode 6 it provides also information about secondary cpus.
428 * In order to get as much information as possible, we first try
429 * subcode 7, then 6 and if both fail, we use subcode 4.
432 static int diag204_probe(void)
437 buf = diag204_get_buffer(INFO_EXT, &pages);
439 if (diag204((unsigned long)SUBC_STIB7 |
440 (unsigned long)INFO_EXT, pages, buf) >= 0) {
441 diag204_store_sc = SUBC_STIB7;
442 diag204_info_type = INFO_EXT;
445 if (diag204((unsigned long)SUBC_STIB6 |
446 (unsigned long)INFO_EXT, pages, buf) >= 0) {
447 diag204_store_sc = SUBC_STIB6;
448 diag204_info_type = INFO_EXT;
451 diag204_free_buffer();
454 /* subcodes 6 and 7 failed, now try subcode 4 */
456 buf = diag204_get_buffer(INFO_SIMPLE, &pages);
461 if (diag204((unsigned long)SUBC_STIB4 |
462 (unsigned long)INFO_SIMPLE, pages, buf) >= 0) {
463 diag204_store_sc = SUBC_STIB4;
464 diag204_info_type = INFO_SIMPLE;
473 diag204_free_buffer();
478 static int diag204_do_store(void *buf, int pages)
482 rc = diag204((unsigned long) diag204_store_sc |
483 (unsigned long) diag204_info_type, pages, buf);
484 return rc < 0 ? -ENOSYS : 0;
487 static void *diag204_store(void)
492 buf = diag204_get_buffer(diag204_info_type, &pages);
495 rc = diag204_do_store(buf, pages);
502 /* Diagnose 224 functions */
504 static int diag224(void *ptr)
506 int rc = -EOPNOTSUPP;
509 " diag %1,%2,0x224\n"
513 : "+d" (rc) :"d" (0), "d" (ptr) : "memory");
517 static int diag224_get_name_table(void)
519 /* memory must be below 2GB */
520 diag224_cpu_names = kmalloc(PAGE_SIZE, GFP_KERNEL | GFP_DMA);
521 if (!diag224_cpu_names)
523 if (diag224(diag224_cpu_names)) {
524 kfree(diag224_cpu_names);
527 EBCASC(diag224_cpu_names + 16, (*diag224_cpu_names + 1) * 16);
531 static void diag224_delete_name_table(void)
533 kfree(diag224_cpu_names);
536 static int diag224_idx2name(int index, char *name)
538 memcpy(name, diag224_cpu_names + ((index + 1) * CPU_NAME_LEN),
540 name[CPU_NAME_LEN] = 0;
545 struct dbfs_d204_hdr {
546 u64 len; /* Length of d204 buffer without header */
547 u16 version; /* Version of header */
548 u8 sc; /* Used subcode */
550 } __attribute__ ((packed));
553 struct dbfs_d204_hdr hdr; /* 64 byte header */
554 char buf[]; /* d204 buffer */
555 } __attribute__ ((packed));
557 static int dbfs_d204_create(void **data, void **data_free_ptr, size_t *size)
559 struct dbfs_d204 *d204;
563 buf_size = PAGE_SIZE * (diag204_buf_pages + 1) + sizeof(d204->hdr);
564 base = vzalloc(buf_size);
567 d204 = page_align_ptr(base + sizeof(d204->hdr)) - sizeof(d204->hdr);
568 rc = diag204_do_store(d204->buf, diag204_buf_pages);
573 d204->hdr.version = DBFS_D204_HDR_VERSION;
574 d204->hdr.len = PAGE_SIZE * diag204_buf_pages;
575 d204->hdr.sc = diag204_store_sc;
577 *data_free_ptr = base;
578 *size = d204->hdr.len + sizeof(struct dbfs_d204_hdr);
582 static struct hypfs_dbfs_file dbfs_file_d204 = {
584 .data_create = dbfs_d204_create,
588 __init int hypfs_diag_init(void)
592 if (diag204_probe()) {
593 pr_err("The hardware system does not support hypfs\n");
596 if (diag204_info_type == INFO_EXT) {
597 rc = hypfs_dbfs_create_file(&dbfs_file_d204);
601 if (MACHINE_IS_LPAR) {
602 rc = diag224_get_name_table();
604 pr_err("The hardware system does not provide all "
605 "functions required by hypfs\n");
606 debugfs_remove(dbfs_d204_file);
613 void hypfs_diag_exit(void)
615 debugfs_remove(dbfs_d204_file);
616 diag224_delete_name_table();
617 diag204_free_buffer();
618 hypfs_dbfs_remove_file(&dbfs_file_d204);
622 * Functions to create the directory structure
623 * *******************************************
626 static int hypfs_create_cpu_files(struct dentry *cpus_dir, void *cpu_info)
628 struct dentry *cpu_dir;
629 char buffer[TMP_SIZE];
632 snprintf(buffer, TMP_SIZE, "%d", cpu_info__cpu_addr(diag204_info_type,
634 cpu_dir = hypfs_mkdir(cpus_dir, buffer);
635 rc = hypfs_create_u64(cpu_dir, "mgmtime",
636 cpu_info__acc_time(diag204_info_type, cpu_info) -
637 cpu_info__lp_time(diag204_info_type, cpu_info));
640 rc = hypfs_create_u64(cpu_dir, "cputime",
641 cpu_info__lp_time(diag204_info_type, cpu_info));
644 if (diag204_info_type == INFO_EXT) {
645 rc = hypfs_create_u64(cpu_dir, "onlinetime",
646 cpu_info__online_time(diag204_info_type,
651 diag224_idx2name(cpu_info__ctidx(diag204_info_type, cpu_info), buffer);
652 rc = hypfs_create_str(cpu_dir, "type", buffer);
656 static void *hypfs_create_lpar_files(struct dentry *systems_dir, void *part_hdr)
658 struct dentry *cpus_dir;
659 struct dentry *lpar_dir;
660 char lpar_name[LPAR_NAME_LEN + 1];
664 part_hdr__part_name(diag204_info_type, part_hdr, lpar_name);
665 lpar_name[LPAR_NAME_LEN] = 0;
666 lpar_dir = hypfs_mkdir(systems_dir, lpar_name);
667 if (IS_ERR(lpar_dir))
669 cpus_dir = hypfs_mkdir(lpar_dir, "cpus");
670 if (IS_ERR(cpus_dir))
672 cpu_info = part_hdr + part_hdr__size(diag204_info_type);
673 for (i = 0; i < part_hdr__rcpus(diag204_info_type, part_hdr); i++) {
675 rc = hypfs_create_cpu_files(cpus_dir, cpu_info);
678 cpu_info += cpu_info__size(diag204_info_type);
683 static int hypfs_create_phys_cpu_files(struct dentry *cpus_dir, void *cpu_info)
685 struct dentry *cpu_dir;
686 char buffer[TMP_SIZE];
689 snprintf(buffer, TMP_SIZE, "%i", phys_cpu__cpu_addr(diag204_info_type,
691 cpu_dir = hypfs_mkdir(cpus_dir, buffer);
693 return PTR_ERR(cpu_dir);
694 rc = hypfs_create_u64(cpu_dir, "mgmtime",
695 phys_cpu__mgm_time(diag204_info_type, cpu_info));
698 diag224_idx2name(phys_cpu__ctidx(diag204_info_type, cpu_info), buffer);
699 rc = hypfs_create_str(cpu_dir, "type", buffer);
703 static void *hypfs_create_phys_files(struct dentry *parent_dir, void *phys_hdr)
707 struct dentry *cpus_dir;
709 cpus_dir = hypfs_mkdir(parent_dir, "cpus");
710 if (IS_ERR(cpus_dir))
712 cpu_info = phys_hdr + phys_hdr__size(diag204_info_type);
713 for (i = 0; i < phys_hdr__cpus(diag204_info_type, phys_hdr); i++) {
715 rc = hypfs_create_phys_cpu_files(cpus_dir, cpu_info);
718 cpu_info += phys_cpu__size(diag204_info_type);
723 int hypfs_diag_create_files(struct dentry *root)
725 struct dentry *systems_dir, *hyp_dir;
726 void *time_hdr, *part_hdr;
730 buffer = diag204_store();
732 return PTR_ERR(buffer);
734 systems_dir = hypfs_mkdir(root, "systems");
735 if (IS_ERR(systems_dir)) {
736 rc = PTR_ERR(systems_dir);
739 time_hdr = (struct x_info_blk_hdr *)buffer;
740 part_hdr = time_hdr + info_blk_hdr__size(diag204_info_type);
741 for (i = 0; i < info_blk_hdr__npar(diag204_info_type, time_hdr); i++) {
742 part_hdr = hypfs_create_lpar_files(systems_dir, part_hdr);
743 if (IS_ERR(part_hdr)) {
744 rc = PTR_ERR(part_hdr);
748 if (info_blk_hdr__flags(diag204_info_type, time_hdr) & LPAR_PHYS_FLG) {
749 ptr = hypfs_create_phys_files(root, part_hdr);
755 hyp_dir = hypfs_mkdir(root, "hyp");
756 if (IS_ERR(hyp_dir)) {
757 rc = PTR_ERR(hyp_dir);
760 ptr = hypfs_create_str(hyp_dir, "type", "LPAR Hypervisor");