2 * arch/s390/hypfs/hypfs_diag.c
3 * Hypervisor filesystem for Linux on s390. Diag 204 and 224
6 * Copyright IBM Corp. 2006, 2008
7 * Author(s): Michael Holzheu <holzheu@de.ibm.com>
10 #define KMSG_COMPONENT "hypfs"
11 #define pr_fmt(fmt) KMSG_COMPONENT ": " fmt
13 #include <linux/types.h>
14 #include <linux/errno.h>
15 #include <linux/slab.h>
16 #include <linux/string.h>
17 #include <linux/vmalloc.h>
19 #include <asm/ebcdic.h>
22 #define LPAR_NAME_LEN 8 /* lpar name len in diag 204 data */
23 #define CPU_NAME_LEN 16 /* type name len of cpus in diag224 name table */
24 #define TMP_SIZE 64 /* size of temporary buffers */
26 #define DBFS_D204_HDR_VERSION 0
28 /* diag 204 subcodes */
36 /* The two available diag 204 data formats */
42 /* bit is set in flags, when physical cpu info is included in diag 204 data */
43 #define LPAR_PHYS_FLG 0x80
45 static char *diag224_cpu_names; /* diag 224 name table */
46 static enum diag204_sc diag204_store_sc; /* used subcode for store */
47 static enum diag204_format diag204_info_type; /* used diag 204 data format */
49 static void *diag204_buf; /* 4K aligned buffer for diag204 data */
50 static void *diag204_buf_vmalloc; /* vmalloc pointer for diag204 data */
51 static int diag204_buf_pages; /* number of pages for diag204 data */
53 static struct dentry *dbfs_d204_file;
56 * DIAG 204 data structures and member access functions.
58 * Since we have two different diag 204 data formats for old and new s390
59 * machines, we do not access the structs directly, but use getter functions for
60 * each struct member instead. This should make the code more readable.
63 /* Time information block */
72 } __attribute__ ((packed));
74 struct x_info_blk_hdr {
83 } __attribute__ ((packed));
85 static inline int info_blk_hdr__size(enum diag204_format type)
87 if (type == INFO_SIMPLE)
88 return sizeof(struct info_blk_hdr);
90 return sizeof(struct x_info_blk_hdr);
93 static inline __u8 info_blk_hdr__npar(enum diag204_format type, void *hdr)
95 if (type == INFO_SIMPLE)
96 return ((struct info_blk_hdr *)hdr)->npar;
98 return ((struct x_info_blk_hdr *)hdr)->npar;
101 static inline __u8 info_blk_hdr__flags(enum diag204_format type, void *hdr)
103 if (type == INFO_SIMPLE)
104 return ((struct info_blk_hdr *)hdr)->flags;
106 return ((struct x_info_blk_hdr *)hdr)->flags;
109 static inline __u16 info_blk_hdr__pcpus(enum diag204_format type, void *hdr)
111 if (type == INFO_SIMPLE)
112 return ((struct info_blk_hdr *)hdr)->phys_cpus;
114 return ((struct x_info_blk_hdr *)hdr)->phys_cpus;
117 /* Partition header */
123 char part_name[LPAR_NAME_LEN];
124 } __attribute__ ((packed));
132 char part_name[LPAR_NAME_LEN];
142 } __attribute__ ((packed));
144 static inline int part_hdr__size(enum diag204_format type)
146 if (type == INFO_SIMPLE)
147 return sizeof(struct part_hdr);
149 return sizeof(struct x_part_hdr);
152 static inline __u8 part_hdr__rcpus(enum diag204_format type, void *hdr)
154 if (type == INFO_SIMPLE)
155 return ((struct part_hdr *)hdr)->cpus;
157 return ((struct x_part_hdr *)hdr)->rcpus;
160 static inline void part_hdr__part_name(enum diag204_format type, void *hdr,
163 if (type == INFO_SIMPLE)
164 memcpy(name, ((struct part_hdr *)hdr)->part_name,
167 memcpy(name, ((struct x_part_hdr *)hdr)->part_name,
169 EBCASC(name, LPAR_NAME_LEN);
170 name[LPAR_NAME_LEN] = 0;
182 } __attribute__ ((packed));
201 } __attribute__ ((packed));
205 static inline int cpu_info__size(enum diag204_format type)
207 if (type == INFO_SIMPLE)
208 return sizeof(struct cpu_info);
210 return sizeof(struct x_cpu_info);
213 static inline __u8 cpu_info__ctidx(enum diag204_format type, void *hdr)
215 if (type == INFO_SIMPLE)
216 return ((struct cpu_info *)hdr)->ctidx;
218 return ((struct x_cpu_info *)hdr)->ctidx;
221 static inline __u16 cpu_info__cpu_addr(enum diag204_format type, void *hdr)
223 if (type == INFO_SIMPLE)
224 return ((struct cpu_info *)hdr)->cpu_addr;
226 return ((struct x_cpu_info *)hdr)->cpu_addr;
229 static inline __u64 cpu_info__acc_time(enum diag204_format type, void *hdr)
231 if (type == INFO_SIMPLE)
232 return ((struct cpu_info *)hdr)->acc_time;
234 return ((struct x_cpu_info *)hdr)->acc_time;
237 static inline __u64 cpu_info__lp_time(enum diag204_format type, void *hdr)
239 if (type == INFO_SIMPLE)
240 return ((struct cpu_info *)hdr)->lp_time;
242 return ((struct x_cpu_info *)hdr)->lp_time;
245 static inline __u64 cpu_info__online_time(enum diag204_format type, void *hdr)
247 if (type == INFO_SIMPLE)
248 return 0; /* online_time not available in simple info */
250 return ((struct x_cpu_info *)hdr)->online_time;
253 /* Physical header */
260 } __attribute__ ((packed));
268 } __attribute__ ((packed));
270 static inline int phys_hdr__size(enum diag204_format type)
272 if (type == INFO_SIMPLE)
273 return sizeof(struct phys_hdr);
275 return sizeof(struct x_phys_hdr);
278 static inline __u8 phys_hdr__cpus(enum diag204_format type, void *hdr)
280 if (type == INFO_SIMPLE)
281 return ((struct phys_hdr *)hdr)->cpus;
283 return ((struct x_phys_hdr *)hdr)->cpus;
286 /* Physical CPU info block */
295 } __attribute__ ((packed));
304 } __attribute__ ((packed));
306 static inline int phys_cpu__size(enum diag204_format type)
308 if (type == INFO_SIMPLE)
309 return sizeof(struct phys_cpu);
311 return sizeof(struct x_phys_cpu);
314 static inline __u16 phys_cpu__cpu_addr(enum diag204_format type, void *hdr)
316 if (type == INFO_SIMPLE)
317 return ((struct phys_cpu *)hdr)->cpu_addr;
319 return ((struct x_phys_cpu *)hdr)->cpu_addr;
322 static inline __u64 phys_cpu__mgm_time(enum diag204_format type, void *hdr)
324 if (type == INFO_SIMPLE)
325 return ((struct phys_cpu *)hdr)->mgm_time;
327 return ((struct x_phys_cpu *)hdr)->mgm_time;
330 static inline __u64 phys_cpu__ctidx(enum diag204_format type, void *hdr)
332 if (type == INFO_SIMPLE)
333 return ((struct phys_cpu *)hdr)->ctidx;
335 return ((struct x_phys_cpu *)hdr)->ctidx;
338 /* Diagnose 204 functions */
340 static int diag204(unsigned long subcode, unsigned long size, void *addr)
342 register unsigned long _subcode asm("0") = subcode;
343 register unsigned long _size asm("1") = size;
346 " diag %2,%0,0x204\n"
349 : "+d" (_subcode), "+d" (_size) : "d" (addr) : "memory");
356 * For the old diag subcode 4 with simple data format we have to use real
357 * memory. If we use subcode 6 or 7 with extended data format, we can (and
358 * should) use vmalloc, since we need a lot of memory in that case. Currently
362 static void diag204_free_buffer(void)
366 if (diag204_buf_vmalloc) {
367 vfree(diag204_buf_vmalloc);
368 diag204_buf_vmalloc = NULL;
370 free_pages((unsigned long) diag204_buf, 0);
375 static void *page_align_ptr(void *ptr)
377 return (void *) PAGE_ALIGN((unsigned long) ptr);
380 static void *diag204_alloc_vbuf(int pages)
382 /* The buffer has to be page aligned! */
383 diag204_buf_vmalloc = vmalloc(PAGE_SIZE * (pages + 1));
384 if (!diag204_buf_vmalloc)
385 return ERR_PTR(-ENOMEM);
386 diag204_buf = page_align_ptr(diag204_buf_vmalloc);
387 diag204_buf_pages = pages;
391 static void *diag204_alloc_rbuf(void)
393 diag204_buf = (void*)__get_free_pages(GFP_KERNEL,0);
395 return ERR_PTR(-ENOMEM);
396 diag204_buf_pages = 1;
400 static void *diag204_get_buffer(enum diag204_format fmt, int *pages)
403 *pages = diag204_buf_pages;
406 if (fmt == INFO_SIMPLE) {
408 return diag204_alloc_rbuf();
409 } else {/* INFO_EXT */
410 *pages = diag204((unsigned long)SUBC_RSI |
411 (unsigned long)INFO_EXT, 0, NULL);
413 return ERR_PTR(-ENOSYS);
415 return diag204_alloc_vbuf(*pages);
420 * diag204_probe() has to find out, which type of diagnose 204 implementation
421 * we have on our machine. Currently there are three possible scanarios:
422 * - subcode 4 + simple data format (only one page)
423 * - subcode 4-6 + extended data format
424 * - subcode 4-7 + extended data format
426 * Subcode 5 is used to retrieve the size of the data, provided by subcodes
427 * 6 and 7. Subcode 7 basically has the same function as subcode 6. In addition
428 * to subcode 6 it provides also information about secondary cpus.
429 * In order to get as much information as possible, we first try
430 * subcode 7, then 6 and if both fail, we use subcode 4.
433 static int diag204_probe(void)
438 buf = diag204_get_buffer(INFO_EXT, &pages);
440 if (diag204((unsigned long)SUBC_STIB7 |
441 (unsigned long)INFO_EXT, pages, buf) >= 0) {
442 diag204_store_sc = SUBC_STIB7;
443 diag204_info_type = INFO_EXT;
446 if (diag204((unsigned long)SUBC_STIB6 |
447 (unsigned long)INFO_EXT, pages, buf) >= 0) {
448 diag204_store_sc = SUBC_STIB6;
449 diag204_info_type = INFO_EXT;
452 diag204_free_buffer();
455 /* subcodes 6 and 7 failed, now try subcode 4 */
457 buf = diag204_get_buffer(INFO_SIMPLE, &pages);
462 if (diag204((unsigned long)SUBC_STIB4 |
463 (unsigned long)INFO_SIMPLE, pages, buf) >= 0) {
464 diag204_store_sc = SUBC_STIB4;
465 diag204_info_type = INFO_SIMPLE;
474 diag204_free_buffer();
479 static int diag204_do_store(void *buf, int pages)
483 rc = diag204((unsigned long) diag204_store_sc |
484 (unsigned long) diag204_info_type, pages, buf);
485 return rc < 0 ? -ENOSYS : 0;
488 static void *diag204_store(void)
493 buf = diag204_get_buffer(diag204_info_type, &pages);
496 rc = diag204_do_store(buf, pages);
503 /* Diagnose 224 functions */
505 static int diag224(void *ptr)
507 int rc = -EOPNOTSUPP;
510 " diag %1,%2,0x224\n"
514 : "+d" (rc) :"d" (0), "d" (ptr) : "memory");
518 static int diag224_get_name_table(void)
520 /* memory must be below 2GB */
521 diag224_cpu_names = kmalloc(PAGE_SIZE, GFP_KERNEL | GFP_DMA);
522 if (!diag224_cpu_names)
524 if (diag224(diag224_cpu_names)) {
525 kfree(diag224_cpu_names);
528 EBCASC(diag224_cpu_names + 16, (*diag224_cpu_names + 1) * 16);
532 static void diag224_delete_name_table(void)
534 kfree(diag224_cpu_names);
537 static int diag224_idx2name(int index, char *name)
539 memcpy(name, diag224_cpu_names + ((index + 1) * CPU_NAME_LEN),
541 name[CPU_NAME_LEN] = 0;
546 struct dbfs_d204_hdr {
547 u64 len; /* Length of d204 buffer without header */
548 u16 version; /* Version of header */
549 u8 sc; /* Used subcode */
551 } __attribute__ ((packed));
554 struct dbfs_d204_hdr hdr; /* 64 byte header */
555 char buf[]; /* d204 buffer */
556 } __attribute__ ((packed));
558 struct dbfs_d204_private {
559 struct dbfs_d204 *d204; /* Aligned d204 data with header */
560 void *base; /* Base pointer (needed for vfree) */
563 static int dbfs_d204_open(struct inode *inode, struct file *file)
565 struct dbfs_d204_private *data;
566 struct dbfs_d204 *d204;
569 data = kzalloc(sizeof(*data), GFP_KERNEL);
572 buf_size = PAGE_SIZE * (diag204_buf_pages + 1) + sizeof(d204->hdr);
573 data->base = vmalloc(buf_size);
576 goto fail_kfree_data;
578 memset(data->base, 0, buf_size);
579 d204 = page_align_ptr(data->base + sizeof(d204->hdr))
581 rc = diag204_do_store(&d204->buf, diag204_buf_pages);
583 goto fail_vfree_base;
584 d204->hdr.version = DBFS_D204_HDR_VERSION;
585 d204->hdr.len = PAGE_SIZE * diag204_buf_pages;
586 d204->hdr.sc = diag204_store_sc;
588 file->private_data = data;
589 return nonseekable_open(inode, file);
598 static int dbfs_d204_release(struct inode *inode, struct file *file)
600 struct dbfs_d204_private *data = file->private_data;
607 static ssize_t dbfs_d204_read(struct file *file, char __user *buf,
608 size_t size, loff_t *ppos)
610 struct dbfs_d204_private *data = file->private_data;
612 return simple_read_from_buffer(buf, size, ppos, data->d204,
613 data->d204->hdr.len +
614 sizeof(data->d204->hdr));
617 static const struct file_operations dbfs_d204_ops = {
618 .open = dbfs_d204_open,
619 .read = dbfs_d204_read,
620 .release = dbfs_d204_release,
623 static int hypfs_dbfs_init(void)
625 dbfs_d204_file = debugfs_create_file("diag_204", 0400, hypfs_dbfs_dir,
626 NULL, &dbfs_d204_ops);
627 if (IS_ERR(dbfs_d204_file))
628 return PTR_ERR(dbfs_d204_file);
632 __init int hypfs_diag_init(void)
636 if (diag204_probe()) {
637 pr_err("The hardware system does not support hypfs\n");
640 rc = diag224_get_name_table();
642 diag204_free_buffer();
643 pr_err("The hardware system does not provide all "
644 "functions required by hypfs\n");
646 if (diag204_info_type == INFO_EXT) {
647 rc = hypfs_dbfs_init();
649 diag204_free_buffer();
654 void hypfs_diag_exit(void)
656 debugfs_remove(dbfs_d204_file);
657 diag224_delete_name_table();
658 diag204_free_buffer();
662 * Functions to create the directory structure
663 * *******************************************
666 static int hypfs_create_cpu_files(struct super_block *sb,
667 struct dentry *cpus_dir, void *cpu_info)
669 struct dentry *cpu_dir;
670 char buffer[TMP_SIZE];
673 snprintf(buffer, TMP_SIZE, "%d", cpu_info__cpu_addr(diag204_info_type,
675 cpu_dir = hypfs_mkdir(sb, cpus_dir, buffer);
676 rc = hypfs_create_u64(sb, cpu_dir, "mgmtime",
677 cpu_info__acc_time(diag204_info_type, cpu_info) -
678 cpu_info__lp_time(diag204_info_type, cpu_info));
681 rc = hypfs_create_u64(sb, cpu_dir, "cputime",
682 cpu_info__lp_time(diag204_info_type, cpu_info));
685 if (diag204_info_type == INFO_EXT) {
686 rc = hypfs_create_u64(sb, cpu_dir, "onlinetime",
687 cpu_info__online_time(diag204_info_type,
692 diag224_idx2name(cpu_info__ctidx(diag204_info_type, cpu_info), buffer);
693 rc = hypfs_create_str(sb, cpu_dir, "type", buffer);
699 static void *hypfs_create_lpar_files(struct super_block *sb,
700 struct dentry *systems_dir, void *part_hdr)
702 struct dentry *cpus_dir;
703 struct dentry *lpar_dir;
704 char lpar_name[LPAR_NAME_LEN + 1];
708 part_hdr__part_name(diag204_info_type, part_hdr, lpar_name);
709 lpar_name[LPAR_NAME_LEN] = 0;
710 lpar_dir = hypfs_mkdir(sb, systems_dir, lpar_name);
711 if (IS_ERR(lpar_dir))
713 cpus_dir = hypfs_mkdir(sb, lpar_dir, "cpus");
714 if (IS_ERR(cpus_dir))
716 cpu_info = part_hdr + part_hdr__size(diag204_info_type);
717 for (i = 0; i < part_hdr__rcpus(diag204_info_type, part_hdr); i++) {
719 rc = hypfs_create_cpu_files(sb, cpus_dir, cpu_info);
722 cpu_info += cpu_info__size(diag204_info_type);
727 static int hypfs_create_phys_cpu_files(struct super_block *sb,
728 struct dentry *cpus_dir, void *cpu_info)
730 struct dentry *cpu_dir;
731 char buffer[TMP_SIZE];
734 snprintf(buffer, TMP_SIZE, "%i", phys_cpu__cpu_addr(diag204_info_type,
736 cpu_dir = hypfs_mkdir(sb, cpus_dir, buffer);
738 return PTR_ERR(cpu_dir);
739 rc = hypfs_create_u64(sb, cpu_dir, "mgmtime",
740 phys_cpu__mgm_time(diag204_info_type, cpu_info));
743 diag224_idx2name(phys_cpu__ctidx(diag204_info_type, cpu_info), buffer);
744 rc = hypfs_create_str(sb, cpu_dir, "type", buffer);
750 static void *hypfs_create_phys_files(struct super_block *sb,
751 struct dentry *parent_dir, void *phys_hdr)
755 struct dentry *cpus_dir;
757 cpus_dir = hypfs_mkdir(sb, parent_dir, "cpus");
758 if (IS_ERR(cpus_dir))
760 cpu_info = phys_hdr + phys_hdr__size(diag204_info_type);
761 for (i = 0; i < phys_hdr__cpus(diag204_info_type, phys_hdr); i++) {
763 rc = hypfs_create_phys_cpu_files(sb, cpus_dir, cpu_info);
766 cpu_info += phys_cpu__size(diag204_info_type);
771 int hypfs_diag_create_files(struct super_block *sb, struct dentry *root)
773 struct dentry *systems_dir, *hyp_dir;
774 void *time_hdr, *part_hdr;
778 buffer = diag204_store();
780 return PTR_ERR(buffer);
782 systems_dir = hypfs_mkdir(sb, root, "systems");
783 if (IS_ERR(systems_dir)) {
784 rc = PTR_ERR(systems_dir);
787 time_hdr = (struct x_info_blk_hdr *)buffer;
788 part_hdr = time_hdr + info_blk_hdr__size(diag204_info_type);
789 for (i = 0; i < info_blk_hdr__npar(diag204_info_type, time_hdr); i++) {
790 part_hdr = hypfs_create_lpar_files(sb, systems_dir, part_hdr);
791 if (IS_ERR(part_hdr)) {
792 rc = PTR_ERR(part_hdr);
796 if (info_blk_hdr__flags(diag204_info_type, time_hdr) & LPAR_PHYS_FLG) {
797 ptr = hypfs_create_phys_files(sb, root, part_hdr);
803 hyp_dir = hypfs_mkdir(sb, root, "hyp");
804 if (IS_ERR(hyp_dir)) {
805 rc = PTR_ERR(hyp_dir);
808 ptr = hypfs_create_str(sb, hyp_dir, "type", "LPAR Hypervisor");