powerpc/hv_gpci: Add sysfs file inside hv_gpci device to show affinity domain via...
[linux-block.git] / arch / powerpc / perf / hv-gpci.c
index 7ff8ff3509f5f6f2f414b6475a86b051a30c335e..de2e1aee9e2cd6710e25e40cf0561666af719d20 100644 (file)
@@ -102,6 +102,293 @@ static ssize_t cpumask_show(struct device *dev,
        return cpumap_print_to_pagebuf(true, buf, &hv_gpci_cpumask);
 }
 
+/* Interface attribute array index to store system information */
+#define INTERFACE_PROCESSOR_BUS_TOPOLOGY_ATTR  6
+#define INTERFACE_PROCESSOR_CONFIG_ATTR                7
+#define INTERFACE_AFFINITY_DOMAIN_VIA_VP_ATTR  8
+#define INTERFACE_NULL_ATTR                    9
+
+/* Counter request value to retrieve system information */
+enum {
+       PROCESSOR_BUS_TOPOLOGY,
+       PROCESSOR_CONFIG,
+       AFFINITY_DOMAIN_VIA_VP, /* affinity domain via virtual processor */
+};
+
+static int sysinfo_counter_request[] = {
+       [PROCESSOR_BUS_TOPOLOGY] = 0xD0,
+       [PROCESSOR_CONFIG] = 0x90,
+       [AFFINITY_DOMAIN_VIA_VP] = 0xA0,
+};
+
+static DEFINE_PER_CPU(char, hv_gpci_reqb[HGPCI_REQ_BUFFER_SIZE]) __aligned(sizeof(uint64_t));
+
+static unsigned long systeminfo_gpci_request(u32 req, u32 starting_index,
+                       u16 secondary_index, char *buf,
+                       size_t *n, struct hv_gpci_request_buffer *arg)
+{
+       unsigned long ret;
+       size_t i, j;
+
+       arg->params.counter_request = cpu_to_be32(req);
+       arg->params.starting_index = cpu_to_be32(starting_index);
+       arg->params.secondary_index = cpu_to_be16(secondary_index);
+
+       ret = plpar_hcall_norets(H_GET_PERF_COUNTER_INFO,
+                       virt_to_phys(arg), HGPCI_REQ_BUFFER_SIZE);
+
+       /*
+        * ret value as 'H_PARAMETER' corresponds to 'GEN_BUF_TOO_SMALL',
+        * which means that the current buffer size cannot accommodate
+        * all the information and a partial buffer returned.
+        * hcall fails incase of ret value other than H_SUCCESS or H_PARAMETER.
+        *
+        * ret value as H_AUTHORITY implies that partition is not permitted to retrieve
+        * performance information, and required to set
+        * "Enable Performance Information Collection" option.
+        */
+       if (ret == H_AUTHORITY)
+               return -EPERM;
+
+       /*
+        * hcall can fail with other possible ret value like H_PRIVILEGE/H_HARDWARE
+        * because of invalid buffer-length/address or due to some hardware
+        * error.
+        */
+       if (ret && (ret != H_PARAMETER))
+               return -EIO;
+
+       /*
+        * hcall H_GET_PERF_COUNTER_INFO populates the 'returned_values'
+        * to show the total number of counter_value array elements
+        * returned via hcall.
+        * hcall also populates 'cv_element_size' corresponds to individual
+        * counter_value array element size. Below loop go through all
+        * counter_value array elements as per their size and add it to
+        * the output buffer.
+        */
+       for (i = 0; i < be16_to_cpu(arg->params.returned_values); i++) {
+               j = i * be16_to_cpu(arg->params.cv_element_size);
+
+               for (; j < (i + 1) * be16_to_cpu(arg->params.cv_element_size); j++)
+                       *n += sprintf(buf + *n,  "%02x", (u8)arg->bytes[j]);
+               *n += sprintf(buf + *n,  "\n");
+       }
+
+       if (*n >= PAGE_SIZE) {
+               pr_info("System information exceeds PAGE_SIZE\n");
+               return -EFBIG;
+       }
+
+       return ret;
+}
+
+static ssize_t processor_bus_topology_show(struct device *dev, struct device_attribute *attr,
+                               char *buf)
+{
+       struct hv_gpci_request_buffer *arg;
+       unsigned long ret;
+       size_t n = 0;
+
+       arg = (void *)get_cpu_var(hv_gpci_reqb);
+       memset(arg, 0, HGPCI_REQ_BUFFER_SIZE);
+
+       /*
+        * Pass the counter request value 0xD0 corresponds to request
+        * type 'Processor_bus_topology', to retrieve
+        * the system topology information.
+        * starting_index value implies the starting hardware
+        * chip id.
+        */
+       ret = systeminfo_gpci_request(sysinfo_counter_request[PROCESSOR_BUS_TOPOLOGY],
+                       0, 0, buf, &n, arg);
+
+       if (!ret)
+               return n;
+
+       if (ret != H_PARAMETER)
+               goto out;
+
+       /*
+        * ret value as 'H_PARAMETER' corresponds to 'GEN_BUF_TOO_SMALL', which
+        * implies that buffer can't accommodate all information, and a partial buffer
+        * returned. To handle that, we need to make subsequent requests
+        * with next starting index to retrieve additional (missing) data.
+        * Below loop do subsequent hcalls with next starting index and add it
+        * to buffer util we get all the information.
+        */
+       while (ret == H_PARAMETER) {
+               int returned_values = be16_to_cpu(arg->params.returned_values);
+               int elementsize = be16_to_cpu(arg->params.cv_element_size);
+               int last_element = (returned_values - 1) * elementsize;
+
+               /*
+                * Since the starting index value is part of counter_value
+                * buffer elements, use the starting index value in the last
+                * element and add 1 to make subsequent hcalls.
+                */
+               u32 starting_index = arg->bytes[last_element + 3] +
+                               (arg->bytes[last_element + 2] << 8) +
+                               (arg->bytes[last_element + 1] << 16) +
+                               (arg->bytes[last_element] << 24) + 1;
+
+               memset(arg, 0, HGPCI_REQ_BUFFER_SIZE);
+
+               ret = systeminfo_gpci_request(sysinfo_counter_request[PROCESSOR_BUS_TOPOLOGY],
+                               starting_index, 0, buf, &n, arg);
+
+               if (!ret)
+                       return n;
+
+               if (ret != H_PARAMETER)
+                       goto out;
+       }
+
+       return n;
+
+out:
+       put_cpu_var(hv_gpci_reqb);
+       return ret;
+}
+
+static ssize_t processor_config_show(struct device *dev, struct device_attribute *attr,
+                                       char *buf)
+{
+       struct hv_gpci_request_buffer *arg;
+       unsigned long ret;
+       size_t n = 0;
+
+       arg = (void *)get_cpu_var(hv_gpci_reqb);
+       memset(arg, 0, HGPCI_REQ_BUFFER_SIZE);
+
+       /*
+        * Pass the counter request value 0x90 corresponds to request
+        * type 'Processor_config', to retrieve
+        * the system processor information.
+        * starting_index value implies the starting hardware
+        * processor index.
+        */
+       ret = systeminfo_gpci_request(sysinfo_counter_request[PROCESSOR_CONFIG],
+                       0, 0, buf, &n, arg);
+
+       if (!ret)
+               return n;
+
+       if (ret != H_PARAMETER)
+               goto out;
+
+       /*
+        * ret value as 'H_PARAMETER' corresponds to 'GEN_BUF_TOO_SMALL', which
+        * implies that buffer can't accommodate all information, and a partial buffer
+        * returned. To handle that, we need to take subsequent requests
+        * with next starting index to retrieve additional (missing) data.
+        * Below loop do subsequent hcalls with next starting index and add it
+        * to buffer util we get all the information.
+        */
+       while (ret == H_PARAMETER) {
+               int returned_values = be16_to_cpu(arg->params.returned_values);
+               int elementsize = be16_to_cpu(arg->params.cv_element_size);
+               int last_element = (returned_values - 1) * elementsize;
+
+               /*
+                * Since the starting index is part of counter_value
+                * buffer elements, use the starting index value in the last
+                * element and add 1 to subsequent hcalls.
+                */
+               u32 starting_index = arg->bytes[last_element + 3] +
+                               (arg->bytes[last_element + 2] << 8) +
+                               (arg->bytes[last_element + 1] << 16) +
+                               (arg->bytes[last_element] << 24) + 1;
+
+               memset(arg, 0, HGPCI_REQ_BUFFER_SIZE);
+
+               ret = systeminfo_gpci_request(sysinfo_counter_request[PROCESSOR_CONFIG],
+                               starting_index, 0, buf, &n, arg);
+
+               if (!ret)
+                       return n;
+
+               if (ret != H_PARAMETER)
+                       goto out;
+       }
+
+       return n;
+
+out:
+       put_cpu_var(hv_gpci_reqb);
+       return ret;
+}
+
+static ssize_t affinity_domain_via_virtual_processor_show(struct device *dev,
+                       struct device_attribute *attr, char *buf)
+{
+       struct hv_gpci_request_buffer *arg;
+       unsigned long ret;
+       size_t n = 0;
+
+       arg = (void *)get_cpu_var(hv_gpci_reqb);
+       memset(arg, 0, HGPCI_REQ_BUFFER_SIZE);
+
+       /*
+        * Pass the counter request 0xA0 corresponds to request
+        * type 'Affinity_domain_information_by_virutal_processor',
+        * to retrieve the system affinity domain information.
+        * starting_index value refers to the starting hardware
+        * processor index.
+        */
+       ret = systeminfo_gpci_request(sysinfo_counter_request[AFFINITY_DOMAIN_VIA_VP],
+                       0, 0, buf, &n, arg);
+
+       if (!ret)
+               return n;
+
+       if (ret != H_PARAMETER)
+               goto out;
+
+       /*
+        * ret value as 'H_PARAMETER' corresponds to 'GEN_BUF_TOO_SMALL', which
+        * implies that buffer can't accommodate all information, and a partial buffer
+        * returned. To handle that, we need to take subsequent requests
+        * with next secondary index to retrieve additional (missing) data.
+        * Below loop do subsequent hcalls with next secondary index and add it
+        * to buffer util we get all the information.
+        */
+       while (ret == H_PARAMETER) {
+               int returned_values = be16_to_cpu(arg->params.returned_values);
+               int elementsize = be16_to_cpu(arg->params.cv_element_size);
+               int last_element = (returned_values - 1) * elementsize;
+
+               /*
+                * Since the starting index and secondary index type is part of the
+                * counter_value buffer elements, use the starting index value in the
+                * last array element as subsequent starting index, and use secondary index
+                * value in the last array element plus 1 as subsequent secondary index.
+                * For counter request '0xA0', starting index points to partition id
+                * and secondary index points to corresponding virtual processor index.
+                */
+               u32 starting_index = arg->bytes[last_element + 1] + (arg->bytes[last_element] << 8);
+               u16 secondary_index = arg->bytes[last_element + 3] +
+                               (arg->bytes[last_element + 2] << 8) + 1;
+
+               memset(arg, 0, HGPCI_REQ_BUFFER_SIZE);
+
+               ret = systeminfo_gpci_request(sysinfo_counter_request[AFFINITY_DOMAIN_VIA_VP],
+                               starting_index, secondary_index, buf, &n, arg);
+
+               if (!ret)
+                       return n;
+
+               if (ret != H_PARAMETER)
+                       goto out;
+       }
+
+       return n;
+
+out:
+       put_cpu_var(hv_gpci_reqb);
+       return ret;
+}
+
 static DEVICE_ATTR_RO(kernel_version);
 static DEVICE_ATTR_RO(cpumask);
 
@@ -118,6 +405,21 @@ static struct attribute *interface_attrs[] = {
        &hv_caps_attr_expanded.attr,
        &hv_caps_attr_lab.attr,
        &hv_caps_attr_collect_privileged.attr,
+       /*
+        * This NULL is a placeholder for the processor_bus_topology
+        * attribute, set in init function if applicable.
+        */
+       NULL,
+       /*
+        * This NULL is a placeholder for the processor_config
+        * attribute, set in init function if applicable.
+        */
+       NULL,
+       /*
+        * This NULL is a placeholder for the affinity_domain_via_virtual_processor
+        * attribute, set in init function if applicable.
+        */
+       NULL,
        NULL,
 };
 
@@ -143,8 +445,6 @@ static const struct attribute_group *attr_groups[] = {
        NULL,
 };
 
-static DEFINE_PER_CPU(char, hv_gpci_reqb[HGPCI_REQ_BUFFER_SIZE]) __aligned(sizeof(uint64_t));
-
 static unsigned long single_gpci_request(u32 req, u32 starting_index,
                u16 secondary_index, u8 version_in, u32 offset, u8 length,
                u64 *value)
@@ -325,6 +625,99 @@ static int hv_gpci_cpu_hotplug_init(void)
                          ppc_hv_gpci_cpu_offline);
 }
 
+static struct device_attribute *sysinfo_device_attr_create(int
+               sysinfo_interface_group_index, u32 req)
+{
+       struct device_attribute *attr = NULL;
+       unsigned long ret;
+       struct hv_gpci_request_buffer *arg;
+
+       if (sysinfo_interface_group_index < INTERFACE_PROCESSOR_BUS_TOPOLOGY_ATTR ||
+                       sysinfo_interface_group_index >= INTERFACE_NULL_ATTR) {
+               pr_info("Wrong interface group index for system information\n");
+               return NULL;
+       }
+
+       /* Check for given counter request value support */
+       arg = (void *)get_cpu_var(hv_gpci_reqb);
+       memset(arg, 0, HGPCI_REQ_BUFFER_SIZE);
+
+       arg->params.counter_request = cpu_to_be32(req);
+
+       ret = plpar_hcall_norets(H_GET_PERF_COUNTER_INFO,
+                       virt_to_phys(arg), HGPCI_REQ_BUFFER_SIZE);
+
+       put_cpu_var(hv_gpci_reqb);
+
+       /*
+        * Add given counter request value attribute in the interface_attrs
+        * attribute array, only for valid return types.
+        */
+       if (!ret || ret == H_AUTHORITY || ret == H_PARAMETER) {
+               attr = kzalloc(sizeof(*attr), GFP_KERNEL);
+               if (!attr)
+                       return NULL;
+
+               sysfs_attr_init(&attr->attr);
+               attr->attr.mode = 0444;
+
+               switch (sysinfo_interface_group_index) {
+               case INTERFACE_PROCESSOR_BUS_TOPOLOGY_ATTR:
+                       attr->attr.name = "processor_bus_topology";
+                       attr->show = processor_bus_topology_show;
+               break;
+               case INTERFACE_PROCESSOR_CONFIG_ATTR:
+                       attr->attr.name = "processor_config";
+                       attr->show = processor_config_show;
+               break;
+               case INTERFACE_AFFINITY_DOMAIN_VIA_VP_ATTR:
+                       attr->attr.name = "affinity_domain_via_virtual_processor";
+                       attr->show = affinity_domain_via_virtual_processor_show;
+               break;
+               }
+       } else
+               pr_devel("hcall failed, with error: 0x%lx\n", ret);
+
+       return attr;
+}
+
+static void add_sysinfo_interface_files(void)
+{
+       int sysfs_count;
+       struct device_attribute *attr[INTERFACE_NULL_ATTR - INTERFACE_PROCESSOR_BUS_TOPOLOGY_ATTR];
+       int i;
+
+       sysfs_count = INTERFACE_NULL_ATTR - INTERFACE_PROCESSOR_BUS_TOPOLOGY_ATTR;
+
+       /* Get device attribute for a given counter request value */
+       for (i = 0; i < sysfs_count; i++) {
+               attr[i] = sysinfo_device_attr_create(i + INTERFACE_PROCESSOR_BUS_TOPOLOGY_ATTR,
+                               sysinfo_counter_request[i]);
+
+               if (!attr[i])
+                       goto out;
+       }
+
+       /* Add sysinfo interface attributes in the interface_attrs attribute array */
+       for (i = 0; i < sysfs_count; i++)
+               interface_attrs[i + INTERFACE_PROCESSOR_BUS_TOPOLOGY_ATTR] = &attr[i]->attr;
+
+       return;
+
+out:
+       /*
+        * The sysinfo interface attributes will be added, only if hcall passed for
+        * all the counter request values. Free the device attribute array incase
+        * of any hcall failure.
+        */
+       if (i > 0) {
+               while (i >= 0) {
+                       kfree(attr[i]);
+                       i--;
+               }
+       }
+}
+
 static int hv_gpci_init(void)
 {
        int r;
@@ -388,6 +781,10 @@ static int hv_gpci_init(void)
        if (r)
                return r;
 
+       /* sysinfo interface files are only available for power10 and above platforms */
+       if (PVR_VER(mfspr(SPRN_PVR)) >= PVR_POWER10)
+               add_sysinfo_interface_files();
+
        return 0;
 }