LCOV - code coverage report
Current view: top level - plugins/perfmon/intel/bundle - iio_bw.c (source / functions) Hit Total Coverage
Test: coverage-filtered.info Lines: 4 96 4.2 %
Date: 2023-07-05 22:20:52 Functions: 3 8 37.5 %

          Line data    Source code
       1             : /*
       2             :  * Copyright (c) 2021 Intel and/or its affiliates.
       3             :  * Licensed under the Apache License, Version 2.0 (the "License");
       4             :  * you may not use this file except in compliance with the License.
       5             :  * You may obtain a copy of the License at:
       6             :  *
       7             :  *     http://www.apache.org/licenses/LICENSE-2.0
       8             :  *
       9             :  * Unless required by applicable law or agreed to in writing, software
      10             :  * distributed under the License is distributed on an "AS IS" BASIS,
      11             :  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
      12             :  * See the License for the specific language governing permissions and
      13             :  * limitations under the License.
      14             :  */
      15             : 
      16             : #include <perfmon/perfmon.h>
      17             : #include <perfmon/intel/uncore.h>
      18             : #include <vlib/pci/pci.h>
      19             : #include <vppinfra/format.h>
      20             : #include <linux/limits.h>
      21             : #include <fcntl.h>
      22             : #include <math.h>
      23             : 
      24             : typedef struct
      25             : {
      26             :   u8 socket_id;
      27             :   u8 sad_id;
      28             :   u8 iio_unit_id;
      29             : } iio_uncore_sad_t;
      30             : typedef u32 index_t;
      31             : 
      32             : static const char *procfs_pci_path = "/proc/bus/pci";
      33             : 
      34             : #define PCM_INTEL_PCI_VENDOR_ID        0x8086
      35             : #define SNR_ICX_SAD_CONTROL_CFG_OFFSET 0x3F4
      36             : #define SNR_ICX_MESH2IIO_MMAP_DID      0x09A2
      37             : 
      38             : static const u8 icx_sad_to_pmu_id_mapping[] = { 5, 0, 1, 2, 3, 4 };
      39             : 
      40             : static const char *iio_bw_footer_message =
      41             :   "* this bundle currently only measures x8 and x16 PCIe devices on Port #0\n"
      42             :   "or Port #2. Please see the \"Intel® Xeon® Processor Scalable Memory\n"
      43             :   "Family Uncore Performance Monitoring Reference Manual(336274)\"\n"
      44             :   "Section 2.4 for more information.";
      45             : 
      46             : static u32
      47           0 : get_sad_ctrl_cfg (vlib_pci_addr_t *addr)
      48             : {
      49           0 :   int fd = 0;
      50             :   u32 value;
      51           0 :   u8 *dev_node_name = format (0, "%s/%02x/%02x.%x", procfs_pci_path, addr->bus,
      52           0 :                               addr->slot, addr->function);
      53             : 
      54           0 :   fd = open ((char *) dev_node_name, O_RDWR);
      55           0 :   if (fd < 0)
      56           0 :     return -1;
      57             : 
      58           0 :   if (pread (fd, &value, sizeof (u32), SNR_ICX_SAD_CONTROL_CFG_OFFSET) <
      59             :       sizeof (u32))
      60           0 :     value = -1;
      61             : 
      62           0 :   close (fd);
      63             : 
      64           0 :   return value;
      65             : }
      66             : 
      67             : static u64
      68           0 : get_bus_to_sad_mappings (vlib_main_t *vm, index_t **ph, iio_uncore_sad_t **pp)
      69             : {
      70           0 :   index_t *h = 0;
      71           0 :   iio_uncore_sad_t *p = 0, *e = 0;
      72           0 :   vlib_pci_addr_t *addr = 0, *addrs;
      73             : 
      74           0 :   addrs = vlib_pci_get_all_dev_addrs ();
      75             : 
      76           0 :   vec_foreach (addr, addrs)
      77             :     {
      78             :       vlib_pci_device_info_t *d;
      79           0 :       d = vlib_pci_get_device_info (vm, addr, 0);
      80             : 
      81           0 :       if (!d)
      82           0 :         continue;
      83             : 
      84           0 :       if (d->vendor_id == PCM_INTEL_PCI_VENDOR_ID &&
      85           0 :           d->device_id == SNR_ICX_MESH2IIO_MMAP_DID)
      86             :         {
      87             : 
      88           0 :           u32 sad_ctrl_cfg = get_sad_ctrl_cfg (addr);
      89           0 :           if (sad_ctrl_cfg == 0xFFFFFFFF)
      90             :             {
      91           0 :               vlib_pci_free_device_info (d);
      92           0 :               continue;
      93             :             }
      94             : 
      95           0 :           pool_get_zero (p, e);
      96             : 
      97           0 :           e->socket_id = (sad_ctrl_cfg & 0xf);
      98           0 :           e->sad_id = (sad_ctrl_cfg >> 4) & 0x7;
      99           0 :           e->iio_unit_id = icx_sad_to_pmu_id_mapping[e->sad_id];
     100             : 
     101           0 :           hash_set (h, addr->bus, e - p);
     102             :         }
     103             : 
     104           0 :       vlib_pci_free_device_info (d);
     105             :     }
     106             : 
     107           0 :   vec_free (addrs);
     108             : 
     109           0 :   *ph = h;
     110           0 :   *pp = p;
     111             : 
     112           0 :   return 0;
     113             : }
     114             : 
     115             : u8 *
     116           0 : format_stack_socket (u8 *s, va_list *va)
     117             : {
     118           0 :   iio_uncore_sad_t *e, *p = va_arg (*va, iio_uncore_sad_t *);
     119           0 :   index_t *h = va_arg (*va, index_t *);
     120           0 :   vlib_pci_addr_t root_bus, *addr = va_arg (*va, vlib_pci_addr_t *);
     121           0 :   clib_error_t *err = vlib_pci_get_device_root_bus (addr, &root_bus);
     122           0 :   if (err)
     123             :     {
     124           0 :       clib_error_free (err);
     125           0 :       return s;
     126             :     }
     127             : 
     128           0 :   uword *pu = hash_get (h, root_bus.bus);
     129           0 :   if (pu)
     130             :     {
     131           0 :       e = pool_elt_at_index (p, (index_t) pu[0]);
     132             : 
     133           0 :       s = format (s, "IIO%u/%u", e->socket_id, e->iio_unit_id);
     134             :     }
     135             :   else
     136             :     {
     137           0 :       s = format (s, "[ERR: hash lookup for bus '%u' failed]", root_bus.bus);
     138             :     }
     139           0 :   return s;
     140             : }
     141             : 
     142             : static clib_error_t *
     143           0 : init_intel_uncore_iio_bw (vlib_main_t *vm, struct perfmon_bundle *b)
     144             : {
     145           0 :   index_t *h = 0;
     146           0 :   iio_uncore_sad_t *p = 0;
     147           0 :   vlib_pci_addr_t *addr = 0, *addrs;
     148           0 :   u8 *s = 0;
     149             : 
     150           0 :   get_bus_to_sad_mappings (vm, &h, &p);
     151             : 
     152           0 :   s = format (0, "%-10s%-5s%-13s%-12s%-14s%-16s%s\n", "Stack", "Port",
     153             :               "Address", "VID:PID", "Link Speed", "Driver", "Product Name");
     154             : 
     155           0 :   addrs = vlib_pci_get_all_dev_addrs ();
     156             : 
     157           0 :   vec_foreach (addr, addrs)
     158             :     {
     159             :       vlib_pci_device_info_t *d;
     160           0 :       d = vlib_pci_get_device_info (vm, addr, 0);
     161             : 
     162           0 :       if (!d)
     163           0 :         continue;
     164             : 
     165           0 :       if (d->device_class != PCI_CLASS_NETWORK_ETHERNET)
     166           0 :         continue;
     167             : 
     168           0 :       s = format (
     169             :         s, "%-10U%-5U%-13U%04x:%04x   %-14U%-16s%v\n", format_stack_socket, p,
     170             :         h, addr, format_vlib_pci_link_port, d, format_vlib_pci_addr, addr,
     171           0 :         d->vendor_id, d->device_id, format_vlib_pci_link_speed, d,
     172           0 :         d->driver_name ? (char *) d->driver_name : "", d->product_name);
     173             : 
     174           0 :       vlib_pci_free_device_info (d);
     175             :     }
     176             : 
     177           0 :   b->footer = (char *) format (s, "\n%s", iio_bw_footer_message);
     178             : 
     179           0 :   vec_free (addrs);
     180           0 :   pool_free (p);
     181           0 :   hash_free (h);
     182             : 
     183           0 :   return 0;
     184             : }
     185             : 
     186             : static u8 *
     187           0 : format_intel_uncore_iio_bw (u8 *s, va_list *args)
     188             : {
     189           0 :   perfmon_reading_t *r = va_arg (*args, perfmon_reading_t *);
     190           0 :   int col = va_arg (*args, int);
     191           0 :   f64 tr = r->time_running * 1e-9;
     192           0 :   f64 value = 0;
     193             : 
     194           0 :   switch (col)
     195             :     {
     196           0 :     case 0:
     197           0 :       s = format (s, "%9.2f", tr);
     198           0 :       break;
     199           0 :     default:
     200           0 :       if (r->time_running)
     201             :         {
     202           0 :           value = r->value[col - 1] * 4 / tr;
     203             : 
     204           0 :           if (value > 1.0e6)
     205           0 :             s = format (s, "%9.0fM", value * 1e-6);
     206           0 :           else if (value > 1.0e3)
     207           0 :             s = format (s, "%9.0fK", value * 1e-3);
     208             :           else
     209           0 :             s = format (s, "%9.0f ", value);
     210             :         }
     211             : 
     212           0 :       break;
     213             :     }
     214             : 
     215           0 :   return s;
     216             : }
     217             : 
     218             : /*
     219             :  * This bundle is currently only supported and tested on Intel Icelake.
     220             :  */
     221             : static int
     222        2236 : is_icelake ()
     223             : {
     224        2236 :   return clib_cpu_supports_avx512_bitalg () && !clib_cpu_supports_movdir64b ();
     225             : }
     226             : 
     227             : static perfmon_cpu_supports_t iio_bw_cpu_supports[] = {
     228             :   { is_icelake, PERFMON_BUNDLE_TYPE_SYSTEM }
     229             : };
     230             : 
     231         559 : PERFMON_REGISTER_BUNDLE (intel_uncore_iio_bw_pci) = {
     232             :   .name = "iio-bandwidth-pci",
     233             :   .description = "pci iio memory reads and writes per iio stack *",
     234             :   .source = "intel-uncore",
     235             :   .events[0] = INTEL_UNCORE_E_IIO_UNC_IIO_DATA_REQ_OF_CPU_PART0_RD,
     236             :   .events[1] = INTEL_UNCORE_E_IIO_UNC_IIO_DATA_REQ_BY_CPU_PART0_WR,
     237             :   .events[2] = INTEL_UNCORE_E_IIO_UNC_IIO_DATA_REQ_BY_CPU_PART2_RD,
     238             :   .events[3] = INTEL_UNCORE_E_IIO_UNC_IIO_DATA_REQ_BY_CPU_PART2_WR,
     239             :   .n_events = 4,
     240             :   .cpu_supports = iio_bw_cpu_supports,
     241             :   .n_cpu_supports = ARRAY_LEN (iio_bw_cpu_supports),
     242             :   .format_fn = format_intel_uncore_iio_bw,
     243             :   .init_fn = init_intel_uncore_iio_bw,
     244             :   .column_headers = PERFMON_STRINGS ("RunTime", "PCIe Rd/P0", "PCIe Wr/P0",
     245             :                                      "PCIe Rd/P2", "PCIe Wr/P2")
     246             : };
     247             : 
     248         559 : PERFMON_REGISTER_BUNDLE (intel_uncore_iio_bw_cpu) = {
     249             :   .name = "iio-bandwidth-cpu",
     250             :   .description = "cpu iio memory reads and writes per iio stack *",
     251             :   .source = "intel-uncore",
     252             :   .events[0] = INTEL_UNCORE_E_IIO_UNC_IIO_DATA_REQ_BY_CPU_PART0_RD,
     253             :   .events[1] = INTEL_UNCORE_E_IIO_UNC_IIO_DATA_REQ_BY_CPU_PART0_WR,
     254             :   .events[2] = INTEL_UNCORE_E_IIO_UNC_IIO_DATA_REQ_BY_CPU_PART2_RD,
     255             :   .events[3] = INTEL_UNCORE_E_IIO_UNC_IIO_DATA_REQ_BY_CPU_PART2_WR,
     256             :   .n_events = 4,
     257             :   .cpu_supports = iio_bw_cpu_supports,
     258             :   .n_cpu_supports = ARRAY_LEN (iio_bw_cpu_supports),
     259             :   .format_fn = format_intel_uncore_iio_bw,
     260             :   .init_fn = init_intel_uncore_iio_bw,
     261             :   .column_headers = PERFMON_STRINGS ("RunTime", "CPU Rd/P0", "CPU Wr/P0",
     262             :                                      "CPU Rd/P2", "CPU Wr/P2")
     263             : };

Generated by: LCOV version 1.14