intel_rdt: refactor pids monitoring code.

[collectd.git] / src / intel_rdt.c
diff --git a/src/intel_rdt.c b/src/intel_rdt.c

index a3f77c9..b0adf05 100644 (file)
--- a/src/intel_rdt.c
+++ b/src/intel_rdt.c
@@ -1,7 +1,7 @@
  /**
   * collectd - src/intel_rdt.c
   *
  /**
   * collectd - src/intel_rdt.c
   *
- * Copyright(c) 2016 Intel Corporation. All rights reserved.
+ * Copyright(c) 2016-2018 Intel Corporation. All rights reserved.
   *
   * Permission is hereby granted, free of charge, to any person obtaining a copy
   * of this software and associated documentation files (the "Software"), to deal
   *
   * Permission is hereby granted, free of charge, to any person obtaining a copy
   * of this software and associated documentation files (the "Software"), to deal
@@ -23,242 +23,385 @@
   *
   * Authors:
   *   Serhiy Pshyk <serhiyx.pshyk@intel.com>
   *
   * Authors:
   *   Serhiy Pshyk <serhiyx.pshyk@intel.com>
+ *   Starzyk, Mateusz <mateuszx.starzyk@intel.com>
+ *   Wojciech Andralojc <wojciechx.andralojc@intel.com>
   **/
  
   **/
  
-#include "common.h"
  #include "collectd.h"
  #include "collectd.h"
-
+#include "utils/common/common.h"
+#include "utils/config_cores/config_cores.h"
+#include "utils_proc_pids.h"
  #include <pqos.h>
  
  #define RDT_PLUGIN "intel_rdt"
  
  #include <pqos.h>
  
  #define RDT_PLUGIN "intel_rdt"
  
+/* libpqos v2.0 or newer is required for process monitoring*/
+#undef LIBPQOS2
+#if defined(PQOS_VERSION) && PQOS_VERSION >= 20000
+#define LIBPQOS2
+#endif
+
+#define RDT_PLUGIN "intel_rdt"
+
  #define RDT_MAX_SOCKETS 8
  #define RDT_MAX_SOCKET_CORES 64
  #define RDT_MAX_CORES (RDT_MAX_SOCKET_CORES * RDT_MAX_SOCKETS)
  
  #define RDT_MAX_SOCKETS 8
  #define RDT_MAX_SOCKET_CORES 64
  #define RDT_MAX_CORES (RDT_MAX_SOCKET_CORES * RDT_MAX_SOCKETS)
  
+#ifdef LIBPQOS2
+/*
+ * Process name inside comm file is limited to 16 chars.
+ * More info here: http://man7.org/linux/man-pages/man5/proc.5.html
+ */
+#define RDT_MAX_NAMES_GROUPS 64
+#define RDT_PROC_PATH "/proc"
+#endif /* LIBPQOS2 */
+
  typedef enum {
    UNKNOWN = 0,
    CONFIGURATION_ERROR,
  } rdt_config_status;
  
  typedef enum {
    UNKNOWN = 0,
    CONFIGURATION_ERROR,
  } rdt_config_status;
  
-struct rdt_core_group_s {
+#ifdef LIBPQOS2
+struct rdt_name_group_s {
    char *desc;
    char *desc;
-  size_t num_cores;
-  unsigned *cores;
+  size_t num_names;
+  char **names;
+  proc_pids_t *proc_pids_array;
+  size_t monitored_pids_count;
    enum pqos_mon_event events;
  };
    enum pqos_mon_event events;
  };
-typedef struct rdt_core_group_s rdt_core_group_t;
+typedef struct rdt_name_group_s rdt_name_group_t;
+#endif /* LIBPQOS2 */
  
  struct rdt_ctx_s {
  
  struct rdt_ctx_s {
-  rdt_core_group_t cgroups[RDT_MAX_CORES];
-  struct pqos_mon_data *pgroups[RDT_MAX_CORES];
-  size_t num_groups;
+  core_groups_list_t cores;
+  enum pqos_mon_event events[RDT_MAX_CORES];
+  struct pqos_mon_data *pcgroups[RDT_MAX_CORES];
+#ifdef LIBPQOS2
+  rdt_name_group_t ngroups[RDT_MAX_NAMES_GROUPS];
+  struct pqos_mon_data *pngroups[RDT_MAX_NAMES_GROUPS];
+  size_t num_ngroups;
+#endif /* LIBPQOS2 */
    const struct pqos_cpuinfo *pqos_cpu;
    const struct pqos_cap *pqos_cap;
    const struct pqos_capability *cap_mon;
  };
  typedef struct rdt_ctx_s rdt_ctx_t;
  
    const struct pqos_cpuinfo *pqos_cpu;
    const struct pqos_cap *pqos_cap;
    const struct pqos_capability *cap_mon;
  };
  typedef struct rdt_ctx_s rdt_ctx_t;
  
-static rdt_ctx_t *g_rdt = NULL;
+static rdt_ctx_t *g_rdt;
  
  static rdt_config_status g_state = UNKNOWN;
  
  
  static rdt_config_status g_state = UNKNOWN;
  
-static int isdup(const uint64_t *nums, size_t size, uint64_t val) {
-  for (size_t i = 0; i < size; i++)
-    if (nums[i] == val)
-      return 1;
-  return 0;
+static int g_interface = -1;
+
+static void rdt_submit_derive(const char *cgroup, const char *type,
+                              const char *type_instance, derive_t value) {
+  value_list_t vl = VALUE_LIST_INIT;
+
+  vl.values = &(value_t){.derive = value};
+  vl.values_len = 1;
+
+  sstrncpy(vl.plugin, RDT_PLUGIN, sizeof(vl.plugin));
+  snprintf(vl.plugin_instance, sizeof(vl.plugin_instance), "%s", cgroup);
+  sstrncpy(vl.type, type, sizeof(vl.type));
+  if (type_instance)
+    sstrncpy(vl.type_instance, type_instance, sizeof(vl.type_instance));
+
+  plugin_dispatch_values(&vl);
  }
  
  }
  
-static int strtouint64(const char *s, uint64_t *n) {
-  char *endptr = NULL;
+static void rdt_submit_gauge(const char *cgroup, const char *type,
+                             const char *type_instance, gauge_t value) {
+  value_list_t vl = VALUE_LIST_INIT;
  
  
-  assert(s != NULL);
-  assert(n != NULL);
+  vl.values = &(value_t){.gauge = value};
+  vl.values_len = 1;
  
  
-  *n = strtoull(s, &endptr, 0);
+  sstrncpy(vl.plugin, RDT_PLUGIN, sizeof(vl.plugin));
+  snprintf(vl.plugin_instance, sizeof(vl.plugin_instance), "%s", cgroup);
+  sstrncpy(vl.type, type, sizeof(vl.type));
+  if (type_instance)
+    sstrncpy(vl.type_instance, type_instance, sizeof(vl.type_instance));
  
  
-  if (!(*s != '\0' && *endptr == '\0')) {
-    DEBUG(RDT_PLUGIN ": Error converting '%s' to unsigned number.", s);
-    return -EINVAL;
+  plugin_dispatch_values(&vl);
+}
+
+#if COLLECT_DEBUG
+static void rdt_dump_cgroups(void) {
+  char cores[RDT_MAX_CORES * 4];
+
+  if (g_rdt == NULL)
+    return;
+
+  DEBUG(RDT_PLUGIN ": Core Groups Dump");
+  DEBUG(RDT_PLUGIN ":  groups count: %" PRIsz, g_rdt->cores.num_cgroups);
+
+  for (size_t i = 0; i < g_rdt->cores.num_cgroups; i++) {
+    core_group_t *cgroup = g_rdt->cores.cgroups + i;
+
+    memset(cores, 0, sizeof(cores));
+    for (size_t j = 0; j < cgroup->num_cores; j++) {
+      snprintf(cores + strlen(cores), sizeof(cores) - strlen(cores) - 1, " %d",
+               cgroup->cores[j]);
+    }
+
+    DEBUG(RDT_PLUGIN ":  group[%zu]:", i);
+    DEBUG(RDT_PLUGIN ":    description: %s", cgroup->desc);
+    DEBUG(RDT_PLUGIN ":    cores: %s", cores);
+    DEBUG(RDT_PLUGIN ":    events: 0x%X", g_rdt->events[i]);
+  }
+
+  return;
+}
+
+#ifdef LIBPQOS2
+static void rdt_dump_ngroups(void) {
+
+  char names[DATA_MAX_NAME_LEN];
+
+  if (g_rdt == NULL)
+    return;
+
+  DEBUG(RDT_PLUGIN ": Process Names Groups Dump");
+  DEBUG(RDT_PLUGIN ":  groups count: %" PRIsz, g_rdt->num_ngroups);
+
+  for (size_t i = 0; i < g_rdt->num_ngroups; i++) {
+    memset(names, 0, sizeof(names));
+    for (size_t j = 0; j < g_rdt->ngroups[i].num_names; j++)
+      snprintf(names + strlen(names), sizeof(names) - strlen(names) - 1, " %s",
+               g_rdt->ngroups[i].names[j]);
+
+    DEBUG(RDT_PLUGIN ":  group[%d]:", (int)i);
+    DEBUG(RDT_PLUGIN ":    description: %s", g_rdt->ngroups[i].desc);
+    DEBUG(RDT_PLUGIN ":    process names:%s", names);
+    DEBUG(RDT_PLUGIN ":    events: 0x%X", g_rdt->ngroups[i].events);
+  }
+
+  return;
+}
+#endif /* LIBPQOS2 */
+
+static inline double bytes_to_kb(const double bytes) { return bytes / 1024.0; }
+
+static inline double bytes_to_mb(const double bytes) {
+  return bytes / (1024.0 * 1024.0);
+}
+
+static void rdt_dump_cores_data(void) {
+/*
+ * CORE - monitored group of cores
+ * RMID - Resource Monitoring ID associated with the monitored group
+ *        This is not available for monitoring with resource control
+ * LLC - last level cache occupancy
+ * MBL - local memory bandwidth
+ * MBR - remote memory bandwidth
+ */
+#ifdef LIBPQOS2
+  if (g_interface == PQOS_INTER_OS_RESCTRL_MON) {
+    DEBUG(RDT_PLUGIN ":  CORE     LLC[KB]   MBL[MB]    MBR[MB]");
+  } else {
+    DEBUG(RDT_PLUGIN ":  CORE     RMID    LLC[KB]   MBL[MB]    MBR[MB]");
+  }
+#else
+  DEBUG(RDT_PLUGIN ":  CORE     RMID    LLC[KB]   MBL[MB]    MBR[MB]");
+#endif /* LIBPQOS2 */
+
+  for (int i = 0; i < g_rdt->cores.num_cgroups; i++) {
+    const struct pqos_event_values *pv = &g_rdt->pcgroups[i]->values;
+
+    double llc = bytes_to_kb(pv->llc);
+    double mbr = bytes_to_mb(pv->mbm_remote_delta);
+    double mbl = bytes_to_mb(pv->mbm_local_delta);
+#ifdef LIBPQOS2
+    if (g_interface == PQOS_INTER_OS_RESCTRL_MON) {
+      DEBUG(RDT_PLUGIN ": [%s] %10.1f %10.1f %10.1f",
+            g_rdt->cores.cgroups[i].desc, llc, mbl, mbr);
+    } else {
+      DEBUG(RDT_PLUGIN ": [%s] %8u %10.1f %10.1f %10.1f",
+            g_rdt->cores.cgroups[i].desc, g_rdt->pcgroups[i]->poll_ctx[0].rmid,
+            llc, mbl, mbr);
+    }
+#else
+    DEBUG(RDT_PLUGIN ": [%s] %8u %10.1f %10.1f %10.1f",
+          g_rdt->cores.cgroups[i].desc, g_rdt->pcgroups[i]->poll_ctx[0].rmid,
+          llc, mbl, mbr);
+#endif /* LIBPQOS2 */
+  }
+}
+
+#ifdef LIBPQOS2
+static void rdt_dump_pids_data(void) {
+  /*
+   * NAME - monitored group of processes
+   * PIDs - list of PID numbers in the NAME group
+   * LLC - last level cache occupancy
+   * MBL - local memory bandwidth
+   * MBR - remote memory bandwidth
+   */
+
+  DEBUG(RDT_PLUGIN ":  NAME     PIDs");
+  char pids[DATA_MAX_NAME_LEN];
+  for (size_t i = 0; i < g_rdt->num_ngroups; ++i) {
+    memset(pids, 0, sizeof(pids));
+    for (size_t j = 0; j < g_rdt->ngroups[i].num_names; ++j) {
+      pids_list_t *list = g_rdt->ngroups[i].proc_pids_array[j].pids;
+      while (list != NULL) {
+        snprintf(pids + strlen(pids), sizeof(pids) - strlen(pids) - 1, " %u",
+                 list->pid);
+        list = list->next;
+      }
+    }
+    DEBUG(RDT_PLUGIN ":  [%s] %s", g_rdt->ngroups[i].desc, pids);
+  }
+
+  DEBUG(RDT_PLUGIN ":  NAME    LLC[KB]   MBL[MB]    MBR[MB]");
+  for (size_t i = 0; i < g_rdt->num_ngroups; i++) {
+
+    const struct pqos_event_values *pv = &g_rdt->pngroups[i]->values;
+
+    double llc = bytes_to_kb(pv->llc);
+    double mbr = bytes_to_mb(pv->mbm_remote_delta);
+    double mbl = bytes_to_mb(pv->mbm_local_delta);
+
+    DEBUG(RDT_PLUGIN ":  [%s] %10.1f %10.1f %10.1f", g_rdt->ngroups[i].desc,
+          llc, mbl, mbr);
    }
    }
+}
+#endif /* LIBPQOS2 */
+#endif /* COLLECT_DEBUG */
+
+#ifdef LIBPQOS2
+static int isdupstr(const char *names[], const size_t size, const char *name) {
+  for (size_t i = 0; i < size; i++)
+    if (strncmp(names[i], name, (size_t)MAX_PROC_NAME_LEN) == 0)
+      return 1;
  
    return 0;
  }
  
  /*
   * NAME
  
    return 0;
  }
  
  /*
   * NAME
- *   strlisttonums
+ *   strlisttoarray
   *
   * DESCRIPTION
   *
   * DESCRIPTION
- *   Converts string of characters representing list of numbers into array of
- *   numbers. Allowed formats are:
- *     0,1,2,3
- *     0-10,20-18
- *     1,3,5-8,10,0x10-12
- *
- *   Numbers can be in decimal or hexadecimal format.
+ *   Converts string representing list of strings into array of strings.
+ *   Allowed format is:
+ *     name,name1,name2,name3
   *
   * PARAMETERS
   *
   * PARAMETERS
- *   `s'         String representing list of unsigned numbers.
- *   `nums'      Array to put converted numeric values into.
- *   `max'       Maximum number of elements that nums can accommodate.
+ *   `str_list'  String representing list of strings.
+ *   `names'     Array to put extracted strings into.
+ *   `names_num' Variable to put number of extracted strings.
   *
   * RETURN VALUE
   *
   * RETURN VALUE
- *    Number of elements placed into nums.
+ *    Number of elements placed into names.
   */
   */
-static size_t strlisttonums(char *s, uint64_t *nums, size_t max) {
-  int ret;
-  size_t index = 0;
+static int strlisttoarray(char *str_list, char ***names, size_t *names_num) {
    char *saveptr = NULL;
  
    char *saveptr = NULL;
  
-  if (s == NULL || nums == NULL || max == 0)
-    return index;
+  if (str_list == NULL || names == NULL)
+    return -EINVAL;
  
  
-  for (;;) {
-    char *p = NULL;
-    char *token = NULL;
+  if (strstr(str_list, ",,")) {
+    /* strtok ignores empty words between separators.
+     * This condition handles that by rejecting strings
+     * with consecutive seprators */
+    ERROR(RDT_PLUGIN ": Empty process name");
+    return -EINVAL;
+  }
  
  
-    token = strtok_r(s, ",", &saveptr);
+  for (;;) {
+    char *token = strtok_r(str_list, ",", &saveptr);
      if (token == NULL)
        break;
  
      if (token == NULL)
        break;
  
-    s = NULL;
+    str_list = NULL;
  
      while (isspace(*token))
        token++;
  
      while (isspace(*token))
        token++;
+
      if (*token == '\0')
        continue;
  
      if (*token == '\0')
        continue;
  
-    p = strchr(token, '-');
-    if (p != NULL) {
-      uint64_t n, start, end;
-      *p = '\0';
-      ret = strtouint64(token, &start);
-      if (ret < 0)
-        return 0;
-      ret = strtouint64(p + 1, &end);
-      if (ret < 0)
-        return 0;
-      if (start > end) {
-        return 0;
-      }
-      for (n = start; n <= end; n++) {
-        if (!(isdup(nums, index, n))) {
-          nums[index] = n;
-          index++;
-        }
-        if (index >= max)
-          return index;
-      }
+    if ((isdupstr((const char **)*names, *names_num, token))) {
+      ERROR(RDT_PLUGIN ": Duplicated process name \'%s\' in group \'%s\'",
+            token, str_list);
+      return -EINVAL;
      } else {
      } else {
-      uint64_t val;
-
-      ret = strtouint64(token, &val);
-      if (ret < 0)
-        return 0;
-
-      if (!(isdup(nums, index, val))) {
-        nums[index] = val;
-        index++;
+      if (0 != strarray_add(names, names_num, token)) {
+        ERROR(RDT_PLUGIN ": Error allocating process name string");
+        return -ENOMEM;
        }
        }
-      if (index >= max)
-        return index;
      }
    }
  
      }
    }
  
-  return index;
+  return 0;
  }
  
  /*
   * NAME
  }
  
  /*
   * NAME
- *   cgroup_cmp
+ *   ngroup_cmp
   *
   * DESCRIPTION
   *
   * DESCRIPTION
- *   Function to compare cores in 2 core groups.
+ *   Function to compare names in two name groups.
   *
   * PARAMETERS
   *
   * PARAMETERS
- *   `cg_a'      Pointer to core group a.
- *   `cg_b'      Pointer to core group b.
+ *   `ng_a'      Pointer to name group a.
+ *   `ng_b'      Pointer to name group b.
   *
   * RETURN VALUE
   *
   * RETURN VALUE
- *    1 if both groups contain the same cores
- *    0 if none of their cores match
- *    -1 if some but not all cores match
+ *    1 if both groups contain the same names
+ *    0 if none of their names match
+ *    -1 if some but not all names match
   */
   */
-static int cgroup_cmp(const rdt_core_group_t *cg_a,
-                      const rdt_core_group_t *cg_b) {
-  int found = 0;
+static int ngroup_cmp(const rdt_name_group_t *ng_a,
+                      const rdt_name_group_t *ng_b) {
+  unsigned found = 0;
  
  
-  assert(cg_a != NULL);
-  assert(cg_b != NULL);
+  assert(ng_a != NULL);
+  assert(ng_b != NULL);
  
  
-  const int sz_a = cg_a->num_cores;
-  const int sz_b = cg_b->num_cores;
-  const unsigned *tab_a = cg_a->cores;
-  const unsigned *tab_b = cg_b->cores;
+  const size_t sz_a = (unsigned)ng_a->num_names;
+  const size_t sz_b = (unsigned)ng_b->num_names;
+  const char **tab_a = (const char **)ng_a->names;
+  const char **tab_b = (const char **)ng_b->names;
  
  
-  for (int i = 0; i < sz_a; i++) {
-    for (int j = 0; j < sz_b; j++)
-      if (tab_a[i] == tab_b[j])
+  for (size_t i = 0; i < sz_a; i++) {
+    for (size_t j = 0; j < sz_b; j++)
+      if (strncmp(tab_a[i], tab_b[j], (size_t)MAX_PROC_NAME_LEN) == 0)
          found++;
    }
          found++;
    }
-  /* if no cores are the same */
+  /* if no names are the same */
    if (!found)
      return 0;
    if (!found)
      return 0;
-  /* if group contains same cores */
-  if (sz_a == sz_b && sz_b == found)
+  /* if group contains same names */
+  if (sz_a == sz_b && sz_b == (size_t)found)
      return 1;
      return 1;
-  /* if not all cores are the same */
+  /* if not all names are the same */
    return -1;
  }
  
    return -1;
  }
  
-static int cgroup_set(rdt_core_group_t *cg, char *desc, uint64_t *cores,
-                      size_t num_cores) {
-  assert(cg != NULL);
-  assert(desc != NULL);
-  assert(cores != NULL);
-  assert(num_cores > 0);
-
-  cg->cores = calloc(num_cores, sizeof(unsigned));
-  if (cg->cores == NULL) {
-    ERROR(RDT_PLUGIN ": Error allocating core group table");
-    return -ENOMEM;
-  }
-  cg->num_cores = num_cores;
-  cg->desc = strdup(desc);
-  if (cg->desc == NULL) {
-    ERROR(RDT_PLUGIN ": Error allocating core group description");
-    sfree(cg->cores);
-    return -ENOMEM;
-  }
-
-  for (size_t i = 0; i < num_cores; i++)
-    cg->cores[i] = (unsigned)cores[i];
-
-  return 0;
-}
-
  /*
   * NAME
  /*
   * NAME
- *   oconfig_to_cgroups
+ *   oconfig_to_ngroups
   *
   * DESCRIPTION
   *
   * DESCRIPTION
- *   Function to set the descriptions and cores for each core group.
+ *   Function to set the descriptions and names for each process names group.
   *   Takes a config option containing list of strings that are used to set
   *   Takes a config option containing list of strings that are used to set
- *   core group values.
+ *   process group values.
   *
   * PARAMETERS
   *
   * PARAMETERS
- *   `item'        Config option containing core groups.
- *   `groups'      Table of core groups to set values in.
- *   `max_groups'  Maximum number of core groups allowed.
+ *   `item'        Config option containing process names groups.
+ *   `groups'      Table of process name groups to set values in.
+ *   `max_groups'  Maximum number of process name groups allowed.
   *
   * RETURN VALUE
   *
   * RETURN VALUE
- *   On success, the number of core groups set up. On error, appropriate
+ *   On success, the number of name groups set up. On error, appropriate
   *   negative error value.
   */
   *   negative error value.
   */
-static int oconfig_to_cgroups(oconfig_item_t *item, rdt_core_group_t *groups,
-                              size_t max_groups) {
+static int oconfig_to_ngroups(const oconfig_item_t *item,
+                              rdt_name_group_t *groups,
+                              const size_t max_groups) {
    int index = 0;
  
    assert(groups != NULL);
    int index = 0;
  
    assert(groups != NULL);
@@ -267,32 +410,37 @@ static int oconfig_to_cgroups(oconfig_item_t *item, rdt_core_group_t *groups,
  
    for (int j = 0; j < item->values_num; j++) {
      int ret;
  
    for (int j = 0; j < item->values_num; j++) {
      int ret;
-    size_t n;
-    uint64_t cores[RDT_MAX_CORES] = {0};
      char value[DATA_MAX_NAME_LEN];
  
      if ((item->values[j].value.string == NULL) ||
      char value[DATA_MAX_NAME_LEN];
  
      if ((item->values[j].value.string == NULL) ||
-        (strlen(item->values[j].value.string) == 0))
-      continue;
+        (strlen(item->values[j].value.string) == 0)) {
+      ERROR(RDT_PLUGIN ": Error - empty group");
+      return -EINVAL;
+    }
  
      sstrncpy(value, item->values[j].value.string, sizeof(value));
  
  
      sstrncpy(value, item->values[j].value.string, sizeof(value));
  
-    n = strlisttonums(value, cores, STATIC_ARRAY_SIZE(cores));
-    if (n == 0) {
-      ERROR(RDT_PLUGIN ": Error parsing core group (%s)",
+    ret = strlisttoarray(value, &groups[index].names, &groups[index].num_names);
+    if (ret != 0 || groups[index].num_names == 0) {
+      ERROR(RDT_PLUGIN ": Error parsing process names group (%s)",
              item->values[j].value.string);
        return -EINVAL;
      }
  
              item->values[j].value.string);
        return -EINVAL;
      }
  
-    /* set core group info */
-    ret = cgroup_set(&groups[index], item->values[j].value.string, cores, n);
-    if (ret < 0)
-      return ret;
+    /* set group description info */
+    groups[index].desc = sstrdup(item->values[j].value.string);
+    if (groups[index].desc == NULL) {
+      ERROR(RDT_PLUGIN ": Error allocating name group description");
+      return -ENOMEM;
+    }
+
+    groups[index].proc_pids_array = NULL;
+    groups[index].monitored_pids_count = 0;
  
      index++;
  
  
      index++;
  
-    if (index >= max_groups) {
-      WARNING(RDT_PLUGIN ": Too many core groups configured");
+    if (index >= (const int)max_groups) {
+      WARNING(RDT_PLUGIN ": Too many process names groups configured");
        return index;
      }
    }
        return index;
      }
    }
@@ -300,95 +448,475 @@ static int oconfig_to_cgroups(oconfig_item_t *item, rdt_core_group_t *groups,
    return index;
  }
  
    return index;
  }
  
-#if COLLECT_DEBUG
-static void rdt_dump_cgroups(void) {
-  char cores[RDT_MAX_CORES * 4];
+static void rdt_free_ngroups(rdt_ctx_t *rdt) {
+  for (int i = 0; i < RDT_MAX_NAMES_GROUPS; i++) {
+    if (rdt->ngroups[i].desc)
+      DEBUG(RDT_PLUGIN ": Freeing pids \'%s\' group\'s data...",
+            rdt->ngroups[i].desc);
+    sfree(rdt->ngroups[i].desc);
+    strarray_free(rdt->ngroups[i].names, rdt->ngroups[i].num_names);
+
+    if (rdt->ngroups[i].proc_pids_array) {
+      for (size_t j = 0; j < rdt->ngroups[i].num_names; ++j) {
+        if (NULL == rdt->ngroups[i].proc_pids_array[j].pids)
+          continue;
+        pids_list_free(rdt->ngroups[i].proc_pids_array[j].pids);
+      }
  
  
-  if (g_rdt == NULL)
-    return;
+      sfree(rdt->ngroups[i].proc_pids_array);
+    }
+    rdt->ngroups[i].num_names = 0;
+    sfree(rdt->pngroups[i]);
+  }
+}
  
  
-  DEBUG(RDT_PLUGIN ": Core Groups Dump");
-  DEBUG(RDT_PLUGIN ":  groups count: %zu", g_rdt->num_groups);
+static int rdt_config_ngroups(rdt_ctx_t *rdt, const oconfig_item_t *item) {
+  int n = 0;
+  enum pqos_mon_event events = 0;
  
  
-  for (int i = 0; i < g_rdt->num_groups; i++) {
+  if (item == NULL) {
+    DEBUG(RDT_PLUGIN ": ngroups_config: Invalid argument.");
+    return -EINVAL;
+  }
  
  
-    memset(cores, 0, sizeof(cores));
-    for (int j = 0; j < g_rdt->cgroups[i].num_cores; j++) {
-      snprintf(cores + strlen(cores), sizeof(cores) - strlen(cores) - 1, " %d",
-               g_rdt->cgroups[i].cores[j]);
+  DEBUG(RDT_PLUGIN ": Process names groups [%d]:", item->values_num);
+  for (int j = 0; j < item->values_num; j++) {
+    if (item->values[j].type != OCONFIG_TYPE_STRING) {
+      ERROR(RDT_PLUGIN
+            ": given process names group value is not a string [idx=%d]",
+            j);
+      return -EINVAL;
      }
      }
+    DEBUG(RDT_PLUGIN ":  [%d]: %s", j, item->values[j].value.string);
+  }
  
  
-    DEBUG(RDT_PLUGIN ":  group[%d]:", i);
-    DEBUG(RDT_PLUGIN ":    description: %s", g_rdt->cgroups[i].desc);
-    DEBUG(RDT_PLUGIN ":    cores: %s", cores);
-    DEBUG(RDT_PLUGIN ":    events: 0x%X", g_rdt->cgroups[i].events);
+  n = oconfig_to_ngroups(item, rdt->ngroups, RDT_MAX_NAMES_GROUPS);
+  if (n < 0) {
+    rdt_free_ngroups(rdt);
+    ERROR(RDT_PLUGIN ": Error parsing process name groups configuration.");
+    return -EINVAL;
    }
  
    }
  
-  return;
-}
+  /* validate configured process name values */
+  for (int group_idx = 0; group_idx < n; group_idx++) {
+    DEBUG(RDT_PLUGIN ":  checking group [%d]: %s", group_idx,
+          rdt->ngroups[group_idx].desc);
+    for (size_t name_idx = 0; name_idx < rdt->ngroups[group_idx].num_names;
+         name_idx++) {
+      DEBUG(RDT_PLUGIN ":    checking process name [%zu]: %s", name_idx,
+            rdt->ngroups[group_idx].names[name_idx]);
+      if (!is_proc_name_valid(rdt->ngroups[group_idx].names[name_idx])) {
+        ERROR(RDT_PLUGIN ": Process name group '%s' contains invalid name '%s'",
+              rdt->ngroups[group_idx].desc,
+              rdt->ngroups[group_idx].names[name_idx]);
+        rdt_free_ngroups(rdt);
+        return -EINVAL;
+      }
+    }
+  }
  
  
-static inline double bytes_to_kb(const double bytes) { return bytes / 1024.0; }
+  if (n == 0) {
+    ERROR(RDT_PLUGIN ": Empty process name groups configured.");
+    return -EINVAL;
+  }
  
  
-static inline double bytes_to_mb(const double bytes) {
-  return bytes / (1024.0 * 1024.0);
+  /* Get all available events on this platform */
+  for (unsigned i = 0; i < rdt->cap_mon->u.mon->num_events; i++)
+    events |= rdt->cap_mon->u.mon->events[i].type;
+
+  events &= ~(PQOS_PERF_EVENT_LLC_MISS);
+
+  DEBUG(RDT_PLUGIN ": Available events to monitor: %#x", events);
+
+  rdt->num_ngroups = n;
+  for (int i = 0; i < n; i++) {
+    for (int j = 0; j < i; j++) {
+      int found = ngroup_cmp(&rdt->ngroups[j], &rdt->ngroups[i]);
+      if (found != 0) {
+        rdt_free_ngroups(rdt);
+        ERROR(RDT_PLUGIN
+              ": Cannot monitor same process name in different groups.");
+        return -EINVAL;
+      }
+    }
+
+    rdt->ngroups[i].events = events;
+    rdt->pngroups[i] = calloc(1, sizeof(*rdt->pngroups[i]));
+    if (rdt->pngroups[i] == NULL) {
+      rdt_free_ngroups(rdt);
+      ERROR(RDT_PLUGIN
+            ": Failed to allocate memory for process name monitoring data.");
+      return -ENOMEM;
+    }
+  }
+
+  return 0;
  }
  
  }
  
-static void rdt_dump_data(void) {
-  /*
-   * CORE - monitored group of cores
-   * RMID - Resource Monitoring ID associated with the monitored group
-   * LLC - last level cache occupancy
-   * MBL - local memory bandwidth
-   * MBR - remote memory bandwidth
+static int rdt_refresh_ngroup(rdt_name_group_t *ngroup,
+                              struct pqos_mon_data *group_mon_data) {
+
+  int result = 0;
+
+  if (NULL == ngroup)
+    return -1;
+
+  if (NULL == ngroup->proc_pids_array) {
+    ERROR(RDT_PLUGIN
+          ": rdt_refresh_ngroup: \'%s\' uninitialized process pids array.",
+          ngroup->desc);
+
+    return -1;
+  }
+
+  DEBUG(RDT_PLUGIN ": rdt_refresh_ngroup: \'%s\' process names group.",
+        ngroup->desc);
+
+  proc_pids_t *proc_pids_array_prev = ngroup->proc_pids_array;
+  proc_pids_t *proc_pids_array_curr = NULL;
+
+  int fetch_result =
+      fetch_pids_for_procs(RDT_PROC_PATH, (const char **)ngroup->names,
+                           ngroup->num_names, &proc_pids_array_curr);
+
+  if (0 != fetch_result) {
+    ERROR(RDT_PLUGIN ": rdt_refresh_ngroup: \'%s\' failed to fetch PIDs.",
+          ngroup->desc);
+    return fetch_result;
+  }
+
+  pids_list_t *new_pids = NULL;
+  pid_t *new_pids_array = NULL;
+  size_t new_pids_count = 0;
+
+  pids_list_t *lost_pids = NULL;
+  pid_t *lost_pids_array = NULL;
+  size_t lost_pids_count = 0;
+
+  for (size_t i = 0; i < ngroup->num_names; ++i) {
+    if (NULL == proc_pids_array_prev[i].pids &&
+        NULL == proc_pids_array_curr[i].pids)
+      continue;
+    int diff_result = pids_list_diff(
+        proc_pids_array_prev[i].pids, proc_pids_array_curr[i].pids, &new_pids,
+        &new_pids_count, &lost_pids, &lost_pids_count);
+    if (0 != diff_result) {
+      ERROR(RDT_PLUGIN
+            ": rdt_refresh_ngroup: \'%s\'. Error [%d] during PID diff.",
+            ngroup->desc, diff_result);
+      result = -1;
+      goto cleanup;
+    }
+  }
+
+  DEBUG(RDT_PLUGIN ": rdt_refresh_ngroup: \'%s\' process names group, added: "
+                   "%u, removed: %u.",
+        ngroup->desc, (unsigned)new_pids_count, (unsigned)lost_pids_count);
+
+  if (new_pids && new_pids_count > 0) {
+    new_pids_array = malloc(new_pids_count * sizeof(pid_t));
+    if (new_pids_array == NULL) {
+      ERROR(RDT_PLUGIN ": rdt_refresh_ngroup: \'%s\'. Memory "
+                       "allocation failed",
+            ngroup->desc);
+      result = -1;
+      goto cleanup;
+    }
+    pids_list_to_array(new_pids_array, new_pids, new_pids_count);
+
+    /* no pids are monitored for this group yet: start monitoring */
+    if (0 == ngroup->monitored_pids_count) {
+
+      int start_result =
+          pqos_mon_start_pids(new_pids_count, new_pids_array, ngroup->events,
+                              (void *)ngroup->desc, group_mon_data);
+      if (PQOS_RETVAL_OK == start_result) {
+        ngroup->monitored_pids_count = new_pids_count;
+      } else {
+        ERROR(RDT_PLUGIN ": rdt_refresh_ngroup: \'%s\'. Error [%d] while "
+                         "STARTING pids monitoring",
+              ngroup->desc, start_result);
+        result = -1;
+        goto pqos_error_recovery;
+      }
+
+    } else {
+
+      int add_result =
+          pqos_mon_add_pids(new_pids_count, new_pids_array, group_mon_data);
+      if (PQOS_RETVAL_OK == add_result)
+        ngroup->monitored_pids_count += new_pids_count;
+      else {
+        ERROR(RDT_PLUGIN
+              ": rdt_refresh_ngroup: \'%s\'. Error [%d] while ADDING pids.",
+              ngroup->desc, add_result);
+        result = -1;
+        goto pqos_error_recovery;
+      }
+    }
+  }
+
+  if (lost_pids && lost_pids_count > 0) {
+    lost_pids_array = malloc(lost_pids_count * sizeof(pid_t));
+    if (lost_pids_array == NULL) {
+      ERROR(RDT_PLUGIN ": rdt_refresh_ngroup: \'%s\'. Memory "
+                       "allocation failed",
+            ngroup->desc);
+      result = -1;
+      goto cleanup;
+    }
+    pids_list_to_array(lost_pids_array, lost_pids, lost_pids_count);
+
+    if (lost_pids_count == ngroup->monitored_pids_count) {
+      /* all pids for this group are lost: stop monitoring */
+      int stop_result = pqos_mon_stop(group_mon_data);
+      if (PQOS_RETVAL_OK != stop_result) {
+        ERROR(RDT_PLUGIN ": rdt_refresh_ngroup: \'%s\'. Error [%d] while "
+                         "STOPPING monitoring",
+              ngroup->desc, stop_result);
+        result = -1;
+        goto pqos_error_recovery;
+      }
+      ngroup->monitored_pids_count = 0;
+    } else {
+      assert(lost_pids_count < ngroup->monitored_pids_count);
+      int remove_result = pqos_mon_remove_pids(lost_pids_count, lost_pids_array,
+                                               group_mon_data);
+      if (PQOS_RETVAL_OK == remove_result) {
+        ngroup->monitored_pids_count -= lost_pids_count;
+      } else {
+        ERROR(RDT_PLUGIN
+              ": rdt_refresh_ngroup: \'%s\'. Error [%d] while REMOVING pids.",
+              ngroup->desc, remove_result);
+        result = -1;
+        goto pqos_error_recovery;
+      }
+    }
+  }
+
+  if (new_pids_count > 0 || lost_pids_count > 0)
+    ngroup->proc_pids_array = proc_pids_array_curr;
+
+  goto cleanup;
+
+pqos_error_recovery:
+  /* Why?
+   * Resources might be temporary unavailable.
+   *
+   * How?
+   * Collectd will halt the reading thread for this
+   * plugin if it returns an error.
+   * Consecutive errors will be increasing the read period
+   * up to 1 day interval.
+   * On pqos error stop monitoring current group
+   * and reset the proc_pids array
+   * monitoring will be restarted on next collectd read cycle
     */
     */
-  DEBUG("  CORE     RMID    LLC[KB]   MBL[MB]    MBR[MB]");
-  for (int i = 0; i < g_rdt->num_groups; i++) {
+  DEBUG(RDT_PLUGIN ": rdt_refresh_ngroup: \'%s\' group RESET after error.",
+        ngroup->desc);
+  pqos_mon_stop(group_mon_data);
+  for (size_t i = 0; i < ngroup->num_names; ++i) {
+    if (ngroup->proc_pids_array[i].pids)
+      pids_list_free(ngroup->proc_pids_array[i].pids);
+  }
+  sfree(ngroup->proc_pids_array);
  
  
-    const struct pqos_event_values *pv = &g_rdt->pgroups[i]->values;
+  initialize_proc_pids((const char **)ngroup->names, ngroup->num_names,
+                       &ngroup->proc_pids_array);
+  ngroup->monitored_pids_count = 0;
  
  
-    double llc = bytes_to_kb(pv->llc);
-    double mbr = bytes_to_mb(pv->mbm_remote_delta);
-    double mbl = bytes_to_mb(pv->mbm_local_delta);
+cleanup:
+  if (ngroup->proc_pids_array == proc_pids_array_curr) {
+    assert(proc_pids_array_curr);
+    /* new list was successfully saved, free the old one */
+    for (size_t i = 0; i < ngroup->num_names; ++i)
+      if (proc_pids_array_prev[i].pids)
+        pids_list_free(proc_pids_array_prev[i].pids);
  
  
-    DEBUG(" [%s] %8u %10.1f %10.1f %10.1f", g_rdt->cgroups[i].desc,
-          g_rdt->pgroups[i]->poll_ctx[0].rmid, llc, mbl, mbr);
+    sfree(proc_pids_array_prev);
+
+  } else {
+    /* new list was not saved. Free the new list, keep the old one*/
+    for (size_t i = 0; i < ngroup->num_names; ++i)
+      if (proc_pids_array_curr[i].pids)
+        pids_list_free(proc_pids_array_curr[i].pids);
+
+    sfree(proc_pids_array_curr);
    }
    }
+
+  if (new_pids)
+    pids_list_free(new_pids);
+
+  if (new_pids_array)
+    free(new_pids_array);
+
+  if (lost_pids)
+    pids_list_free(lost_pids);
+
+  if (lost_pids_array)
+    free(lost_pids_array);
+
+  return result;
  }
  }
+
+static int read_pids_data() {
+
+  if (0 == g_rdt->num_ngroups) {
+    DEBUG(RDT_PLUGIN ": read_pids_data: not configured - PIDs read skipped");
+    return 0;
+  }
+
+  DEBUG(RDT_PLUGIN ": read_pids_data: Scanning active groups");
+  struct pqos_mon_data *active_groups[RDT_MAX_NAMES_GROUPS] = {0};
+  size_t active_group_idx = 0;
+  for (size_t pngroups_idx = 0;
+       pngroups_idx < STATIC_ARRAY_SIZE(g_rdt->pngroups); ++pngroups_idx)
+    if (0 != g_rdt->ngroups[pngroups_idx].monitored_pids_count)
+      active_groups[active_group_idx++] = g_rdt->pngroups[pngroups_idx];
+
+  int ret = 0;
+
+  if (0 == active_group_idx) {
+    DEBUG(RDT_PLUGIN ": read_pids_data: no active groups - PIDs read skipped");
+    goto groups_refresh;
+  }
+
+  DEBUG(RDT_PLUGIN ": read_pids_data: PIDs data polling");
+
+  int poll_result = pqos_mon_poll(active_groups, active_group_idx);
+  if (poll_result != PQOS_RETVAL_OK) {
+    ERROR(RDT_PLUGIN ": read_pids_data: Failed to poll monitoring data for "
+                     "pids. Error [%d].",
+          poll_result);
+    ret = -poll_result;
+    goto groups_refresh;
+  }
+
+  for (size_t i = 0; i < g_rdt->num_ngroups; i++) {
+    enum pqos_mon_event mbm_events =
+        (PQOS_MON_EVENT_LMEM_BW | PQOS_MON_EVENT_TMEM_BW |
+         PQOS_MON_EVENT_RMEM_BW);
+
+    if (g_rdt->pngroups[i] == NULL ||
+        g_rdt->ngroups[i].monitored_pids_count == 0)
+      continue;
+
+    const struct pqos_event_values *pv = &g_rdt->pngroups[i]->values;
+
+    /* Submit only monitored events data */
+
+    if (g_rdt->ngroups[i].events & PQOS_MON_EVENT_L3_OCCUP)
+      rdt_submit_gauge(g_rdt->ngroups[i].desc, "bytes", "llc", pv->llc);
+
+    if (g_rdt->ngroups[i].events & PQOS_PERF_EVENT_IPC)
+      rdt_submit_gauge(g_rdt->ngroups[i].desc, "ipc", NULL, pv->ipc);
+
+    if (g_rdt->ngroups[i].events & mbm_events) {
+      rdt_submit_derive(g_rdt->ngroups[i].desc, "memory_bandwidth", "local",
+                        pv->mbm_local_delta);
+      rdt_submit_derive(g_rdt->ngroups[i].desc, "memory_bandwidth", "remote",
+                        pv->mbm_remote_delta);
+    }
+  }
+
+#if COLLECT_DEBUG
+  rdt_dump_pids_data();
  #endif /* COLLECT_DEBUG */
  
  #endif /* COLLECT_DEBUG */
  
-static void rdt_free_cgroups(void) {
-  for (int i = 0; i < RDT_MAX_CORES; i++) {
-    sfree(g_rdt->cgroups[i].desc);
+groups_refresh:
+  for (size_t i = 0; i < g_rdt->num_ngroups; i++) {
+    int refresh_result =
+        rdt_refresh_ngroup(&(g_rdt->ngroups[i]), g_rdt->pngroups[i]);
+
+    if (0 != refresh_result) {
+      ERROR(RDT_PLUGIN ": read_pids_data: NGroup %zu refresh failed. Error: %d",
+            i, refresh_result);
+      if (0 == ret) {
+        /* refresh error will be escalated only if there were no
+         * errors before.
+         */
+        ret = refresh_result;
+      }
+    }
+  }
  
  
-    sfree(g_rdt->cgroups[i].cores);
-    g_rdt->cgroups[i].num_cores = 0;
+  assert(ret <= 0);
+  return ret;
+}
  
  
-    sfree(g_rdt->pgroups[i]);
+static void rdt_init_pids_monitoring() {
+  for (size_t group_idx = 0; group_idx < g_rdt->num_ngroups; group_idx++) {
+    /*
+     * Each group must have not-null proc_pids array.
+     * Initial refresh is not mandatory for proper
+     * PIDs statistics detection.
+     */
+    rdt_name_group_t *ng = &g_rdt->ngroups[group_idx];
+    int init_result = initialize_proc_pids((const char **)ng->names,
+                                           ng->num_names, &ng->proc_pids_array);
+    if (0 != init_result) {
+      ERROR(RDT_PLUGIN
+            ": Initialization of proc_pids for group %zu failed. Error: %d",
+            group_idx, init_result);
+      continue;
+    }
+
+    int refresh_result = rdt_refresh_ngroup(&(g_rdt->ngroups[group_idx]),
+                                            g_rdt->pngroups[group_idx]);
+    if (0 != refresh_result)
+      ERROR(RDT_PLUGIN ": Initial refresh of group %zu failed. Error: %d",
+            group_idx, refresh_result);
+  }
+}
+#endif /* LIBPQOS2 */
+
+static void rdt_free_cgroups(void) {
+  config_cores_cleanup(&g_rdt->cores);
+  for (int i = 0; i < RDT_MAX_CORES; i++) {
+    sfree(g_rdt->pcgroups[i]);
    }
  }
  
  static int rdt_default_cgroups(void) {
    }
  }
  
  static int rdt_default_cgroups(void) {
-  int ret;
+  unsigned num_cores = g_rdt->pqos_cpu->num_cores;
+
+  g_rdt->cores.cgroups = calloc(num_cores, sizeof(*(g_rdt->cores.cgroups)));
+  if (g_rdt->cores.cgroups == NULL) {
+    ERROR(RDT_PLUGIN ": Error allocating core groups array");
+    return -ENOMEM;
+  }
+  g_rdt->cores.num_cgroups = num_cores;
  
    /* configure each core in separate group */
  
    /* configure each core in separate group */
-  for (unsigned i = 0; i < g_rdt->pqos_cpu->num_cores; i++) {
+  for (unsigned i = 0; i < num_cores; i++) {
+    core_group_t *cgroup = g_rdt->cores.cgroups + i;
      char desc[DATA_MAX_NAME_LEN];
      char desc[DATA_MAX_NAME_LEN];
-    uint64_t core = i;
-
-    snprintf(desc, sizeof(desc), "%d", g_rdt->pqos_cpu->cores[i].lcore);
  
      /* set core group info */
  
      /* set core group info */
-    ret = cgroup_set(&g_rdt->cgroups[i], desc, &core, 1);
-    if (ret < 0)
-      return ret;
+    cgroup->cores = calloc(1, sizeof(*cgroup->cores));
+    if (cgroup->cores == NULL) {
+      ERROR(RDT_PLUGIN ": Error allocating cores array");
+      rdt_free_cgroups();
+      return -ENOMEM;
+    }
+    cgroup->num_cores = 1;
+    cgroup->cores[0] = i;
+
+    snprintf(desc, sizeof(desc), "%d", g_rdt->pqos_cpu->cores[i].lcore);
+    cgroup->desc = strdup(desc);
+    if (cgroup->desc == NULL) {
+      ERROR(RDT_PLUGIN ": Error allocating core group description");
+      rdt_free_cgroups();
+      return -ENOMEM;
+    }
    }
  
    }
  
-  return g_rdt->pqos_cpu->num_cores;
+  return num_cores;
  }
  
  }
  
-static int rdt_is_core_id_valid(int core_id) {
+static int rdt_is_core_id_valid(unsigned int core_id) {
  
  
-  for (int i = 0; i < g_rdt->pqos_cpu->num_cores; i++)
+  for (unsigned int i = 0; i < g_rdt->pqos_cpu->num_cores; i++)
      if (core_id == g_rdt->pqos_cpu->cores[i].lcore)
        return 1;
  
      if (core_id == g_rdt->pqos_cpu->cores[i].lcore)
        return 1;
  
@@ -396,38 +924,23 @@ static int rdt_is_core_id_valid(int core_id) {
  }
  
  static int rdt_config_cgroups(oconfig_item_t *item) {
  }
  
  static int rdt_config_cgroups(oconfig_item_t *item) {
-  int n = 0;
+  size_t n = 0;
    enum pqos_mon_event events = 0;
  
    enum pqos_mon_event events = 0;
  
-  if (item == NULL) {
-    DEBUG(RDT_PLUGIN ": cgroups_config: Invalid argument.");
-    return -EINVAL;
-  }
-
-  DEBUG(RDT_PLUGIN ": Core groups [%d]:", item->values_num);
-  for (int j = 0; j < item->values_num; j++) {
-    if (item->values[j].type != OCONFIG_TYPE_STRING) {
-      ERROR(RDT_PLUGIN ": given core group value is not a string [idx=%d]", j);
-      return -EINVAL;
-    }
-    DEBUG(RDT_PLUGIN ":  [%d]: %s", j, item->values[j].value.string);
-  }
-
-  n = oconfig_to_cgroups(item, g_rdt->cgroups, g_rdt->pqos_cpu->num_cores);
-  if (n < 0) {
+  if (config_cores_parse(item, &g_rdt->cores) < 0) {
      rdt_free_cgroups();
      ERROR(RDT_PLUGIN ": Error parsing core groups configuration.");
      return -EINVAL;
    }
      rdt_free_cgroups();
      ERROR(RDT_PLUGIN ": Error parsing core groups configuration.");
      return -EINVAL;
    }
+  n = g_rdt->cores.num_cgroups;
  
    /* validate configured core id values */
  
    /* validate configured core id values */
-  for (int group_idx = 0; group_idx < n; group_idx++) {
-    for (int core_idx = 0; core_idx < g_rdt->cgroups[group_idx].num_cores;
-         core_idx++) {
-      if (!rdt_is_core_id_valid(g_rdt->cgroups[group_idx].cores[core_idx])) {
-        ERROR(RDT_PLUGIN ": Core group '%s' contains invalid core id '%d'",
-                g_rdt->cgroups[group_idx].desc,
-                (int)g_rdt->cgroups[group_idx].cores[core_idx]);
+  for (size_t group_idx = 0; group_idx < n; group_idx++) {
+    core_group_t *cgroup = g_rdt->cores.cgroups + group_idx;
+    for (size_t core_idx = 0; core_idx < cgroup->num_cores; core_idx++) {
+      if (!rdt_is_core_id_valid(cgroup->cores[core_idx])) {
+        ERROR(RDT_PLUGIN ": Core group '%s' contains invalid core id '%u'",
+              cgroup->desc, cgroup->cores[core_idx]);
          rdt_free_cgroups();
          return -EINVAL;
        }
          rdt_free_cgroups();
          return -EINVAL;
        }
@@ -436,18 +949,19 @@ static int rdt_config_cgroups(oconfig_item_t *item) {
  
    if (n == 0) {
      /* create default core groups if "Cores" config option is empty */
  
    if (n == 0) {
      /* create default core groups if "Cores" config option is empty */
-    n = rdt_default_cgroups();
-    if (n < 0) {
+    int ret = rdt_default_cgroups();
+    if (ret < 0) {
        rdt_free_cgroups();
        ERROR(RDT_PLUGIN ": Error creating default core groups configuration.");
        rdt_free_cgroups();
        ERROR(RDT_PLUGIN ": Error creating default core groups configuration.");
-      return n;
+      return ret;
      }
      }
+    n = (size_t)ret;
      INFO(RDT_PLUGIN
           ": No core groups configured. Default core groups created.");
    }
  
    /* Get all available events on this platform */
      INFO(RDT_PLUGIN
           ": No core groups configured. Default core groups created.");
    }
  
    /* Get all available events on this platform */
-  for (int i = 0; i < g_rdt->cap_mon->u.mon->num_events; i++)
+  for (unsigned int i = 0; i < g_rdt->cap_mon->u.mon->num_events; i++)
      events |= g_rdt->cap_mon->u.mon->events[i].type;
  
    events &= ~(PQOS_PERF_EVENT_LLC_MISS);
      events |= g_rdt->cap_mon->u.mon->events[i].type;
  
    events &= ~(PQOS_PERF_EVENT_LLC_MISS);
@@ -456,11 +970,12 @@ static int rdt_config_cgroups(oconfig_item_t *item) {
          g_rdt->pqos_cpu->num_cores);
    DEBUG(RDT_PLUGIN ": Available events to monitor: %#x", events);
  
          g_rdt->pqos_cpu->num_cores);
    DEBUG(RDT_PLUGIN ": Available events to monitor: %#x", events);
  
-  g_rdt->num_groups = n;
+  g_rdt->cores.num_cgroups = n;
    for (int i = 0; i < n; i++) {
      for (int j = 0; j < i; j++) {
        int found = 0;
    for (int i = 0; i < n; i++) {
      for (int j = 0; j < i; j++) {
        int found = 0;
-      found = cgroup_cmp(&g_rdt->cgroups[j], &g_rdt->cgroups[i]);
+      found = config_cores_cmp_cgroups(&g_rdt->cores.cgroups[j],
+                                       &g_rdt->cores.cgroups[i]);
        if (found != 0) {
          rdt_free_cgroups();
          ERROR(RDT_PLUGIN ": Cannot monitor same cores in different groups.");
        if (found != 0) {
          rdt_free_cgroups();
          ERROR(RDT_PLUGIN ": Cannot monitor same cores in different groups.");
@@ -468,9 +983,9 @@ static int rdt_config_cgroups(oconfig_item_t *item) {
        }
      }
  
        }
      }
  
-    g_rdt->cgroups[i].events = events;
-    g_rdt->pgroups[i] = calloc(1, sizeof(*g_rdt->pgroups[i]));
-    if (g_rdt->pgroups[i] == NULL) {
+    g_rdt->events[i] = events;
+    g_rdt->pcgroups[i] = calloc(1, sizeof(*g_rdt->pcgroups[i]));
+    if (g_rdt->pcgroups[i] == NULL) {
        rdt_free_cgroups();
        ERROR(RDT_PLUGIN ": Failed to allocate memory for monitoring data.");
        return -ENOMEM;
        rdt_free_cgroups();
        ERROR(RDT_PLUGIN ": Failed to allocate memory for monitoring data.");
        return -ENOMEM;
@@ -501,14 +1016,34 @@ static int rdt_preinit(void) {
    struct pqos_config pqos = {.fd_log = -1,
                               .callback_log = rdt_pqos_log,
                               .context_log = NULL,
    struct pqos_config pqos = {.fd_log = -1,
                               .callback_log = rdt_pqos_log,
                               .context_log = NULL,
-                             .verbose = 0};
+                             .verbose = 0,
+#ifdef LIBPQOS2
+                             .interface = PQOS_INTER_OS_RESCTRL_MON};
+  DEBUG(RDT_PLUGIN ": Initializing PQoS with RESCTRL interface");
+#else
+                             .interface = PQOS_INTER_MSR};
+  DEBUG(RDT_PLUGIN ": Initializing PQoS with MSR interface");
+#endif
  
    ret = pqos_init(&pqos);
  
    ret = pqos_init(&pqos);
+  DEBUG(RDT_PLUGIN ": PQoS initialization result: [%d]", ret);
+
+#ifdef LIBPQOS2
+  if (ret == PQOS_RETVAL_INTER) {
+    pqos.interface = PQOS_INTER_MSR;
+    DEBUG(RDT_PLUGIN ": Initializing PQoS with MSR interface");
+    ret = pqos_init(&pqos);
+    DEBUG(RDT_PLUGIN ": PQoS initialization result: [%d]", ret);
+  }
+#endif
+
    if (ret != PQOS_RETVAL_OK) {
      ERROR(RDT_PLUGIN ": Error initializing PQoS library!");
      goto rdt_preinit_error1;
    }
  
    if (ret != PQOS_RETVAL_OK) {
      ERROR(RDT_PLUGIN ": Error initializing PQoS library!");
      goto rdt_preinit_error1;
    }
  
+  g_interface = pqos.interface;
+
    ret = pqos_cap_get(&g_rdt->pqos_cap, &g_rdt->pqos_cpu);
    if (ret != PQOS_RETVAL_OK) {
      ERROR(RDT_PLUGIN ": Error retrieving PQoS capabilities.");
    ret = pqos_cap_get(&g_rdt->pqos_cap, &g_rdt->pqos_cpu);
    if (ret != PQOS_RETVAL_OK) {
      ERROR(RDT_PLUGIN ": Error retrieving PQoS capabilities.");
@@ -537,7 +1072,6 @@ rdt_preinit_error2:
    pqos_fini();
  
  rdt_preinit_error1:
    pqos_fini();
  
  rdt_preinit_error1:
-
    sfree(g_rdt);
  
    return -1;
    sfree(g_rdt);
  
    return -1;
@@ -556,7 +1090,7 @@ static int rdt_config(oconfig_item_t *ci) {
    for (int i = 0; i < ci->children_num; i++) {
      oconfig_item_t *child = ci->children + i;
  
    for (int i = 0; i < ci->children_num; i++) {
      oconfig_item_t *child = ci->children + i;
  
-    if (strcasecmp("Cores", child->key) == 0) {
+    if (strncasecmp("Cores", child->key, (size_t)strlen("Cores")) == 0) {
        if (rdt_config_cgroups(child) != 0) {
          g_state = CONFIGURATION_ERROR;
          /* if we return -1 at this point collectd
        if (rdt_config_cgroups(child) != 0) {
          g_state = CONFIGURATION_ERROR;
          /* if we return -1 at this point collectd
@@ -569,6 +1103,38 @@ static int rdt_config(oconfig_item_t *ci) {
  #if COLLECT_DEBUG
        rdt_dump_cgroups();
  #endif /* COLLECT_DEBUG */
  #if COLLECT_DEBUG
        rdt_dump_cgroups();
  #endif /* COLLECT_DEBUG */
+    } else if (strncasecmp("Processes", child->key,
+                           (size_t)strlen("Processes")) == 0) {
+#ifdef LIBPQOS2
+      if (g_interface != PQOS_INTER_OS_RESCTRL_MON) {
+        ERROR(RDT_PLUGIN ": Configuration parameter \"%s\" not supported. "
+                         "Resctrl monitoring is needed for PIDs monitoring.",
+              child->key);
+        g_state = CONFIGURATION_ERROR;
+        /* if we return -1 at this point collectd
+           reports a failure in configuration and
+           aborts
+         */
+        return 0;
+      }
+
+      if (rdt_config_ngroups(g_rdt, child) != 0) {
+        g_state = CONFIGURATION_ERROR;
+        /* if we return -1 at this point collectd
+           reports a failure in configuration and
+           aborts
+         */
+        return 0;
+      }
+
+#if COLLECT_DEBUG
+      rdt_dump_ngroups();
+#endif /* COLLECT_DEBUG */
+#else  /* !LIBPQOS2 */
+      ERROR(RDT_PLUGIN ": Configuration parameter \"%s\" not supported, please "
+                       "recompile collectd with libpqos version 2.0 or newer.",
+            child->key);
+#endif /* LIBPQOS2 */
      } else {
        ERROR(RDT_PLUGIN ": Unknown configuration parameter \"%s\".", child->key);
      }
      } else {
        ERROR(RDT_PLUGIN ": Unknown configuration parameter \"%s\".", child->key);
      }
@@ -577,103 +1143,106 @@ static int rdt_config(oconfig_item_t *ci) {
    return 0;
  }
  
    return 0;
  }
  
-static void rdt_submit_derive(char *cgroup, char *type, char *type_instance,
-                              derive_t value) {
-  value_list_t vl = VALUE_LIST_INIT;
+static int read_cores_data() {
  
  
-  vl.values = &(value_t){.derive = value};
-  vl.values_len = 1;
+  if (0 == g_rdt->cores.num_cgroups) {
+    DEBUG(RDT_PLUGIN ": read_cores_data: not configured - Cores read skipped");
+    return 0;
+  }
+  DEBUG(RDT_PLUGIN ": read_cores_data: Cores data poll");
  
  
-  sstrncpy(vl.plugin, RDT_PLUGIN, sizeof(vl.plugin));
-  snprintf(vl.plugin_instance, sizeof(vl.plugin_instance), "%s", cgroup);
-  sstrncpy(vl.type, type, sizeof(vl.type));
-  if (type_instance)
-    sstrncpy(vl.type_instance, type_instance, sizeof(vl.type_instance));
+  int ret =
+      pqos_mon_poll(&g_rdt->pcgroups[0], (unsigned)g_rdt->cores.num_cgroups);
+  if (ret != PQOS_RETVAL_OK) {
+    ERROR(RDT_PLUGIN ": read_cores_data: Failed to poll monitoring data for "
+                     "cores. Error [%d].",
+          ret);
+    return -1;
+  }
  
  
-  plugin_dispatch_values(&vl);
-}
+  for (size_t i = 0; i < g_rdt->cores.num_cgroups; i++) {
+    core_group_t *cgroup = g_rdt->cores.cgroups + i;
+    enum pqos_mon_event mbm_events =
+        (PQOS_MON_EVENT_LMEM_BW | PQOS_MON_EVENT_TMEM_BW |
+         PQOS_MON_EVENT_RMEM_BW);
  
  
-static void rdt_submit_gauge(char *cgroup, char *type, char *type_instance,
-                             gauge_t value) {
-  value_list_t vl = VALUE_LIST_INIT;
+    const struct pqos_event_values *pv = &g_rdt->pcgroups[i]->values;
  
  
-  vl.values = &(value_t){.gauge = value};
-  vl.values_len = 1;
+    /* Submit only monitored events data */
  
  
-  sstrncpy(vl.plugin, RDT_PLUGIN, sizeof(vl.plugin));
-  snprintf(vl.plugin_instance, sizeof(vl.plugin_instance), "%s", cgroup);
-  sstrncpy(vl.type, type, sizeof(vl.type));
-  if (type_instance)
-    sstrncpy(vl.type_instance, type_instance, sizeof(vl.type_instance));
+    if (g_rdt->events[i] & PQOS_MON_EVENT_L3_OCCUP)
+      rdt_submit_gauge(cgroup->desc, "bytes", "llc", pv->llc);
  
  
-  plugin_dispatch_values(&vl);
+    if (g_rdt->events[i] & PQOS_PERF_EVENT_IPC)
+      rdt_submit_gauge(cgroup->desc, "ipc", NULL, pv->ipc);
+
+    if (g_rdt->events[i] & mbm_events) {
+      rdt_submit_derive(cgroup->desc, "memory_bandwidth", "local",
+                        pv->mbm_local_delta);
+      rdt_submit_derive(cgroup->desc, "memory_bandwidth", "remote",
+                        pv->mbm_remote_delta);
+    }
+  }
+
+#if COLLECT_DEBUG
+  rdt_dump_cores_data();
+#endif /* COLLECT_DEBUG */
+
+  return 0;
  }
  
  static int rdt_read(__attribute__((unused)) user_data_t *ud) {
  }
  
  static int rdt_read(__attribute__((unused)) user_data_t *ud) {
-  int ret;
  
    if (g_rdt == NULL) {
      ERROR(RDT_PLUGIN ": rdt_read: plugin not initialized.");
      return -EINVAL;
    }
  
  
    if (g_rdt == NULL) {
      ERROR(RDT_PLUGIN ": rdt_read: plugin not initialized.");
      return -EINVAL;
    }
  
-  ret = pqos_mon_poll(&g_rdt->pgroups[0], (unsigned)g_rdt->num_groups);
-  if (ret != PQOS_RETVAL_OK) {
-    ERROR(RDT_PLUGIN ": Failed to poll monitoring data.");
-    return -1;
-  }
+  int cores_read_result = read_cores_data();
  
  
-#if COLLECT_DEBUG
-  rdt_dump_data();
-#endif /* COLLECT_DEBUG */
+#ifdef LIBPQOS2
+  int pids_read_result = read_pids_data();
+#endif /* LIBPQOS2 */
  
  
-  for (int i = 0; i < g_rdt->num_groups; i++) {
-    enum pqos_mon_event mbm_events =
-        (PQOS_MON_EVENT_LMEM_BW | PQOS_MON_EVENT_TMEM_BW |
-         PQOS_MON_EVENT_RMEM_BW);
+  if (0 != cores_read_result)
+    return cores_read_result;
  
  
-    const struct pqos_event_values *pv = &g_rdt->pgroups[i]->values;
+#ifdef LIBPQOS2
+  if (0 != pids_read_result)
+    return pids_read_result;
+#endif /* LIBPQOS2 */
  
  
-    /* Submit only monitored events data */
+  return 0;
+}
  
  
-    if (g_rdt->cgroups[i].events & PQOS_MON_EVENT_L3_OCCUP)
-      rdt_submit_gauge(g_rdt->cgroups[i].desc, "bytes", "llc", pv->llc);
+static void rdt_init_cores_monitoring() {
+  for (size_t i = 0; i < g_rdt->cores.num_cgroups; i++) {
+    core_group_t *cg = g_rdt->cores.cgroups + i;
  
  
-    if (g_rdt->cgroups[i].events & PQOS_PERF_EVENT_IPC)
-      rdt_submit_gauge(g_rdt->cgroups[i].desc, "ipc", NULL, pv->ipc);
+    int mon_start_result =
+        pqos_mon_start(cg->num_cores, cg->cores, g_rdt->events[i],
+                       (void *)cg->desc, g_rdt->pcgroups[i]);
  
  
-    if (g_rdt->cgroups[i].events & mbm_events) {
-      rdt_submit_derive(g_rdt->cgroups[i].desc, "memory_bandwidth", "local",
-                        pv->mbm_local_delta);
-      rdt_submit_derive(g_rdt->cgroups[i].desc, "memory_bandwidth", "remote",
-                        pv->mbm_remote_delta);
-    }
+    if (mon_start_result != PQOS_RETVAL_OK)
+      ERROR(RDT_PLUGIN
+            ": Error starting cores monitoring group %s (pqos status=%d)",
+            cg->desc, mon_start_result);
    }
    }
-
-  return 0;
  }
  
  static int rdt_init(void) {
  }
  
  static int rdt_init(void) {
-  int ret;
  
    if (g_state == CONFIGURATION_ERROR)
      return -1;
  
  
    if (g_state == CONFIGURATION_ERROR)
      return -1;
  
-  ret = rdt_preinit();
-  if (ret != 0)
-    return ret;
-
-  /* Start monitoring */
-  for (int i = 0; i < g_rdt->num_groups; i++) {
-    rdt_core_group_t *cg = &g_rdt->cgroups[i];
-
-    ret = pqos_mon_start(cg->num_cores, cg->cores, cg->events, (void *)cg->desc,
-                         g_rdt->pgroups[i]);
+  int rdt_preinint_result = rdt_preinit();
+  if (rdt_preinint_result != 0)
+    return rdt_preinint_result;
  
  
-    if (ret != PQOS_RETVAL_OK)
-      ERROR(RDT_PLUGIN ": Error starting monitoring group %s (pqos status=%d)",
-            cg->desc, ret);
-  }
+  rdt_init_cores_monitoring();
+#ifdef LIBPQOS2
+  rdt_init_pids_monitoring();
+#endif /* LIBPQOS2 */
  
    return 0;
  }
  
    return 0;
  }
@@ -686,16 +1255,24 @@ static int rdt_shutdown(void) {
    if (g_rdt == NULL)
      return 0;
  
    if (g_rdt == NULL)
      return 0;
  
-  /* Stop monitoring */
-  for (int i = 0; i < g_rdt->num_groups; i++) {
-    pqos_mon_stop(g_rdt->pgroups[i]);
+  /* Stop monitoring cores */
+  for (size_t i = 0; i < g_rdt->cores.num_cgroups; i++) {
+    pqos_mon_stop(g_rdt->pcgroups[i]);
    }
  
    }
  
+/* Stop pids monitoring */
+#ifdef LIBPQOS2
+  for (size_t i = 0; i < g_rdt->num_ngroups; i++)
+    pqos_mon_stop(g_rdt->pngroups[i]);
+#endif
+
    ret = pqos_fini();
    if (ret != PQOS_RETVAL_OK)
      ERROR(RDT_PLUGIN ": Error shutting down PQoS library.");
    ret = pqos_fini();
    if (ret != PQOS_RETVAL_OK)
      ERROR(RDT_PLUGIN ": Error shutting down PQoS library.");
-
    rdt_free_cgroups();
    rdt_free_cgroups();
+#ifdef LIBPQOS2
+  rdt_free_ngroups(g_rdt);
+#endif /* LIBPQOS2 */
    sfree(g_rdt);
  
    return 0;
    sfree(g_rdt);
  
    return 0;