5102 lines
241 KiB
Diff
5102 lines
241 KiB
Diff
From e206501e56a364efa130f9a1c691f61d8cf0bd1a Mon Sep 17 00:00:00 2001
|
|
From: Rui Matos <tiagomatos@gmail.com>
|
|
Date: Thu, 31 Aug 2017 17:32:43 +0200
|
|
Subject: [PATCH] housekeeping: Add a GPU memory usage notification
|
|
|
|
Only works on supported nvidia GPUs and nvidia binary driver
|
|
combinations.
|
|
---
|
|
meson.build | 1 +
|
|
plugins/housekeeping/gsd-gpu-mem.c | 261 +
|
|
plugins/housekeeping/gsd-gpu-mem.h | 33 +
|
|
.../housekeeping/gsd-housekeeping-manager.c | 7 +
|
|
plugins/housekeeping/meson.build | 7 +-
|
|
plugins/housekeeping/nvml/include/nvml.h | 4447 +++++++++++++++++
|
|
6 files changed, 4754 insertions(+), 2 deletions(-)
|
|
create mode 100644 plugins/housekeeping/gsd-gpu-mem.c
|
|
create mode 100644 plugins/housekeeping/gsd-gpu-mem.h
|
|
create mode 100644 plugins/housekeeping/nvml/include/nvml.h
|
|
|
|
diff --git a/meson.build b/meson.build
|
|
index a352d04f..1632ea05 100644
|
|
--- a/meson.build
|
|
+++ b/meson.build
|
|
@@ -76,60 +76,61 @@ endif
|
|
|
|
# Workaround for meson's bug
|
|
# https://github.com/mesonbuild/meson/pull/1896
|
|
if get_option('b_ndebug') == true
|
|
common_flags += ['-DG_DISABLE_ASSERT']
|
|
endif
|
|
|
|
add_project_arguments(common_flags + compiler_flags, language: 'c')
|
|
|
|
glib_dep = dependency('glib-2.0', version: '>= 2.56')
|
|
colord_dep = dependency('colord', version: '>= 1.0.2')
|
|
geocode_glib_dep = dependency('geocode-glib-1.0', version: '>= 3.10.0')
|
|
gio_dep = dependency('gio-2.0', version: '>= 2.53.0')
|
|
gio_unix_dep = dependency('gio-unix-2.0')
|
|
gnome_desktop_dep = dependency('gnome-desktop-3.0', version: '>= 3.11.1')
|
|
gsettings_desktop_dep = dependency('gsettings-desktop-schemas', version: '>= 3.27.90')
|
|
gtk_dep = dependency('gtk+-3.0', version: '>= 3.15.3')
|
|
gtk_x11_dep = dependency('gtk+-x11-3.0')
|
|
gweather_dep = dependency('gweather-3.0', version: '>= 3.9.5')
|
|
lcms_dep = dependency('lcms2', version: '>= 2.2')
|
|
libcanberra_gtk_dep = dependency('libcanberra-gtk3')
|
|
libgeoclue_dep = dependency('libgeoclue-2.0', version: '>= 2.3.1')
|
|
libnotify_dep = dependency('libnotify', version: '>= 0.7.3')
|
|
libpulse_mainloop_glib_dep = dependency('libpulse-mainloop-glib', version: '>= 2.0')
|
|
pango_dep = dependency('pango', version: '>= 1.20.0')
|
|
polkit_gobject_dep = dependency('polkit-gobject-1', version: '>= 0.103')
|
|
upower_glib_dep = dependency('upower-glib', version: '>= 0.99.0')
|
|
x11_dep = dependency('x11')
|
|
|
|
m_dep = cc.find_library('m')
|
|
+dl_dep = cc.find_library('dl')
|
|
|
|
# ALSA integration (default enabled)
|
|
enable_alsa = get_option('alsa')
|
|
assert(enable_alsa or not host_is_linux, 'ALSA is not optional on Linux platforms')
|
|
|
|
libgvc = subproject(
|
|
'gvc',
|
|
default_options: [
|
|
'static=true',
|
|
'alsa=' + enable_alsa.to_string()
|
|
]
|
|
)
|
|
libgvc_dep = libgvc.get_variable('libgvc_dep')
|
|
|
|
# GUdev integration (default enabled)
|
|
enable_gudev = get_option('gudev')
|
|
if enable_gudev
|
|
gudev_dep = dependency('gudev-1.0')
|
|
endif
|
|
config_h.set10('HAVE_GUDEV', enable_gudev)
|
|
if host_is_linux
|
|
assert(enable_gudev, 'GUdev is not optional on Linux platforms')
|
|
endif
|
|
|
|
has_timerfd_create = cc.has_function('timerfd_create')
|
|
config_h.set10('HAVE_TIMERFD', has_timerfd_create)
|
|
|
|
# Check for wayland dependencies
|
|
enable_wayland = get_option('wayland')
|
|
if enable_wayland
|
|
diff --git a/plugins/housekeeping/gsd-gpu-mem.c b/plugins/housekeeping/gsd-gpu-mem.c
|
|
new file mode 100644
|
|
index 00000000..a76579b6
|
|
--- /dev/null
|
|
+++ b/plugins/housekeeping/gsd-gpu-mem.c
|
|
@@ -0,0 +1,261 @@
|
|
+/*
|
|
+ * Copyright (C) 2017 Red Hat, Inc.
|
|
+ *
|
|
+ * This program is free software; you can redistribute it and/or modify
|
|
+ * it under the terms of the GNU General Public License as published by
|
|
+ * the Free Software Foundation; either version 2 of the License, or
|
|
+ * (at your option) any later version.
|
|
+ *
|
|
+ * This program is distributed in the hope that it will be useful,
|
|
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
+ * GNU General Public License for more details.
|
|
+ *
|
|
+ * You should have received a copy of the GNU General Public License
|
|
+ * along with this program; if not, write to the Free Software
|
|
+ * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
|
|
+ *
|
|
+ */
|
|
+
|
|
+#include <glib.h>
|
|
+#include <dlfcn.h>
|
|
+#include <math.h>
|
|
+#include "nvml/include/nvml.h"
|
|
+
|
|
+typedef nvmlReturn_t (*nvml_init_t) (void);
|
|
+static nvml_init_t nvml_init;
|
|
+typedef nvmlReturn_t (*nvml_device_get_handle_by_index_t) (unsigned int, nvmlDevice_t *);
|
|
+static nvml_device_get_handle_by_index_t nvml_device_get_handle_by_index;
|
|
+typedef nvmlReturn_t (*nvml_device_get_memory_info_t) (nvmlDevice_t, nvmlMemory_t *);
|
|
+static nvml_device_get_memory_info_t nvml_device_get_memory_info;
|
|
+typedef const char* (*nvml_error_string_t) (nvmlReturn_t);
|
|
+static nvml_error_string_t nvml_error_string;
|
|
+static void *nvml_handle = NULL;
|
|
+static gboolean nvml_loaded = FALSE;
|
|
+
|
|
+static gboolean
|
|
+nvml_load (void)
|
|
+{
|
|
+ char *error;
|
|
+
|
|
+ if (nvml_loaded)
|
|
+ goto out;
|
|
+ nvml_loaded = TRUE;
|
|
+
|
|
+ nvml_handle = dlopen ("libnvidia-ml.so", RTLD_LAZY);
|
|
+ error = dlerror();
|
|
+ if (!nvml_handle)
|
|
+ {
|
|
+ g_warning ("Loading NVML: %s", error);
|
|
+ goto out;
|
|
+ }
|
|
+
|
|
+ nvml_init = (nvml_init_t) dlsym (nvml_handle, "nvmlInit");
|
|
+ nvml_device_get_handle_by_index = (nvml_device_get_handle_by_index_t) dlsym (nvml_handle, "nvmlDeviceGetHandleByIndex");
|
|
+ nvml_device_get_memory_info = (nvml_device_get_memory_info_t) dlsym (nvml_handle, "nvmlDeviceGetMemoryInfo");
|
|
+ nvml_error_string = (nvml_error_string_t) dlsym (nvml_handle, "nvmlErrorString");
|
|
+ error = dlerror();
|
|
+ if (error)
|
|
+ {
|
|
+ g_warning ("Loading NVML: %s", error);
|
|
+ goto cleanup;
|
|
+ }
|
|
+ goto out;
|
|
+
|
|
+ cleanup:
|
|
+ dlclose (nvml_handle);
|
|
+ nvml_handle = NULL;
|
|
+ out:
|
|
+ return nvml_handle != NULL;
|
|
+}
|
|
+
|
|
+static nvmlReturn_t nvml_status = NVML_ERROR_UNINITIALIZED;
|
|
+static nvmlDevice_t nvml_device = NULL;
|
|
+
|
|
+static nvmlReturn_t
|
|
+nvml_warn (nvmlReturn_t rcode, const gchar *prefix)
|
|
+{
|
|
+ if (rcode != NVML_SUCCESS)
|
|
+ g_warning ("%s: %s", prefix, nvml_error_string (rcode));
|
|
+ return rcode;
|
|
+}
|
|
+
|
|
+static gboolean
|
|
+nvml_ready (void)
|
|
+{
|
|
+ if (!nvml_load ())
|
|
+ return FALSE;
|
|
+
|
|
+ if (nvml_status == NVML_ERROR_UNINITIALIZED)
|
|
+ {
|
|
+ nvml_status = nvml_warn (nvml_init (), "Initializing NVML");
|
|
+ if (nvml_status == NVML_SUCCESS)
|
|
+ nvml_warn (nvml_device_get_handle_by_index (0, &nvml_device), "Getting NVML device 0");
|
|
+ }
|
|
+
|
|
+ return nvml_status == NVML_SUCCESS && nvml_device != NULL;
|
|
+}
|
|
+
|
|
+static void
|
|
+nvml_read_mem_info (nvmlMemory_t *mem_info)
|
|
+{
|
|
+ if (!nvml_ready ())
|
|
+ return;
|
|
+
|
|
+ nvml_device_get_memory_info (nvml_device, mem_info);
|
|
+}
|
|
+
|
|
+
|
|
+#include <gio/gdesktopappinfo.h>
|
|
+#include <libnotify/notify.h>
|
|
+#include "gsd-gpu-mem.h"
|
|
+
|
|
+#define POLLING_INTERVAL 30
|
|
+#define MEM_USAGE_NOTIFY_THRESHOLD 0.80
|
|
+
|
|
+struct _GsdGpuMem
|
|
+{
|
|
+ GObject parent_instance;
|
|
+
|
|
+ guint timeout_id;
|
|
+
|
|
+ GDesktopAppInfo *sysmon_app_info;
|
|
+ NotifyNotification *notification;
|
|
+};
|
|
+
|
|
+G_DEFINE_TYPE (GsdGpuMem, gsd_gpu_mem, G_TYPE_OBJECT)
|
|
+
|
|
+static void
|
|
+clear_timeout (GsdGpuMem *self)
|
|
+{
|
|
+ if (self->timeout_id != 0)
|
|
+ {
|
|
+ g_source_remove (self->timeout_id);
|
|
+ self->timeout_id = 0;
|
|
+ }
|
|
+}
|
|
+
|
|
+static void
|
|
+notification_closed (GsdGpuMem *self)
|
|
+{
|
|
+ g_clear_object (&self->notification);
|
|
+}
|
|
+
|
|
+static void
|
|
+unnotify (GsdGpuMem *self)
|
|
+{
|
|
+ if (!self->notification)
|
|
+ return;
|
|
+
|
|
+ notify_notification_close (self->notification, NULL);
|
|
+}
|
|
+
|
|
+static void
|
|
+ignore_callback (NotifyNotification *n,
|
|
+ const char *a,
|
|
+ GsdGpuMem *self)
|
|
+{
|
|
+ unnotify (self);
|
|
+ clear_timeout (self);
|
|
+}
|
|
+
|
|
+static void
|
|
+examine_callback (NotifyNotification *n,
|
|
+ const char *a,
|
|
+ GsdGpuMem *self)
|
|
+
|
|
+{
|
|
+ unnotify (self);
|
|
+ g_app_info_launch (G_APP_INFO (self->sysmon_app_info), NULL, NULL, NULL);
|
|
+}
|
|
+
|
|
+static void
|
|
+notify (GsdGpuMem *self, double mem_usage)
|
|
+{
|
|
+ const gchar *summary = "Running low on GPU memory";
|
|
+ const gchar *icon_name = "utilities-system-monitor-symbolic";
|
|
+ g_autofree gchar *body = g_strdup_printf ("GPU memory usage is at %d%%. "
|
|
+ "You may free up some memory by closing some applications.",
|
|
+ (int) round (mem_usage * 100));
|
|
+ if (self->notification)
|
|
+ {
|
|
+ notify_notification_update (self->notification, summary, body, icon_name);
|
|
+ notify_notification_show (self->notification, NULL);
|
|
+ return;
|
|
+ }
|
|
+
|
|
+ self->notification = notify_notification_new (summary, body, icon_name);
|
|
+ g_signal_connect_object (self->notification, "closed",
|
|
+ G_CALLBACK (notification_closed),
|
|
+ self, G_CONNECT_SWAPPED);
|
|
+
|
|
+ notify_notification_set_app_name (self->notification, "GPU memory");
|
|
+
|
|
+ notify_notification_add_action (self->notification,
|
|
+ "ignore",
|
|
+ "Ignore",
|
|
+ (NotifyActionCallback) ignore_callback,
|
|
+ self, NULL);
|
|
+
|
|
+ if (self->sysmon_app_info)
|
|
+ notify_notification_add_action (self->notification,
|
|
+ "examine",
|
|
+ "Examine",
|
|
+ (NotifyActionCallback) examine_callback,
|
|
+ self, NULL);
|
|
+
|
|
+ notify_notification_show (self->notification, NULL);
|
|
+}
|
|
+
|
|
+static gboolean
|
|
+poll_gpu_memory (gpointer user_data)
|
|
+{
|
|
+ GsdGpuMem *self = user_data;
|
|
+ nvmlMemory_t mem_info = { 0 };
|
|
+ double mem_usage = 0.0;
|
|
+
|
|
+ nvml_read_mem_info (&mem_info);
|
|
+ if (mem_info.total > 0)
|
|
+ mem_usage = (double) mem_info.used / mem_info.total;
|
|
+
|
|
+ if (mem_usage > MEM_USAGE_NOTIFY_THRESHOLD)
|
|
+ {
|
|
+ notify (self, mem_usage);
|
|
+ }
|
|
+ else
|
|
+ {
|
|
+ unnotify (self);
|
|
+ }
|
|
+
|
|
+ return G_SOURCE_CONTINUE;
|
|
+}
|
|
+
|
|
+static void
|
|
+gsd_gpu_mem_init (GsdGpuMem *self)
|
|
+{
|
|
+ if (!nvml_ready ())
|
|
+ return;
|
|
+
|
|
+ self->timeout_id = g_timeout_add_seconds (POLLING_INTERVAL, poll_gpu_memory, self);
|
|
+ self->sysmon_app_info = g_desktop_app_info_new ("gnome-system-monitor.desktop");
|
|
+}
|
|
+
|
|
+static void
|
|
+gsd_gpu_mem_finalize (GObject *object)
|
|
+{
|
|
+ GsdGpuMem *self = GSD_GPU_MEM (object);
|
|
+
|
|
+ clear_timeout (self);
|
|
+ g_clear_object (&self->sysmon_app_info);
|
|
+ unnotify (self);
|
|
+
|
|
+ G_OBJECT_CLASS (gsd_gpu_mem_parent_class)->finalize (object);
|
|
+}
|
|
+
|
|
+static void
|
|
+gsd_gpu_mem_class_init (GsdGpuMemClass *klass)
|
|
+{
|
|
+ GObjectClass *gobject_class = G_OBJECT_CLASS (klass);
|
|
+
|
|
+ gobject_class->finalize = gsd_gpu_mem_finalize;
|
|
+}
|
|
diff --git a/plugins/housekeeping/gsd-gpu-mem.h b/plugins/housekeeping/gsd-gpu-mem.h
|
|
new file mode 100644
|
|
index 00000000..f8967879
|
|
--- /dev/null
|
|
+++ b/plugins/housekeeping/gsd-gpu-mem.h
|
|
@@ -0,0 +1,33 @@
|
|
+/*
|
|
+ * Copyright (C) 2017 Red Hat, Inc.
|
|
+ *
|
|
+ * This program is free software; you can redistribute it and/or modify
|
|
+ * it under the terms of the GNU General Public License as published by
|
|
+ * the Free Software Foundation; either version 2 of the License, or
|
|
+ * (at your option) any later version.
|
|
+ *
|
|
+ * This program is distributed in the hope that it will be useful,
|
|
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
+ * GNU General Public License for more details.
|
|
+ *
|
|
+ * You should have received a copy of the GNU General Public License
|
|
+ * along with this program; if not, write to the Free Software
|
|
+ * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
|
|
+ *
|
|
+ */
|
|
+
|
|
+#ifndef _GSD_GPU_MEM_H
|
|
+#define _GSD_GPU_MEM_H
|
|
+
|
|
+#include <glib-object.h>
|
|
+
|
|
+G_BEGIN_DECLS
|
|
+
|
|
+#define GSD_TYPE_GPU_MEM (gsd_gpu_mem_get_type ())
|
|
+G_DECLARE_FINAL_TYPE (GsdGpuMem, gsd_gpu_mem,
|
|
+ GSD, GPU_MEM, GObject)
|
|
+
|
|
+G_END_DECLS
|
|
+
|
|
+#endif /* _GSD_GPU_MEM_H */
|
|
diff --git a/plugins/housekeeping/gsd-housekeeping-manager.c b/plugins/housekeeping/gsd-housekeeping-manager.c
|
|
index 5ace4179..1bd53061 100644
|
|
--- a/plugins/housekeeping/gsd-housekeeping-manager.c
|
|
+++ b/plugins/housekeeping/gsd-housekeeping-manager.c
|
|
@@ -1,89 +1,92 @@
|
|
/*
|
|
* Copyright (C) 2008 Michael J. Chudobiak <mjc@avtechpulse.com>
|
|
*
|
|
* This program is free software; you can redistribute it and/or modify
|
|
* it under the terms of the GNU General Public License as published by
|
|
* the Free Software Foundation; either version 2 of the License, or
|
|
* (at your option) any later version.
|
|
*
|
|
* This program is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
* GNU General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU General Public License
|
|
* along with this program; if not, see <http://www.gnu.org/licenses/>.
|
|
*
|
|
*/
|
|
|
|
#include "config.h"
|
|
|
|
#include <gio/gio.h>
|
|
#include <glib/gstdio.h>
|
|
#include <string.h>
|
|
#include <libnotify/notify.h>
|
|
|
|
#include "gnome-settings-profile.h"
|
|
#include "gsd-housekeeping-manager.h"
|
|
#include "gsd-disk-space.h"
|
|
+#include "gsd-gpu-mem.h"
|
|
|
|
|
|
/* General */
|
|
#define INTERVAL_ONCE_A_DAY 24*60*60
|
|
#define INTERVAL_TWO_MINUTES 2*60
|
|
|
|
/* Thumbnail cleaner */
|
|
#define THUMB_PREFIX "org.gnome.desktop.thumbnail-cache"
|
|
|
|
#define THUMB_AGE_KEY "maximum-age"
|
|
#define THUMB_SIZE_KEY "maximum-size"
|
|
|
|
#define GSD_HOUSEKEEPING_DBUS_PATH "/org/gnome/SettingsDaemon/Housekeeping"
|
|
|
|
static const gchar introspection_xml[] =
|
|
"<node>"
|
|
" <interface name='org.gnome.SettingsDaemon.Housekeeping'>"
|
|
" <method name='EmptyTrash'/>"
|
|
" <method name='RemoveTempFiles'/>"
|
|
" </interface>"
|
|
"</node>";
|
|
|
|
struct GsdHousekeepingManagerPrivate {
|
|
GSettings *settings;
|
|
guint long_term_cb;
|
|
guint short_term_cb;
|
|
|
|
GDBusNodeInfo *introspection_data;
|
|
GDBusConnection *connection;
|
|
GCancellable *bus_cancellable;
|
|
guint name_id;
|
|
+
|
|
+ GsdGpuMem *gpu_mem_notifier;
|
|
};
|
|
|
|
#define GSD_HOUSEKEEPING_MANAGER_GET_PRIVATE(o) (G_TYPE_INSTANCE_GET_PRIVATE ((o), GSD_TYPE_HOUSEKEEPING_MANAGER, GsdHousekeepingManagerPrivate))
|
|
|
|
static void gsd_housekeeping_manager_class_init (GsdHousekeepingManagerClass *klass);
|
|
static void gsd_housekeeping_manager_init (GsdHousekeepingManager *housekeeping_manager);
|
|
|
|
G_DEFINE_TYPE (GsdHousekeepingManager, gsd_housekeeping_manager, G_TYPE_OBJECT)
|
|
|
|
static gpointer manager_object = NULL;
|
|
|
|
|
|
typedef struct {
|
|
glong now;
|
|
glong max_age;
|
|
goffset total_size;
|
|
goffset max_size;
|
|
} PurgeData;
|
|
|
|
|
|
typedef struct {
|
|
time_t mtime;
|
|
char *path;
|
|
glong size;
|
|
} ThumbData;
|
|
|
|
|
|
static void
|
|
thumb_data_free (gpointer data)
|
|
{
|
|
@@ -384,101 +387,105 @@ gsd_housekeeping_manager_start (GsdHousekeepingManager *manager,
|
|
{
|
|
gchar *dir;
|
|
|
|
g_debug ("Starting housekeeping manager");
|
|
gnome_settings_profile_start (NULL);
|
|
|
|
/* Create ~/.local/ as early as possible */
|
|
(void) g_mkdir_with_parents(g_get_user_data_dir (), 0700);
|
|
|
|
/* Create ~/.local/share/applications/, see
|
|
* https://bugzilla.gnome.org/show_bug.cgi?id=703048 */
|
|
dir = g_build_filename (g_get_user_data_dir (), "applications", NULL);
|
|
(void) g_mkdir (dir, 0700);
|
|
g_free (dir);
|
|
|
|
gsd_ldsm_setup (FALSE);
|
|
|
|
manager->priv->settings = g_settings_new (THUMB_PREFIX);
|
|
g_signal_connect (G_OBJECT (manager->priv->settings), "changed",
|
|
G_CALLBACK (settings_changed_callback), manager);
|
|
|
|
/* Clean once, a few minutes after start-up */
|
|
do_cleanup_soon (manager);
|
|
|
|
/* Clean periodically, on a daily basis. */
|
|
manager->priv->long_term_cb = g_timeout_add_seconds (INTERVAL_ONCE_A_DAY,
|
|
(GSourceFunc) do_cleanup,
|
|
manager);
|
|
g_source_set_name_by_id (manager->priv->long_term_cb, "[gnome-settings-daemon] do_cleanup");
|
|
|
|
+ manager->priv->gpu_mem_notifier = g_object_new (GSD_TYPE_GPU_MEM, NULL);
|
|
+
|
|
gnome_settings_profile_end (NULL);
|
|
|
|
return TRUE;
|
|
}
|
|
|
|
void
|
|
gsd_housekeeping_manager_stop (GsdHousekeepingManager *manager)
|
|
{
|
|
GsdHousekeepingManagerPrivate *p = manager->priv;
|
|
|
|
g_debug ("Stopping housekeeping manager");
|
|
|
|
if (manager->priv->name_id != 0) {
|
|
g_bus_unown_name (manager->priv->name_id);
|
|
manager->priv->name_id = 0;
|
|
}
|
|
|
|
g_clear_object (&p->bus_cancellable);
|
|
g_clear_pointer (&p->introspection_data, g_dbus_node_info_unref);
|
|
g_clear_object (&p->connection);
|
|
|
|
if (p->short_term_cb) {
|
|
g_source_remove (p->short_term_cb);
|
|
p->short_term_cb = 0;
|
|
}
|
|
|
|
if (p->long_term_cb) {
|
|
g_source_remove (p->long_term_cb);
|
|
p->long_term_cb = 0;
|
|
|
|
/* Do a clean-up on shutdown if and only if the size or age
|
|
limits have been set to paranoid levels (zero) */
|
|
if ((g_settings_get_int (p->settings, THUMB_AGE_KEY) == 0) ||
|
|
(g_settings_get_int (p->settings, THUMB_SIZE_KEY) == 0)) {
|
|
do_cleanup (manager);
|
|
}
|
|
|
|
}
|
|
|
|
g_clear_object (&p->settings);
|
|
gsd_ldsm_clean ();
|
|
+
|
|
+ g_clear_object (&p->gpu_mem_notifier);
|
|
}
|
|
|
|
static void
|
|
gsd_housekeeping_manager_finalize (GObject *object)
|
|
{
|
|
gsd_housekeeping_manager_stop (GSD_HOUSEKEEPING_MANAGER (object));
|
|
|
|
G_OBJECT_CLASS (gsd_housekeeping_manager_parent_class)->finalize (object);
|
|
}
|
|
|
|
static void
|
|
gsd_housekeeping_manager_class_init (GsdHousekeepingManagerClass *klass)
|
|
{
|
|
GObjectClass *object_class = G_OBJECT_CLASS (klass);
|
|
|
|
object_class->finalize = gsd_housekeeping_manager_finalize;
|
|
|
|
notify_init ("gnome-settings-daemon");
|
|
|
|
g_type_class_add_private (klass, sizeof (GsdHousekeepingManagerPrivate));
|
|
}
|
|
|
|
static void
|
|
gsd_housekeeping_manager_init (GsdHousekeepingManager *manager)
|
|
{
|
|
manager->priv = GSD_HOUSEKEEPING_MANAGER_GET_PRIVATE (manager);
|
|
}
|
|
|
|
GsdHousekeepingManager *
|
|
gsd_housekeeping_manager_new (void)
|
|
diff --git a/plugins/housekeeping/meson.build b/plugins/housekeeping/meson.build
|
|
index a0b4ca5f..0b690cdb 100644
|
|
--- a/plugins/housekeeping/meson.build
|
|
+++ b/plugins/housekeeping/meson.build
|
|
@@ -1,41 +1,44 @@
|
|
common_files = files(
|
|
'gsd-disk-space.c',
|
|
- 'gsd-disk-space-helper.c'
|
|
+ 'gsd-disk-space-helper.c',
|
|
+ 'gsd-gpu-mem.c'
|
|
)
|
|
|
|
sources = common_files + files(
|
|
'gsd-housekeeping-manager.c',
|
|
'main.c'
|
|
)
|
|
|
|
deps = plugins_deps + [
|
|
gio_unix_dep,
|
|
gtk_dep,
|
|
- libnotify_dep
|
|
+ libnotify_dep,
|
|
+ m_dep,
|
|
+ dl_dep
|
|
]
|
|
|
|
executable(
|
|
'gsd-' + plugin_name,
|
|
sources,
|
|
include_directories: [top_inc, common_inc],
|
|
dependencies: deps,
|
|
c_args: cflags,
|
|
install: true,
|
|
install_rpath: gsd_pkglibdir,
|
|
install_dir: gsd_libexecdir
|
|
)
|
|
|
|
programs = [
|
|
'gsd-disk-space-test',
|
|
'gsd-empty-trash-test',
|
|
'gsd-purge-temp-test'
|
|
]
|
|
|
|
foreach program: programs
|
|
executable(
|
|
program,
|
|
common_files + [program + '.c'],
|
|
include_directories: top_inc,
|
|
dependencies: deps
|
|
)
|
|
endforeach
|
|
diff --git a/plugins/housekeeping/nvml/include/nvml.h b/plugins/housekeeping/nvml/include/nvml.h
|
|
new file mode 100644
|
|
index 00000000..f151007e
|
|
--- /dev/null
|
|
+++ b/plugins/housekeeping/nvml/include/nvml.h
|
|
@@ -0,0 +1,4447 @@
|
|
+/*
|
|
+ * Copyright 1993-2016 NVIDIA Corporation. All rights reserved.
|
|
+ *
|
|
+ * NOTICE TO USER:
|
|
+ *
|
|
+ * This source code is subject to NVIDIA ownership rights under U.S. and
|
|
+ * international Copyright laws. Users and possessors of this source code
|
|
+ * are hereby granted a nonexclusive, royalty-free license to use this code
|
|
+ * in individual and commercial software.
|
|
+ *
|
|
+ * NVIDIA MAKES NO REPRESENTATION ABOUT THE SUITABILITY OF THIS SOURCE
|
|
+ * CODE FOR ANY PURPOSE. IT IS PROVIDED "AS IS" WITHOUT EXPRESS OR
|
|
+ * IMPLIED WARRANTY OF ANY KIND. NVIDIA DISCLAIMS ALL WARRANTIES WITH
|
|
+ * REGARD TO THIS SOURCE CODE, INCLUDING ALL IMPLIED WARRANTIES OF
|
|
+ * MERCHANTABILITY, NONINFRINGEMENT, AND FITNESS FOR A PARTICULAR PURPOSE.
|
|
+ * IN NO EVENT SHALL NVIDIA BE LIABLE FOR ANY SPECIAL, INDIRECT, INCIDENTAL,
|
|
+ * OR CONSEQUENTIAL DAMAGES, OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS
|
|
+ * OF USE, DATA OR PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE
|
|
+ * OR OTHER TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE
|
|
+ * OR PERFORMANCE OF THIS SOURCE CODE.
|
|
+ *
|
|
+ * U.S. Government End Users. This source code is a "commercial item" as
|
|
+ * that term is defined at 48 C.F.R. 2.101 (OCT 1995), consisting of
|
|
+ * "commercial computer software" and "commercial computer software
|
|
+ * documentation" as such terms are used in 48 C.F.R. 12.212 (SEPT 1995)
|
|
+ * and is provided to the U.S. Government only as a commercial end item.
|
|
+ * Consistent with 48 C.F.R.12.212 and 48 C.F.R. 227.7202-1 through
|
|
+ * 227.7202-4 (JUNE 1995), all U.S. Government End Users acquire the
|
|
+ * source code with only those rights set forth herein.
|
|
+ *
|
|
+ * Any use of this source code in individual and commercial software must
|
|
+ * include, in the user documentation and internal comments to the code,
|
|
+ * the above Disclaimer and U.S. Government End Users Notice.
|
|
+ */
|
|
+
|
|
+/*
|
|
+NVML API Reference
|
|
+
|
|
+The NVIDIA Management Library (NVML) is a C-based programmatic interface for monitoring and
|
|
+managing various states within NVIDIA Tesla &tm; GPUs. It is intended to be a platform for building
|
|
+3rd party applications, and is also the underlying library for the NVIDIA-supported nvidia-smi
|
|
+tool. NVML is thread-safe so it is safe to make simultaneous NVML calls from multiple threads.
|
|
+
|
|
+API Documentation
|
|
+
|
|
+Supported platforms:
|
|
+- Windows: Windows Server 2008 R2 64bit, Windows Server 2012 R2 64bit, Windows 7 64bit, Windows 8 64bit, Windows 10 64bit
|
|
+- Linux: 32-bit and 64-bit
|
|
+- Hypervisors: Windows Server 2008R2/2012 Hyper-V 64bit, Citrix XenServer 6.2 SP1+, VMware ESX 5.1/5.5
|
|
+
|
|
+Supported products:
|
|
+- Full Support
|
|
+ - All Tesla products, starting with the Fermi architecture
|
|
+ - All Quadro products, starting with the Fermi architecture
|
|
+ - All GRID products, starting with the Kepler architecture
|
|
+ - Selected GeForce Titan products
|
|
+- Limited Support
|
|
+ - All Geforce products, starting with the Fermi architecture
|
|
+
|
|
+The NVML library can be found at \%ProgramW6432\%\\"NVIDIA Corporation"\\NVSMI\\ on Windows. It is
|
|
+not be added to the system path by default. To dynamically link to NVML, add this path to the PATH
|
|
+environmental variable. To dynamically load NVML, call LoadLibrary with this path.
|
|
+
|
|
+On Linux the NVML library will be found on the standard library path. For 64 bit Linux, both the 32 bit
|
|
+and 64 bit NVML libraries will be installed.
|
|
+
|
|
+Online documentation for this library is available at http://docs.nvidia.com/deploy/nvml-api/index.html
|
|
+*/
|
|
+
|
|
+#ifndef __nvml_nvml_h__
|
|
+#define __nvml_nvml_h__
|
|
+
|
|
+#ifdef __cplusplus
|
|
+extern "C" {
|
|
+#endif
|
|
+
|
|
+/*
|
|
+ * On Windows, set up methods for DLL export
|
|
+ * define NVML_STATIC_IMPORT when using nvml_loader library
|
|
+ */
|
|
+#if defined _WINDOWS
|
|
+ #if !defined NVML_STATIC_IMPORT
|
|
+ #if defined NVML_LIB_EXPORT
|
|
+ #define DECLDIR __declspec(dllexport)
|
|
+ #else
|
|
+ #define DECLDIR __declspec(dllimport)
|
|
+ #endif
|
|
+ #else
|
|
+ #define DECLDIR
|
|
+ #endif
|
|
+#else
|
|
+ #define DECLDIR
|
|
+#endif
|
|
+
|
|
+/**
|
|
+ * NVML API versioning support
|
|
+ */
|
|
+#define NVML_API_VERSION 8
|
|
+#define NVML_API_VERSION_STR "8"
|
|
+#define nvmlInit nvmlInit_v2
|
|
+#define nvmlDeviceGetPciInfo nvmlDeviceGetPciInfo_v2
|
|
+#define nvmlDeviceGetCount nvmlDeviceGetCount_v2
|
|
+#define nvmlDeviceGetHandleByIndex nvmlDeviceGetHandleByIndex_v2
|
|
+#define nvmlDeviceGetHandleByPciBusId nvmlDeviceGetHandleByPciBusId_v2
|
|
+
|
|
+/***************************************************************************************************/
|
|
+/** @defgroup nvmlDeviceStructs Device Structs
|
|
+ * @{
|
|
+ */
|
|
+/***************************************************************************************************/
|
|
+
|
|
+/**
|
|
+ * Special constant that some fields take when they are not available.
|
|
+ * Used when only part of the struct is not available.
|
|
+ *
|
|
+ * Each structure explicitly states when to check for this value.
|
|
+ */
|
|
+#define NVML_VALUE_NOT_AVAILABLE (-1)
|
|
+
|
|
+typedef struct nvmlDevice_st* nvmlDevice_t;
|
|
+
|
|
+/**
|
|
+ * Buffer size guaranteed to be large enough for pci bus id
|
|
+ */
|
|
+#define NVML_DEVICE_PCI_BUS_ID_BUFFER_SIZE 16
|
|
+
|
|
+/**
|
|
+ * PCI information about a GPU device.
|
|
+ */
|
|
+typedef struct nvmlPciInfo_st
|
|
+{
|
|
+ char busId[NVML_DEVICE_PCI_BUS_ID_BUFFER_SIZE]; //!< The tuple domain:bus:device.function PCI identifier (& NULL terminator)
|
|
+ unsigned int domain; //!< The PCI domain on which the device's bus resides, 0 to 0xffff
|
|
+ unsigned int bus; //!< The bus on which the device resides, 0 to 0xff
|
|
+ unsigned int device; //!< The device's id on the bus, 0 to 31
|
|
+ unsigned int pciDeviceId; //!< The combined 16-bit device id and 16-bit vendor id
|
|
+
|
|
+ // Added in NVML 2.285 API
|
|
+ unsigned int pciSubSystemId; //!< The 32-bit Sub System Device ID
|
|
+
|
|
+ // NVIDIA reserved for internal use only
|
|
+ unsigned int reserved0;
|
|
+ unsigned int reserved1;
|
|
+ unsigned int reserved2;
|
|
+ unsigned int reserved3;
|
|
+} nvmlPciInfo_t;
|
|
+
|
|
+/**
|
|
+ * Detailed ECC error counts for a device.
|
|
+ *
|
|
+ * @deprecated Different GPU families can have different memory error counters
|
|
+ * See \ref nvmlDeviceGetMemoryErrorCounter
|
|
+ */
|
|
+typedef struct nvmlEccErrorCounts_st
|
|
+{
|
|
+ unsigned long long l1Cache; //!< L1 cache errors
|
|
+ unsigned long long l2Cache; //!< L2 cache errors
|
|
+ unsigned long long deviceMemory; //!< Device memory errors
|
|
+ unsigned long long registerFile; //!< Register file errors
|
|
+} nvmlEccErrorCounts_t;
|
|
+
|
|
+/**
|
|
+ * Utilization information for a device.
|
|
+ * Each sample period may be between 1 second and 1/6 second, depending on the product being queried.
|
|
+ */
|
|
+typedef struct nvmlUtilization_st
|
|
+{
|
|
+ unsigned int gpu; //!< Percent of time over the past sample period during which one or more kernels was executing on the GPU
|
|
+ unsigned int memory; //!< Percent of time over the past sample period during which global (device) memory was being read or written
|
|
+} nvmlUtilization_t;
|
|
+
|
|
+/**
|
|
+ * Memory allocation information for a device.
|
|
+ */
|
|
+typedef struct nvmlMemory_st
|
|
+{
|
|
+ unsigned long long total; //!< Total installed FB memory (in bytes)
|
|
+ unsigned long long free; //!< Unallocated FB memory (in bytes)
|
|
+ unsigned long long used; //!< Allocated FB memory (in bytes). Note that the driver/GPU always sets aside a small amount of memory for bookkeeping
|
|
+} nvmlMemory_t;
|
|
+
|
|
+/**
|
|
+ * BAR1 Memory allocation Information for a device
|
|
+ */
|
|
+typedef struct nvmlBAR1Memory_st
|
|
+{
|
|
+ unsigned long long bar1Total; //!< Total BAR1 Memory (in bytes)
|
|
+ unsigned long long bar1Free; //!< Unallocated BAR1 Memory (in bytes)
|
|
+ unsigned long long bar1Used; //!< Allocated Used Memory (in bytes)
|
|
+}nvmlBAR1Memory_t;
|
|
+
|
|
+/**
|
|
+ * Information about running compute processes on the GPU
|
|
+ */
|
|
+typedef struct nvmlProcessInfo_st
|
|
+{
|
|
+ unsigned int pid; //!< Process ID
|
|
+ unsigned long long usedGpuMemory; //!< Amount of used GPU memory in bytes.
|
|
+ //! Under WDDM, \ref NVML_VALUE_NOT_AVAILABLE is always reported
|
|
+ //! because Windows KMD manages all the memory and not the NVIDIA driver
|
|
+} nvmlProcessInfo_t;
|
|
+
|
|
+
|
|
+/**
|
|
+ * Enum to represent type of bridge chip
|
|
+ */
|
|
+typedef enum nvmlBridgeChipType_enum
|
|
+{
|
|
+ NVML_BRIDGE_CHIP_PLX = 0,
|
|
+ NVML_BRIDGE_CHIP_BRO4 = 1
|
|
+}nvmlBridgeChipType_t;
|
|
+
|
|
+/**
|
|
+ * Maximum number of NvLink links supported
|
|
+ */
|
|
+#define NVML_NVLINK_MAX_LINKS 4
|
|
+
|
|
+/**
|
|
+ * Enum to represent the NvLink utilization counter packet units
|
|
+ */
|
|
+typedef enum nvmlNvLinkUtilizationCountUnits_enum
|
|
+{
|
|
+ NVML_NVLINK_COUNTER_UNIT_CYCLES = 0, // count by cycles
|
|
+ NVML_NVLINK_COUNTER_UNIT_PACKETS = 1, // count by packets
|
|
+ NVML_NVLINK_COUNTER_UNIT_BYTES = 2, // count by bytes
|
|
+
|
|
+ // this must be last
|
|
+ NVML_NVLINK_COUNTER_UNIT_COUNT
|
|
+} nvmlNvLinkUtilizationCountUnits_t;
|
|
+
|
|
+/**
|
|
+ * Enum to represent the NvLink utilization counter packet types to count
|
|
+ * ** this is ONLY applicable with the units as packets or bytes
|
|
+ * ** as specified in \a nvmlNvLinkUtilizationCountUnits_t
|
|
+ * ** all packet filter descriptions are target GPU centric
|
|
+ * ** these can be "OR'd" together
|
|
+ */
|
|
+typedef enum nvmlNvLinkUtilizationCountPktTypes_enum
|
|
+{
|
|
+ NVML_NVLINK_COUNTER_PKTFILTER_NOP = 0x1, // no operation packets
|
|
+ NVML_NVLINK_COUNTER_PKTFILTER_READ = 0x2, // read packets
|
|
+ NVML_NVLINK_COUNTER_PKTFILTER_WRITE = 0x4, // write packets
|
|
+ NVML_NVLINK_COUNTER_PKTFILTER_RATOM = 0x8, // reduction atomic requests
|
|
+ NVML_NVLINK_COUNTER_PKTFILTER_NRATOM = 0x10, // non-reduction atomic requests
|
|
+ NVML_NVLINK_COUNTER_PKTFILTER_FLUSH = 0x20, // flush requests
|
|
+ NVML_NVLINK_COUNTER_PKTFILTER_RESPDATA = 0x40, // responses with data
|
|
+ NVML_NVLINK_COUNTER_PKTFILTER_RESPNODATA = 0x80, // responses without data
|
|
+ NVML_NVLINK_COUNTER_PKTFILTER_ALL = 0xFF // all packets
|
|
+} nvmlNvLinkUtilizationCountPktTypes_t;
|
|
+
|
|
+/**
|
|
+ * Struct to define the NVLINK counter controls
|
|
+ */
|
|
+typedef struct nvmlNvLinkUtilizationControl_st
|
|
+{
|
|
+ nvmlNvLinkUtilizationCountUnits_t units;
|
|
+ nvmlNvLinkUtilizationCountPktTypes_t pktfilter;
|
|
+} nvmlNvLinkUtilizationControl_t;
|
|
+
|
|
+/**
|
|
+ * Enum to represent NvLink queryable capabilities
|
|
+ */
|
|
+typedef enum nvmlNvLinkCapability_enum
|
|
+{
|
|
+ NVML_NVLINK_CAP_P2P_SUPPORTED = 0, // P2P over NVLink is supported
|
|
+ NVML_NVLINK_CAP_SYSMEM_ACCESS = 1, // Access to system memory is supported
|
|
+ NVML_NVLINK_CAP_P2P_ATOMICS = 2, // P2P atomics are supported
|
|
+ NVML_NVLINK_CAP_SYSMEM_ATOMICS= 3, // System memory atomics are supported
|
|
+ NVML_NVLINK_CAP_SLI_BRIDGE = 4, // SLI is supported over this link
|
|
+ NVML_NVLINK_CAP_VALID = 5, // Link is supported on this device
|
|
+ // should be last
|
|
+ NVML_NVLINK_CAP_COUNT
|
|
+} nvmlNvLinkCapability_t;
|
|
+
|
|
+/**
|
|
+ * Enum to represent NvLink queryable error counters
|
|
+ */
|
|
+typedef enum nvmlNvLinkErrorCounter_enum
|
|
+{
|
|
+ NVML_NVLINK_ERROR_DL_REPLAY = 0, // Data link transmit replay error counter
|
|
+ NVML_NVLINK_ERROR_DL_RECOVERY = 1, // Data link transmit recovery error counter
|
|
+ NVML_NVLINK_ERROR_DL_CRC_FLIT = 2, // Data link receive flow control digit CRC error counter
|
|
+ NVML_NVLINK_ERROR_DL_CRC_DATA = 3, // Data link receive data CRC error counter
|
|
+
|
|
+ // this must be last
|
|
+ NVML_NVLINK_ERROR_COUNT
|
|
+} nvmlNvLinkErrorCounter_t;
|
|
+
|
|
+/**
|
|
+ * Represents level relationships within a system between two GPUs
|
|
+ * The enums are spaced to allow for future relationships
|
|
+ */
|
|
+typedef enum nvmlGpuLevel_enum
|
|
+{
|
|
+ NVML_TOPOLOGY_INTERNAL = 0, // e.g. Tesla K80
|
|
+ NVML_TOPOLOGY_SINGLE = 10, // all devices that only need traverse a single PCIe switch
|
|
+ NVML_TOPOLOGY_MULTIPLE = 20, // all devices that need not traverse a host bridge
|
|
+ NVML_TOPOLOGY_HOSTBRIDGE = 30, // all devices that are connected to the same host bridge
|
|
+ NVML_TOPOLOGY_CPU = 40, // all devices that are connected to the same CPU but possibly multiple host bridges
|
|
+ NVML_TOPOLOGY_SYSTEM = 50, // all devices in the system
|
|
+
|
|
+ // there is purposefully no COUNT here because of the need for spacing above
|
|
+} nvmlGpuTopologyLevel_t;
|
|
+
|
|
+/* P2P Capability Index Status*/
|
|
+typedef enum nvmlGpuP2PStatus_enum
|
|
+{
|
|
+ NVML_P2P_STATUS_OK = 0,
|
|
+ NVML_P2P_STATUS_CHIPSET_NOT_SUPPORED,
|
|
+ NVML_P2P_STATUS_GPU_NOT_SUPPORTED,
|
|
+ NVML_P2P_STATUS_IOH_TOPOLOGY_NOT_SUPPORTED,
|
|
+ NVML_P2P_STATUS_DISABLED_BY_REGKEY,
|
|
+ NVML_P2P_STATUS_NOT_SUPPORTED,
|
|
+ NVML_P2P_STATUS_UNKNOWN
|
|
+
|
|
+} nvmlGpuP2PStatus_t;
|
|
+
|
|
+/* P2P Capability Index*/
|
|
+typedef enum nvmlGpuP2PCapsIndex_enum
|
|
+{
|
|
+ NVML_P2P_CAPS_INDEX_READ = 0,
|
|
+ NVML_P2P_CAPS_INDEX_WRITE,
|
|
+ NVML_P2P_CAPS_INDEX_NVLINK,
|
|
+ NVML_P2P_CAPS_INDEX_ATOMICS,
|
|
+ NVML_P2P_CAPS_INDEX_PROP,
|
|
+ NVML_P2P_CAPS_INDEX_UNKNOWN
|
|
+}nvmlGpuP2PCapsIndex_t;
|
|
+
|
|
+/**
|
|
+ * Maximum limit on Physical Bridges per Board
|
|
+ */
|
|
+#define NVML_MAX_PHYSICAL_BRIDGE (128)
|
|
+
|
|
+/**
|
|
+ * Information about the Bridge Chip Firmware
|
|
+ */
|
|
+typedef struct nvmlBridgeChipInfo_st
|
|
+{
|
|
+ nvmlBridgeChipType_t type; //!< Type of Bridge Chip
|
|
+ unsigned int fwVersion; //!< Firmware Version. 0=Version is unavailable
|
|
+}nvmlBridgeChipInfo_t;
|
|
+
|
|
+/**
|
|
+ * This structure stores the complete Hierarchy of the Bridge Chip within the board. The immediate
|
|
+ * bridge is stored at index 0 of bridgeInfoList, parent to immediate bridge is at index 1 and so forth.
|
|
+ */
|
|
+typedef struct nvmlBridgeChipHierarchy_st
|
|
+{
|
|
+ unsigned char bridgeCount; //!< Number of Bridge Chips on the Board
|
|
+ nvmlBridgeChipInfo_t bridgeChipInfo[NVML_MAX_PHYSICAL_BRIDGE]; //!< Hierarchy of Bridge Chips on the board
|
|
+}nvmlBridgeChipHierarchy_t;
|
|
+
|
|
+/**
|
|
+ * Represents Type of Sampling Event
|
|
+ */
|
|
+typedef enum nvmlSamplingType_enum
|
|
+{
|
|
+ NVML_TOTAL_POWER_SAMPLES = 0, //!< To represent total power drawn by GPU
|
|
+ NVML_GPU_UTILIZATION_SAMPLES = 1, //!< To represent percent of time during which one or more kernels was executing on the GPU
|
|
+ NVML_MEMORY_UTILIZATION_SAMPLES = 2, //!< To represent percent of time during which global (device) memory was being read or written
|
|
+ NVML_ENC_UTILIZATION_SAMPLES = 3, //!< To represent percent of time during which NVENC remains busy
|
|
+ NVML_DEC_UTILIZATION_SAMPLES = 4, //!< To represent percent of time during which NVDEC remains busy
|
|
+ NVML_PROCESSOR_CLK_SAMPLES = 5, //!< To represent processor clock samples
|
|
+ NVML_MEMORY_CLK_SAMPLES = 6, //!< To represent memory clock samples
|
|
+
|
|
+ // Keep this last
|
|
+ NVML_SAMPLINGTYPE_COUNT
|
|
+}nvmlSamplingType_t;
|
|
+
|
|
+/**
|
|
+ * Represents the queryable PCIe utilization counters
|
|
+ */
|
|
+typedef enum nvmlPcieUtilCounter_enum
|
|
+{
|
|
+ NVML_PCIE_UTIL_TX_BYTES = 0, // 1KB granularity
|
|
+ NVML_PCIE_UTIL_RX_BYTES = 1, // 1KB granularity
|
|
+
|
|
+ // Keep this last
|
|
+ NVML_PCIE_UTIL_COUNT
|
|
+} nvmlPcieUtilCounter_t;
|
|
+
|
|
+/**
|
|
+ * Represents the type for sample value returned
|
|
+ */
|
|
+typedef enum nvmlValueType_enum
|
|
+{
|
|
+ NVML_VALUE_TYPE_DOUBLE = 0,
|
|
+ NVML_VALUE_TYPE_UNSIGNED_INT = 1,
|
|
+ NVML_VALUE_TYPE_UNSIGNED_LONG = 2,
|
|
+ NVML_VALUE_TYPE_UNSIGNED_LONG_LONG = 3,
|
|
+
|
|
+ // Keep this last
|
|
+ NVML_VALUE_TYPE_COUNT
|
|
+}nvmlValueType_t;
|
|
+
|
|
+
|
|
+/**
|
|
+ * Union to represent different types of Value
|
|
+ */
|
|
+typedef union nvmlValue_st
|
|
+{
|
|
+ double dVal; //!< If the value is double
|
|
+ unsigned int uiVal; //!< If the value is unsigned int
|
|
+ unsigned long ulVal; //!< If the value is unsigned long
|
|
+ unsigned long long ullVal; //!< If the value is unsigned long long
|
|
+}nvmlValue_t;
|
|
+
|
|
+/**
|
|
+ * Information for Sample
|
|
+ */
|
|
+typedef struct nvmlSample_st
|
|
+{
|
|
+ unsigned long long timeStamp; //!< CPU Timestamp in microseconds
|
|
+ nvmlValue_t sampleValue; //!< Sample Value
|
|
+}nvmlSample_t;
|
|
+
|
|
+/**
|
|
+ * Represents type of perf policy for which violation times can be queried
|
|
+ */
|
|
+typedef enum nvmlPerfPolicyType_enum
|
|
+{
|
|
+ NVML_PERF_POLICY_POWER = 0,
|
|
+ NVML_PERF_POLICY_THERMAL = 1,
|
|
+ NVML_PERF_POLICY_SYNC_BOOST = 2,
|
|
+
|
|
+ // Keep this last
|
|
+ NVML_PERF_POLICY_COUNT
|
|
+}nvmlPerfPolicyType_t;
|
|
+
|
|
+/**
|
|
+ * Struct to hold perf policy violation status data
|
|
+ */
|
|
+typedef struct nvmlViolationTime_st
|
|
+{
|
|
+ unsigned long long referenceTime; //!< referenceTime represents CPU timestamp in microseconds
|
|
+ unsigned long long violationTime; //!< violationTime in Nanoseconds
|
|
+}nvmlViolationTime_t;
|
|
+
|
|
+/** @} */
|
|
+
|
|
+/***************************************************************************************************/
|
|
+/** @defgroup nvmlDeviceEnumvs Device Enums
|
|
+ * @{
|
|
+ */
|
|
+/***************************************************************************************************/
|
|
+
|
|
+/**
|
|
+ * Generic enable/disable enum.
|
|
+ */
|
|
+typedef enum nvmlEnableState_enum
|
|
+{
|
|
+ NVML_FEATURE_DISABLED = 0, //!< Feature disabled
|
|
+ NVML_FEATURE_ENABLED = 1 //!< Feature enabled
|
|
+} nvmlEnableState_t;
|
|
+
|
|
+//! Generic flag used to specify the default behavior of some functions. See description of particular functions for details.
|
|
+#define nvmlFlagDefault 0x00
|
|
+//! Generic flag used to force some behavior. See description of particular functions for details.
|
|
+#define nvmlFlagForce 0x01
|
|
+
|
|
+/**
|
|
+ * * The Brand of the GPU
|
|
+ * */
|
|
+typedef enum nvmlBrandType_enum
|
|
+{
|
|
+ NVML_BRAND_UNKNOWN = 0,
|
|
+ NVML_BRAND_QUADRO = 1,
|
|
+ NVML_BRAND_TESLA = 2,
|
|
+ NVML_BRAND_NVS = 3,
|
|
+ NVML_BRAND_GRID = 4,
|
|
+ NVML_BRAND_GEFORCE = 5,
|
|
+
|
|
+ // Keep this last
|
|
+ NVML_BRAND_COUNT
|
|
+} nvmlBrandType_t;
|
|
+
|
|
+/**
|
|
+ * Temperature thresholds.
|
|
+ */
|
|
+typedef enum nvmlTemperatureThresholds_enum
|
|
+{
|
|
+ NVML_TEMPERATURE_THRESHOLD_SHUTDOWN = 0, // Temperature at which the GPU will shut down
|
|
+ // for HW protection
|
|
+ NVML_TEMPERATURE_THRESHOLD_SLOWDOWN = 1, // Temperature at which the GPU will begin slowdown
|
|
+ // Keep this last
|
|
+ NVML_TEMPERATURE_THRESHOLD_COUNT
|
|
+} nvmlTemperatureThresholds_t;
|
|
+
|
|
+/**
|
|
+ * Temperature sensors.
|
|
+ */
|
|
+typedef enum nvmlTemperatureSensors_enum
|
|
+{
|
|
+ NVML_TEMPERATURE_GPU = 0, //!< Temperature sensor for the GPU die
|
|
+
|
|
+ // Keep this last
|
|
+ NVML_TEMPERATURE_COUNT
|
|
+} nvmlTemperatureSensors_t;
|
|
+
|
|
+/**
|
|
+ * Compute mode.
|
|
+ *
|
|
+ * NVML_COMPUTEMODE_EXCLUSIVE_PROCESS was added in CUDA 4.0.
|
|
+ * Earlier CUDA versions supported a single exclusive mode,
|
|
+ * which is equivalent to NVML_COMPUTEMODE_EXCLUSIVE_THREAD in CUDA 4.0 and beyond.
|
|
+ */
|
|
+typedef enum nvmlComputeMode_enum
|
|
+{
|
|
+ NVML_COMPUTEMODE_DEFAULT = 0, //!< Default compute mode -- multiple contexts per device
|
|
+ NVML_COMPUTEMODE_EXCLUSIVE_THREAD = 1, //!< Support Removed
|
|
+ NVML_COMPUTEMODE_PROHIBITED = 2, //!< Compute-prohibited mode -- no contexts per device
|
|
+ NVML_COMPUTEMODE_EXCLUSIVE_PROCESS = 3, //!< Compute-exclusive-process mode -- only one context per device, usable from multiple threads at a time
|
|
+
|
|
+ // Keep this last
|
|
+ NVML_COMPUTEMODE_COUNT
|
|
+} nvmlComputeMode_t;
|
|
+
|
|
+/**
|
|
+ * ECC bit types.
|
|
+ *
|
|
+ * @deprecated See \ref nvmlMemoryErrorType_t for a more flexible type
|
|
+ */
|
|
+#define nvmlEccBitType_t nvmlMemoryErrorType_t
|
|
+
|
|
+/**
|
|
+ * Single bit ECC errors
|
|
+ *
|
|
+ * @deprecated Mapped to \ref NVML_MEMORY_ERROR_TYPE_CORRECTED
|
|
+ */
|
|
+#define NVML_SINGLE_BIT_ECC NVML_MEMORY_ERROR_TYPE_CORRECTED
|
|
+
|
|
+/**
|
|
+ * Double bit ECC errors
|
|
+ *
|
|
+ * @deprecated Mapped to \ref NVML_MEMORY_ERROR_TYPE_UNCORRECTED
|
|
+ */
|
|
+#define NVML_DOUBLE_BIT_ECC NVML_MEMORY_ERROR_TYPE_UNCORRECTED
|
|
+
|
|
+/**
|
|
+ * Memory error types
|
|
+ */
|
|
+typedef enum nvmlMemoryErrorType_enum
|
|
+{
|
|
+ /**
|
|
+ * A memory error that was corrected
|
|
+ *
|
|
+ * For ECC errors, these are single bit errors
|
|
+ * For Texture memory, these are errors fixed by resend
|
|
+ */
|
|
+ NVML_MEMORY_ERROR_TYPE_CORRECTED = 0,
|
|
+ /**
|
|
+ * A memory error that was not corrected
|
|
+ *
|
|
+ * For ECC errors, these are double bit errors
|
|
+ * For Texture memory, these are errors where the resend fails
|
|
+ */
|
|
+ NVML_MEMORY_ERROR_TYPE_UNCORRECTED = 1,
|
|
+
|
|
+
|
|
+ // Keep this last
|
|
+ NVML_MEMORY_ERROR_TYPE_COUNT //!< Count of memory error types
|
|
+
|
|
+} nvmlMemoryErrorType_t;
|
|
+
|
|
+/**
|
|
+ * ECC counter types.
|
|
+ *
|
|
+ * Note: Volatile counts are reset each time the driver loads. On Windows this is once per boot. On Linux this can be more frequent.
|
|
+ * On Linux the driver unloads when no active clients exist. If persistence mode is enabled or there is always a driver
|
|
+ * client active (e.g. X11), then Linux also sees per-boot behavior. If not, volatile counts are reset each time a compute app
|
|
+ * is run.
|
|
+ */
|
|
+typedef enum nvmlEccCounterType_enum
|
|
+{
|
|
+ NVML_VOLATILE_ECC = 0, //!< Volatile counts are reset each time the driver loads.
|
|
+ NVML_AGGREGATE_ECC = 1, //!< Aggregate counts persist across reboots (i.e. for the lifetime of the device)
|
|
+
|
|
+ // Keep this last
|
|
+ NVML_ECC_COUNTER_TYPE_COUNT //!< Count of memory counter types
|
|
+} nvmlEccCounterType_t;
|
|
+
|
|
+/**
|
|
+ * Clock types.
|
|
+ *
|
|
+ * All speeds are in Mhz.
|
|
+ */
|
|
+typedef enum nvmlClockType_enum
|
|
+{
|
|
+ NVML_CLOCK_GRAPHICS = 0, //!< Graphics clock domain
|
|
+ NVML_CLOCK_SM = 1, //!< SM clock domain
|
|
+ NVML_CLOCK_MEM = 2, //!< Memory clock domain
|
|
+ NVML_CLOCK_VIDEO = 3, //!< Video encoder/decoder clock domain
|
|
+
|
|
+ // Keep this last
|
|
+ NVML_CLOCK_COUNT //<! Count of clock types
|
|
+} nvmlClockType_t;
|
|
+
|
|
+/**
|
|
+ * Clock Ids. These are used in combination with nvmlClockType_t
|
|
+ * to specify a single clock value.
|
|
+ */
|
|
+typedef enum nvmlClockId_enum
|
|
+{
|
|
+ NVML_CLOCK_ID_CURRENT = 0, //!< Current actual clock value
|
|
+ NVML_CLOCK_ID_APP_CLOCK_TARGET = 1, //!< Target application clock
|
|
+ NVML_CLOCK_ID_APP_CLOCK_DEFAULT = 2, //!< Default application clock target
|
|
+ NVML_CLOCK_ID_CUSTOMER_BOOST_MAX = 3, //!< OEM-defined maximum clock rate
|
|
+
|
|
+ //Keep this last
|
|
+ NVML_CLOCK_ID_COUNT //<! Count of Clock Ids.
|
|
+} nvmlClockId_t;
|
|
+
|
|
+/**
|
|
+ * Driver models.
|
|
+ *
|
|
+ * Windows only.
|
|
+ */
|
|
+typedef enum nvmlDriverModel_enum
|
|
+{
|
|
+ NVML_DRIVER_WDDM = 0, //!< WDDM driver model -- GPU treated as a display device
|
|
+ NVML_DRIVER_WDM = 1 //!< WDM (TCC) model (recommended) -- GPU treated as a generic device
|
|
+} nvmlDriverModel_t;
|
|
+
|
|
+/**
|
|
+ * Allowed PStates.
|
|
+ */
|
|
+typedef enum nvmlPStates_enum
|
|
+{
|
|
+ NVML_PSTATE_0 = 0, //!< Performance state 0 -- Maximum Performance
|
|
+ NVML_PSTATE_1 = 1, //!< Performance state 1
|
|
+ NVML_PSTATE_2 = 2, //!< Performance state 2
|
|
+ NVML_PSTATE_3 = 3, //!< Performance state 3
|
|
+ NVML_PSTATE_4 = 4, //!< Performance state 4
|
|
+ NVML_PSTATE_5 = 5, //!< Performance state 5
|
|
+ NVML_PSTATE_6 = 6, //!< Performance state 6
|
|
+ NVML_PSTATE_7 = 7, //!< Performance state 7
|
|
+ NVML_PSTATE_8 = 8, //!< Performance state 8
|
|
+ NVML_PSTATE_9 = 9, //!< Performance state 9
|
|
+ NVML_PSTATE_10 = 10, //!< Performance state 10
|
|
+ NVML_PSTATE_11 = 11, //!< Performance state 11
|
|
+ NVML_PSTATE_12 = 12, //!< Performance state 12
|
|
+ NVML_PSTATE_13 = 13, //!< Performance state 13
|
|
+ NVML_PSTATE_14 = 14, //!< Performance state 14
|
|
+ NVML_PSTATE_15 = 15, //!< Performance state 15 -- Minimum Performance
|
|
+ NVML_PSTATE_UNKNOWN = 32 //!< Unknown performance state
|
|
+} nvmlPstates_t;
|
|
+
|
|
+/**
|
|
+ * GPU Operation Mode
|
|
+ *
|
|
+ * GOM allows to reduce power usage and optimize GPU throughput by disabling GPU features.
|
|
+ *
|
|
+ * Each GOM is designed to meet specific user needs.
|
|
+ */
|
|
+typedef enum nvmlGom_enum
|
|
+{
|
|
+ NVML_GOM_ALL_ON = 0, //!< Everything is enabled and running at full speed
|
|
+
|
|
+ NVML_GOM_COMPUTE = 1, //!< Designed for running only compute tasks. Graphics operations
|
|
+ //!< are not allowed
|
|
+
|
|
+ NVML_GOM_LOW_DP = 2 //!< Designed for running graphics applications that don't require
|
|
+ //!< high bandwidth double precision
|
|
+} nvmlGpuOperationMode_t;
|
|
+
|
|
+/**
|
|
+ * Available infoROM objects.
|
|
+ */
|
|
+typedef enum nvmlInforomObject_enum
|
|
+{
|
|
+ NVML_INFOROM_OEM = 0, //!< An object defined by OEM
|
|
+ NVML_INFOROM_ECC = 1, //!< The ECC object determining the level of ECC support
|
|
+ NVML_INFOROM_POWER = 2, //!< The power management object
|
|
+
|
|
+ // Keep this last
|
|
+ NVML_INFOROM_COUNT //!< This counts the number of infoROM objects the driver knows about
|
|
+} nvmlInforomObject_t;
|
|
+
|
|
+/**
|
|
+ * Return values for NVML API calls.
|
|
+ */
|
|
+typedef enum nvmlReturn_enum
|
|
+{
|
|
+ NVML_SUCCESS = 0, //!< The operation was successful
|
|
+ NVML_ERROR_UNINITIALIZED = 1, //!< NVML was not first initialized with nvmlInit()
|
|
+ NVML_ERROR_INVALID_ARGUMENT = 2, //!< A supplied argument is invalid
|
|
+ NVML_ERROR_NOT_SUPPORTED = 3, //!< The requested operation is not available on target device
|
|
+ NVML_ERROR_NO_PERMISSION = 4, //!< The current user does not have permission for operation
|
|
+ NVML_ERROR_ALREADY_INITIALIZED = 5, //!< Deprecated: Multiple initializations are now allowed through ref counting
|
|
+ NVML_ERROR_NOT_FOUND = 6, //!< A query to find an object was unsuccessful
|
|
+ NVML_ERROR_INSUFFICIENT_SIZE = 7, //!< An input argument is not large enough
|
|
+ NVML_ERROR_INSUFFICIENT_POWER = 8, //!< A device's external power cables are not properly attached
|
|
+ NVML_ERROR_DRIVER_NOT_LOADED = 9, //!< NVIDIA driver is not loaded
|
|
+ NVML_ERROR_TIMEOUT = 10, //!< User provided timeout passed
|
|
+ NVML_ERROR_IRQ_ISSUE = 11, //!< NVIDIA Kernel detected an interrupt issue with a GPU
|
|
+ NVML_ERROR_LIBRARY_NOT_FOUND = 12, //!< NVML Shared Library couldn't be found or loaded
|
|
+ NVML_ERROR_FUNCTION_NOT_FOUND = 13, //!< Local version of NVML doesn't implement this function
|
|
+ NVML_ERROR_CORRUPTED_INFOROM = 14, //!< infoROM is corrupted
|
|
+ NVML_ERROR_GPU_IS_LOST = 15, //!< The GPU has fallen off the bus or has otherwise become inaccessible
|
|
+ NVML_ERROR_RESET_REQUIRED = 16, //!< The GPU requires a reset before it can be used again
|
|
+ NVML_ERROR_OPERATING_SYSTEM = 17, //!< The GPU control device has been blocked by the operating system/cgroups
|
|
+ NVML_ERROR_LIB_RM_VERSION_MISMATCH = 18, //!< RM detects a driver/library version mismatch
|
|
+ NVML_ERROR_IN_USE = 19, //!< An operation cannot be performed because the GPU is currently in use
|
|
+ NVML_ERROR_NO_DATA = 20, //!< No data
|
|
+ NVML_ERROR_UNKNOWN = 999 //!< An internal driver error occurred
|
|
+} nvmlReturn_t;
|
|
+
|
|
+/**
|
|
+ * Memory locations
|
|
+ *
|
|
+ * See \ref nvmlDeviceGetMemoryErrorCounter
|
|
+ */
|
|
+typedef enum nvmlMemoryLocation_enum
|
|
+{
|
|
+ NVML_MEMORY_LOCATION_L1_CACHE = 0, //!< GPU L1 Cache
|
|
+ NVML_MEMORY_LOCATION_L2_CACHE = 1, //!< GPU L2 Cache
|
|
+ NVML_MEMORY_LOCATION_DEVICE_MEMORY = 2, //!< GPU Device Memory
|
|
+ NVML_MEMORY_LOCATION_REGISTER_FILE = 3, //!< GPU Register File
|
|
+ NVML_MEMORY_LOCATION_TEXTURE_MEMORY = 4, //!< GPU Texture Memory
|
|
+ NVML_MEMORY_LOCATION_TEXTURE_SHM = 5, //!< Shared memory
|
|
+
|
|
+ // Keep this last
|
|
+ NVML_MEMORY_LOCATION_COUNT //!< This counts the number of memory locations the driver knows about
|
|
+} nvmlMemoryLocation_t;
|
|
+
|
|
+/**
|
|
+ * Causes for page retirement
|
|
+ */
|
|
+typedef enum nvmlPageRetirementCause_enum
|
|
+{
|
|
+ NVML_PAGE_RETIREMENT_CAUSE_MULTIPLE_SINGLE_BIT_ECC_ERRORS = 0, //!< Page was retired due to multiple single bit ECC error
|
|
+ NVML_PAGE_RETIREMENT_CAUSE_DOUBLE_BIT_ECC_ERROR = 1, //!< Page was retired due to double bit ECC error
|
|
+
|
|
+ // Keep this last
|
|
+ NVML_PAGE_RETIREMENT_CAUSE_COUNT
|
|
+} nvmlPageRetirementCause_t;
|
|
+
|
|
+/**
|
|
+ * API types that allow changes to default permission restrictions
|
|
+ */
|
|
+typedef enum nvmlRestrictedAPI_enum
|
|
+{
|
|
+ NVML_RESTRICTED_API_SET_APPLICATION_CLOCKS = 0, //!< APIs that change application clocks, see nvmlDeviceSetApplicationsClocks
|
|
+ //!< and see nvmlDeviceResetApplicationsClocks
|
|
+ NVML_RESTRICTED_API_SET_AUTO_BOOSTED_CLOCKS = 1, //!< APIs that enable/disable Auto Boosted clocks
|
|
+ //!< see nvmlDeviceSetAutoBoostedClocksEnabled
|
|
+ // Keep this last
|
|
+ NVML_RESTRICTED_API_COUNT
|
|
+} nvmlRestrictedAPI_t;
|
|
+
|
|
+/** @} */
|
|
+
|
|
+/***************************************************************************************************/
|
|
+/** @defgroup nvmlUnitStructs Unit Structs
|
|
+ * @{
|
|
+ */
|
|
+/***************************************************************************************************/
|
|
+
|
|
+typedef struct nvmlUnit_st* nvmlUnit_t;
|
|
+
|
|
+/**
|
|
+ * Description of HWBC entry
|
|
+ */
|
|
+typedef struct nvmlHwbcEntry_st
|
|
+{
|
|
+ unsigned int hwbcId;
|
|
+ char firmwareVersion[32];
|
|
+} nvmlHwbcEntry_t;
|
|
+
|
|
+/**
|
|
+ * Fan state enum.
|
|
+ */
|
|
+typedef enum nvmlFanState_enum
|
|
+{
|
|
+ NVML_FAN_NORMAL = 0, //!< Fan is working properly
|
|
+ NVML_FAN_FAILED = 1 //!< Fan has failed
|
|
+} nvmlFanState_t;
|
|
+
|
|
+/**
|
|
+ * Led color enum.
|
|
+ */
|
|
+typedef enum nvmlLedColor_enum
|
|
+{
|
|
+ NVML_LED_COLOR_GREEN = 0, //!< GREEN, indicates good health
|
|
+ NVML_LED_COLOR_AMBER = 1 //!< AMBER, indicates problem
|
|
+} nvmlLedColor_t;
|
|
+
|
|
+
|
|
+/**
|
|
+ * LED states for an S-class unit.
|
|
+ */
|
|
+typedef struct nvmlLedState_st
|
|
+{
|
|
+ char cause[256]; //!< If amber, a text description of the cause
|
|
+ nvmlLedColor_t color; //!< GREEN or AMBER
|
|
+} nvmlLedState_t;
|
|
+
|
|
+/**
|
|
+ * Static S-class unit info.
|
|
+ */
|
|
+typedef struct nvmlUnitInfo_st
|
|
+{
|
|
+ char name[96]; //!< Product name
|
|
+ char id[96]; //!< Product identifier
|
|
+ char serial[96]; //!< Product serial number
|
|
+ char firmwareVersion[96]; //!< Firmware version
|
|
+} nvmlUnitInfo_t;
|
|
+
|
|
+/**
|
|
+ * Power usage information for an S-class unit.
|
|
+ * The power supply state is a human readable string that equals "Normal" or contains
|
|
+ * a combination of "Abnormal" plus one or more of the following:
|
|
+ *
|
|
+ * - High voltage
|
|
+ * - Fan failure
|
|
+ * - Heatsink temperature
|
|
+ * - Current limit
|
|
+ * - Voltage below UV alarm threshold
|
|
+ * - Low-voltage
|
|
+ * - SI2C remote off command
|
|
+ * - MOD_DISABLE input
|
|
+ * - Short pin transition
|
|
+*/
|
|
+typedef struct nvmlPSUInfo_st
|
|
+{
|
|
+ char state[256]; //!< The power supply state
|
|
+ unsigned int current; //!< PSU current (A)
|
|
+ unsigned int voltage; //!< PSU voltage (V)
|
|
+ unsigned int power; //!< PSU power draw (W)
|
|
+} nvmlPSUInfo_t;
|
|
+
|
|
+/**
|
|
+ * Fan speed reading for a single fan in an S-class unit.
|
|
+ */
|
|
+typedef struct nvmlUnitFanInfo_st
|
|
+{
|
|
+ unsigned int speed; //!< Fan speed (RPM)
|
|
+ nvmlFanState_t state; //!< Flag that indicates whether fan is working properly
|
|
+} nvmlUnitFanInfo_t;
|
|
+
|
|
+/**
|
|
+ * Fan speed readings for an entire S-class unit.
|
|
+ */
|
|
+typedef struct nvmlUnitFanSpeeds_st
|
|
+{
|
|
+ nvmlUnitFanInfo_t fans[24]; //!< Fan speed data for each fan
|
|
+ unsigned int count; //!< Number of fans in unit
|
|
+} nvmlUnitFanSpeeds_t;
|
|
+
|
|
+/** @} */
|
|
+
|
|
+/***************************************************************************************************/
|
|
+/** @addtogroup nvmlEvents
|
|
+ * @{
|
|
+ */
|
|
+/***************************************************************************************************/
|
|
+
|
|
+/**
|
|
+ * Handle to an event set
|
|
+ */
|
|
+typedef struct nvmlEventSet_st* nvmlEventSet_t;
|
|
+
|
|
+/** @defgroup nvmlEventType Event Types
|
|
+ * @{
|
|
+ * Event Types which user can be notified about.
|
|
+ * See description of particular functions for details.
|
|
+ *
|
|
+ * See \ref nvmlDeviceRegisterEvents and \ref nvmlDeviceGetSupportedEventTypes to check which devices
|
|
+ * support each event.
|
|
+ *
|
|
+ * Types can be combined with bitwise or operator '|' when passed to \ref nvmlDeviceRegisterEvents
|
|
+ */
|
|
+//! Event about single bit ECC errors
|
|
+/**
|
|
+ * \note A corrected texture memory error is not an ECC error, so it does not generate a single bit event
|
|
+ */
|
|
+#define nvmlEventTypeSingleBitEccError 0x0000000000000001LL
|
|
+
|
|
+//! Event about double bit ECC errors
|
|
+/**
|
|
+ * \note An uncorrected texture memory error is not an ECC error, so it does not generate a double bit event
|
|
+ */
|
|
+#define nvmlEventTypeDoubleBitEccError 0x0000000000000002LL
|
|
+
|
|
+//! Event about PState changes
|
|
+/**
|
|
+ * \note On Fermi architecture PState changes are also an indicator that GPU is throttling down due to
|
|
+ * no work being executed on the GPU, power capping or thermal capping. In a typical situation,
|
|
+ * Fermi-based GPU should stay in P0 for the duration of the execution of the compute process.
|
|
+ */
|
|
+#define nvmlEventTypePState 0x0000000000000004LL
|
|
+
|
|
+//! Event that Xid critical error occurred
|
|
+#define nvmlEventTypeXidCriticalError 0x0000000000000008LL
|
|
+
|
|
+//! Event about clock changes
|
|
+/**
|
|
+ * Kepler only
|
|
+ */
|
|
+#define nvmlEventTypeClock 0x0000000000000010LL
|
|
+
|
|
+//! Mask with no events
|
|
+#define nvmlEventTypeNone 0x0000000000000000LL
|
|
+//! Mask of all events
|
|
+#define nvmlEventTypeAll (nvmlEventTypeNone \
|
|
+ | nvmlEventTypeSingleBitEccError \
|
|
+ | nvmlEventTypeDoubleBitEccError \
|
|
+ | nvmlEventTypePState \
|
|
+ | nvmlEventTypeClock \
|
|
+ | nvmlEventTypeXidCriticalError \
|
|
+ )
|
|
+/** @} */
|
|
+
|
|
+/**
|
|
+ * Information about occurred event
|
|
+ */
|
|
+typedef struct nvmlEventData_st
|
|
+{
|
|
+ nvmlDevice_t device; //!< Specific device where the event occurred
|
|
+ unsigned long long eventType; //!< Information about what specific event occurred
|
|
+ unsigned long long eventData; //!< Stores last XID error for the device in the event of nvmlEventTypeXidCriticalError,
|
|
+ // eventData is 0 for any other event. eventData is set as 999 for unknown xid error.
|
|
+} nvmlEventData_t;
|
|
+
|
|
+/** @} */
|
|
+
|
|
+/***************************************************************************************************/
|
|
+/** @addtogroup nvmlClocksThrottleReasons
|
|
+ * @{
|
|
+ */
|
|
+/***************************************************************************************************/
|
|
+
|
|
+/** Nothing is running on the GPU and the clocks are dropping to Idle state
|
|
+ * \note This limiter may be removed in a later release
|
|
+ */
|
|
+#define nvmlClocksThrottleReasonGpuIdle 0x0000000000000001LL
|
|
+
|
|
+/** GPU clocks are limited by current setting of applications clocks
|
|
+ *
|
|
+ * @see nvmlDeviceSetApplicationsClocks
|
|
+ * @see nvmlDeviceGetApplicationsClock
|
|
+ */
|
|
+#define nvmlClocksThrottleReasonApplicationsClocksSetting 0x0000000000000002LL
|
|
+
|
|
+/**
|
|
+ * @deprecated Renamed to \ref nvmlClocksThrottleReasonApplicationsClocksSetting
|
|
+ * as the name describes the situation more accurately.
|
|
+ */
|
|
+#define nvmlClocksThrottleReasonUserDefinedClocks nvmlClocksThrottleReasonApplicationsClocksSetting
|
|
+
|
|
+/** SW Power Scaling algorithm is reducing the clocks below requested clocks
|
|
+ *
|
|
+ * @see nvmlDeviceGetPowerUsage
|
|
+ * @see nvmlDeviceSetPowerManagementLimit
|
|
+ * @see nvmlDeviceGetPowerManagementLimit
|
|
+ */
|
|
+#define nvmlClocksThrottleReasonSwPowerCap 0x0000000000000004LL
|
|
+
|
|
+/** HW Slowdown (reducing the core clocks by a factor of 2 or more) is engaged
|
|
+ *
|
|
+ * This is an indicator of:
|
|
+ * - temperature being too high
|
|
+ * - External Power Brake Assertion is triggered (e.g. by the system power supply)
|
|
+ * - Power draw is too high and Fast Trigger protection is reducing the clocks
|
|
+ * - May be also reported during PState or clock change
|
|
+ * - This behavior may be removed in a later release.
|
|
+ *
|
|
+ * @see nvmlDeviceGetTemperature
|
|
+ * @see nvmlDeviceGetTemperatureThreshold
|
|
+ * @see nvmlDeviceGetPowerUsage
|
|
+ */
|
|
+#define nvmlClocksThrottleReasonHwSlowdown 0x0000000000000008LL
|
|
+
|
|
+/** Sync Boost
|
|
+ *
|
|
+ * This GPU has been added to a Sync boost group with nvidia-smi or DCGM in
|
|
+ * order to maximize performance per watt. All GPUs in the sync boost group
|
|
+ * will boost to the minimum possible clocks across the entire group. Look at
|
|
+ * the throttle reasons for other GPUs in the system to see why those GPUs are
|
|
+ * holding this one at lower clocks.
|
|
+ *
|
|
+ */
|
|
+#define nvmlClocksThrottleReasonSyncBoost 0x0000000000000010LL
|
|
+
|
|
+/** Some other unspecified factor is reducing the clocks */
|
|
+#define nvmlClocksThrottleReasonUnknown 0x8000000000000000LL
|
|
+
|
|
+/** Bit mask representing no clocks throttling
|
|
+ *
|
|
+ * Clocks are as high as possible.
|
|
+ * */
|
|
+#define nvmlClocksThrottleReasonNone 0x0000000000000000LL
|
|
+
|
|
+/** Bit mask representing all supported clocks throttling reasons
|
|
+ * New reasons might be added to this list in the future
|
|
+ */
|
|
+#define nvmlClocksThrottleReasonAll (nvmlClocksThrottleReasonNone \
|
|
+ | nvmlClocksThrottleReasonGpuIdle \
|
|
+ | nvmlClocksThrottleReasonApplicationsClocksSetting \
|
|
+ | nvmlClocksThrottleReasonSwPowerCap \
|
|
+ | nvmlClocksThrottleReasonHwSlowdown \
|
|
+ | nvmlClocksThrottleReasonSyncBoost \
|
|
+ | nvmlClocksThrottleReasonUnknown \
|
|
+ )
|
|
+/** @} */
|
|
+
|
|
+/***************************************************************************************************/
|
|
+/** @defgroup nvmlAccountingStats Accounting Statistics
|
|
+ * @{
|
|
+ *
|
|
+ * Set of APIs designed to provide per process information about usage of GPU.
|
|
+ *
|
|
+ * @note All accounting statistics and accounting mode live in nvidia driver and reset
|
|
+ * to default (Disabled) when driver unloads.
|
|
+ * It is advised to run with persistence mode enabled.
|
|
+ *
|
|
+ * @note Enabling accounting mode has no negative impact on the GPU performance.
|
|
+ */
|
|
+/***************************************************************************************************/
|
|
+
|
|
+/**
|
|
+ * Describes accounting statistics of a process.
|
|
+ */
|
|
+typedef struct nvmlAccountingStats_st {
|
|
+ unsigned int gpuUtilization; //!< Percent of time over the process's lifetime during which one or more kernels was executing on the GPU.
|
|
+ //! Utilization stats just like returned by \ref nvmlDeviceGetUtilizationRates but for the life time of a
|
|
+ //! process (not just the last sample period).
|
|
+ //! Set to NVML_VALUE_NOT_AVAILABLE if nvmlDeviceGetUtilizationRates is not supported
|
|
+
|
|
+ unsigned int memoryUtilization; //!< Percent of time over the process's lifetime during which global (device) memory was being read or written.
|
|
+ //! Set to NVML_VALUE_NOT_AVAILABLE if nvmlDeviceGetUtilizationRates is not supported
|
|
+
|
|
+ unsigned long long maxMemoryUsage; //!< Maximum total memory in bytes that was ever allocated by the process.
|
|
+ //! Set to NVML_VALUE_NOT_AVAILABLE if nvmlProcessInfo_t->usedGpuMemory is not supported
|
|
+
|
|
+
|
|
+ unsigned long long time; //!< Amount of time in ms during which the compute context was active. The time is reported as 0 if
|
|
+ //!< the process is not terminated
|
|
+
|
|
+ unsigned long long startTime; //!< CPU Timestamp in usec representing start time for the process
|
|
+
|
|
+ unsigned int isRunning; //!< Flag to represent if the process is running (1 for running, 0 for terminated)
|
|
+
|
|
+ unsigned int reserved[5]; //!< Reserved for future use
|
|
+} nvmlAccountingStats_t;
|
|
+
|
|
+/** @} */
|
|
+
|
|
+/***************************************************************************************************/
|
|
+/** @defgroup nvmlInitializationAndCleanup Initialization and Cleanup
|
|
+ * This chapter describes the methods that handle NVML initialization and cleanup.
|
|
+ * It is the user's responsibility to call \ref nvmlInit() before calling any other methods, and
|
|
+ * nvmlShutdown() once NVML is no longer being used.
|
|
+ * @{
|
|
+ */
|
|
+/***************************************************************************************************/
|
|
+
|
|
+/**
|
|
+ * Initialize NVML, but don't initialize any GPUs yet.
|
|
+ *
|
|
+ * \note In NVML 5.319 new nvmlInit_v2 has replaced nvmlInit"_v1" (default in NVML 4.304 and older) that
|
|
+ * did initialize all GPU devices in the system.
|
|
+ *
|
|
+ * This allows NVML to communicate with a GPU
|
|
+ * when other GPUs in the system are unstable or in a bad state. When using this API, GPUs are
|
|
+ * discovered and initialized in nvmlDeviceGetHandleBy* functions instead.
|
|
+ *
|
|
+ * \note To contrast nvmlInit_v2 with nvmlInit"_v1", NVML 4.304 nvmlInit"_v1" will fail when any detected GPU is in
|
|
+ * a bad or unstable state.
|
|
+ *
|
|
+ * For all products.
|
|
+ *
|
|
+ * This method, should be called once before invoking any other methods in the library.
|
|
+ * A reference count of the number of initializations is maintained. Shutdown only occurs
|
|
+ * when the reference count reaches zero.
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if NVML has been properly initialized
|
|
+ * - \ref NVML_ERROR_DRIVER_NOT_LOADED if NVIDIA driver is not running
|
|
+ * - \ref NVML_ERROR_NO_PERMISSION if NVML does not have permission to talk to the driver
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlInit(void);
|
|
+
|
|
+/**
|
|
+ * Shut down NVML by releasing all GPU resources previously allocated with \ref nvmlInit().
|
|
+ *
|
|
+ * For all products.
|
|
+ *
|
|
+ * This method should be called after NVML work is done, once for each call to \ref nvmlInit()
|
|
+ * A reference count of the number of initializations is maintained. Shutdown only occurs
|
|
+ * when the reference count reaches zero. For backwards compatibility, no error is reported if
|
|
+ * nvmlShutdown() is called more times than nvmlInit().
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if NVML has been properly shut down
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlShutdown(void);
|
|
+
|
|
+/** @} */
|
|
+
|
|
+/***************************************************************************************************/
|
|
+/** @defgroup nvmlErrorReporting Error reporting
|
|
+ * This chapter describes helper functions for error reporting routines.
|
|
+ * @{
|
|
+ */
|
|
+/***************************************************************************************************/
|
|
+
|
|
+/**
|
|
+ * Helper method for converting NVML error codes into readable strings.
|
|
+ *
|
|
+ * For all products.
|
|
+ *
|
|
+ * @param result NVML error code to convert
|
|
+ *
|
|
+ * @return String representation of the error.
|
|
+ *
|
|
+ */
|
|
+const DECLDIR char* nvmlErrorString(nvmlReturn_t result);
|
|
+/** @} */
|
|
+
|
|
+
|
|
+/***************************************************************************************************/
|
|
+/** @defgroup nvmlConstants Constants
|
|
+ * @{
|
|
+ */
|
|
+/***************************************************************************************************/
|
|
+
|
|
+/**
|
|
+ * Buffer size guaranteed to be large enough for \ref nvmlDeviceGetInforomVersion and \ref nvmlDeviceGetInforomImageVersion
|
|
+ */
|
|
+#define NVML_DEVICE_INFOROM_VERSION_BUFFER_SIZE 16
|
|
+
|
|
+/**
|
|
+ * Buffer size guaranteed to be large enough for \ref nvmlDeviceGetUUID
|
|
+ */
|
|
+#define NVML_DEVICE_UUID_BUFFER_SIZE 80
|
|
+
|
|
+/**
|
|
+ * Buffer size guaranteed to be large enough for \ref nvmlDeviceGetBoardPartNumber
|
|
+ */
|
|
+#define NVML_DEVICE_PART_NUMBER_BUFFER_SIZE 80
|
|
+
|
|
+/**
|
|
+ * Buffer size guaranteed to be large enough for \ref nvmlSystemGetDriverVersion
|
|
+ */
|
|
+#define NVML_SYSTEM_DRIVER_VERSION_BUFFER_SIZE 80
|
|
+
|
|
+/**
|
|
+ * Buffer size guaranteed to be large enough for \ref nvmlSystemGetNVMLVersion
|
|
+ */
|
|
+#define NVML_SYSTEM_NVML_VERSION_BUFFER_SIZE 80
|
|
+
|
|
+/**
|
|
+ * Buffer size guaranteed to be large enough for \ref nvmlDeviceGetName
|
|
+ */
|
|
+#define NVML_DEVICE_NAME_BUFFER_SIZE 64
|
|
+
|
|
+/**
|
|
+ * Buffer size guaranteed to be large enough for \ref nvmlDeviceGetSerial
|
|
+ */
|
|
+#define NVML_DEVICE_SERIAL_BUFFER_SIZE 30
|
|
+
|
|
+/**
|
|
+ * Buffer size guaranteed to be large enough for \ref nvmlDeviceGetVbiosVersion
|
|
+ */
|
|
+#define NVML_DEVICE_VBIOS_VERSION_BUFFER_SIZE 32
|
|
+
|
|
+/** @} */
|
|
+
|
|
+/***************************************************************************************************/
|
|
+/** @defgroup nvmlSystemQueries System Queries
|
|
+ * This chapter describes the queries that NVML can perform against the local system. These queries
|
|
+ * are not device-specific.
|
|
+ * @{
|
|
+ */
|
|
+/***************************************************************************************************/
|
|
+
|
|
+/**
|
|
+ * Retrieves the version of the system's graphics driver.
|
|
+ *
|
|
+ * For all products.
|
|
+ *
|
|
+ * The version identifier is an alphanumeric string. It will not exceed 80 characters in length
|
|
+ * (including the NULL terminator). See \ref nvmlConstants::NVML_SYSTEM_DRIVER_VERSION_BUFFER_SIZE.
|
|
+ *
|
|
+ * @param version Reference in which to return the version identifier
|
|
+ * @param length The maximum allowed length of the string returned in \a version
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a version has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a version is NULL
|
|
+ * - \ref NVML_ERROR_INSUFFICIENT_SIZE if \a length is too small
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlSystemGetDriverVersion(char *version, unsigned int length);
|
|
+
|
|
+/**
|
|
+ * Retrieves the version of the NVML library.
|
|
+ *
|
|
+ * For all products.
|
|
+ *
|
|
+ * The version identifier is an alphanumeric string. It will not exceed 80 characters in length
|
|
+ * (including the NULL terminator). See \ref nvmlConstants::NVML_SYSTEM_NVML_VERSION_BUFFER_SIZE.
|
|
+ *
|
|
+ * @param version Reference in which to return the version identifier
|
|
+ * @param length The maximum allowed length of the string returned in \a version
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a version has been set
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a version is NULL
|
|
+ * - \ref NVML_ERROR_INSUFFICIENT_SIZE if \a length is too small
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlSystemGetNVMLVersion(char *version, unsigned int length);
|
|
+
|
|
+/**
|
|
+ * Gets name of the process with provided process id
|
|
+ *
|
|
+ * For all products.
|
|
+ *
|
|
+ * Returned process name is cropped to provided length.
|
|
+ * name string is encoded in ANSI.
|
|
+ *
|
|
+ * @param pid The identifier of the process
|
|
+ * @param name Reference in which to return the process name
|
|
+ * @param length The maximum allowed length of the string returned in \a name
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a name has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a name is NULL or \a length is 0.
|
|
+ * - \ref NVML_ERROR_NOT_FOUND if process doesn't exists
|
|
+ * - \ref NVML_ERROR_NO_PERMISSION if the user doesn't have permission to perform this operation
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlSystemGetProcessName(unsigned int pid, char *name, unsigned int length);
|
|
+
|
|
+/** @} */
|
|
+
|
|
+/***************************************************************************************************/
|
|
+/** @defgroup nvmlUnitQueries Unit Queries
|
|
+ * This chapter describes that queries that NVML can perform against each unit. For S-class systems only.
|
|
+ * In each case the device is identified with an nvmlUnit_t handle. This handle is obtained by
|
|
+ * calling \ref nvmlUnitGetHandleByIndex().
|
|
+ * @{
|
|
+ */
|
|
+/***************************************************************************************************/
|
|
+
|
|
+ /**
|
|
+ * Retrieves the number of units in the system.
|
|
+ *
|
|
+ * For S-class products.
|
|
+ *
|
|
+ * @param unitCount Reference in which to return the number of units
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a unitCount has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a unitCount is NULL
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlUnitGetCount(unsigned int *unitCount);
|
|
+
|
|
+/**
|
|
+ * Acquire the handle for a particular unit, based on its index.
|
|
+ *
|
|
+ * For S-class products.
|
|
+ *
|
|
+ * Valid indices are derived from the \a unitCount returned by \ref nvmlUnitGetCount().
|
|
+ * For example, if \a unitCount is 2 the valid indices are 0 and 1, corresponding to UNIT 0 and UNIT 1.
|
|
+ *
|
|
+ * The order in which NVML enumerates units has no guarantees of consistency between reboots.
|
|
+ *
|
|
+ * @param index The index of the target unit, >= 0 and < \a unitCount
|
|
+ * @param unit Reference in which to return the unit handle
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a unit has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a index is invalid or \a unit is NULL
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlUnitGetHandleByIndex(unsigned int index, nvmlUnit_t *unit);
|
|
+
|
|
+/**
|
|
+ * Retrieves the static information associated with a unit.
|
|
+ *
|
|
+ * For S-class products.
|
|
+ *
|
|
+ * See \ref nvmlUnitInfo_t for details on available unit info.
|
|
+ *
|
|
+ * @param unit The identifier of the target unit
|
|
+ * @param info Reference in which to return the unit information
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a info has been populated
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a unit is invalid or \a info is NULL
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlUnitGetUnitInfo(nvmlUnit_t unit, nvmlUnitInfo_t *info);
|
|
+
|
|
+/**
|
|
+ * Retrieves the LED state associated with this unit.
|
|
+ *
|
|
+ * For S-class products.
|
|
+ *
|
|
+ * See \ref nvmlLedState_t for details on allowed states.
|
|
+ *
|
|
+ * @param unit The identifier of the target unit
|
|
+ * @param state Reference in which to return the current LED state
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a state has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a unit is invalid or \a state is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if this is not an S-class product
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ *
|
|
+ * @see nvmlUnitSetLedState()
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlUnitGetLedState(nvmlUnit_t unit, nvmlLedState_t *state);
|
|
+
|
|
+/**
|
|
+ * Retrieves the PSU stats for the unit.
|
|
+ *
|
|
+ * For S-class products.
|
|
+ *
|
|
+ * See \ref nvmlPSUInfo_t for details on available PSU info.
|
|
+ *
|
|
+ * @param unit The identifier of the target unit
|
|
+ * @param psu Reference in which to return the PSU information
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a psu has been populated
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a unit is invalid or \a psu is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if this is not an S-class product
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlUnitGetPsuInfo(nvmlUnit_t unit, nvmlPSUInfo_t *psu);
|
|
+
|
|
+/**
|
|
+ * Retrieves the temperature readings for the unit, in degrees C.
|
|
+ *
|
|
+ * For S-class products.
|
|
+ *
|
|
+ * Depending on the product, readings may be available for intake (type=0),
|
|
+ * exhaust (type=1) and board (type=2).
|
|
+ *
|
|
+ * @param unit The identifier of the target unit
|
|
+ * @param type The type of reading to take
|
|
+ * @param temp Reference in which to return the intake temperature
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a temp has been populated
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a unit or \a type is invalid or \a temp is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if this is not an S-class product
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlUnitGetTemperature(nvmlUnit_t unit, unsigned int type, unsigned int *temp);
|
|
+
|
|
+/**
|
|
+ * Retrieves the fan speed readings for the unit.
|
|
+ *
|
|
+ * For S-class products.
|
|
+ *
|
|
+ * See \ref nvmlUnitFanSpeeds_t for details on available fan speed info.
|
|
+ *
|
|
+ * @param unit The identifier of the target unit
|
|
+ * @param fanSpeeds Reference in which to return the fan speed information
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a fanSpeeds has been populated
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a unit is invalid or \a fanSpeeds is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if this is not an S-class product
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlUnitGetFanSpeedInfo(nvmlUnit_t unit, nvmlUnitFanSpeeds_t *fanSpeeds);
|
|
+
|
|
+/**
|
|
+ * Retrieves the set of GPU devices that are attached to the specified unit.
|
|
+ *
|
|
+ * For S-class products.
|
|
+ *
|
|
+ * The \a deviceCount argument is expected to be set to the size of the input \a devices array.
|
|
+ *
|
|
+ * @param unit The identifier of the target unit
|
|
+ * @param deviceCount Reference in which to provide the \a devices array size, and
|
|
+ * to return the number of attached GPU devices
|
|
+ * @param devices Reference in which to return the references to the attached GPU devices
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a deviceCount and \a devices have been populated
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INSUFFICIENT_SIZE if \a deviceCount indicates that the \a devices array is too small
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a unit is invalid, either of \a deviceCount or \a devices is NULL
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlUnitGetDevices(nvmlUnit_t unit, unsigned int *deviceCount, nvmlDevice_t *devices);
|
|
+
|
|
+/**
|
|
+ * Retrieves the IDs and firmware versions for any Host Interface Cards (HICs) in the system.
|
|
+ *
|
|
+ * For S-class products.
|
|
+ *
|
|
+ * The \a hwbcCount argument is expected to be set to the size of the input \a hwbcEntries array.
|
|
+ * The HIC must be connected to an S-class system for it to be reported by this function.
|
|
+ *
|
|
+ * @param hwbcCount Size of hwbcEntries array
|
|
+ * @param hwbcEntries Array holding information about hwbc
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a hwbcCount and \a hwbcEntries have been populated
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if either \a hwbcCount or \a hwbcEntries is NULL
|
|
+ * - \ref NVML_ERROR_INSUFFICIENT_SIZE if \a hwbcCount indicates that the \a hwbcEntries array is too small
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlSystemGetHicVersion(unsigned int *hwbcCount, nvmlHwbcEntry_t *hwbcEntries);
|
|
+/** @} */
|
|
+
|
|
+/***************************************************************************************************/
|
|
+/** @defgroup nvmlDeviceQueries Device Queries
|
|
+ * This chapter describes that queries that NVML can perform against each device.
|
|
+ * In each case the device is identified with an nvmlDevice_t handle. This handle is obtained by
|
|
+ * calling one of \ref nvmlDeviceGetHandleByIndex(), \ref nvmlDeviceGetHandleBySerial(),
|
|
+ * \ref nvmlDeviceGetHandleByPciBusId(). or \ref nvmlDeviceGetHandleByUUID().
|
|
+ * @{
|
|
+ */
|
|
+/***************************************************************************************************/
|
|
+
|
|
+ /**
|
|
+ * Retrieves the number of compute devices in the system. A compute device is a single GPU.
|
|
+ *
|
|
+ * For all products.
|
|
+ *
|
|
+ * Note: New nvmlDeviceGetCount_v2 (default in NVML 5.319) returns count of all devices in the system
|
|
+ * even if nvmlDeviceGetHandleByIndex_v2 returns NVML_ERROR_NO_PERMISSION for such device.
|
|
+ * Update your code to handle this error, or use NVML 4.304 or older nvml header file.
|
|
+ * For backward binary compatibility reasons _v1 version of the API is still present in the shared
|
|
+ * library.
|
|
+ * Old _v1 version of nvmlDeviceGetCount doesn't count devices that NVML has no permission to talk to.
|
|
+ *
|
|
+ * @param deviceCount Reference in which to return the number of accessible devices
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a deviceCount has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a deviceCount is NULL
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetCount(unsigned int *deviceCount);
|
|
+
|
|
+/**
|
|
+ * Acquire the handle for a particular device, based on its index.
|
|
+ *
|
|
+ * For all products.
|
|
+ *
|
|
+ * Valid indices are derived from the \a accessibleDevices count returned by
|
|
+ * \ref nvmlDeviceGetCount(). For example, if \a accessibleDevices is 2 the valid indices
|
|
+ * are 0 and 1, corresponding to GPU 0 and GPU 1.
|
|
+ *
|
|
+ * The order in which NVML enumerates devices has no guarantees of consistency between reboots. For that reason it
|
|
+ * is recommended that devices be looked up by their PCI ids or UUID. See
|
|
+ * \ref nvmlDeviceGetHandleByUUID() and \ref nvmlDeviceGetHandleByPciBusId().
|
|
+ *
|
|
+ * Note: The NVML index may not correlate with other APIs, such as the CUDA device index.
|
|
+ *
|
|
+ * Starting from NVML 5, this API causes NVML to initialize the target GPU
|
|
+ * NVML may initialize additional GPUs if:
|
|
+ * - The target GPU is an SLI slave
|
|
+ *
|
|
+ * Note: New nvmlDeviceGetCount_v2 (default in NVML 5.319) returns count of all devices in the system
|
|
+ * even if nvmlDeviceGetHandleByIndex_v2 returns NVML_ERROR_NO_PERMISSION for such device.
|
|
+ * Update your code to handle this error, or use NVML 4.304 or older nvml header file.
|
|
+ * For backward binary compatibility reasons _v1 version of the API is still present in the shared
|
|
+ * library.
|
|
+ * Old _v1 version of nvmlDeviceGetCount doesn't count devices that NVML has no permission to talk to.
|
|
+ *
|
|
+ * This means that nvmlDeviceGetHandleByIndex_v2 and _v1 can return different devices for the same index.
|
|
+ * If you don't touch macros that map old (_v1) versions to _v2 versions at the top of the file you don't
|
|
+ * need to worry about that.
|
|
+ *
|
|
+ * @param index The index of the target GPU, >= 0 and < \a accessibleDevices
|
|
+ * @param device Reference in which to return the device handle
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a device has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a index is invalid or \a device is NULL
|
|
+ * - \ref NVML_ERROR_INSUFFICIENT_POWER if any attached devices have improperly attached external power cables
|
|
+ * - \ref NVML_ERROR_NO_PERMISSION if the user doesn't have permission to talk to this device
|
|
+ * - \ref NVML_ERROR_IRQ_ISSUE if NVIDIA kernel detected an interrupt issue with the attached GPUs
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ *
|
|
+ * @see nvmlDeviceGetIndex
|
|
+ * @see nvmlDeviceGetCount
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetHandleByIndex(unsigned int index, nvmlDevice_t *device);
|
|
+
|
|
+/**
|
|
+ * Acquire the handle for a particular device, based on its board serial number.
|
|
+ *
|
|
+ * For Fermi &tm; or newer fully supported devices.
|
|
+ *
|
|
+ * This number corresponds to the value printed directly on the board, and to the value returned by
|
|
+ * \ref nvmlDeviceGetSerial().
|
|
+ *
|
|
+ * @deprecated Since more than one GPU can exist on a single board this function is deprecated in favor
|
|
+ * of \ref nvmlDeviceGetHandleByUUID.
|
|
+ * For dual GPU boards this function will return NVML_ERROR_INVALID_ARGUMENT.
|
|
+ *
|
|
+ * Starting from NVML 5, this API causes NVML to initialize the target GPU
|
|
+ * NVML may initialize additional GPUs as it searches for the target GPU
|
|
+ *
|
|
+ * @param serial The board serial number of the target GPU
|
|
+ * @param device Reference in which to return the device handle
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a device has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a serial is invalid, \a device is NULL or more than one
|
|
+ * device has the same serial (dual GPU boards)
|
|
+ * - \ref NVML_ERROR_NOT_FOUND if \a serial does not match a valid device on the system
|
|
+ * - \ref NVML_ERROR_INSUFFICIENT_POWER if any attached devices have improperly attached external power cables
|
|
+ * - \ref NVML_ERROR_IRQ_ISSUE if NVIDIA kernel detected an interrupt issue with the attached GPUs
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if any GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ *
|
|
+ * @see nvmlDeviceGetSerial
|
|
+ * @see nvmlDeviceGetHandleByUUID
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetHandleBySerial(const char *serial, nvmlDevice_t *device);
|
|
+
|
|
+/**
|
|
+ * Acquire the handle for a particular device, based on its globally unique immutable UUID associated with each device.
|
|
+ *
|
|
+ * For all products.
|
|
+ *
|
|
+ * @param uuid The UUID of the target GPU
|
|
+ * @param device Reference in which to return the device handle
|
|
+ *
|
|
+ * Starting from NVML 5, this API causes NVML to initialize the target GPU
|
|
+ * NVML may initialize additional GPUs as it searches for the target GPU
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a device has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a uuid is invalid or \a device is null
|
|
+ * - \ref NVML_ERROR_NOT_FOUND if \a uuid does not match a valid device on the system
|
|
+ * - \ref NVML_ERROR_INSUFFICIENT_POWER if any attached devices have improperly attached external power cables
|
|
+ * - \ref NVML_ERROR_IRQ_ISSUE if NVIDIA kernel detected an interrupt issue with the attached GPUs
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if any GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ *
|
|
+ * @see nvmlDeviceGetUUID
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetHandleByUUID(const char *uuid, nvmlDevice_t *device);
|
|
+
|
|
+/**
|
|
+ * Acquire the handle for a particular device, based on its PCI bus id.
|
|
+ *
|
|
+ * For all products.
|
|
+ *
|
|
+ * This value corresponds to the nvmlPciInfo_t::busId returned by \ref nvmlDeviceGetPciInfo().
|
|
+ *
|
|
+ * Starting from NVML 5, this API causes NVML to initialize the target GPU
|
|
+ * NVML may initialize additional GPUs if:
|
|
+ * - The target GPU is an SLI slave
|
|
+ *
|
|
+ * \note NVML 4.304 and older version of nvmlDeviceGetHandleByPciBusId"_v1" returns NVML_ERROR_NOT_FOUND
|
|
+ * instead of NVML_ERROR_NO_PERMISSION.
|
|
+ *
|
|
+ * @param pciBusId The PCI bus id of the target GPU
|
|
+ * @param device Reference in which to return the device handle
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a device has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a pciBusId is invalid or \a device is NULL
|
|
+ * - \ref NVML_ERROR_NOT_FOUND if \a pciBusId does not match a valid device on the system
|
|
+ * - \ref NVML_ERROR_INSUFFICIENT_POWER if the attached device has improperly attached external power cables
|
|
+ * - \ref NVML_ERROR_NO_PERMISSION if the user doesn't have permission to talk to this device
|
|
+ * - \ref NVML_ERROR_IRQ_ISSUE if NVIDIA kernel detected an interrupt issue with the attached GPUs
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetHandleByPciBusId(const char *pciBusId, nvmlDevice_t *device);
|
|
+
|
|
+/**
|
|
+ * Retrieves the name of this device.
|
|
+ *
|
|
+ * For all products.
|
|
+ *
|
|
+ * The name is an alphanumeric string that denotes a particular product, e.g. Tesla &tm; C2070. It will not
|
|
+ * exceed 64 characters in length (including the NULL terminator). See \ref
|
|
+ * nvmlConstants::NVML_DEVICE_NAME_BUFFER_SIZE.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param name Reference in which to return the product name
|
|
+ * @param length The maximum allowed length of the string returned in \a name
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a name has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid, or \a name is NULL
|
|
+ * - \ref NVML_ERROR_INSUFFICIENT_SIZE if \a length is too small
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetName(nvmlDevice_t device, char *name, unsigned int length);
|
|
+
|
|
+/**
|
|
+ * Retrieves the brand of this device.
|
|
+ *
|
|
+ * For all products.
|
|
+ *
|
|
+ * The type is a member of \ref nvmlBrandType_t defined above.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param type Reference in which to return the product brand type
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a name has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid, or \a type is NULL
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetBrand(nvmlDevice_t device, nvmlBrandType_t *type);
|
|
+
|
|
+/**
|
|
+ * Retrieves the NVML index of this device.
|
|
+ *
|
|
+ * For all products.
|
|
+ *
|
|
+ * Valid indices are derived from the \a accessibleDevices count returned by
|
|
+ * \ref nvmlDeviceGetCount(). For example, if \a accessibleDevices is 2 the valid indices
|
|
+ * are 0 and 1, corresponding to GPU 0 and GPU 1.
|
|
+ *
|
|
+ * The order in which NVML enumerates devices has no guarantees of consistency between reboots. For that reason it
|
|
+ * is recommended that devices be looked up by their PCI ids or GPU UUID. See
|
|
+ * \ref nvmlDeviceGetHandleByPciBusId() and \ref nvmlDeviceGetHandleByUUID().
|
|
+ *
|
|
+ * Note: The NVML index may not correlate with other APIs, such as the CUDA device index.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param index Reference in which to return the NVML index of the device
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a index has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid, or \a index is NULL
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ *
|
|
+ * @see nvmlDeviceGetHandleByIndex()
|
|
+ * @see nvmlDeviceGetCount()
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetIndex(nvmlDevice_t device, unsigned int *index);
|
|
+
|
|
+/**
|
|
+ * Retrieves the globally unique board serial number associated with this device's board.
|
|
+ *
|
|
+ * For all products with an inforom.
|
|
+ *
|
|
+ * The serial number is an alphanumeric string that will not exceed 30 characters (including the NULL terminator).
|
|
+ * This number matches the serial number tag that is physically attached to the board. See \ref
|
|
+ * nvmlConstants::NVML_DEVICE_SERIAL_BUFFER_SIZE.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param serial Reference in which to return the board/module serial number
|
|
+ * @param length The maximum allowed length of the string returned in \a serial
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a serial has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid, or \a serial is NULL
|
|
+ * - \ref NVML_ERROR_INSUFFICIENT_SIZE if \a length is too small
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not support this feature
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetSerial(nvmlDevice_t device, char *serial, unsigned int length);
|
|
+
|
|
+/**
|
|
+ * Retrieves an array of unsigned ints (sized to cpuSetSize) of bitmasks with the ideal CPU affinity for the device
|
|
+ * For example, if processors 0, 1, 32, and 33 are ideal for the device and cpuSetSize == 2,
|
|
+ * result[0] = 0x3, result[1] = 0x3
|
|
+ *
|
|
+ * For Kepler &tm; or newer fully supported devices.
|
|
+ * Supported on Linux only.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param cpuSetSize The size of the cpuSet array that is safe to access
|
|
+ * @param cpuSet Array reference in which to return a bitmask of CPUs, 64 CPUs per
|
|
+ * unsigned long on 64-bit machines, 32 on 32-bit machines
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a cpuAffinity has been filled
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid, cpuSetSize == 0, or cpuSet is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not support this feature
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetCpuAffinity(nvmlDevice_t device, unsigned int cpuSetSize, unsigned long *cpuSet);
|
|
+
|
|
+/**
|
|
+ * Sets the ideal affinity for the calling thread and device using the guidelines
|
|
+ * given in nvmlDeviceGetCpuAffinity(). Note, this is a change as of version 8.0.
|
|
+ * Older versions set the affinity for a calling process and all children.
|
|
+ * Currently supports up to 64 processors.
|
|
+ *
|
|
+ * For Kepler &tm; or newer fully supported devices.
|
|
+ * Supported on Linux only.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if the calling process has been successfully bound
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not support this feature
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceSetCpuAffinity(nvmlDevice_t device);
|
|
+
|
|
+/**
|
|
+ * Clear all affinity bindings for the calling thread. Note, this is a change as of version
|
|
+ * 8.0 as older versions cleared the affinity for a calling process and all children.
|
|
+ *
|
|
+ * For Kepler &tm; or newer fully supported devices.
|
|
+ * Supported on Linux only.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if the calling process has been successfully unbound
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceClearCpuAffinity(nvmlDevice_t device);
|
|
+
|
|
+/**
|
|
+ * Retrieve the common ancestor for two devices
|
|
+ * For all products.
|
|
+ * Supported on Linux only.
|
|
+ *
|
|
+ * @param device1 The identifier of the first device
|
|
+ * @param device2 The identifier of the second device
|
|
+ * @param pathInfo A \ref nvmlGpuTopologyLevel_t that gives the path type
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a pathInfo has been set
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device1, or \a device2 is invalid, or \a pathInfo is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device or OS does not support this feature
|
|
+ * - \ref NVML_ERROR_UNKNOWN an error has occurred in underlying topology discovery
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetTopologyCommonAncestor(nvmlDevice_t device1, nvmlDevice_t device2, nvmlGpuTopologyLevel_t *pathInfo);
|
|
+
|
|
+/**
|
|
+ * Retrieve the set of GPUs that are nearest to a given device at a specific interconnectivity level
|
|
+ * For all products.
|
|
+ * Supported on Linux only.
|
|
+ *
|
|
+ * @param device The identifier of the first device
|
|
+ * @param level The \ref nvmlGpuTopologyLevel_t level to search for other GPUs
|
|
+ * @param count When zero, is set to the number of matching GPUs such that \a deviceArray
|
|
+ * can be malloc'd. When non-zero, \a deviceArray will be filled with \a count
|
|
+ * number of device handles.
|
|
+ * @param deviceArray An array of device handles for GPUs found at \a level
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a deviceArray or \a count (if initially zero) has been set
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device, \a level, or \a count is invalid, or \a deviceArray is NULL with a non-zero \a count
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device or OS does not support this feature
|
|
+ * - \ref NVML_ERROR_UNKNOWN an error has occurred in underlying topology discovery
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetTopologyNearestGpus(nvmlDevice_t device, nvmlGpuTopologyLevel_t level, unsigned int *count, nvmlDevice_t *deviceArray);
|
|
+
|
|
+/**
|
|
+ * Retrieve the set of GPUs that have a CPU affinity with the given CPU number
|
|
+ * For all products.
|
|
+ * Supported on Linux only.
|
|
+ *
|
|
+ * @param cpuNumber The CPU number
|
|
+ * @param count When zero, is set to the number of matching GPUs such that \a deviceArray
|
|
+ * can be malloc'd. When non-zero, \a deviceArray will be filled with \a count
|
|
+ * number of device handles.
|
|
+ * @param deviceArray An array of device handles for GPUs found with affinity to \a cpuNumber
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a deviceArray or \a count (if initially zero) has been set
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a cpuNumber, or \a count is invalid, or \a deviceArray is NULL with a non-zero \a count
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device or OS does not support this feature
|
|
+ * - \ref NVML_ERROR_UNKNOWN an error has occurred in underlying topology discovery
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlSystemGetTopologyGpuSet(unsigned int cpuNumber, unsigned int *count, nvmlDevice_t *deviceArray);
|
|
+
|
|
+/**
|
|
+ * Retrieve the status for a given p2p capability index between a given pair of GPU
|
|
+ *
|
|
+ * @param device1 The first device
|
|
+ * @param device2 The second device
|
|
+ * @param p2pIndex p2p Capability Index being looked for between \a device1 and \a device2
|
|
+ * @param p2pStatus Reference in which to return the status of the \a p2pIndex
|
|
+ * between \a device1 and \a device2
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a p2pStatus has been populated
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device1 or \a device2 or \a p2pIndex is invalid or \a p2pStatus is NULL
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetP2PStatus(nvmlDevice_t device1, nvmlDevice_t device2, nvmlGpuP2PCapsIndex_t p2pIndex,nvmlGpuP2PStatus_t *p2pStatus);
|
|
+
|
|
+
|
|
+/**
|
|
+ * Retrieves the globally unique immutable UUID associated with this device, as a 5 part hexadecimal string,
|
|
+ * that augments the immutable, board serial identifier.
|
|
+ *
|
|
+ * For all products.
|
|
+ *
|
|
+ * The UUID is a globally unique identifier. It is the only available identifier for pre-Fermi-architecture products.
|
|
+ * It does NOT correspond to any identifier printed on the board. It will not exceed 80 characters in length
|
|
+ * (including the NULL terminator). See \ref nvmlConstants::NVML_DEVICE_UUID_BUFFER_SIZE.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param uuid Reference in which to return the GPU UUID
|
|
+ * @param length The maximum allowed length of the string returned in \a uuid
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a uuid has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid, or \a uuid is NULL
|
|
+ * - \ref NVML_ERROR_INSUFFICIENT_SIZE if \a length is too small
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not support this feature
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetUUID(nvmlDevice_t device, char *uuid, unsigned int length);
|
|
+
|
|
+/**
|
|
+ * Retrieves minor number for the device. The minor number for the device is such that the Nvidia device node file for
|
|
+ * each GPU will have the form /dev/nvidia[minor number].
|
|
+ *
|
|
+ * For all products.
|
|
+ * Supported only for Linux
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param minorNumber Reference in which to return the minor number for the device
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if the minor number is successfully retrieved
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a minorNumber is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if this query is not supported by the device
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetMinorNumber(nvmlDevice_t device, unsigned int *minorNumber);
|
|
+
|
|
+/**
|
|
+ * Retrieves the the device board part number which is programmed into the board's InfoROM
|
|
+ *
|
|
+ * For all products.
|
|
+ *
|
|
+ * @param device Identifier of the target device
|
|
+ * @param partNumber Reference to the buffer to return
|
|
+ * @param length Length of the buffer reference
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a partNumber has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the needed VBIOS fields have not been filled
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a serial is NULL
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetBoardPartNumber(nvmlDevice_t device, char* partNumber, unsigned int length);
|
|
+
|
|
+/**
|
|
+ * Retrieves the version information for the device's infoROM object.
|
|
+ *
|
|
+ * For all products with an inforom.
|
|
+ *
|
|
+ * Fermi and higher parts have non-volatile on-board memory for persisting device info, such as aggregate
|
|
+ * ECC counts. The version of the data structures in this memory may change from time to time. It will not
|
|
+ * exceed 16 characters in length (including the NULL terminator).
|
|
+ * See \ref nvmlConstants::NVML_DEVICE_INFOROM_VERSION_BUFFER_SIZE.
|
|
+ *
|
|
+ * See \ref nvmlInforomObject_t for details on the available infoROM objects.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param object The target infoROM object
|
|
+ * @param version Reference in which to return the infoROM version
|
|
+ * @param length The maximum allowed length of the string returned in \a version
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a version has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a version is NULL
|
|
+ * - \ref NVML_ERROR_INSUFFICIENT_SIZE if \a length is too small
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not have an infoROM
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ *
|
|
+ * @see nvmlDeviceGetInforomImageVersion
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetInforomVersion(nvmlDevice_t device, nvmlInforomObject_t object, char *version, unsigned int length);
|
|
+
|
|
+/**
|
|
+ * Retrieves the global infoROM image version
|
|
+ *
|
|
+ * For all products with an inforom.
|
|
+ *
|
|
+ * Image version just like VBIOS version uniquely describes the exact version of the infoROM flashed on the board
|
|
+ * in contrast to infoROM object version which is only an indicator of supported features.
|
|
+ * Version string will not exceed 16 characters in length (including the NULL terminator).
|
|
+ * See \ref nvmlConstants::NVML_DEVICE_INFOROM_VERSION_BUFFER_SIZE.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param version Reference in which to return the infoROM image version
|
|
+ * @param length The maximum allowed length of the string returned in \a version
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a version has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a version is NULL
|
|
+ * - \ref NVML_ERROR_INSUFFICIENT_SIZE if \a length is too small
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not have an infoROM
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ *
|
|
+ * @see nvmlDeviceGetInforomVersion
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetInforomImageVersion(nvmlDevice_t device, char *version, unsigned int length);
|
|
+
|
|
+/**
|
|
+ * Retrieves the checksum of the configuration stored in the device's infoROM.
|
|
+ *
|
|
+ * For all products with an inforom.
|
|
+ *
|
|
+ * Can be used to make sure that two GPUs have the exact same configuration.
|
|
+ * Current checksum takes into account configuration stored in PWR and ECC infoROM objects.
|
|
+ * Checksum can change between driver releases or when user changes configuration (e.g. disable/enable ECC)
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param checksum Reference in which to return the infoROM configuration checksum
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a checksum has been set
|
|
+ * - \ref NVML_ERROR_CORRUPTED_INFOROM if the device's checksum couldn't be retrieved due to infoROM corruption
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a checksum is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not support this feature
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetInforomConfigurationChecksum(nvmlDevice_t device, unsigned int *checksum);
|
|
+
|
|
+/**
|
|
+ * Reads the infoROM from the flash and verifies the checksums.
|
|
+ *
|
|
+ * For all products with an inforom.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if infoROM is not corrupted
|
|
+ * - \ref NVML_ERROR_CORRUPTED_INFOROM if the device's infoROM is corrupted
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not support this feature
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceValidateInforom(nvmlDevice_t device);
|
|
+
|
|
+/**
|
|
+ * Retrieves the display mode for the device.
|
|
+ *
|
|
+ * For all products.
|
|
+ *
|
|
+ * This method indicates whether a physical display (e.g. monitor) is currently connected to
|
|
+ * any of the device's connectors.
|
|
+ *
|
|
+ * See \ref nvmlEnableState_t for details on allowed modes.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param display Reference in which to return the display mode
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a display has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a display is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not support this feature
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetDisplayMode(nvmlDevice_t device, nvmlEnableState_t *display);
|
|
+
|
|
+/**
|
|
+ * Retrieves the display active state for the device.
|
|
+ *
|
|
+ * For all products.
|
|
+ *
|
|
+ * This method indicates whether a display is initialized on the device.
|
|
+ * For example whether X Server is attached to this device and has allocated memory for the screen.
|
|
+ *
|
|
+ * Display can be active even when no monitor is physically attached.
|
|
+ *
|
|
+ * See \ref nvmlEnableState_t for details on allowed modes.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param isActive Reference in which to return the display active state
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a isActive has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a isActive is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not support this feature
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetDisplayActive(nvmlDevice_t device, nvmlEnableState_t *isActive);
|
|
+
|
|
+/**
|
|
+ * Retrieves the persistence mode associated with this device.
|
|
+ *
|
|
+ * For all products.
|
|
+ * For Linux only.
|
|
+ *
|
|
+ * When driver persistence mode is enabled the driver software state is not torn down when the last
|
|
+ * client disconnects. By default this feature is disabled.
|
|
+ *
|
|
+ * See \ref nvmlEnableState_t for details on allowed modes.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param mode Reference in which to return the current driver persistence mode
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a mode has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a mode is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not support this feature
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ *
|
|
+ * @see nvmlDeviceSetPersistenceMode()
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetPersistenceMode(nvmlDevice_t device, nvmlEnableState_t *mode);
|
|
+
|
|
+/**
|
|
+ * Retrieves the PCI attributes of this device.
|
|
+ *
|
|
+ * For all products.
|
|
+ *
|
|
+ * See \ref nvmlPciInfo_t for details on the available PCI info.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param pci Reference in which to return the PCI info
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a pci has been populated
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a pci is NULL
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetPciInfo(nvmlDevice_t device, nvmlPciInfo_t *pci);
|
|
+
|
|
+/**
|
|
+ * Retrieves the maximum PCIe link generation possible with this device and system
|
|
+ *
|
|
+ * I.E. for a generation 2 PCIe device attached to a generation 1 PCIe bus the max link generation this function will
|
|
+ * report is generation 1.
|
|
+ *
|
|
+ * For Fermi &tm; or newer fully supported devices.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param maxLinkGen Reference in which to return the max PCIe link generation
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a maxLinkGen has been populated
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a maxLinkGen is null
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if PCIe link information is not available
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetMaxPcieLinkGeneration(nvmlDevice_t device, unsigned int *maxLinkGen);
|
|
+
|
|
+/**
|
|
+ * Retrieves the maximum PCIe link width possible with this device and system
|
|
+ *
|
|
+ * I.E. for a device with a 16x PCIe bus width attached to a 8x PCIe system bus this function will report
|
|
+ * a max link width of 8.
|
|
+ *
|
|
+ * For Fermi &tm; or newer fully supported devices.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param maxLinkWidth Reference in which to return the max PCIe link generation
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a maxLinkWidth has been populated
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a maxLinkWidth is null
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if PCIe link information is not available
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetMaxPcieLinkWidth(nvmlDevice_t device, unsigned int *maxLinkWidth);
|
|
+
|
|
+/**
|
|
+ * Retrieves the current PCIe link generation
|
|
+ *
|
|
+ * For Fermi &tm; or newer fully supported devices.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param currLinkGen Reference in which to return the current PCIe link generation
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a currLinkGen has been populated
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a currLinkGen is null
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if PCIe link information is not available
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetCurrPcieLinkGeneration(nvmlDevice_t device, unsigned int *currLinkGen);
|
|
+
|
|
+/**
|
|
+ * Retrieves the current PCIe link width
|
|
+ *
|
|
+ * For Fermi &tm; or newer fully supported devices.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param currLinkWidth Reference in which to return the current PCIe link generation
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a currLinkWidth has been populated
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a currLinkWidth is null
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if PCIe link information is not available
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetCurrPcieLinkWidth(nvmlDevice_t device, unsigned int *currLinkWidth);
|
|
+
|
|
+/**
|
|
+ * Retrieve PCIe utilization information.
|
|
+ * This function is querying a byte counter over a 20ms interval and thus is the
|
|
+ * PCIe throughput over that interval.
|
|
+ *
|
|
+ * For Maxwell &tm; or newer fully supported devices.
|
|
+ *
|
|
+ * This method is not supported on virtualized GPU environments.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param counter The specific counter that should be queried \ref nvmlPcieUtilCounter_t
|
|
+ * @param value Reference in which to return throughput in KB/s
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a value has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device or \a counter is invalid, or \a value is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not support this feature
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetPcieThroughput(nvmlDevice_t device, nvmlPcieUtilCounter_t counter, unsigned int *value);
|
|
+
|
|
+/**
|
|
+ * Retrieve the PCIe replay counter.
|
|
+ *
|
|
+ * For Kepler &tm; or newer fully supported devices.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param value Reference in which to return the counter's value
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a value and \a rollover have been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid, or \a value or \a rollover are NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not support this feature
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetPcieReplayCounter(nvmlDevice_t device, unsigned int *value);
|
|
+
|
|
+/**
|
|
+ * Retrieves the current clock speeds for the device.
|
|
+ *
|
|
+ * For Fermi &tm; or newer fully supported devices.
|
|
+ *
|
|
+ * See \ref nvmlClockType_t for details on available clock information.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param type Identify which clock domain to query
|
|
+ * @param clock Reference in which to return the clock speed in MHz
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a clock has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a clock is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device cannot report the specified clock
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetClockInfo(nvmlDevice_t device, nvmlClockType_t type, unsigned int *clock);
|
|
+
|
|
+/**
|
|
+ * Retrieves the maximum clock speeds for the device.
|
|
+ *
|
|
+ * For Fermi &tm; or newer fully supported devices.
|
|
+ *
|
|
+ * See \ref nvmlClockType_t for details on available clock information.
|
|
+ *
|
|
+ * \note On GPUs from Fermi family current P0 clocks (reported by \ref nvmlDeviceGetClockInfo) can differ from max clocks
|
|
+ * by few MHz.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param type Identify which clock domain to query
|
|
+ * @param clock Reference in which to return the clock speed in MHz
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a clock has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a clock is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device cannot report the specified clock
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetMaxClockInfo(nvmlDevice_t device, nvmlClockType_t type, unsigned int *clock);
|
|
+
|
|
+/**
|
|
+ * Retrieves the current setting of a clock that applications will use unless an overspec situation occurs.
|
|
+ * Can be changed using \ref nvmlDeviceSetApplicationsClocks.
|
|
+ *
|
|
+ * For Kepler &tm; or newer fully supported devices.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param clockType Identify which clock domain to query
|
|
+ * @param clockMHz Reference in which to return the clock in MHz
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a clockMHz has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a clockMHz is NULL or \a clockType is invalid
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not support this feature
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetApplicationsClock(nvmlDevice_t device, nvmlClockType_t clockType, unsigned int *clockMHz);
|
|
+
|
|
+/**
|
|
+ * Retrieves the default applications clock that GPU boots with or
|
|
+ * defaults to after \ref nvmlDeviceResetApplicationsClocks call.
|
|
+ *
|
|
+ * For Kepler &tm; or newer fully supported devices.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param clockType Identify which clock domain to query
|
|
+ * @param clockMHz Reference in which to return the default clock in MHz
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a clockMHz has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a clockMHz is NULL or \a clockType is invalid
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not support this feature
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ *
|
|
+ * \see nvmlDeviceGetApplicationsClock
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetDefaultApplicationsClock(nvmlDevice_t device, nvmlClockType_t clockType, unsigned int *clockMHz);
|
|
+
|
|
+/**
|
|
+ * Resets the application clock to the default value
|
|
+ *
|
|
+ * This is the applications clock that will be used after system reboot or driver reload.
|
|
+ * Default value is constant, but the current value an be changed using \ref nvmlDeviceSetApplicationsClocks.
|
|
+ *
|
|
+ * On Pascal and newer hardware, if clocks were previously locked with \ref nvmlDeviceSetApplicationsClocks,
|
|
+ * this call will unlock clocks. This returns clocks their default behavior ofautomatically boosting above
|
|
+ * base clocks as thermal limits allow.
|
|
+ *
|
|
+ * @see nvmlDeviceGetApplicationsClock
|
|
+ * @see nvmlDeviceSetApplicationsClocks
|
|
+ *
|
|
+ * For Fermi &tm; or newer non-GeForce fully supported devices and Maxwell or newer GeForce devices.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if new settings were successfully set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not support this feature
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceResetApplicationsClocks(nvmlDevice_t device);
|
|
+
|
|
+/**
|
|
+ * Retrieves the clock speed for the clock specified by the clock type and clock ID.
|
|
+ *
|
|
+ * For Kepler &tm; or newer fully supported devices.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param clockType Identify which clock domain to query
|
|
+ * @param clockId Identify which clock in the domain to query
|
|
+ * @param clockMHz Reference in which to return the clock in MHz
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a clockMHz has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a clockMHz is NULL or \a clockType is invalid
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not support this feature
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetClock(nvmlDevice_t device, nvmlClockType_t clockType, nvmlClockId_t clockId, unsigned int *clockMHz);
|
|
+
|
|
+/**
|
|
+ * Retrieves the customer defined maximum boost clock speed specified by the given clock type.
|
|
+ *
|
|
+ * For newer than Maxwell &tm; fully supported devices.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param clockType Identify which clock domain to query
|
|
+ * @param clockMHz Reference in which to return the clock in MHz
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a clockMHz has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a clockMHz is NULL or \a clockType is invalid
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device or the \a clockType on this device does not support this feature
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetMaxCustomerBoostClock(nvmlDevice_t device, nvmlClockType_t clockType, unsigned int *clockMHz);
|
|
+
|
|
+/**
|
|
+ * Retrieves the list of possible memory clocks that can be used as an argument for \ref nvmlDeviceSetApplicationsClocks.
|
|
+ *
|
|
+ * For Kepler &tm; or newer fully supported devices.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param count Reference in which to provide the \a clocksMHz array size, and
|
|
+ * to return the number of elements
|
|
+ * @param clocksMHz Reference in which to return the clock in MHz
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a count and \a clocksMHz have been populated
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a count is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not support this feature
|
|
+ * - \ref NVML_ERROR_INSUFFICIENT_SIZE if \a count is too small (\a count is set to the number of
|
|
+ * required elements)
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ *
|
|
+ * @see nvmlDeviceSetApplicationsClocks
|
|
+ * @see nvmlDeviceGetSupportedGraphicsClocks
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetSupportedMemoryClocks(nvmlDevice_t device, unsigned int *count, unsigned int *clocksMHz);
|
|
+
|
|
+/**
|
|
+ * Retrieves the list of possible graphics clocks that can be used as an argument for \ref nvmlDeviceSetApplicationsClocks.
|
|
+ *
|
|
+ * For Kepler &tm; or newer fully supported devices.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param memoryClockMHz Memory clock for which to return possible graphics clocks
|
|
+ * @param count Reference in which to provide the \a clocksMHz array size, and
|
|
+ * to return the number of elements
|
|
+ * @param clocksMHz Reference in which to return the clocks in MHz
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a count and \a clocksMHz have been populated
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_NOT_FOUND if the specified \a memoryClockMHz is not a supported frequency
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a clock is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not support this feature
|
|
+ * - \ref NVML_ERROR_INSUFFICIENT_SIZE if \a count is too small
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ *
|
|
+ * @see nvmlDeviceSetApplicationsClocks
|
|
+ * @see nvmlDeviceGetSupportedMemoryClocks
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetSupportedGraphicsClocks(nvmlDevice_t device, unsigned int memoryClockMHz, unsigned int *count, unsigned int *clocksMHz);
|
|
+
|
|
+/**
|
|
+ * Retrieve the current state of Auto Boosted clocks on a device and store it in \a isEnabled
|
|
+ *
|
|
+ * For Kepler &tm; or newer fully supported devices.
|
|
+ *
|
|
+ * Auto Boosted clocks are enabled by default on some hardware, allowing the GPU to run at higher clock rates
|
|
+ * to maximize performance as thermal limits allow.
|
|
+ *
|
|
+ * On Pascal and newer hardware, Auto Aoosted clocks are controlled through application clocks.
|
|
+ * Use \ref nvmlDeviceSetApplicationsClocks and \ref nvmlDeviceResetApplicationsClocks to control Auto Boost
|
|
+ * behavior.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param isEnabled Where to store the current state of Auto Boosted clocks of the target device
|
|
+ * @param defaultIsEnabled Where to store the default Auto Boosted clocks behavior of the target device that the device will
|
|
+ * revert to when no applications are using the GPU
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS If \a isEnabled has been been set with the Auto Boosted clocks state of \a device
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a isEnabled is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not support Auto Boosted clocks
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ *
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetAutoBoostedClocksEnabled(nvmlDevice_t device, nvmlEnableState_t *isEnabled, nvmlEnableState_t *defaultIsEnabled);
|
|
+
|
|
+/**
|
|
+ * Try to set the current state of Auto Boosted clocks on a device.
|
|
+ *
|
|
+ * For Kepler &tm; or newer fully supported devices.
|
|
+ *
|
|
+ * Auto Boosted clocks are enabled by default on some hardware, allowing the GPU to run at higher clock rates
|
|
+ * to maximize performance as thermal limits allow. Auto Boosted clocks should be disabled if fixed clock
|
|
+ * rates are desired.
|
|
+ *
|
|
+ * Non-root users may use this API by default but can be restricted by root from using this API by calling
|
|
+ * \ref nvmlDeviceSetAPIRestriction with apiType=NVML_RESTRICTED_API_SET_AUTO_BOOSTED_CLOCKS.
|
|
+ * Note: Persistence Mode is required to modify current Auto Boost settings, therefore, it must be enabled.
|
|
+ *
|
|
+ * On Pascal and newer hardware, Auto Boosted clocks are controlled through application clocks.
|
|
+ * Use \ref nvmlDeviceSetApplicationsClocks and \ref nvmlDeviceResetApplicationsClocks to control Auto Boost
|
|
+ * behavior.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param enabled What state to try to set Auto Boosted clocks of the target device to
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS If the Auto Boosted clocks were successfully set to the state specified by \a enabled
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not support Auto Boosted clocks
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ *
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceSetAutoBoostedClocksEnabled(nvmlDevice_t device, nvmlEnableState_t enabled);
|
|
+
|
|
+/**
|
|
+ * Try to set the default state of Auto Boosted clocks on a device. This is the default state that Auto Boosted clocks will
|
|
+ * return to when no compute running processes (e.g. CUDA application which have an active context) are running
|
|
+ *
|
|
+ * For Kepler &tm; or newer non-GeForce fully supported devices and Maxwell or newer GeForce devices.
|
|
+ * Requires root/admin permissions.
|
|
+ *
|
|
+ * Auto Boosted clocks are enabled by default on some hardware, allowing the GPU to run at higher clock rates
|
|
+ * to maximize performance as thermal limits allow. Auto Boosted clocks should be disabled if fixed clock
|
|
+ * rates are desired.
|
|
+ *
|
|
+ * On Pascal and newer hardware, Auto Boosted clocks are controlled through application clocks.
|
|
+ * Use \ref nvmlDeviceSetApplicationsClocks and \ref nvmlDeviceResetApplicationsClocks to control Auto Boost
|
|
+ * behavior.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param enabled What state to try to set default Auto Boosted clocks of the target device to
|
|
+ * @param flags Flags that change the default behavior. Currently Unused.
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS If the Auto Boosted clock's default state was successfully set to the state specified by \a enabled
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_NO_PERMISSION If the calling user does not have permission to change Auto Boosted clock's default state.
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not support Auto Boosted clocks
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ *
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceSetDefaultAutoBoostedClocksEnabled(nvmlDevice_t device, nvmlEnableState_t enabled, unsigned int flags);
|
|
+
|
|
+
|
|
+/**
|
|
+ * Retrieves the intended operating speed of the device's fan.
|
|
+ *
|
|
+ * Note: The reported speed is the intended fan speed. If the fan is physically blocked and unable to spin, the
|
|
+ * output will not match the actual fan speed.
|
|
+ *
|
|
+ * For all discrete products with dedicated fans.
|
|
+ *
|
|
+ * The fan speed is expressed as a percent of the maximum, i.e. full speed is 100%.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param speed Reference in which to return the fan speed percentage
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a speed has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a speed is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not have a fan
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetFanSpeed(nvmlDevice_t device, unsigned int *speed);
|
|
+
|
|
+/**
|
|
+ * Retrieves the current temperature readings for the device, in degrees C.
|
|
+ *
|
|
+ * For all products.
|
|
+ *
|
|
+ * See \ref nvmlTemperatureSensors_t for details on available temperature sensors.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param sensorType Flag that indicates which sensor reading to retrieve
|
|
+ * @param temp Reference in which to return the temperature reading
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a temp has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid, \a sensorType is invalid or \a temp is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not have the specified sensor
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetTemperature(nvmlDevice_t device, nvmlTemperatureSensors_t sensorType, unsigned int *temp);
|
|
+
|
|
+/**
|
|
+ * Retrieves the temperature threshold for the GPU with the specified threshold type in degrees C.
|
|
+ *
|
|
+ * For Kepler &tm; or newer fully supported devices.
|
|
+ *
|
|
+ * See \ref nvmlTemperatureThresholds_t for details on available temperature thresholds.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param thresholdType The type of threshold value queried
|
|
+ * @param temp Reference in which to return the temperature reading
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a temp has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid, \a thresholdType is invalid or \a temp is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not have a temperature sensor or is unsupported
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetTemperatureThreshold(nvmlDevice_t device, nvmlTemperatureThresholds_t thresholdType, unsigned int *temp);
|
|
+
|
|
+/**
|
|
+ * Retrieves the current performance state for the device.
|
|
+ *
|
|
+ * For Fermi &tm; or newer fully supported devices.
|
|
+ *
|
|
+ * See \ref nvmlPstates_t for details on allowed performance states.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param pState Reference in which to return the performance state reading
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a pState has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a pState is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not support this feature
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetPerformanceState(nvmlDevice_t device, nvmlPstates_t *pState);
|
|
+
|
|
+/**
|
|
+ * Retrieves current clocks throttling reasons.
|
|
+ *
|
|
+ * For all fully supported products.
|
|
+ *
|
|
+ * \note More than one bit can be enabled at the same time. Multiple reasons can be affecting clocks at once.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param clocksThrottleReasons Reference in which to return bitmask of active clocks throttle
|
|
+ * reasons
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a clocksThrottleReasons has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a clocksThrottleReasons is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not support this feature
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ *
|
|
+ * @see nvmlClocksThrottleReasons
|
|
+ * @see nvmlDeviceGetSupportedClocksThrottleReasons
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetCurrentClocksThrottleReasons(nvmlDevice_t device, unsigned long long *clocksThrottleReasons);
|
|
+
|
|
+/**
|
|
+ * Retrieves bitmask of supported clocks throttle reasons that can be returned by
|
|
+ * \ref nvmlDeviceGetCurrentClocksThrottleReasons
|
|
+ *
|
|
+ * For all fully supported products.
|
|
+ *
|
|
+ * This method is not supported on virtualized GPU environments.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param supportedClocksThrottleReasons Reference in which to return bitmask of supported
|
|
+ * clocks throttle reasons
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a supportedClocksThrottleReasons has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a supportedClocksThrottleReasons is NULL
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ *
|
|
+ * @see nvmlClocksThrottleReasons
|
|
+ * @see nvmlDeviceGetCurrentClocksThrottleReasons
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetSupportedClocksThrottleReasons(nvmlDevice_t device, unsigned long long *supportedClocksThrottleReasons);
|
|
+
|
|
+/**
|
|
+ * Deprecated: Use \ref nvmlDeviceGetPerformanceState. This function exposes an incorrect generalization.
|
|
+ *
|
|
+ * Retrieve the current performance state for the device.
|
|
+ *
|
|
+ * For Fermi &tm; or newer fully supported devices.
|
|
+ *
|
|
+ * See \ref nvmlPstates_t for details on allowed performance states.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param pState Reference in which to return the performance state reading
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a pState has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a pState is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not support this feature
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetPowerState(nvmlDevice_t device, nvmlPstates_t *pState);
|
|
+
|
|
+/**
|
|
+ * This API has been deprecated.
|
|
+ *
|
|
+ * Retrieves the power management mode associated with this device.
|
|
+ *
|
|
+ * For products from the Fermi family.
|
|
+ * - Requires \a NVML_INFOROM_POWER version 3.0 or higher.
|
|
+ *
|
|
+ * For from the Kepler or newer families.
|
|
+ * - Does not require \a NVML_INFOROM_POWER object.
|
|
+ *
|
|
+ * This flag indicates whether any power management algorithm is currently active on the device. An
|
|
+ * enabled state does not necessarily mean the device is being actively throttled -- only that
|
|
+ * that the driver will do so if the appropriate conditions are met.
|
|
+ *
|
|
+ * See \ref nvmlEnableState_t for details on allowed modes.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param mode Reference in which to return the current power management mode
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a mode has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a mode is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not support this feature
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetPowerManagementMode(nvmlDevice_t device, nvmlEnableState_t *mode);
|
|
+
|
|
+/**
|
|
+ * Retrieves the power management limit associated with this device.
|
|
+ *
|
|
+ * For Fermi &tm; or newer fully supported devices.
|
|
+ *
|
|
+ * The power limit defines the upper boundary for the card's power draw. If
|
|
+ * the card's total power draw reaches this limit the power management algorithm kicks in.
|
|
+ *
|
|
+ * This reading is only available if power management mode is supported.
|
|
+ * See \ref nvmlDeviceGetPowerManagementMode.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param limit Reference in which to return the power management limit in milliwatts
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a limit has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a limit is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not support this feature
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetPowerManagementLimit(nvmlDevice_t device, unsigned int *limit);
|
|
+
|
|
+/**
|
|
+ * Retrieves information about possible values of power management limits on this device.
|
|
+ *
|
|
+ * For Kepler &tm; or newer fully supported devices.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param minLimit Reference in which to return the minimum power management limit in milliwatts
|
|
+ * @param maxLimit Reference in which to return the maximum power management limit in milliwatts
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a minLimit and \a maxLimit have been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a minLimit or \a maxLimit is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not support this feature
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ *
|
|
+ * @see nvmlDeviceSetPowerManagementLimit
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetPowerManagementLimitConstraints(nvmlDevice_t device, unsigned int *minLimit, unsigned int *maxLimit);
|
|
+
|
|
+/**
|
|
+ * Retrieves default power management limit on this device, in milliwatts.
|
|
+ * Default power management limit is a power management limit that the device boots with.
|
|
+ *
|
|
+ * For Kepler &tm; or newer fully supported devices.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param defaultLimit Reference in which to return the default power management limit in milliwatts
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a defaultLimit has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a defaultLimit is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not support this feature
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetPowerManagementDefaultLimit(nvmlDevice_t device, unsigned int *defaultLimit);
|
|
+
|
|
+/**
|
|
+ * Retrieves power usage for this GPU in milliwatts and its associated circuitry (e.g. memory)
|
|
+ *
|
|
+ * For Fermi &tm; or newer fully supported devices.
|
|
+ *
|
|
+ * On Fermi and Kepler GPUs the reading is accurate to within +/- 5% of current power draw.
|
|
+ *
|
|
+ * It is only available if power management mode is supported. See \ref nvmlDeviceGetPowerManagementMode.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param power Reference in which to return the power usage information
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a power has been populated
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a power is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not support power readings
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetPowerUsage(nvmlDevice_t device, unsigned int *power);
|
|
+
|
|
+/**
|
|
+ * Get the effective power limit that the driver enforces after taking into account all limiters
|
|
+ *
|
|
+ * Note: This can be different from the \ref nvmlDeviceGetPowerManagementLimit if other limits are set elsewhere
|
|
+ * This includes the out of band power limit interface
|
|
+ *
|
|
+ * For Kepler &tm; or newer fully supported devices.
|
|
+ *
|
|
+ * @param device The device to communicate with
|
|
+ * @param limit Reference in which to return the power management limit in milliwatts
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a limit has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a limit is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not support this feature
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetEnforcedPowerLimit(nvmlDevice_t device, unsigned int *limit);
|
|
+
|
|
+/**
|
|
+ * Retrieves the current GOM and pending GOM (the one that GPU will switch to after reboot).
|
|
+ *
|
|
+ * For GK110 M-class and X-class Tesla &tm; products from the Kepler family.
|
|
+ * Modes \ref NVML_GOM_LOW_DP and \ref NVML_GOM_ALL_ON are supported on fully supported GeForce products.
|
|
+ * Not supported on Quadro ® and Tesla &tm; C-class products.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param current Reference in which to return the current GOM
|
|
+ * @param pending Reference in which to return the pending GOM
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a mode has been populated
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a current or \a pending is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not support this feature
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ *
|
|
+ * @see nvmlGpuOperationMode_t
|
|
+ * @see nvmlDeviceSetGpuOperationMode
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetGpuOperationMode(nvmlDevice_t device, nvmlGpuOperationMode_t *current, nvmlGpuOperationMode_t *pending);
|
|
+
|
|
+/**
|
|
+ * Retrieves the amount of used, free and total memory available on the device, in bytes.
|
|
+ *
|
|
+ * For all products.
|
|
+ *
|
|
+ * Enabling ECC reduces the amount of total available memory, due to the extra required parity bits.
|
|
+ * Under WDDM most device memory is allocated and managed on startup by Windows.
|
|
+ *
|
|
+ * Under Linux and Windows TCC, the reported amount of used memory is equal to the sum of memory allocated
|
|
+ * by all active channels on the device.
|
|
+ *
|
|
+ * See \ref nvmlMemory_t for details on available memory info.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param memory Reference in which to return the memory information
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a memory has been populated
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a memory is NULL
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetMemoryInfo(nvmlDevice_t device, nvmlMemory_t *memory);
|
|
+
|
|
+/**
|
|
+ * Retrieves the current compute mode for the device.
|
|
+ *
|
|
+ * For all products.
|
|
+ *
|
|
+ * See \ref nvmlComputeMode_t for details on allowed compute modes.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param mode Reference in which to return the current compute mode
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a mode has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a mode is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not support this feature
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ *
|
|
+ * @see nvmlDeviceSetComputeMode()
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetComputeMode(nvmlDevice_t device, nvmlComputeMode_t *mode);
|
|
+
|
|
+/**
|
|
+ * Retrieves the current and pending ECC modes for the device.
|
|
+ *
|
|
+ * For Fermi &tm; or newer fully supported devices.
|
|
+ * Only applicable to devices with ECC.
|
|
+ * Requires \a NVML_INFOROM_ECC version 1.0 or higher.
|
|
+ *
|
|
+ * Changing ECC modes requires a reboot. The "pending" ECC mode refers to the target mode following
|
|
+ * the next reboot.
|
|
+ *
|
|
+ * See \ref nvmlEnableState_t for details on allowed modes.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param current Reference in which to return the current ECC mode
|
|
+ * @param pending Reference in which to return the pending ECC mode
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a current and \a pending have been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or either \a current or \a pending is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not support this feature
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ *
|
|
+ * @see nvmlDeviceSetEccMode()
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetEccMode(nvmlDevice_t device, nvmlEnableState_t *current, nvmlEnableState_t *pending);
|
|
+
|
|
+/**
|
|
+ * Retrieves the device boardId from 0-N.
|
|
+ * Devices with the same boardId indicate GPUs connected to the same PLX. Use in conjunction with
|
|
+ * \ref nvmlDeviceGetMultiGpuBoard() to decide if they are on the same board as well.
|
|
+ * The boardId returned is a unique ID for the current configuration. Uniqueness and ordering across
|
|
+ * reboots and system configurations is not guaranteed (i.e. if a Tesla K40c returns 0x100 and
|
|
+ * the two GPUs on a Tesla K10 in the same system returns 0x200 it is not guaranteed they will
|
|
+ * always return those values but they will always be different from each other).
|
|
+ *
|
|
+ *
|
|
+ * For Fermi &tm; or newer fully supported devices.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param boardId Reference in which to return the device's board ID
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a boardId has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a boardId is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not support this feature
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetBoardId(nvmlDevice_t device, unsigned int *boardId);
|
|
+
|
|
+/**
|
|
+ * Retrieves whether the device is on a Multi-GPU Board
|
|
+ * Devices that are on multi-GPU boards will set \a multiGpuBool to a non-zero value.
|
|
+ *
|
|
+ * For Fermi &tm; or newer fully supported devices.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param multiGpuBool Reference in which to return a zero or non-zero value
|
|
+ * to indicate whether the device is on a multi GPU board
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a multiGpuBool has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a multiGpuBool is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not support this feature
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetMultiGpuBoard(nvmlDevice_t device, unsigned int *multiGpuBool);
|
|
+
|
|
+/**
|
|
+ * Retrieves the total ECC error counts for the device.
|
|
+ *
|
|
+ * For Fermi &tm; or newer fully supported devices.
|
|
+ * Only applicable to devices with ECC.
|
|
+ * Requires \a NVML_INFOROM_ECC version 1.0 or higher.
|
|
+ * Requires ECC Mode to be enabled.
|
|
+ *
|
|
+ * The total error count is the sum of errors across each of the separate memory systems, i.e. the total set of
|
|
+ * errors across the entire device.
|
|
+ *
|
|
+ * See \ref nvmlMemoryErrorType_t for a description of available error types.\n
|
|
+ * See \ref nvmlEccCounterType_t for a description of available counter types.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param errorType Flag that specifies the type of the errors.
|
|
+ * @param counterType Flag that specifies the counter-type of the errors.
|
|
+ * @param eccCounts Reference in which to return the specified ECC errors
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a eccCounts has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device, \a errorType or \a counterType is invalid, or \a eccCounts is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not support this feature
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ *
|
|
+ * @see nvmlDeviceClearEccErrorCounts()
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetTotalEccErrors(nvmlDevice_t device, nvmlMemoryErrorType_t errorType, nvmlEccCounterType_t counterType, unsigned long long *eccCounts);
|
|
+
|
|
+/**
|
|
+ * Retrieves the detailed ECC error counts for the device.
|
|
+ *
|
|
+ * @deprecated This API supports only a fixed set of ECC error locations
|
|
+ * On different GPU architectures different locations are supported
|
|
+ * See \ref nvmlDeviceGetMemoryErrorCounter
|
|
+ *
|
|
+ * For Fermi &tm; or newer fully supported devices.
|
|
+ * Only applicable to devices with ECC.
|
|
+ * Requires \a NVML_INFOROM_ECC version 2.0 or higher to report aggregate location-based ECC counts.
|
|
+ * Requires \a NVML_INFOROM_ECC version 1.0 or higher to report all other ECC counts.
|
|
+ * Requires ECC Mode to be enabled.
|
|
+ *
|
|
+ * Detailed errors provide separate ECC counts for specific parts of the memory system.
|
|
+ *
|
|
+ * Reports zero for unsupported ECC error counters when a subset of ECC error counters are supported.
|
|
+ *
|
|
+ * See \ref nvmlMemoryErrorType_t for a description of available bit types.\n
|
|
+ * See \ref nvmlEccCounterType_t for a description of available counter types.\n
|
|
+ * See \ref nvmlEccErrorCounts_t for a description of provided detailed ECC counts.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param errorType Flag that specifies the type of the errors.
|
|
+ * @param counterType Flag that specifies the counter-type of the errors.
|
|
+ * @param eccCounts Reference in which to return the specified ECC errors
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a eccCounts has been populated
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device, \a errorType or \a counterType is invalid, or \a eccCounts is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not support this feature
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ *
|
|
+ * @see nvmlDeviceClearEccErrorCounts()
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetDetailedEccErrors(nvmlDevice_t device, nvmlMemoryErrorType_t errorType, nvmlEccCounterType_t counterType, nvmlEccErrorCounts_t *eccCounts);
|
|
+
|
|
+/**
|
|
+ * Retrieves the requested memory error counter for the device.
|
|
+ *
|
|
+ * For Fermi &tm; or newer fully supported devices.
|
|
+ * Requires \a NVML_INFOROM_ECC version 2.0 or higher to report aggregate location-based memory error counts.
|
|
+ * Requires \a NVML_INFOROM_ECC version 1.0 or higher to report all other memory error counts.
|
|
+ *
|
|
+ * Only applicable to devices with ECC.
|
|
+ *
|
|
+ * Requires ECC Mode to be enabled.
|
|
+ *
|
|
+ * See \ref nvmlMemoryErrorType_t for a description of available memory error types.\n
|
|
+ * See \ref nvmlEccCounterType_t for a description of available counter types.\n
|
|
+ * See \ref nvmlMemoryLocation_t for a description of available counter locations.\n
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param errorType Flag that specifies the type of error.
|
|
+ * @param counterType Flag that specifies the counter-type of the errors.
|
|
+ * @param locationType Specifies the location of the counter.
|
|
+ * @param count Reference in which to return the ECC counter
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a count has been populated
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device, \a bitTyp,e \a counterType or \a locationType is
|
|
+ * invalid, or \a count is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not support ECC error reporting in the specified memory
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetMemoryErrorCounter(nvmlDevice_t device, nvmlMemoryErrorType_t errorType,
|
|
+ nvmlEccCounterType_t counterType,
|
|
+ nvmlMemoryLocation_t locationType, unsigned long long *count);
|
|
+
|
|
+/**
|
|
+ * Retrieves the current utilization rates for the device's major subsystems.
|
|
+ *
|
|
+ * For Fermi &tm; or newer fully supported devices.
|
|
+ *
|
|
+ * See \ref nvmlUtilization_t for details on available utilization rates.
|
|
+ *
|
|
+ * \note During driver initialization when ECC is enabled one can see high GPU and Memory Utilization readings.
|
|
+ * This is caused by ECC Memory Scrubbing mechanism that is performed during driver initialization.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param utilization Reference in which to return the utilization information
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a utilization has been populated
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a utilization is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not support this feature
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetUtilizationRates(nvmlDevice_t device, nvmlUtilization_t *utilization);
|
|
+
|
|
+/**
|
|
+ * Retrieves the current utilization and sampling size in microseconds for the Encoder
|
|
+ *
|
|
+ * For Kepler &tm; or newer fully supported devices.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param utilization Reference to an unsigned int for encoder utilization info
|
|
+ * @param samplingPeriodUs Reference to an unsigned int for the sampling period in US
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a utilization has been populated
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid, \a utilization is NULL, or \a samplingPeriodUs is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not support this feature
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetEncoderUtilization(nvmlDevice_t device, unsigned int *utilization, unsigned int *samplingPeriodUs);
|
|
+
|
|
+/**
|
|
+ * Retrieves the current utilization and sampling size in microseconds for the Decoder
|
|
+ *
|
|
+ * For Kepler &tm; or newer fully supported devices.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param utilization Reference to an unsigned int for decoder utilization info
|
|
+ * @param samplingPeriodUs Reference to an unsigned int for the sampling period in US
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a utilization has been populated
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid, \a utilization is NULL, or \a samplingPeriodUs is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not support this feature
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetDecoderUtilization(nvmlDevice_t device, unsigned int *utilization, unsigned int *samplingPeriodUs);
|
|
+
|
|
+/**
|
|
+ * Retrieves the current and pending driver model for the device.
|
|
+ *
|
|
+ * For Fermi &tm; or newer fully supported devices.
|
|
+ * For windows only.
|
|
+ *
|
|
+ * On Windows platforms the device driver can run in either WDDM or WDM (TCC) mode. If a display is attached
|
|
+ * to the device it must run in WDDM mode. TCC mode is preferred if a display is not attached.
|
|
+ *
|
|
+ * See \ref nvmlDriverModel_t for details on available driver models.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param current Reference in which to return the current driver model
|
|
+ * @param pending Reference in which to return the pending driver model
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if either \a current and/or \a pending have been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or both \a current and \a pending are NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the platform is not windows
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ *
|
|
+ * @see nvmlDeviceSetDriverModel()
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetDriverModel(nvmlDevice_t device, nvmlDriverModel_t *current, nvmlDriverModel_t *pending);
|
|
+
|
|
+/**
|
|
+ * Get VBIOS version of the device.
|
|
+ *
|
|
+ * For all products.
|
|
+ *
|
|
+ * The VBIOS version may change from time to time. It will not exceed 32 characters in length
|
|
+ * (including the NULL terminator). See \ref nvmlConstants::NVML_DEVICE_VBIOS_VERSION_BUFFER_SIZE.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param version Reference to which to return the VBIOS version
|
|
+ * @param length The maximum allowed length of the string returned in \a version
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a version has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid, or \a version is NULL
|
|
+ * - \ref NVML_ERROR_INSUFFICIENT_SIZE if \a length is too small
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetVbiosVersion(nvmlDevice_t device, char *version, unsigned int length);
|
|
+
|
|
+/**
|
|
+ * Get Bridge Chip Information for all the bridge chips on the board.
|
|
+ *
|
|
+ * For all fully supported products.
|
|
+ * Only applicable to multi-GPU products.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param bridgeHierarchy Reference to the returned bridge chip Hierarchy
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if bridge chip exists
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid, or \a bridgeInfo is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if bridge chip not supported on the device
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ *
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetBridgeChipInfo(nvmlDevice_t device, nvmlBridgeChipHierarchy_t *bridgeHierarchy);
|
|
+
|
|
+/**
|
|
+ * Get information about processes with a compute context on a device
|
|
+ *
|
|
+ * For Fermi &tm; or newer fully supported devices.
|
|
+ *
|
|
+ * This function returns information only about compute running processes (e.g. CUDA application which have
|
|
+ * active context). Any graphics applications (e.g. using OpenGL, DirectX) won't be listed by this function.
|
|
+ *
|
|
+ * To query the current number of running compute processes, call this function with *infoCount = 0. The
|
|
+ * return code will be NVML_ERROR_INSUFFICIENT_SIZE, or NVML_SUCCESS if none are running. For this call
|
|
+ * \a infos is allowed to be NULL.
|
|
+ *
|
|
+ * The usedGpuMemory field returned is all of the memory used by the application.
|
|
+ *
|
|
+ * Keep in mind that information returned by this call is dynamic and the number of elements might change in
|
|
+ * time. Allocate more space for \a infos table in case new compute processes are spawned.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param infoCount Reference in which to provide the \a infos array size, and
|
|
+ * to return the number of returned elements
|
|
+ * @param infos Reference in which to return the process information
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a infoCount and \a infos have been populated
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INSUFFICIENT_SIZE if \a infoCount indicates that the \a infos array is too small
|
|
+ * \a infoCount will contain minimal amount of space necessary for
|
|
+ * the call to complete
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid, either of \a infoCount or \a infos is NULL
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ *
|
|
+ * @see \ref nvmlSystemGetProcessName
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetComputeRunningProcesses(nvmlDevice_t device, unsigned int *infoCount, nvmlProcessInfo_t *infos);
|
|
+
|
|
+/**
|
|
+ * Get information about processes with a graphics context on a device
|
|
+ *
|
|
+ * For Kepler &tm; or newer fully supported devices.
|
|
+ *
|
|
+ * This function returns information only about graphics based processes
|
|
+ * (eg. applications using OpenGL, DirectX)
|
|
+ *
|
|
+ * To query the current number of running graphics processes, call this function with *infoCount = 0. The
|
|
+ * return code will be NVML_ERROR_INSUFFICIENT_SIZE, or NVML_SUCCESS if none are running. For this call
|
|
+ * \a infos is allowed to be NULL.
|
|
+ *
|
|
+ * The usedGpuMemory field returned is all of the memory used by the application.
|
|
+ *
|
|
+ * Keep in mind that information returned by this call is dynamic and the number of elements might change in
|
|
+ * time. Allocate more space for \a infos table in case new graphics processes are spawned.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param infoCount Reference in which to provide the \a infos array size, and
|
|
+ * to return the number of returned elements
|
|
+ * @param infos Reference in which to return the process information
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a infoCount and \a infos have been populated
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INSUFFICIENT_SIZE if \a infoCount indicates that the \a infos array is too small
|
|
+ * \a infoCount will contain minimal amount of space necessary for
|
|
+ * the call to complete
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid, either of \a infoCount or \a infos is NULL
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ *
|
|
+ * @see \ref nvmlSystemGetProcessName
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetGraphicsRunningProcesses(nvmlDevice_t device, unsigned int *infoCount, nvmlProcessInfo_t *infos);
|
|
+
|
|
+/**
|
|
+ * Check if the GPU devices are on the same physical board.
|
|
+ *
|
|
+ * For all fully supported products.
|
|
+ *
|
|
+ * @param device1 The first GPU device
|
|
+ * @param device2 The second GPU device
|
|
+ * @param onSameBoard Reference in which to return the status.
|
|
+ * Non-zero indicates that the GPUs are on the same board.
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a onSameBoard has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a dev1 or \a dev2 are invalid or \a onSameBoard is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if this check is not supported by the device
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the either GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceOnSameBoard(nvmlDevice_t device1, nvmlDevice_t device2, int *onSameBoard);
|
|
+
|
|
+/**
|
|
+ * Retrieves the root/admin permissions on the target API. See \a nvmlRestrictedAPI_t for the list of supported APIs.
|
|
+ * If an API is restricted only root users can call that API. See \a nvmlDeviceSetAPIRestriction to change current permissions.
|
|
+ *
|
|
+ * For all fully supported products.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param apiType Target API type for this operation
|
|
+ * @param isRestricted Reference in which to return the current restriction
|
|
+ * NVML_FEATURE_ENABLED indicates that the API is root-only
|
|
+ * NVML_FEATURE_DISABLED indicates that the API is accessible to all users
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a isRestricted has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid, \a apiType incorrect or \a isRestricted is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if this query is not supported by the device or the device does not support
|
|
+ * the feature that is being queried (E.G. Enabling/disabling Auto Boosted clocks is
|
|
+ * not supported by the device)
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ *
|
|
+ * @see nvmlRestrictedAPI_t
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetAPIRestriction(nvmlDevice_t device, nvmlRestrictedAPI_t apiType, nvmlEnableState_t *isRestricted);
|
|
+
|
|
+/**
|
|
+ * Gets recent samples for the GPU.
|
|
+ *
|
|
+ * For Kepler &tm; or newer fully supported devices.
|
|
+ *
|
|
+ * Based on type, this method can be used to fetch the power, utilization or clock samples maintained in the buffer by
|
|
+ * the driver.
|
|
+ *
|
|
+ * Power, Utilization and Clock samples are returned as type "unsigned int" for the union nvmlValue_t.
|
|
+ *
|
|
+ * To get the size of samples that user needs to allocate, the method is invoked with samples set to NULL.
|
|
+ * The returned samplesCount will provide the number of samples that can be queried. The user needs to
|
|
+ * allocate the buffer with size as samplesCount * sizeof(nvmlSample_t).
|
|
+ *
|
|
+ * lastSeenTimeStamp represents CPU timestamp in microseconds. Set it to 0 to fetch all the samples maintained by the
|
|
+ * underlying buffer. Set lastSeenTimeStamp to one of the timeStamps retrieved from the date of the previous query
|
|
+ * to get more recent samples.
|
|
+ *
|
|
+ * This method fetches the number of entries which can be accommodated in the provided samples array, and the
|
|
+ * reference samplesCount is updated to indicate how many samples were actually retrieved. The advantage of using this
|
|
+ * method for samples in contrast to polling via existing methods is to get get higher frequency data at lower polling cost.
|
|
+ *
|
|
+ * @param device The identifier for the target device
|
|
+ * @param type Type of sampling event
|
|
+ * @param lastSeenTimeStamp Return only samples with timestamp greater than lastSeenTimeStamp.
|
|
+ * @param sampleValType Output parameter to represent the type of sample value as described in nvmlSampleVal_t
|
|
+ * @param sampleCount Reference to provide the number of elements which can be queried in samples array
|
|
+ * @param samples Reference in which samples are returned
|
|
+
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if samples are successfully retrieved
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid, \a samplesCount is NULL or
|
|
+ * reference to \a sampleCount is 0 for non null \a samples
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if this query is not supported by the device
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_NOT_FOUND if sample entries are not found
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetSamples(nvmlDevice_t device, nvmlSamplingType_t type, unsigned long long lastSeenTimeStamp,
|
|
+ nvmlValueType_t *sampleValType, unsigned int *sampleCount, nvmlSample_t *samples);
|
|
+
|
|
+/**
|
|
+ * Gets Total, Available and Used size of BAR1 memory.
|
|
+ *
|
|
+ * BAR1 is used to map the FB (device memory) so that it can be directly accessed by the CPU or by 3rd party
|
|
+ * devices (peer-to-peer on the PCIE bus).
|
|
+ *
|
|
+ * For Kepler &tm; or newer fully supported devices.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param bar1Memory Reference in which BAR1 memory
|
|
+ * information is returned.
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if BAR1 memory is successfully retrieved
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid, \a bar1Memory is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if this query is not supported by the device
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ *
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetBAR1MemoryInfo(nvmlDevice_t device, nvmlBAR1Memory_t *bar1Memory);
|
|
+
|
|
+
|
|
+/**
|
|
+ * Gets the duration of time during which the device was throttled (lower than requested clocks) due to power
|
|
+ * or thermal constraints.
|
|
+ *
|
|
+ * The method is important to users who are tying to understand if their GPUs throttle at any point during their applications. The
|
|
+ * difference in violation times at two different reference times gives the indication of GPU throttling event.
|
|
+ *
|
|
+ * Violation for thermal capping is not supported at this time.
|
|
+ *
|
|
+ * For Kepler &tm; or newer fully supported devices.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param perfPolicyType Represents Performance policy which can trigger GPU throttling
|
|
+ * @param violTime Reference to which violation time related information is returned
|
|
+ *
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if violation time is successfully retrieved
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid, \a perfPolicyType is invalid, or \a violTime is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if this query is not supported by the device
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ *
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetViolationStatus(nvmlDevice_t device, nvmlPerfPolicyType_t perfPolicyType, nvmlViolationTime_t *violTime);
|
|
+
|
|
+/**
|
|
+ * @}
|
|
+ */
|
|
+
|
|
+/** @addtogroup nvmlAccountingStats
|
|
+ * @{
|
|
+ */
|
|
+
|
|
+/**
|
|
+ * Queries the state of per process accounting mode.
|
|
+ *
|
|
+ * For Kepler &tm; or newer fully supported devices.
|
|
+ *
|
|
+ * See \ref nvmlDeviceGetAccountingStats for more details.
|
|
+ * See \ref nvmlDeviceSetAccountingMode
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param mode Reference in which to return the current accounting mode
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if the mode has been successfully retrieved
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a mode are NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device doesn't support this feature
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetAccountingMode(nvmlDevice_t device, nvmlEnableState_t *mode);
|
|
+
|
|
+/**
|
|
+ * Queries process's accounting stats.
|
|
+ *
|
|
+ * For Kepler &tm; or newer fully supported devices.
|
|
+ *
|
|
+ * Accounting stats capture GPU utilization and other statistics across the lifetime of a process.
|
|
+ * Accounting stats can be queried during life time of the process and after its termination.
|
|
+ * The time field in \ref nvmlAccountingStats_t is reported as 0 during the lifetime of the process and
|
|
+ * updated to actual running time after its termination.
|
|
+ * Accounting stats are kept in a circular buffer, newly created processes overwrite information about old
|
|
+ * processes.
|
|
+ *
|
|
+ * See \ref nvmlAccountingStats_t for description of each returned metric.
|
|
+ * List of processes that can be queried can be retrieved from \ref nvmlDeviceGetAccountingPids.
|
|
+ *
|
|
+ * @note Accounting Mode needs to be on. See \ref nvmlDeviceGetAccountingMode.
|
|
+ * @note Only compute and graphics applications stats can be queried. Monitoring applications stats can't be
|
|
+ * queried since they don't contribute to GPU utilization.
|
|
+ * @note In case of pid collision stats of only the latest process (that terminated last) will be reported
|
|
+ *
|
|
+ * @warning On Kepler devices per process statistics are accurate only if there's one process running on a GPU.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param pid Process Id of the target process to query stats for
|
|
+ * @param stats Reference in which to return the process's accounting stats
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if stats have been successfully retrieved
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a stats are NULL
|
|
+ * - \ref NVML_ERROR_NOT_FOUND if process stats were not found
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device doesn't support this feature or accounting mode is disabled
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ *
|
|
+ * @see nvmlDeviceGetAccountingBufferSize
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetAccountingStats(nvmlDevice_t device, unsigned int pid, nvmlAccountingStats_t *stats);
|
|
+
|
|
+/**
|
|
+ * Queries list of processes that can be queried for accounting stats. The list of processes returned
|
|
+ * can be in running or terminated state.
|
|
+ *
|
|
+ * For Kepler &tm; or newer fully supported devices.
|
|
+ *
|
|
+ * To just query the number of processes ready to be queried, call this function with *count = 0 and
|
|
+ * pids=NULL. The return code will be NVML_ERROR_INSUFFICIENT_SIZE, or NVML_SUCCESS if list is empty.
|
|
+ *
|
|
+ * For more details see \ref nvmlDeviceGetAccountingStats.
|
|
+ *
|
|
+ * @note In case of PID collision some processes might not be accessible before the circular buffer is full.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param count Reference in which to provide the \a pids array size, and
|
|
+ * to return the number of elements ready to be queried
|
|
+ * @param pids Reference in which to return list of process ids
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if pids were successfully retrieved
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a count is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device doesn't support this feature or accounting mode is disabled
|
|
+ * - \ref NVML_ERROR_INSUFFICIENT_SIZE if \a count is too small (\a count is set to
|
|
+ * expected value)
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ *
|
|
+ * @see nvmlDeviceGetAccountingBufferSize
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetAccountingPids(nvmlDevice_t device, unsigned int *count, unsigned int *pids);
|
|
+
|
|
+/**
|
|
+ * Returns the number of processes that the circular buffer with accounting pids can hold.
|
|
+ *
|
|
+ * For Kepler &tm; or newer fully supported devices.
|
|
+ *
|
|
+ * This is the maximum number of processes that accounting information will be stored for before information
|
|
+ * about oldest processes will get overwritten by information about new processes.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param bufferSize Reference in which to provide the size (in number of elements)
|
|
+ * of the circular buffer for accounting stats.
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if buffer size was successfully retrieved
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a bufferSize is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device doesn't support this feature or accounting mode is disabled
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ *
|
|
+ * @see nvmlDeviceGetAccountingStats
|
|
+ * @see nvmlDeviceGetAccountingPids
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetAccountingBufferSize(nvmlDevice_t device, unsigned int *bufferSize);
|
|
+
|
|
+/** @} */
|
|
+
|
|
+/** @addtogroup nvmlDeviceQueries
|
|
+ * @{
|
|
+ */
|
|
+
|
|
+/**
|
|
+ * Returns the list of retired pages by source, including pages that are pending retirement
|
|
+ * The address information provided from this API is the hardware address of the page that was retired. Note
|
|
+ * that this does not match the virtual address used in CUDA, but will match the address information in XID 63
|
|
+ *
|
|
+ * For Kepler &tm; or newer fully supported devices.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param cause Filter page addresses by cause of retirement
|
|
+ * @param pageCount Reference in which to provide the \a addresses buffer size, and
|
|
+ * to return the number of retired pages that match \a cause
|
|
+ * Set to 0 to query the size without allocating an \a addresses buffer
|
|
+ * @param addresses Buffer to write the page addresses into
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a pageCount was populated and \a addresses was filled
|
|
+ * - \ref NVML_ERROR_INSUFFICIENT_SIZE if \a pageCount indicates the buffer is not large enough to store all the
|
|
+ * matching page addresses. \a pageCount is set to the needed size.
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid, \a pageCount is NULL, \a cause is invalid, or
|
|
+ * \a addresses is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device doesn't support this feature
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetRetiredPages(nvmlDevice_t device, nvmlPageRetirementCause_t cause,
|
|
+ unsigned int *pageCount, unsigned long long *addresses);
|
|
+
|
|
+/**
|
|
+ * Check if any pages are pending retirement and need a reboot to fully retire.
|
|
+ *
|
|
+ * For Kepler &tm; or newer fully supported devices.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param isPending Reference in which to return the pending status
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a isPending was populated
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a isPending is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device doesn't support this feature
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetRetiredPagesPendingStatus(nvmlDevice_t device, nvmlEnableState_t *isPending);
|
|
+
|
|
+/** @} */
|
|
+
|
|
+/***************************************************************************************************/
|
|
+/** @defgroup nvmlUnitCommands Unit Commands
|
|
+ * This chapter describes NVML operations that change the state of the unit. For S-class products.
|
|
+ * Each of these requires root/admin access. Non-admin users will see an NVML_ERROR_NO_PERMISSION
|
|
+ * error code when invoking any of these methods.
|
|
+ * @{
|
|
+ */
|
|
+/***************************************************************************************************/
|
|
+
|
|
+/**
|
|
+ * Set the LED state for the unit. The LED can be either green (0) or amber (1).
|
|
+ *
|
|
+ * For S-class products.
|
|
+ * Requires root/admin permissions.
|
|
+ *
|
|
+ * This operation takes effect immediately.
|
|
+ *
|
|
+ *
|
|
+ * <b>Current S-Class products don't provide unique LEDs for each unit. As such, both front
|
|
+ * and back LEDs will be toggled in unison regardless of which unit is specified with this command.</b>
|
|
+ *
|
|
+ * See \ref nvmlLedColor_t for available colors.
|
|
+ *
|
|
+ * @param unit The identifier of the target unit
|
|
+ * @param color The target LED color
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if the LED color has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a unit or \a color is invalid
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if this is not an S-class product
|
|
+ * - \ref NVML_ERROR_NO_PERMISSION if the user doesn't have permission to perform this operation
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ *
|
|
+ * @see nvmlUnitGetLedState()
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlUnitSetLedState(nvmlUnit_t unit, nvmlLedColor_t color);
|
|
+
|
|
+/** @} */
|
|
+
|
|
+/***************************************************************************************************/
|
|
+/** @defgroup nvmlDeviceCommands Device Commands
|
|
+ * This chapter describes NVML operations that change the state of the device.
|
|
+ * Each of these requires root/admin access. Non-admin users will see an NVML_ERROR_NO_PERMISSION
|
|
+ * error code when invoking any of these methods.
|
|
+ * @{
|
|
+ */
|
|
+/***************************************************************************************************/
|
|
+
|
|
+/**
|
|
+ * Set the persistence mode for the device.
|
|
+ *
|
|
+ * For all products.
|
|
+ * For Linux only.
|
|
+ * Requires root/admin permissions.
|
|
+ *
|
|
+ * The persistence mode determines whether the GPU driver software is torn down after the last client
|
|
+ * exits.
|
|
+ *
|
|
+ * This operation takes effect immediately. It is not persistent across reboots. After each reboot the
|
|
+ * persistence mode is reset to "Disabled".
|
|
+ *
|
|
+ * See \ref nvmlEnableState_t for available modes.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param mode The target persistence mode
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if the persistence mode was set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a mode is invalid
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not support this feature
|
|
+ * - \ref NVML_ERROR_NO_PERMISSION if the user doesn't have permission to perform this operation
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ *
|
|
+ * @see nvmlDeviceGetPersistenceMode()
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceSetPersistenceMode(nvmlDevice_t device, nvmlEnableState_t mode);
|
|
+
|
|
+/**
|
|
+ * Set the compute mode for the device.
|
|
+ *
|
|
+ * For all products.
|
|
+ * Requires root/admin permissions.
|
|
+ *
|
|
+ * The compute mode determines whether a GPU can be used for compute operations and whether it can
|
|
+ * be shared across contexts.
|
|
+ *
|
|
+ * This operation takes effect immediately. Under Linux it is not persistent across reboots and
|
|
+ * always resets to "Default". Under windows it is persistent.
|
|
+ *
|
|
+ * Under windows compute mode may only be set to DEFAULT when running in WDDM
|
|
+ *
|
|
+ * See \ref nvmlComputeMode_t for details on available compute modes.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param mode The target compute mode
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if the compute mode was set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a mode is invalid
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not support this feature
|
|
+ * - \ref NVML_ERROR_NO_PERMISSION if the user doesn't have permission to perform this operation
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ *
|
|
+ * @see nvmlDeviceGetComputeMode()
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceSetComputeMode(nvmlDevice_t device, nvmlComputeMode_t mode);
|
|
+
|
|
+/**
|
|
+ * Set the ECC mode for the device.
|
|
+ *
|
|
+ * For Kepler &tm; or newer fully supported devices.
|
|
+ * Only applicable to devices with ECC.
|
|
+ * Requires \a NVML_INFOROM_ECC version 1.0 or higher.
|
|
+ * Requires root/admin permissions.
|
|
+ *
|
|
+ * The ECC mode determines whether the GPU enables its ECC support.
|
|
+ *
|
|
+ * This operation takes effect after the next reboot.
|
|
+ *
|
|
+ * See \ref nvmlEnableState_t for details on available modes.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param ecc The target ECC mode
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if the ECC mode was set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a ecc is invalid
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not support this feature
|
|
+ * - \ref NVML_ERROR_NO_PERMISSION if the user doesn't have permission to perform this operation
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ *
|
|
+ * @see nvmlDeviceGetEccMode()
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceSetEccMode(nvmlDevice_t device, nvmlEnableState_t ecc);
|
|
+
|
|
+/**
|
|
+ * Clear the ECC error and other memory error counts for the device.
|
|
+ *
|
|
+ * For Kepler &tm; or newer fully supported devices.
|
|
+ * Only applicable to devices with ECC.
|
|
+ * Requires \a NVML_INFOROM_ECC version 2.0 or higher to clear aggregate location-based ECC counts.
|
|
+ * Requires \a NVML_INFOROM_ECC version 1.0 or higher to clear all other ECC counts.
|
|
+ * Requires root/admin permissions.
|
|
+ * Requires ECC Mode to be enabled.
|
|
+ *
|
|
+ * Sets all of the specified ECC counters to 0, including both detailed and total counts.
|
|
+ *
|
|
+ * This operation takes effect immediately.
|
|
+ *
|
|
+ * See \ref nvmlMemoryErrorType_t for details on available counter types.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param counterType Flag that indicates which type of errors should be cleared.
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if the error counts were cleared
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a counterType is invalid
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not support this feature
|
|
+ * - \ref NVML_ERROR_NO_PERMISSION if the user doesn't have permission to perform this operation
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ *
|
|
+ * @see
|
|
+ * - nvmlDeviceGetDetailedEccErrors()
|
|
+ * - nvmlDeviceGetTotalEccErrors()
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceClearEccErrorCounts(nvmlDevice_t device, nvmlEccCounterType_t counterType);
|
|
+
|
|
+/**
|
|
+ * Set the driver model for the device.
|
|
+ *
|
|
+ * For Fermi &tm; or newer fully supported devices.
|
|
+ * For windows only.
|
|
+ * Requires root/admin permissions.
|
|
+ *
|
|
+ * On Windows platforms the device driver can run in either WDDM or WDM (TCC) mode. If a display is attached
|
|
+ * to the device it must run in WDDM mode.
|
|
+ *
|
|
+ * It is possible to force the change to WDM (TCC) while the display is still attached with a force flag (nvmlFlagForce).
|
|
+ * This should only be done if the host is subsequently powered down and the display is detached from the device
|
|
+ * before the next reboot.
|
|
+ *
|
|
+ * This operation takes effect after the next reboot.
|
|
+ *
|
|
+ * Windows driver model may only be set to WDDM when running in DEFAULT compute mode.
|
|
+ *
|
|
+ * Change driver model to WDDM is not supported when GPU doesn't support graphics acceleration or
|
|
+ * will not support it after reboot. See \ref nvmlDeviceSetGpuOperationMode.
|
|
+ *
|
|
+ * See \ref nvmlDriverModel_t for details on available driver models.
|
|
+ * See \ref nvmlFlagDefault and \ref nvmlFlagForce
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param driverModel The target driver model
|
|
+ * @param flags Flags that change the default behavior
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if the driver model has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a driverModel is invalid
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the platform is not windows or the device does not support this feature
|
|
+ * - \ref NVML_ERROR_NO_PERMISSION if the user doesn't have permission to perform this operation
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ *
|
|
+ * @see nvmlDeviceGetDriverModel()
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceSetDriverModel(nvmlDevice_t device, nvmlDriverModel_t driverModel, unsigned int flags);
|
|
+
|
|
+/**
|
|
+ * Set clocks that applications will lock to.
|
|
+ *
|
|
+ * Sets the clocks that compute and graphics applications will be running at.
|
|
+ * e.g. CUDA driver requests these clocks during context creation which means this property
|
|
+ * defines clocks at which CUDA applications will be running unless some overspec event
|
|
+ * occurs (e.g. over power, over thermal or external HW brake).
|
|
+ *
|
|
+ * Can be used as a setting to request constant performance.
|
|
+ *
|
|
+ * On Pascal and newer hardware, this will automatically disable automatic boosting of clocks.
|
|
+ *
|
|
+ * On K80 and newer Kepler and Maxwell GPUs, users desiring fixed performance should also call
|
|
+ * \ref nvmlDeviceSetAutoBoostedClocksEnabled to prevent clocks from automatically boosting
|
|
+ * above the clock value being set.
|
|
+ *
|
|
+ * For Kepler &tm; or newer non-GeForce fully supported devices and Maxwell or newer GeForce devices.
|
|
+ * Requires root/admin permissions.
|
|
+ *
|
|
+ * See \ref nvmlDeviceGetSupportedMemoryClocks and \ref nvmlDeviceGetSupportedGraphicsClocks
|
|
+ * for details on how to list available clocks combinations.
|
|
+ *
|
|
+ * After system reboot or driver reload applications clocks go back to their default value.
|
|
+ * See \ref nvmlDeviceResetApplicationsClocks.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param memClockMHz Requested memory clock in MHz
|
|
+ * @param graphicsClockMHz Requested graphics clock in MHz
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if new settings were successfully set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a memClockMHz and \a graphicsClockMHz
|
|
+ * is not a valid clock combination
|
|
+ * - \ref NVML_ERROR_NO_PERMISSION if the user doesn't have permission to perform this operation
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device doesn't support this feature
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceSetApplicationsClocks(nvmlDevice_t device, unsigned int memClockMHz, unsigned int graphicsClockMHz);
|
|
+
|
|
+/**
|
|
+ * Set new power limit of this device.
|
|
+ *
|
|
+ * For Kepler &tm; or newer fully supported devices.
|
|
+ * Requires root/admin permissions.
|
|
+ *
|
|
+ * See \ref nvmlDeviceGetPowerManagementLimitConstraints to check the allowed ranges of values.
|
|
+ *
|
|
+ * \note Limit is not persistent across reboots or driver unloads.
|
|
+ * Enable persistent mode to prevent driver from unloading when no application is using the device.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param limit Power management limit in milliwatts to set
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a limit has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a defaultLimit is out of range
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not support this feature
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ *
|
|
+ * @see nvmlDeviceGetPowerManagementLimitConstraints
|
|
+ * @see nvmlDeviceGetPowerManagementDefaultLimit
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceSetPowerManagementLimit(nvmlDevice_t device, unsigned int limit);
|
|
+
|
|
+/**
|
|
+ * Sets new GOM. See \a nvmlGpuOperationMode_t for details.
|
|
+ *
|
|
+ * For GK110 M-class and X-class Tesla &tm; products from the Kepler family.
|
|
+ * Modes \ref NVML_GOM_LOW_DP and \ref NVML_GOM_ALL_ON are supported on fully supported GeForce products.
|
|
+ * Not supported on Quadro ® and Tesla &tm; C-class products.
|
|
+ * Requires root/admin permissions.
|
|
+ *
|
|
+ * Changing GOMs requires a reboot.
|
|
+ * The reboot requirement might be removed in the future.
|
|
+ *
|
|
+ * Compute only GOMs don't support graphics acceleration. Under windows switching to these GOMs when
|
|
+ * pending driver model is WDDM is not supported. See \ref nvmlDeviceSetDriverModel.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param mode Target GOM
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a mode has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a mode incorrect
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not support GOM or specific mode
|
|
+ * - \ref NVML_ERROR_NO_PERMISSION if the user doesn't have permission to perform this operation
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ *
|
|
+ * @see nvmlGpuOperationMode_t
|
|
+ * @see nvmlDeviceGetGpuOperationMode
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceSetGpuOperationMode(nvmlDevice_t device, nvmlGpuOperationMode_t mode);
|
|
+
|
|
+/**
|
|
+ * Changes the root/admin restructions on certain APIs. See \a nvmlRestrictedAPI_t for the list of supported APIs.
|
|
+ * This method can be used by a root/admin user to give non-root/admin access to certain otherwise-restricted APIs.
|
|
+ * The new setting lasts for the lifetime of the NVIDIA driver; it is not persistent. See \a nvmlDeviceGetAPIRestriction
|
|
+ * to query the current restriction settings.
|
|
+ *
|
|
+ * For Kepler &tm; or newer fully supported devices.
|
|
+ * Requires root/admin permissions.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param apiType Target API type for this operation
|
|
+ * @param isRestricted The target restriction
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a isRestricted has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device is invalid or \a apiType incorrect
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device does not support changing API restrictions or the device does not support
|
|
+ * the feature that api restrictions are being set for (E.G. Enabling/disabling auto
|
|
+ * boosted clocks is not supported by the device)
|
|
+ * - \ref NVML_ERROR_NO_PERMISSION if the user doesn't have permission to perform this operation
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ *
|
|
+ * @see nvmlRestrictedAPI_t
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceSetAPIRestriction(nvmlDevice_t device, nvmlRestrictedAPI_t apiType, nvmlEnableState_t isRestricted);
|
|
+
|
|
+/**
|
|
+ * @}
|
|
+ */
|
|
+
|
|
+/** @addtogroup nvmlAccountingStats
|
|
+ * @{
|
|
+ */
|
|
+
|
|
+/**
|
|
+ * Enables or disables per process accounting.
|
|
+ *
|
|
+ * For Kepler &tm; or newer fully supported devices.
|
|
+ * Requires root/admin permissions.
|
|
+ *
|
|
+ * @note This setting is not persistent and will default to disabled after driver unloads.
|
|
+ * Enable persistence mode to be sure the setting doesn't switch off to disabled.
|
|
+ *
|
|
+ * @note Enabling accounting mode has no negative impact on the GPU performance.
|
|
+ *
|
|
+ * @note Disabling accounting clears all accounting pids information.
|
|
+ *
|
|
+ * See \ref nvmlDeviceGetAccountingMode
|
|
+ * See \ref nvmlDeviceGetAccountingStats
|
|
+ * See \ref nvmlDeviceClearAccountingPids
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param mode The target accounting mode
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if the new mode has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device or \a mode are invalid
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device doesn't support this feature
|
|
+ * - \ref NVML_ERROR_NO_PERMISSION if the user doesn't have permission to perform this operation
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceSetAccountingMode(nvmlDevice_t device, nvmlEnableState_t mode);
|
|
+
|
|
+/**
|
|
+ * Clears accounting information about all processes that have already terminated.
|
|
+ *
|
|
+ * For Kepler &tm; or newer fully supported devices.
|
|
+ * Requires root/admin permissions.
|
|
+ *
|
|
+ * See \ref nvmlDeviceGetAccountingMode
|
|
+ * See \ref nvmlDeviceGetAccountingStats
|
|
+ * See \ref nvmlDeviceSetAccountingMode
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if accounting information has been cleared
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device are invalid
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device doesn't support this feature
|
|
+ * - \ref NVML_ERROR_NO_PERMISSION if the user doesn't have permission to perform this operation
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceClearAccountingPids(nvmlDevice_t device);
|
|
+
|
|
+/** @} */
|
|
+
|
|
+/***************************************************************************************************/
|
|
+/** @defgroup NvLink NvLink Methods
|
|
+ * This chapter describes methods that NVML can perform on NVLINK enabled devices.
|
|
+ * @{
|
|
+ */
|
|
+/***************************************************************************************************/
|
|
+
|
|
+/**
|
|
+ * Retrieves the state of the device's NvLink for the link specified
|
|
+ *
|
|
+ * For newer than Maxwell &tm; fully supported devices.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param link Specifies the NvLink link to be queried
|
|
+ * @param isActive \a nvmlEnableState_t where NVML_FEATURE_ENABLED indicates that
|
|
+ * the link is active and NVML_FEATURE_DISABLED indicates it
|
|
+ * is inactive
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a isActive has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device or \a link is invalid or \a isActive is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device doesn't support this feature
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetNvLinkState(nvmlDevice_t device, unsigned int link, nvmlEnableState_t *isActive);
|
|
+
|
|
+/**
|
|
+ * Retrieves the version of the device's NvLink for the link specified
|
|
+ *
|
|
+ * For newer than Maxwell &tm; fully supported devices.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param link Specifies the NvLink link to be queried
|
|
+ * @param version Requested NvLink version
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a version has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device or \a link is invalid or \a version is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device doesn't support this feature
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetNvLinkVersion(nvmlDevice_t device, unsigned int link, unsigned int *version);
|
|
+
|
|
+/**
|
|
+ * Retrieves the requested capability from the device's NvLink for the link specified
|
|
+ * Please refer to the \a nvmlNvLinkCapability_t structure for the specific caps that can be queried
|
|
+ * The return value should be treated as a boolean.
|
|
+ *
|
|
+ * For newer than Maxwell &tm; fully supported devices.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param link Specifies the NvLink link to be queried
|
|
+ * @param capability Specifies the \a nvmlNvLinkCapability_t to be queried
|
|
+ * @param capResult A boolean for the queried capability indicating that feature is available
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a capResult has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device, \a link, or \a capability is invalid or \a capResult is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device doesn't support this feature
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetNvLinkCapability(nvmlDevice_t device, unsigned int link,
|
|
+ nvmlNvLinkCapability_t capability, unsigned int *capResult);
|
|
+
|
|
+/**
|
|
+ * Retrieves the PCI information for the remote node on a NvLink link
|
|
+ * Note: pciSubSystemId is not filled in this function and is indeterminate
|
|
+ *
|
|
+ * For newer than Maxwell &tm; fully supported devices.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param link Specifies the NvLink link to be queried
|
|
+ * @param pci \a nvmlPciInfo_t of the remote node for the specified link
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a pci has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device or \a link is invalid or \a pci is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device doesn't support this feature
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetNvLinkRemotePciInfo(nvmlDevice_t device, unsigned int link, nvmlPciInfo_t *pci);
|
|
+
|
|
+/**
|
|
+ * Retrieves the specified error counter value
|
|
+ * Please refer to \a nvmlNvLinkErrorCounter_t for error counters that are available
|
|
+ *
|
|
+ * For newer than Maxwell &tm; fully supported devices.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param link Specifies the NvLink link to be queried
|
|
+ * @param counter Specifies the NvLink counter to be queried
|
|
+ * @param counterValue Returned counter value
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a counter has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device, \a link, or \a counter is invalid or \a counterValue is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device doesn't support this feature
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetNvLinkErrorCounter(nvmlDevice_t device, unsigned int link,
|
|
+ nvmlNvLinkErrorCounter_t counter, unsigned long long *counterValue);
|
|
+
|
|
+/**
|
|
+ * Resets all error counters to zero
|
|
+ * Please refer to \a nvmlNvLinkErrorCounter_t for the list of error counters that are reset
|
|
+ *
|
|
+ * For newer than Maxwell &tm; fully supported devices.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param link Specifies the NvLink link to be queried
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if the reset is successful
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device or \a link is invalid
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device doesn't support this feature
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceResetNvLinkErrorCounters(nvmlDevice_t device, unsigned int link);
|
|
+
|
|
+/**
|
|
+ * Set the NVLINK utilization counter control information for the specified counter, 0 or 1.
|
|
+ * Please refer to \a nvmlNvLinkUtilizationControl_t for the structure definition. Performs a reset
|
|
+ * of the counters if the reset parameter is non-zero.
|
|
+ *
|
|
+ * For newer than Maxwell &tm; fully supported devices.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param counter Specifies the counter that should be set (0 or 1).
|
|
+ * @param link Specifies the NvLink link to be queried
|
|
+ * @param control A reference to the \a nvmlNvLinkUtilizationControl_t to set
|
|
+ * @param reset Resets the counters on set if non-zero
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if the control has been set successfully
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device, \a counter, \a link, or \a control is invalid
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device doesn't support this feature
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceSetNvLinkUtilizationControl(nvmlDevice_t device, unsigned int link, unsigned int counter,
|
|
+ nvmlNvLinkUtilizationControl_t *control, unsigned int reset);
|
|
+
|
|
+/**
|
|
+ * Get the NVLINK utilization counter control information for the specified counter, 0 or 1.
|
|
+ * Please refer to \a nvmlNvLinkUtilizationControl_t for the structure definition
|
|
+ *
|
|
+ * For newer than Maxwell &tm; fully supported devices.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param counter Specifies the counter that should be set (0 or 1).
|
|
+ * @param link Specifies the NvLink link to be queried
|
|
+ * @param control A reference to the \a nvmlNvLinkUtilizationControl_t to place information
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if the control has been set successfully
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device, \a counter, \a link, or \a control is invalid
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device doesn't support this feature
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetNvLinkUtilizationControl(nvmlDevice_t device, unsigned int link, unsigned int counter,
|
|
+ nvmlNvLinkUtilizationControl_t *control);
|
|
+
|
|
+
|
|
+/**
|
|
+ * Retrieve the NVLINK utilization counter based on the current control for a specified counter.
|
|
+ * In general it is good practice to use \a nvmlDeviceSetNvLinkUtilizationControl
|
|
+ * before reading the utilization counters as they have no default state
|
|
+ *
|
|
+ * For newer than Maxwell &tm; fully supported devices.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param link Specifies the NvLink link to be queried
|
|
+ * @param counter Specifies the counter that should be read (0 or 1).
|
|
+ * @param rxcounter Receive counter return value
|
|
+ * @param txcounter Transmit counter return value
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if \a rxcounter and \a txcounter have been successfully set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device, \a counter, or \a link is invalid or \a rxcounter or \a txcounter are NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device doesn't support this feature
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetNvLinkUtilizationCounter(nvmlDevice_t device, unsigned int link, unsigned int counter,
|
|
+ unsigned long long *rxcounter, unsigned long long *txcounter);
|
|
+
|
|
+/**
|
|
+ * Freeze the NVLINK utilization counters
|
|
+ * Both the receive and transmit counters are operated on by this function
|
|
+ *
|
|
+ * For newer than Maxwell &tm; fully supported devices.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param link Specifies the NvLink link to be queried
|
|
+ * @param counter Specifies the counter that should be frozen (0 or 1).
|
|
+ * @param freeze NVML_FEATURE_ENABLED = freeze the receive and transmit counters
|
|
+ * NVML_FEATURE_DISABLED = unfreeze the receive and transmit counters
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if counters were successfully frozen or unfrozen
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device, \a link, \a counter, or \a freeze is invalid
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device doesn't support this feature
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceFreezeNvLinkUtilizationCounter (nvmlDevice_t device, unsigned int link,
|
|
+ unsigned int counter, nvmlEnableState_t freeze);
|
|
+
|
|
+/**
|
|
+ * Reset the NVLINK utilization counters
|
|
+ * Both the receive and transmit counters are operated on by this function
|
|
+ *
|
|
+ * For newer than Maxwell &tm; fully supported devices.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param link Specifies the NvLink link to be reset
|
|
+ * @param counter Specifies the counter that should be reset (0 or 1)
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if counters were successfully reset
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a device, \a link, or \a counter is invalid
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device doesn't support this feature
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceResetNvLinkUtilizationCounter (nvmlDevice_t device, unsigned int link, unsigned int counter);
|
|
+
|
|
+/** @} */
|
|
+
|
|
+/***************************************************************************************************/
|
|
+/** @defgroup nvmlEvents Event Handling Methods
|
|
+ * This chapter describes methods that NVML can perform against each device to register and wait for
|
|
+ * some event to occur.
|
|
+ * @{
|
|
+ */
|
|
+/***************************************************************************************************/
|
|
+
|
|
+/**
|
|
+ * Create an empty set of events.
|
|
+ * Event set should be freed by \ref nvmlEventSetFree
|
|
+ *
|
|
+ * For Fermi &tm; or newer fully supported devices.
|
|
+ * @param set Reference in which to return the event handle
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if the event has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a set is NULL
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ *
|
|
+ * @see nvmlEventSetFree
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlEventSetCreate(nvmlEventSet_t *set);
|
|
+
|
|
+/**
|
|
+ * Starts recording of events on a specified devices and add the events to specified \ref nvmlEventSet_t
|
|
+ *
|
|
+ * For Fermi &tm; or newer fully supported devices.
|
|
+ * Ecc events are available only on ECC enabled devices (see \ref nvmlDeviceGetTotalEccErrors)
|
|
+ * Power capping events are available only on Power Management enabled devices (see \ref nvmlDeviceGetPowerManagementMode)
|
|
+ *
|
|
+ * For Linux only.
|
|
+ *
|
|
+ * \b IMPORTANT: Operations on \a set are not thread safe
|
|
+ *
|
|
+ * This call starts recording of events on specific device.
|
|
+ * All events that occurred before this call are not recorded.
|
|
+ * Checking if some event occurred can be done with \ref nvmlEventSetWait
|
|
+ *
|
|
+ * If function reports NVML_ERROR_UNKNOWN, event set is in undefined state and should be freed.
|
|
+ * If function reports NVML_ERROR_NOT_SUPPORTED, event set can still be used. None of the requested eventTypes
|
|
+ * are registered in that case.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param eventTypes Bitmask of \ref nvmlEventType to record
|
|
+ * @param set Set to which add new event types
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if the event has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a eventTypes is invalid or \a set is NULL
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the platform does not support this feature or some of requested event types
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ *
|
|
+ * @see nvmlEventType
|
|
+ * @see nvmlDeviceGetSupportedEventTypes
|
|
+ * @see nvmlEventSetWait
|
|
+ * @see nvmlEventSetFree
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceRegisterEvents(nvmlDevice_t device, unsigned long long eventTypes, nvmlEventSet_t set);
|
|
+
|
|
+/**
|
|
+ * Returns information about events supported on device
|
|
+ *
|
|
+ * For Fermi &tm; or newer fully supported devices.
|
|
+ *
|
|
+ * Events are not supported on Windows. So this function returns an empty mask in \a eventTypes on Windows.
|
|
+ *
|
|
+ * @param device The identifier of the target device
|
|
+ * @param eventTypes Reference in which to return bitmask of supported events
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if the eventTypes has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a eventType is NULL
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if the target GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ *
|
|
+ * @see nvmlEventType
|
|
+ * @see nvmlDeviceRegisterEvents
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceGetSupportedEventTypes(nvmlDevice_t device, unsigned long long *eventTypes);
|
|
+
|
|
+/**
|
|
+ * Waits on events and delivers events
|
|
+ *
|
|
+ * For Fermi &tm; or newer fully supported devices.
|
|
+ *
|
|
+ * If some events are ready to be delivered at the time of the call, function returns immediately.
|
|
+ * If there are no events ready to be delivered, function sleeps till event arrives
|
|
+ * but not longer than specified timeout. This function in certain conditions can return before
|
|
+ * specified timeout passes (e.g. when interrupt arrives)
|
|
+ *
|
|
+ * In case of xid error, the function returns the most recent xid error type seen by the system. If there are multiple
|
|
+ * xid errors generated before nvmlEventSetWait is invoked then the last seen xid error type is returned for all
|
|
+ * xid error events.
|
|
+ *
|
|
+ * @param set Reference to set of events to wait on
|
|
+ * @param data Reference in which to return event data
|
|
+ * @param timeoutms Maximum amount of wait time in milliseconds for registered event
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if the data has been set
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a data is NULL
|
|
+ * - \ref NVML_ERROR_TIMEOUT if no event arrived in specified timeout or interrupt arrived
|
|
+ * - \ref NVML_ERROR_GPU_IS_LOST if a GPU has fallen off the bus or is otherwise inaccessible
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ *
|
|
+ * @see nvmlEventType
|
|
+ * @see nvmlDeviceRegisterEvents
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlEventSetWait(nvmlEventSet_t set, nvmlEventData_t * data, unsigned int timeoutms);
|
|
+
|
|
+/**
|
|
+ * Releases events in the set
|
|
+ *
|
|
+ * For Fermi &tm; or newer fully supported devices.
|
|
+ *
|
|
+ * @param set Reference to events to be released
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if the event has been successfully released
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ *
|
|
+ * @see nvmlDeviceRegisterEvents
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlEventSetFree(nvmlEventSet_t set);
|
|
+
|
|
+/** @} */
|
|
+
|
|
+/***************************************************************************************************/
|
|
+/** @defgroup nvmlZPI Drain states
|
|
+ * This chapter describes methods that NVML can perform against each device to control their drain state
|
|
+ * and recognition by NVML and NVIDIA kernel driver. These methods can be used with out-of-band tools to
|
|
+ * power on/off GPUs, enable robust reset scenarios, etc.
|
|
+ * @{
|
|
+ */
|
|
+/***************************************************************************************************/
|
|
+
|
|
+/**
|
|
+ * Modify the drain state of a GPU. This method forces a GPU to no longer accept new incoming requests.
|
|
+ * Any new NVML process will no longer see this GPU. Persistence mode for this GPU must be turned off before
|
|
+ * this call is made.
|
|
+ * Must be called as administrator.
|
|
+ * For Linux only.
|
|
+ *
|
|
+ * For newer than Maxwell &tm; fully supported devices.
|
|
+ * Some Kepler devices supported.
|
|
+ *
|
|
+ * @param pciInfo The PCI address of the GPU drain state to be modified
|
|
+ * @param newState The drain state that should be entered, see \ref nvmlEnableState_t
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if counters were successfully reset
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a nvmlIndex or \a newState is invalid
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device doesn't support this feature
|
|
+ * - \ref NVML_ERROR_NO_PERMISSION if the calling process has insufficient permissions to perform operation
|
|
+ * - \ref NVML_ERROR_IN_USE if the device has persistence mode turned on
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceModifyDrainState (nvmlPciInfo_t *pciInfo, nvmlEnableState_t newState);
|
|
+
|
|
+/**
|
|
+ * Query the drain state of a GPU. This method is used to check if a GPU is in a currently draining
|
|
+ * state.
|
|
+ * For Linux only.
|
|
+ *
|
|
+ * For newer than Maxwell &tm; fully supported devices.
|
|
+ * Some Kepler devices supported.
|
|
+ *
|
|
+ * @param pciInfo The PCI address of the GPU drain state to be queried
|
|
+ * @param currentState The current drain state for this GPU, see \ref nvmlEnableState_t
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if counters were successfully reset
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a nvmlIndex or \a currentState is invalid
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device doesn't support this feature
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceQueryDrainState (nvmlPciInfo_t *pciInfo, nvmlEnableState_t *currentState);
|
|
+
|
|
+/**
|
|
+ * This method will remove the specified GPU from the view of both NVML and the NVIDIA kernel driver
|
|
+ * as long as no other processes are attached. If other processes are attached, this call will return
|
|
+ * NVML_ERROR_IN_USE and the GPU will be returned to its original "draining" state. Note: the
|
|
+ * only situation where a process can still be attached after nvmlDeviceModifyDrainState() is called
|
|
+ * to initiate the draining state is if that process was using, and is still using, a GPU before the
|
|
+ * call was made. Also note, persistence mode counts as an attachment to the GPU thus it must be disabled
|
|
+ * prior to this call.
|
|
+ *
|
|
+ * For long-running NVML processes please note that this will change the enumeration of current GPUs.
|
|
+ * For example, if there are four GPUs present and GPU1 is removed, the new enumeration will be 0-2.
|
|
+ * Also, device handles after the removed GPU will not be valid and must be re-established.
|
|
+ * Must be run as administrator.
|
|
+ * For Linux only.
|
|
+ *
|
|
+ * For newer than Maxwell &tm; fully supported devices.
|
|
+ * Some Kepler devices supported.
|
|
+ *
|
|
+ * @param pciInfo The PCI address of the GPU to be removed
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if counters were successfully reset
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a nvmlIndex is invalid
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the device doesn't support this feature
|
|
+ * - \ref NVML_ERROR_IN_USE if the device is still in use and cannot be removed
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceRemoveGpu (nvmlPciInfo_t *pciInfo);
|
|
+
|
|
+/**
|
|
+ * Request the OS and the NVIDIA kernel driver to rediscover a portion of the PCI subsystem looking for GPUs that
|
|
+ * were previously removed. The portion of the PCI tree can be narrowed by specifying a domain, bus, and device.
|
|
+ * If all are zeroes then the entire PCI tree will be searched. Please note that for long-running NVML processes
|
|
+ * the enumeration will change based on how many GPUs are discovered and where they are inserted in bus order.
|
|
+ *
|
|
+ * In addition, all newly discovered GPUs will be initialized and their ECC scrubbed which may take several seconds
|
|
+ * per GPU. Also, all device handles are no longer guaranteed to be valid post discovery.
|
|
+ *
|
|
+ * Must be run as administrator.
|
|
+ * For Linux only.
|
|
+ *
|
|
+ * For newer than Maxwell &tm; fully supported devices.
|
|
+ * Some Kepler devices supported.
|
|
+ *
|
|
+ * @param pciInfo The PCI tree to be searched. Only the domain, bus, and device
|
|
+ * fields are used in this call.
|
|
+ *
|
|
+ * @return
|
|
+ * - \ref NVML_SUCCESS if counters were successfully reset
|
|
+ * - \ref NVML_ERROR_UNINITIALIZED if the library has not been successfully initialized
|
|
+ * - \ref NVML_ERROR_INVALID_ARGUMENT if \a pciInfo is invalid
|
|
+ * - \ref NVML_ERROR_NOT_SUPPORTED if the operating system does not support this feature
|
|
+ * - \ref NVML_ERROR_OPERATING_SYSTEM if the operating system is denying this feature
|
|
+ * - \ref NVML_ERROR_NO_PERMISSION if the calling process has insufficient permissions to perform operation
|
|
+ * - \ref NVML_ERROR_UNKNOWN on any unexpected error
|
|
+ */
|
|
+nvmlReturn_t DECLDIR nvmlDeviceDiscoverGpus (nvmlPciInfo_t *pciInfo);
|
|
+
|
|
+/** @} */
|
|
+
|
|
+/**
|
|
+ * NVML API versioning support
|
|
+ */
|
|
+#if defined(__NVML_API_VERSION_INTERNAL)
|
|
+#undef nvmlDeviceGetPciInfo
|
|
+#undef nvmlDeviceGetCount
|
|
+#undef nvmlDeviceGetHandleByIndex
|
|
+#undef nvmlDeviceGetHandleByPciBusId
|
|
+#undef nvmlInit
|
|
+#endif
|
|
+
|
|
+#ifdef __cplusplus
|
|
+}
|
|
+#endif
|
|
+
|
|
+#endif
|
|
--
|
|
2.21.0
|
|
|