gpu: nvgpu: add interface to power on-off gpu

The power rail of dGPU is managed with help of a set of GPIOs. Using those GPIOs add an interface to power off and power on dGPU. Before dGPU is powered off, new work is blocked by setting NVGPU_DRIVER_IS_DYING and current jobs are allowed to finish by waiting for gpu to be idle. The tegra PCIe controller driver provided APIs tegra_pcie_attach_controller() and tegra_pcie_detach_controller() are used to manage PCIe link shutdown, PCIe refclk management and PCIe rescan. JIRA NVGPU-1100 Change-Id: Ifae5b81535f40dceca5292a987d3daf6984f3210 Signed-off-by: Nitin Kumbhar <nkumbhar@nvidia.com> Reviewed-on: https://git-master.nvidia.com/r/1749847 Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com> Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
2025-12-22 09:12:24 +03:00 · 2018-06-14 17:27:47 +05:30
parent 334f5869c9
commit 237af3ef86
7 changed files with 603 additions and 1 deletions
--- a/drivers/gpu/nvgpu/Makefile
+++ b/drivers/gpu/nvgpu/Makefile
@@ -153,6 +153,7 @@ endif

 nvgpu-$(CONFIG_GK20A_PCI) += \
 	os/linux/pci.o \
+	os/linux/pci_power.o \
 	os/linux/pci_usermode.o

 nvgpu-$(CONFIG_TEGRA_GK20A_NVHOST) += \
--- a/drivers/gpu/nvgpu/os/linux/module.c
+++ b/drivers/gpu/nvgpu/os/linux/module.c
@@ -1100,6 +1100,38 @@ static int gk20a_pm_deinit(struct device *dev)
 	return 0;
 }

+int nvgpu_start_gpu_idle(struct gk20a *g)
+{
+	struct nvgpu_os_linux *l = nvgpu_os_linux_from_gk20a(g);
+
+	down_write(&l->busy_lock);
+
+	/*
+	 * Set NVGPU_DRIVER_IS_DYING to avoid gpu being marked
+	 * busy to submit new work to gpu.
+	 */
+	__nvgpu_set_enabled(g, NVGPU_DRIVER_IS_DYING, true);
+
+	up_write(&l->busy_lock);
+
+	return 0;
+}
+
+int nvgpu_wait_for_gpu_idle(struct gk20a *g)
+{
+	int ret = 0;
+
+	ret = gk20a_wait_for_idle(g);
+	if (ret) {
+		nvgpu_err(g, "failed in wait for idle");
+		goto out;
+	}
+
+	nvgpu_wait_for_deferred_interrupts(g);
+out:
+	return ret;
+}
+
 /*
 * Start the process for unloading the driver. Set NVGPU_DRIVER_IS_DYING.
 */
--- a/drivers/gpu/nvgpu/os/linux/module.h
+++ b/drivers/gpu/nvgpu/os/linux/module.h
@@ -23,6 +23,8 @@ void gk20a_remove_support(struct gk20a *g);
 void gk20a_driver_start_unload(struct gk20a *g);
 int nvgpu_quiesce(struct gk20a *g);
 int nvgpu_remove(struct device *dev, struct class *class);
+int nvgpu_start_gpu_idle(struct gk20a *g);
+int nvgpu_wait_for_gpu_idle(struct gk20a *g);
 void nvgpu_free_irq(struct gk20a *g);
 struct device_node *nvgpu_get_node(struct gk20a *g);
 void __iomem *nvgpu_devm_ioremap_resource(struct platform_device *dev, int i,
--- a/drivers/gpu/nvgpu/os/linux/pci.c
+++ b/drivers/gpu/nvgpu/os/linux/pci.c
@@ -39,6 +39,7 @@
 #include "platform_gk20a.h"

 #include "pci.h"
+#include "pci_power.h"
 #include "pci_usermode.h"

 #include "driver_common.h"
@@ -806,6 +807,12 @@ static int nvgpu_pci_probe(struct pci_dev *pdev,
 		}
 	}

+	err = nvgpu_pci_add_pci_power(pdev);
+	if (err) {
+		nvgpu_err(g, "add pci power failed (%d).", err);
+		goto err_free_irq;
+	}
+
 	return 0;

 err_free_irq:
@@ -832,6 +839,9 @@ static void nvgpu_pci_remove(struct pci_dev *pdev)
 	if (gk20a_gpu_is_virtual(dev))
 		return;

+	err = nvgpu_pci_clear_pci_power(dev_name(dev));
+	WARN(err, "gpu failed to clear pci power");
+
 	err = nvgpu_nvlink_deinit(g);
 	WARN(err, "gpu failed to remove nvlink");

@@ -882,11 +892,27 @@ int __init nvgpu_pci_init(void)
 	if (ret)
 		return ret;

-	return pci_register_driver(&nvgpu_pci_driver);
+	ret = pci_register_driver(&nvgpu_pci_driver);
+	if (ret)
+		goto driver_fail;
+
+	ret = nvgpu_pci_power_init(&nvgpu_pci_driver);
+	if (ret)
+		goto power_init_fail;
+
+	return 0;
+
+power_init_fail:
+	pci_unregister_driver(&nvgpu_pci_driver);
+driver_fail:
+	class_unregister(&nvgpu_pci_class);
+	return ret;
 }

 void __exit nvgpu_pci_exit(void)
 {
+	nvgpu_pci_power_exit(&nvgpu_pci_driver);
 	pci_unregister_driver(&nvgpu_pci_driver);
 	class_unregister(&nvgpu_pci_class);
+	nvgpu_pci_power_cleanup();
 }
--- a/drivers/gpu/nvgpu/os/linux/pci_power.c
+++ b/drivers/gpu/nvgpu/os/linux/pci_power.c
@@ -0,0 +1,486 @@
+/*
+ * Copyright (c) 2018, NVIDIA CORPORATION. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms and conditions of the GNU General Public License,
+ * version 2, as published by the Free Software Foundation.
+ *
+ * This program is distributed in the hope it will be useful, but WITHOUT
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
+ * more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program.  If not, see <http://www.gnu.org/licenses/>.
+ */
+
+#include <linux/delay.h>
+#include <linux/list.h>
+#include <linux/pci.h>
+#include <linux/platform_device.h>
+#include <linux/of_gpio.h>
+#include <linux/gpio/consumer.h>
+
+#include <nvgpu/lock.h>
+
+#include "module.h"
+#include "platform_gk20a.h"
+#include "pci_power.h"
+
+#define PCI_DEV_NAME_MAX	64
+
+struct nvgpu_pci_power {
+	struct	list_head list;
+	struct	nvgpu_mutex mutex;
+	struct	nvgpu_pci_gpios gpios;
+	struct	pci_dev *pci_dev;
+	char	pci_dev_name[PCI_DEV_NAME_MAX];
+	void	*pci_cookie;
+};
+
+static struct list_head nvgpu_pci_power_devs =
+	LIST_HEAD_INIT(nvgpu_pci_power_devs);
+
+static struct nvgpu_pci_power *nvgpu_pci_get_pci_power(const char *dev_name)
+{
+	struct nvgpu_pci_power *pp, *tmp_pp;
+
+	list_for_each_entry_safe(pp, tmp_pp, &nvgpu_pci_power_devs, list) {
+		if (!strcmp(dev_name, pp->pci_dev_name))
+			return pp;
+	}
+	return NULL;
+}
+
+int nvgpu_pci_add_pci_power(struct pci_dev *pdev)
+{
+	struct nvgpu_pci_power *pp;
+
+	if (!pdev)
+		return -EINVAL;
+
+	pp = nvgpu_pci_get_pci_power(dev_name(&pdev->dev));
+	if (pp) {
+		pp->pci_dev = pdev;
+		return 0;
+	}
+
+	pp = kzalloc(sizeof(*pp), GFP_KERNEL);
+	if (!pp)
+		return -ENOMEM;
+
+	nvgpu_mutex_init(&pp->mutex);
+	pp->pci_dev = pdev;
+	strlcpy(pp->pci_dev_name,
+		dev_name(&pdev->dev), PCI_DEV_NAME_MAX);
+
+	list_add(&pp->list, &nvgpu_pci_power_devs);
+
+	return 0;
+}
+
+static void nvgpu_free_pci_gpios(struct nvgpu_pci_gpios *pgpios);
+
+static int nvgpu_pci_remove_pci_power(struct nvgpu_pci_power *pp)
+{
+	list_del(&pp->list);
+	nvgpu_free_pci_gpios(&pp->gpios);
+	kfree(pp);
+	return 0;
+}
+
+static ssize_t probed_gpus_show(struct device_driver *drv, char *buf)
+{
+	struct nvgpu_pci_power *pp, *tmp_pp;
+	ssize_t count = 0;
+
+	list_for_each_entry_safe(pp, tmp_pp, &nvgpu_pci_power_devs, list) {
+		count += snprintf(buf, PAGE_SIZE - count, "pci-%s\t%s\n",
+				  pp->pci_dev_name,
+				  pp->pci_dev ? "PoweredOn" : "PoweredOff");
+	}
+	return count;
+}
+
+static DRIVER_ATTR_RO(probed_gpus);
+
+int nvgpu_pci_clear_pci_power(const char *dev_name)
+{
+	struct nvgpu_pci_power *pp, *tmp_pp;
+
+	list_for_each_entry_safe(pp, tmp_pp, &nvgpu_pci_power_devs, list) {
+		if (!strcmp(dev_name, pp->pci_dev_name)) {
+			pp->pci_dev = NULL;
+			return 0;
+		}
+	}
+	return -ENODEV;
+}
+
+static char *nvgpu_pci_gpio_name(int g)
+{
+	switch (g) {
+	case PCI_GPIO_VBAT_PWR_ON:
+		return "PCI_GPIO_VBAT_PWR_ON";
+	case PCI_GPIO_PRSNT2:
+		return "PCI_GPIO_PRSNT2*";
+	case PCI_GPIO_PRSNT1:
+		return "PCI_GPIO_PRSNT1*";
+	case PCI_GPIO_PWR_ON:
+		return "PCI_GPIO_PWR_ON";
+	case PCI_GPIO_PG:
+		return "PCI_GPIO_PG";
+	}
+	return "INVALID_PCI_GPIO";
+}
+
+static void nvgpu_dump_pci_gpios(struct nvgpu_pci_gpios *pgpios, const char *f)
+{
+	int is_in, val, i;
+	struct gpio_desc *gd;
+
+	pr_debug("nvgpu gpio status in %s:\n", f);
+
+	for (i = 0; i < PCI_GPIO_MAX; i++) {
+		if (pgpios->gpios[i] == 0) {
+			pr_debug("%d. %-25s: gpio not requested\n",
+				 i, nvgpu_pci_gpio_name(i));
+			continue;
+		}
+
+		gd = gpio_to_desc(pgpios->gpios[i]);
+		if (gd) {
+			is_in = gpiod_get_direction(gd);
+			val = gpiod_get_value_cansleep(gd);
+
+			pr_debug("%d. %-25s gpio-%-3d dir=%s val=%s\n",
+				 i, nvgpu_pci_gpio_name(i), pgpios->gpios[i],
+				 is_in ? "in " : "out",
+				 val >= 0 ? (val != 0 ? "hi" : "lo") : "?  ");
+
+		} else {
+			pr_debug("%d. %-25s invalid gpio desc\n",
+				 i, nvgpu_pci_gpio_name(i));
+		}
+	}
+}
+
+static void nvgpu_free_pci_gpios(struct nvgpu_pci_gpios *pgpios)
+{
+	int i;
+
+	for (i = 0; i < PCI_GPIO_MAX; i++) {
+		if (pgpios->gpios[i]) {
+			gpio_free(pgpios->gpios[i]);
+			pgpios->gpios[i] = 0;
+		}
+	}
+}
+
+static int nvgpu_request_pci_gpios(struct nvgpu_pci_gpios *pgpios)
+{
+	struct device_node *np;
+	int i, ret, gpio;
+
+	if (pgpios->gpios[0])
+		return 0;
+
+	np = of_find_node_by_name(NULL, "nvgpu");
+	if (!np) {
+		ret = -ENOENT;
+		goto err;
+	}
+
+	for (i = 0; i < PCI_GPIO_MAX; i++) {
+		gpio = of_get_named_gpio(np, "nvgpu-pci-gpios", i);
+		if (gpio < 0) {
+			ret = gpio;
+			goto err;
+		}
+
+		ret = gpio_request(gpio, "pci-gpio");
+		if (ret)
+			goto err;
+
+		pgpios->gpios[i] = gpio;
+	}
+
+	nvgpu_dump_pci_gpios(pgpios, __func__);
+
+	of_node_put(np);
+	return 0;
+err:
+	of_node_put(np);
+	nvgpu_free_pci_gpios(pgpios);
+	return ret;
+}
+
+static int nvgpu_disable_pci_rail(struct nvgpu_pci_gpios *pgpios)
+{
+	int pci_vbat_pwr_on_gpio = pgpios->gpios[PCI_GPIO_VBAT_PWR_ON];
+
+	gpio_set_value(pci_vbat_pwr_on_gpio, 0);
+
+	mdelay(PCI_VBAR_PWR_ON_DELAY_MS);
+	return 0;
+}
+
+static int nvgpu_check_pci_power_good(struct nvgpu_pci_gpios *pgpios)
+{
+	int pci_pg = pgpios->gpios[PCI_GPIO_PG];
+
+	return gpio_get_value(pci_pg) != 1 ? -EINVAL : 0;
+}
+
+static int nvgpu_enable_pci_rail(struct nvgpu_pci_gpios *pgpios)
+{
+	int pci_vbat_pwr_on_gpio = pgpios->gpios[PCI_GPIO_VBAT_PWR_ON];
+
+	gpio_set_value(pci_vbat_pwr_on_gpio, 1);
+
+	mdelay(PCI_VBAR_PWR_ON_DELAY_MS);
+	return 0;
+}
+
+static int nvgpu_deassert_pci_pwr_on(struct nvgpu_pci_gpios *pgpios)
+{
+	int pci_pwr_on = pgpios->gpios[PCI_GPIO_PWR_ON];
+
+	gpio_set_value(pci_pwr_on, 0);
+
+	mdelay(PCI_PWR_ON_DELAY_MS);
+	return 0;
+}
+
+static int nvgpu_assert_pci_pwr_on(struct nvgpu_pci_gpios *pgpios)
+{
+	int pci_pwr_on = pgpios->gpios[PCI_GPIO_PWR_ON];
+
+	gpio_set_value(pci_pwr_on, 1);
+
+	mdelay(PCI_PWR_ON_DELAY_MS);
+	return 0;
+}
+
+#if !IS_ENABLED(CONFIG_PCIE_TEGRA_DW) ||		\
+	!IS_ENABLED(CONFIG_ARCH_TEGRA_19x_SOC) ||	\
+	LINUX_VERSION_CODE < KERNEL_VERSION(4, 9, 0)
+void *tegra_pcie_detach_controller(struct pci_dev *pdev)
+{
+	pr_err("nvgpu: detach pci controller not available\n");
+	return NULL;
+}
+
+int tegra_pcie_attach_controller(void *cookie)
+{
+	pr_err("nvgpu: attach pci controller not available\n");
+	return -EINVAL;
+}
+#endif
+
+static int nvgpu_detach_pci_gpu(struct nvgpu_pci_power *pp)
+{
+	struct pci_dev *pdev = pp->pci_dev;
+	void *pci_cookie;
+	int ret = 0;
+
+	pci_cookie = tegra_pcie_detach_controller(pdev);
+
+	if (IS_ERR(pci_cookie)) {
+		ret = PTR_ERR(pci_cookie);
+		pr_err("nvgpu: detaching PCIe controller failed (%d)\n", ret);
+		return ret;
+	}
+
+	pp->pci_cookie = pci_cookie;
+	return 0;
+}
+
+static int nvgpu_attach_pci_gpu(struct nvgpu_pci_power *pp)
+{
+	void *pci_cookie = pp->pci_cookie;
+	int ret = 0;
+
+	if (pci_cookie == NULL) {
+		pr_err("nvgpu: Invalid pci cookie\n");
+		return -EINVAL;
+	}
+
+	ret = tegra_pcie_attach_controller(pci_cookie);
+	if (ret)
+		pr_err("nvgpu: attaching PCIe controller failed (%d)\n", ret);
+
+	return ret;
+}
+
+static int nvgpu_pci_gpu_power_on(char *dev_name)
+{
+	struct nvgpu_pci_power *pp;
+	struct nvgpu_pci_gpios *pgpios;
+	int ret;
+
+	pp = nvgpu_pci_get_pci_power(dev_name);
+	if (!pp) {
+		pr_err("nvgpu: no pci dev by name: %s\n", dev_name);
+		return -ENODEV;
+	}
+
+	nvgpu_mutex_acquire(&pp->mutex);
+
+	pgpios = &pp->gpios;
+
+	ret = nvgpu_request_pci_gpios(pgpios);
+	if (ret) {
+		pr_err("nvgpu: request pci gpios failed\n");
+		goto out;
+	}
+
+	ret = nvgpu_enable_pci_rail(pgpios);
+	if (ret) {
+		pr_err("nvgpu: enable pci rail failed\n");
+		goto out;
+	}
+
+	ret = nvgpu_assert_pci_pwr_on(pgpios);
+	if (ret) {
+		pr_err("nvgpu: assert pci pwr on failed\n");
+		goto out;
+	}
+
+	ret = nvgpu_check_pci_power_good(pgpios);
+	if (ret) {
+		pr_err("nvgpu: pci power is no good\n");
+		goto out;
+	}
+
+	ret = nvgpu_attach_pci_gpu(pp);
+	if (ret) {
+		pr_err("nvgpu: attach pci gpu failed\n");
+		goto out;
+	}
+
+	nvgpu_dump_pci_gpios(pgpios, __func__);
+
+	nvgpu_mutex_release(&pp->mutex);
+	return 0;
+out:
+	nvgpu_mutex_release(&pp->mutex);
+	return ret;
+}
+
+static int nvgpu_pci_gpu_power_off(char *dev_name)
+{
+	struct nvgpu_pci_power *pp;
+	struct nvgpu_pci_gpios *pgpios;
+	struct device *dev;
+	struct gk20a *g;
+	int ret;
+
+	pp = nvgpu_pci_get_pci_power(dev_name);
+	if (!pp) {
+		pr_err("nvgpu: no pci dev by name: %s\n", dev_name);
+		return -ENODEV;
+	}
+
+	nvgpu_mutex_acquire(&pp->mutex);
+
+	dev = &pp->pci_dev->dev;
+	g = get_gk20a(dev);
+	pgpios = &pp->gpios;
+
+	ret = nvgpu_start_gpu_idle(g);
+	if (ret) {
+		pr_err("nvgpu: start gpu idle failed\n");
+		goto out;
+	}
+
+	ret = nvgpu_wait_for_gpu_idle(g);
+	if (ret) {
+		pr_err("nvgpu: wait for gpu idle failed\n");
+		goto out;
+	}
+
+	ret = nvgpu_request_pci_gpios(pgpios);
+	if (ret) {
+		pr_err("nvgpu: request pci gpios failed\n");
+		goto out;
+	}
+
+	ret = nvgpu_detach_pci_gpu(pp);
+	if (ret) {
+		pr_err("nvgpu: detach pci gpu failed\n");
+		goto out;
+	}
+
+	ret = nvgpu_deassert_pci_pwr_on(pgpios);
+	if (ret) {
+		pr_err("nvgpu: deassert pci pwr on failed\n");
+		goto out;
+	}
+
+	ret = nvgpu_disable_pci_rail(pgpios);
+	if (ret) {
+		pr_err("nvgpu: disable pci rail failed\n");
+		goto out;
+	}
+
+	nvgpu_dump_pci_gpios(pgpios, __func__);
+
+	nvgpu_mutex_release(&pp->mutex);
+	return 0;
+out:
+	nvgpu_mutex_release(&pp->mutex);
+	return ret;
+}
+
+int nvgpu_pci_set_powerstate(char *dev_name, int powerstate)
+{
+	int ret = 0;
+
+	switch (powerstate) {
+	case NVGPU_POWER_ON:
+		ret = nvgpu_pci_gpu_power_on(dev_name);
+		break;
+
+	case NVGPU_POWER_OFF:
+		ret = nvgpu_pci_gpu_power_off(dev_name);
+		break;
+
+	default:
+		ret = -EINVAL;
+		break;
+	}
+
+	return ret;
+}
+
+
+int __init nvgpu_pci_power_init(struct pci_driver *nvgpu_pci_driver)
+{
+	struct device_driver *driver = &nvgpu_pci_driver->driver;
+	int ret;
+
+	ret = driver_create_file(driver, &driver_attr_probed_gpus);
+	if (ret)
+		goto err_probed_gpus;
+
+	return 0;
+
+err_probed_gpus:
+	return ret;
+}
+
+void __exit nvgpu_pci_power_exit(struct pci_driver *nvgpu_pci_driver)
+{
+	struct device_driver *driver = &nvgpu_pci_driver->driver;
+
+	driver_remove_file(driver, &driver_attr_probed_gpus);
+}
+
+void __exit nvgpu_pci_power_cleanup(void)
+{
+	struct nvgpu_pci_power *pp, *tmp_pp;
+
+	list_for_each_entry_safe(pp, tmp_pp, &nvgpu_pci_power_devs, list)
+		nvgpu_pci_remove_pci_power(pp);
+}
--- a/drivers/gpu/nvgpu/os/linux/pci_power.h
+++ b/drivers/gpu/nvgpu/os/linux/pci_power.h
@@ -0,0 +1,38 @@
+/*
+ * Copyright (c) 2018, NVIDIA CORPORATION. All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms and conditions of the GNU General Public License,
+ * version 2, as published by the Free Software Foundation.
+ *
+ * This program is distributed in the hope it will be useful, but WITHOUT
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
+ * more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program.  If not, see <http://www.gnu.org/licenses/>.
+ */
+
+#ifndef NVGPU_PCI_POWER_H
+#define NVGPU_PCI_POWER_H
+
+#include <linux/version.h>
+#include <linux/pci.h>
+
+#define NVGPU_POWER_OFF		0
+#define NVGPU_POWER_ON		1
+
+int nvgpu_pci_set_powerstate(char *dev_name, int powerstate);
+
+int nvgpu_pci_add_pci_power(struct pci_dev *pdev);
+int nvgpu_pci_clear_pci_power(const char *dev_name);
+
+void *tegra_pcie_detach_controller(struct pci_dev *pdev);
+int tegra_pcie_attach_controller(void *cookie);
+
+int __init nvgpu_pci_power_init(struct pci_driver *nvgpu_pci_driver);
+void __exit nvgpu_pci_power_exit(struct pci_driver *nvgpu_pci_driver);
+void __exit nvgpu_pci_power_cleanup(void);
+
+#endif
--- a/drivers/gpu/nvgpu/os/linux/platform_gk20a.h
+++ b/drivers/gpu/nvgpu/os/linux/platform_gk20a.h
@@ -35,6 +35,23 @@ struct secure_page_buffer {
 	size_t used;
 };

+enum {
+	PCI_GPIO_VBAT_PWR_ON,
+	PCI_GPIO_PRSNT2,
+	PCI_GPIO_PRSNT1,
+	PCI_GPIO_PWR_ON,
+	PCI_GPIO_PG,
+	PCI_GPIO_MAX,
+};
+
+struct nvgpu_pci_gpios {
+	int gpios[PCI_GPIO_MAX];
+};
+
+/* delays in milliseconds (ms) */
+#define PCI_VBAR_PWR_ON_DELAY_MS	15
+#define PCI_PWR_ON_DELAY_MS		150
+
 struct gk20a_platform {
 	/* Populated by the gk20a driver before probing the platform. */
 	struct gk20a *g;