15ca02815Sjsg /*
25ca02815Sjsg * Copyright 2021 Advanced Micro Devices, Inc.
35ca02815Sjsg *
45ca02815Sjsg * Permission is hereby granted, free of charge, to any person obtaining a
55ca02815Sjsg * copy of this software and associated documentation files (the "Software"),
65ca02815Sjsg * to deal in the Software without restriction, including without limitation
75ca02815Sjsg * the rights to use, copy, modify, merge, publish, distribute, sublicense,
85ca02815Sjsg * and/or sell copies of the Software, and to permit persons to whom the
95ca02815Sjsg * Software is furnished to do so, subject to the following conditions:
105ca02815Sjsg *
115ca02815Sjsg * The above copyright notice and this permission notice shall be included in
125ca02815Sjsg * all copies or substantial portions of the Software.
135ca02815Sjsg *
145ca02815Sjsg * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
155ca02815Sjsg * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
165ca02815Sjsg * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
175ca02815Sjsg * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
185ca02815Sjsg * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
195ca02815Sjsg * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
205ca02815Sjsg * OTHER DEALINGS IN THE SOFTWARE.
215ca02815Sjsg *
225ca02815Sjsg */
235ca02815Sjsg
245ca02815Sjsg #include "amdgpu_reset.h"
255ca02815Sjsg #include "aldebaran.h"
261bb76ff1Sjsg #include "sienna_cichlid.h"
27*f005ef32Sjsg #include "smu_v13_0_10.h"
285ca02815Sjsg
amdgpu_reset_add_handler(struct amdgpu_reset_control * reset_ctl,struct amdgpu_reset_handler * handler)295ca02815Sjsg int amdgpu_reset_add_handler(struct amdgpu_reset_control *reset_ctl,
305ca02815Sjsg struct amdgpu_reset_handler *handler)
315ca02815Sjsg {
325ca02815Sjsg /* TODO: Check if handler exists? */
335ca02815Sjsg list_add_tail(&handler->handler_list, &reset_ctl->reset_handlers);
345ca02815Sjsg return 0;
355ca02815Sjsg }
365ca02815Sjsg
amdgpu_reset_init(struct amdgpu_device * adev)375ca02815Sjsg int amdgpu_reset_init(struct amdgpu_device *adev)
385ca02815Sjsg {
395ca02815Sjsg int ret = 0;
405ca02815Sjsg
411bb76ff1Sjsg switch (adev->ip_versions[MP1_HWIP][0]) {
421bb76ff1Sjsg case IP_VERSION(13, 0, 2):
43*f005ef32Sjsg case IP_VERSION(13, 0, 6):
445ca02815Sjsg ret = aldebaran_reset_init(adev);
455ca02815Sjsg break;
461bb76ff1Sjsg case IP_VERSION(11, 0, 7):
471bb76ff1Sjsg ret = sienna_cichlid_reset_init(adev);
481bb76ff1Sjsg break;
49*f005ef32Sjsg case IP_VERSION(13, 0, 10):
50*f005ef32Sjsg ret = smu_v13_0_10_reset_init(adev);
51*f005ef32Sjsg break;
525ca02815Sjsg default:
535ca02815Sjsg break;
545ca02815Sjsg }
555ca02815Sjsg
565ca02815Sjsg return ret;
575ca02815Sjsg }
585ca02815Sjsg
amdgpu_reset_fini(struct amdgpu_device * adev)595ca02815Sjsg int amdgpu_reset_fini(struct amdgpu_device *adev)
605ca02815Sjsg {
615ca02815Sjsg int ret = 0;
625ca02815Sjsg
631bb76ff1Sjsg switch (adev->ip_versions[MP1_HWIP][0]) {
641bb76ff1Sjsg case IP_VERSION(13, 0, 2):
65*f005ef32Sjsg case IP_VERSION(13, 0, 6):
665ca02815Sjsg ret = aldebaran_reset_fini(adev);
675ca02815Sjsg break;
681bb76ff1Sjsg case IP_VERSION(11, 0, 7):
691bb76ff1Sjsg ret = sienna_cichlid_reset_fini(adev);
701bb76ff1Sjsg break;
71*f005ef32Sjsg case IP_VERSION(13, 0, 10):
72*f005ef32Sjsg ret = smu_v13_0_10_reset_fini(adev);
73*f005ef32Sjsg break;
745ca02815Sjsg default:
755ca02815Sjsg break;
765ca02815Sjsg }
775ca02815Sjsg
785ca02815Sjsg return ret;
795ca02815Sjsg }
805ca02815Sjsg
amdgpu_reset_prepare_hwcontext(struct amdgpu_device * adev,struct amdgpu_reset_context * reset_context)815ca02815Sjsg int amdgpu_reset_prepare_hwcontext(struct amdgpu_device *adev,
825ca02815Sjsg struct amdgpu_reset_context *reset_context)
835ca02815Sjsg {
845ca02815Sjsg struct amdgpu_reset_handler *reset_handler = NULL;
855ca02815Sjsg
865ca02815Sjsg if (adev->reset_cntl && adev->reset_cntl->get_reset_handler)
875ca02815Sjsg reset_handler = adev->reset_cntl->get_reset_handler(
885ca02815Sjsg adev->reset_cntl, reset_context);
895ca02815Sjsg if (!reset_handler)
90*f005ef32Sjsg return -EOPNOTSUPP;
915ca02815Sjsg
925ca02815Sjsg return reset_handler->prepare_hwcontext(adev->reset_cntl,
935ca02815Sjsg reset_context);
945ca02815Sjsg }
955ca02815Sjsg
amdgpu_reset_perform_reset(struct amdgpu_device * adev,struct amdgpu_reset_context * reset_context)965ca02815Sjsg int amdgpu_reset_perform_reset(struct amdgpu_device *adev,
975ca02815Sjsg struct amdgpu_reset_context *reset_context)
985ca02815Sjsg {
995ca02815Sjsg int ret;
1005ca02815Sjsg struct amdgpu_reset_handler *reset_handler = NULL;
1015ca02815Sjsg
1025ca02815Sjsg if (adev->reset_cntl)
1035ca02815Sjsg reset_handler = adev->reset_cntl->get_reset_handler(
1045ca02815Sjsg adev->reset_cntl, reset_context);
1055ca02815Sjsg if (!reset_handler)
106*f005ef32Sjsg return -EOPNOTSUPP;
1075ca02815Sjsg
1085ca02815Sjsg ret = reset_handler->perform_reset(adev->reset_cntl, reset_context);
1095ca02815Sjsg if (ret)
1105ca02815Sjsg return ret;
1115ca02815Sjsg
1125ca02815Sjsg return reset_handler->restore_hwcontext(adev->reset_cntl,
1135ca02815Sjsg reset_context);
1145ca02815Sjsg }
1151bb76ff1Sjsg
1161bb76ff1Sjsg
amdgpu_reset_destroy_reset_domain(struct kref * ref)1171bb76ff1Sjsg void amdgpu_reset_destroy_reset_domain(struct kref *ref)
1181bb76ff1Sjsg {
1191bb76ff1Sjsg struct amdgpu_reset_domain *reset_domain = container_of(ref,
1201bb76ff1Sjsg struct amdgpu_reset_domain,
1211bb76ff1Sjsg refcount);
1221bb76ff1Sjsg if (reset_domain->wq)
1231bb76ff1Sjsg destroy_workqueue(reset_domain->wq);
1241bb76ff1Sjsg
1251bb76ff1Sjsg kvfree(reset_domain);
1261bb76ff1Sjsg }
1271bb76ff1Sjsg
amdgpu_reset_create_reset_domain(enum amdgpu_reset_domain_type type,char * wq_name)1281bb76ff1Sjsg struct amdgpu_reset_domain *amdgpu_reset_create_reset_domain(enum amdgpu_reset_domain_type type,
1291bb76ff1Sjsg char *wq_name)
1301bb76ff1Sjsg {
1311bb76ff1Sjsg struct amdgpu_reset_domain *reset_domain;
1321bb76ff1Sjsg
1331bb76ff1Sjsg reset_domain = kvzalloc(sizeof(struct amdgpu_reset_domain), GFP_KERNEL);
1341bb76ff1Sjsg if (!reset_domain) {
1351bb76ff1Sjsg DRM_ERROR("Failed to allocate amdgpu_reset_domain!");
1361bb76ff1Sjsg return NULL;
1371bb76ff1Sjsg }
1381bb76ff1Sjsg
1391bb76ff1Sjsg reset_domain->type = type;
1401bb76ff1Sjsg kref_init(&reset_domain->refcount);
1411bb76ff1Sjsg
1421bb76ff1Sjsg reset_domain->wq = create_singlethread_workqueue(wq_name);
1431bb76ff1Sjsg if (!reset_domain->wq) {
1441bb76ff1Sjsg DRM_ERROR("Failed to allocate wq for amdgpu_reset_domain!");
1451bb76ff1Sjsg amdgpu_reset_put_reset_domain(reset_domain);
1461bb76ff1Sjsg return NULL;
1471bb76ff1Sjsg
1481bb76ff1Sjsg }
1491bb76ff1Sjsg
1501bb76ff1Sjsg atomic_set(&reset_domain->in_gpu_reset, 0);
1511bb76ff1Sjsg atomic_set(&reset_domain->reset_res, 0);
1521bb76ff1Sjsg rw_init(&reset_domain->sem, "agrs");
1531bb76ff1Sjsg
1541bb76ff1Sjsg return reset_domain;
1551bb76ff1Sjsg }
1561bb76ff1Sjsg
amdgpu_device_lock_reset_domain(struct amdgpu_reset_domain * reset_domain)1571bb76ff1Sjsg void amdgpu_device_lock_reset_domain(struct amdgpu_reset_domain *reset_domain)
1581bb76ff1Sjsg {
1591bb76ff1Sjsg atomic_set(&reset_domain->in_gpu_reset, 1);
1601bb76ff1Sjsg down_write(&reset_domain->sem);
1611bb76ff1Sjsg }
1621bb76ff1Sjsg
1631bb76ff1Sjsg
amdgpu_device_unlock_reset_domain(struct amdgpu_reset_domain * reset_domain)1641bb76ff1Sjsg void amdgpu_device_unlock_reset_domain(struct amdgpu_reset_domain *reset_domain)
1651bb76ff1Sjsg {
1661bb76ff1Sjsg atomic_set(&reset_domain->in_gpu_reset, 0);
1671bb76ff1Sjsg up_write(&reset_domain->sem);
1681bb76ff1Sjsg }
1691bb76ff1Sjsg
1701bb76ff1Sjsg
1711bb76ff1Sjsg
172