You are not logged in.
Pages: 1
Hello, my gpu disconnects whenever I run a graphically intensive game on it. This issue started around 4 months ago but before that heavy games weren't an issue. I am using a gtx 1650 TU177M with standard linux kernel (linux) and nvidia-open drivers. After checking dmesg I get the following repetitively
[11932.168106] NVRM: nvAssertFailedNoLog: Assertion failed: (status == NV_OK) || (status == NV_ERR_GPU_IN_FULLCHIP_RESET) @ rs_server.c:1375
[11933.185932] NVRM: GPU0 nvAssertFailedNoLog: Assertion failed: (status == NV_OK) || (status == NV_ERR_GPU_IN_FULLCHIP_RESET) @ mem.c:178
[11933.186119] NVRM: GPU0 nvAssertFailedNoLog: Assertion failed: (status == NV_OK) || (status == NV_ERR_GPU_IN_FULLCHIP_RESET) @ mem.c:178
[11933.186263] NVRM: GPU0 nvAssertFailedNoLog: Assertion failed: (status == NV_OK) || (status == NV_ERR_GPU_IN_FULLCHIP_RESET) @ vaspace_api.c:573
[11933.186281] NVRM: GPU0 nvAssertFailedNoLog: Assertion failed: (status == NV_OK) || (status == NV_ERR_GPU_IN_FULLCHIP_RESET) @ mem.c:178
[11933.186375] NVRM: GPU0 nvAssertFailedNoLog: Assertion failed: (status == NV_OK) || (status == NV_ERR_GPU_IN_FULLCHIP_RESET) @ rs_client.c:844
[11933.186382] NVRM: nvAssertFailedNoLog: Assertion failed: (status == NV_OK) || (status == NV_ERR_GPU_IN_FULLCHIP_RESET) @ rs_server.c:259
[11933.186387] NVRM: nvAssertFailedNoLog: Assertion failed: (status == NV_OK) || (status == NV_ERR_GPU_IN_FULLCHIP_RESET) @ rs_server.c:1375
[11933.186672] NVRM: GPU0 nvAssertFailedNoLog: Assertion failed: (status == NV_OK) || (status == NV_ERR_GPU_IN_FULLCHIP_RESET) @ mem.c:178
[11933.186687] NVRM: GPU0 nvAssertFailedNoLog: Assertion failed: (status == NV_OK) || (status == NV_ERR_GPU_IN_FULLCHIP_RESET) @ vaspace_api.c:573
[11933.186989] ------------[ cut here ]------------
[11933.186992] WARNING: CPU: 6 PID: 11060 at nvidia/nv.c:5213 nvidia_dev_put+0xa4/0xb0 [nvidia]
[11933.187302] Modules linked in: ccm snd_seq_dummy snd_hrtimer rfcomm snd_seq snd_seq_device uhid cmac algif_hash algif_skcipher af_alg snd_ctl_led snd_soc_skl_hda_dsp snd_soc_intel_sof_board_helpers snd_soc_intel_hda_dsp_common snd_sof_probes snd_hda_codec_intelhdmi bnep snd_soc_dmic snd_hda_codec_alc269 snd_hda_intel snd_hda_scodec_component snd_hda_codec_realtek_lib snd_hda_codec_generic snd_sof_pci_intel_tgl snd_sof_pci_intel_cnl xe snd_sof_intel_hda_generic soundwire_intel snd_sof_intel_hda_sdw_bpt snd_sof_intel_hda_common snd_soc_hdac_hda snd_sof_intel_hda_mlink snd_sof_intel_hda snd_hda_codec_hdmi drm_gpuvm drm_gpusvm_helper soundwire_cadence gpu_sched snd_sof_pci snd_sof_xtensa_dsp drm_exec drm_suballoc_helper snd_sof snd_sof_utils snd_soc_acpi_intel_match snd_soc_acpi_intel_sdca_quirks soundwire_generic_allocation snd_soc_acpi soundwire_bus intel_uncore_frequency snd_soc_sdca intel_uncore_frequency_common crc8 snd_soc_avs uvcvideo snd_soc_hda_codec x86_pkg_temp_thermal snd_hda_ext_core intel_powerclamp
[11933.187387] videobuf2_vmalloc btusb uvc iwlmvm coretemp snd_hda_codec btmtk videobuf2_memops videobuf2_v4l2 mousedev btrtl snd_hda_core videobuf2_common mac80211 btbcm snd_intel_dspcfg iTCO_wdt kvm_intel videodev btintel snd_intel_sdw_acpi vfat intel_pmc_bxt ptp bluetooth joydev mc fat hid_multitouch intel_rapl_msr mei_hdcp mei_pxp ee1004 iTCO_vendor_support snd_hwdep kvm i915 pps_core snd_soc_core processor_thermal_device_pci_legacy libarc4 irqbypass processor_thermal_device snd_compress polyval_clmulni processor_thermal_wt_hint ac97_bus ghash_clmulni_intel platform_temperature_control lenovo_wmi_gamezone processor_thermal_soc_slider snd_pcm_dmaengine aesni_intel lenovo_wmi_other r8169 lenovo_wmi_helpers processor_thermal_rfim iwlwifi realtek processor_thermal_rapl lenovo_wmi_capdata01 snd_pcm drm_buddy spi_nor intel_rapl_common mdio_devres rapl i2c_algo_bit intel_cstate snd_timer libphy lenovo_wmi_events intel_uncore firmware_attributes_class lenovo_wmi_hotkey_utilities mtd wmi_bmof processor_thermal_wt_req pcspkr
[11933.187477] mei_me i2c_i801 i2c_hid_acpi drm_display_helper mdio_bus i2c_smbus snd processor_thermal_power_floor cfg80211 i2c_hid processor_thermal_mbox cec soundcore mei i2c_mux intel_gtt intel_soc_dts_iosf igen6_edac intel_pmc_core elants_i2c ideapad_laptop pmt_telemetry platform_profile pmt_discovery intel_oc_wdt rfkill pmt_class intel_pmc_ssram_telemetry int3400_thermal intel_hid int3403_thermal acpi_thermal_rel intel_vsec sparse_keymap pinctrl_tigerlake int340x_thermal_zone acpi_pad mac_hid ip6t_REJECT nf_reject_ipv6 xt_hl ip6t_rt ipt_REJECT nf_reject_ipv4 xt_LOG nf_log_syslog xt_multiport xt_recent xt_comment xt_limit xt_addrtype xt_tcpudp xt_conntrack nf_conntrack nf_defrag_ipv6 nf_defrag_ipv4 ip6table_filter ip6_tables iptable_filter ip_tables x_tables sg i2c_dev ntsync crypto_user nfnetlink nvidia_drm(OE) nvme nvme_core nvidia_modeset(OE) nvidia_uvm(OE) intel_lpss_pci nvme_keyring intel_lpss spi_intel_pci nvme_auth spi_intel hkdf idma64 serio_raw nvidia(OE) video drm_ttm_helper wmi ttm acpi_call(OE)
[11933.187570] CPU: 6 UID: 1000 PID: 11060 Comm: explorer.exe Tainted: G W OE 6.18.9-arch1-2 #1 PREEMPT(full) acc0345693780c55f83aaf9a0c9efd10d8da358f
[11933.187578] Tainted: [W]=WARN, [O]=OOT_MODULE, [E]=UNSIGNED_MODULE
[11933.187580] Hardware name: LENOVO 82K1/LNVNB161216, BIOS H4CN37WW(V2.06) 06/18/2024
[11933.187583] RIP: 0010:nvidia_dev_put+0xa4/0xb0 [nvidia]
[11933.187821] Code: 89 de 4c 89 e7 e8 2c bd 14 00 85 c0 75 1c 5b 48 89 ef 5d 41 5c e9 dc fa 9b da 5b 48 c7 c7 c0 85 83 c0 5d 41 5c e9 cc fa 9b da <0f> 0b eb e0 0f 1f 84 00 00 00 00 00 90 90 90 90 90 90 90 90 90 90
[11933.187824] RSP: 0018:ffffcf6a46cabc88 EFLAGS: 00010202
[11933.187829] RAX: 0000000000000026 RBX: ffff8db612128000 RCX: 0000000000000000
[11933.187831] RDX: ffffcf6a46cabc08 RSI: 0000000000000296 RDI: ffffcf6a46cabbc8
[11933.187834] RBP: ffff8db612128720 R08: 0000000000000000 R09: 0000000000000000
[11933.187836] R10: ffffcf6a46cabc30 R11: ffff8db600042200 R12: 0000000000000000
[11933.187838] R13: ffffffffc0838720 R14: ffff8db600697f00 R15: 0000000000000000
[11933.187840] FS: 00007fb6c10cbb80(0000) GS:ffff8dba02a6f000(0000) knlGS:000000007ffc0000
[11933.187844] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033
[11933.187846] CR2: 00007fb6be1b8000 CR3: 0000000266bdc005 CR4: 0000000000f72ef0
[11933.187849] PKRU: 55555554
[11933.187851] Call Trace:
[11933.187855] <TASK>
[11933.187859] nvidia_close+0x182/0x270 [nvidia c668d9d83bb24b5e78745b61fca0ad75dbe168ac]
[11933.188080] __fput+0xe6/0x2a0
[11933.188088] __x64_sys_close+0x3d/0x80
[11933.188092] do_syscall_64+0x81/0x7f0
[11933.188098] ? __slab_free+0xe4/0x310
[11933.188104] ? kmem_cache_free+0x521/0x5d0
[11933.188108] ? __x64_sys_close+0x3d/0x80
[11933.188111] ? __x64_sys_close+0x3d/0x80
[11933.188114] ? do_syscall_64+0x81/0x7f0
[11933.188117] ? kmem_cache_free+0x521/0x5d0
[11933.188120] ? __x64_sys_close+0x3d/0x80
[11933.188123] ? __x64_sys_close+0x3d/0x80
[11933.188125] ? do_syscall_64+0x81/0x7f0
[11933.188128] ? clear_bhb_loop+0x50/0xa0
[11933.188134] ? clear_bhb_loop+0x50/0xa0
[11933.188137] ? clear_bhb_loop+0x50/0xa0
[11933.188141] entry_SYSCALL_64_after_hwframe+0x76/0x7e
[11933.188145] RIP: 0033:0x7fb6c116bf32
[11933.188191] Code: 08 0f 85 c1 43 ff ff 49 89 fb 48 89 f0 48 89 d7 48 89 ce 4c 89 c2 4d 89 ca 4c 8b 44 24 08 4c 8b 4c 24 10 4c 89 5c 24 08 0f 05 <c3> 66 2e 0f 1f 84 00 00 00 00 00 0f 1f 00 f3 0f 1e fa 55 bf 01 00
[11933.188194] RSP: 002b:00000001000fefc8 EFLAGS: 00000246 ORIG_RAX: 0000000000000003
[11933.188199] RAX: ffffffffffffffda RBX: 0000555588f43970 RCX: 00007fb6c116bf32
[11933.188201] RDX: 0000000000000000 RSI: 0000000000000000 RDI: 0000000000000011
[11933.188203] RBP: 00000001000feff0 R08: 0000000000000000 R09: 0000000000000000
[11933.188205] R10: 0000000000000000 R11: 0000000000000246 R12: 0000555588fcccc8
[11933.188207] R13: 0000000000002b34 R14: 00007fb6be079cf0 R15: 00007fb6bc843770
[11933.188213] </TASK>
[11933.188214] ---[ end trace 0000000000000000 ]---
[11933.188346] NVRM: GPU0 nvAssertFailedNoLog: Assertion failed: (status == NV_OK) || (status == NV_ERR_GPU_IN_FULLCHIP_RESET) @ vaspace_api.c:573
[11933.190887] ------------[ cut here ]------------
[11933.190890] WARNING: CPU: 6 PID: 11060 at nvidia/nv.c:5213 nvidia_dev_put+0xa4/0xb0 [nvidia]
[11933.191031] Modules linked in: ccm snd_seq_dummy snd_hrtimer rfcomm snd_seq snd_seq_device uhid cmac algif_hash algif_skcipher af_alg snd_ctl_led snd_soc_skl_hda_dsp snd_soc_intel_sof_board_helpers snd_soc_intel_hda_dsp_common snd_sof_probes snd_hda_codec_intelhdmi bnep snd_soc_dmic snd_hda_codec_alc269 snd_hda_intel snd_hda_scodec_component snd_hda_codec_realtek_lib snd_hda_codec_generic snd_sof_pci_intel_tgl snd_sof_pci_intel_cnl xe snd_sof_intel_hda_generic soundwire_intel snd_sof_intel_hda_sdw_bpt snd_sof_intel_hda_common snd_soc_hdac_hda snd_sof_intel_hda_mlink snd_sof_intel_hda snd_hda_codec_hdmi drm_gpuvm drm_gpusvm_helper soundwire_cadence gpu_sched snd_sof_pci snd_sof_xtensa_dsp drm_exec drm_suballoc_helper snd_sof snd_sof_utils snd_soc_acpi_intel_match snd_soc_acpi_intel_sdca_quirks soundwire_generic_allocation snd_soc_acpi soundwire_bus intel_uncore_frequency snd_soc_sdca intel_uncore_frequency_common crc8 snd_soc_avs uvcvideo snd_soc_hda_codec x86_pkg_temp_thermal snd_hda_ext_core intel_powerclamp
[11933.191063] videobuf2_vmalloc btusb uvc iwlmvm coretemp snd_hda_codec btmtk videobuf2_memops videobuf2_v4l2 mousedev btrtl snd_hda_core videobuf2_common mac80211 btbcm snd_intel_dspcfg iTCO_wdt kvm_intel videodev btintel snd_intel_sdw_acpi vfat intel_pmc_bxt ptp bluetooth joydev mc fat hid_multitouch intel_rapl_msr mei_hdcp mei_pxp ee1004 iTCO_vendor_support snd_hwdep kvm i915 pps_core snd_soc_core processor_thermal_device_pci_legacy libarc4 irqbypass processor_thermal_device snd_compress polyval_clmulni processor_thermal_wt_hint ac97_bus ghash_clmulni_intel platform_temperature_control lenovo_wmi_gamezone processor_thermal_soc_slider snd_pcm_dmaengine aesni_intel lenovo_wmi_other r8169 lenovo_wmi_helpers processor_thermal_rfim iwlwifi realtek processor_thermal_rapl lenovo_wmi_capdata01 snd_pcm drm_buddy spi_nor intel_rapl_common mdio_devres rapl i2c_algo_bit intel_cstate snd_timer libphy lenovo_wmi_events intel_uncore firmware_attributes_class lenovo_wmi_hotkey_utilities mtd wmi_bmof processor_thermal_wt_req pcspkr
[11933.191107] mei_me i2c_i801 i2c_hid_acpi drm_display_helper mdio_bus i2c_smbus snd processor_thermal_power_floor cfg80211 i2c_hid processor_thermal_mbox cec soundcore mei i2c_mux intel_gtt intel_soc_dts_iosf igen6_edac intel_pmc_core elants_i2c ideapad_laptop pmt_telemetry platform_profile pmt_discovery intel_oc_wdt rfkill pmt_class intel_pmc_ssram_telemetry int3400_thermal intel_hid int3403_thermal acpi_thermal_rel intel_vsec sparse_keymap pinctrl_tigerlake int340x_thermal_zone acpi_pad mac_hid ip6t_REJECT nf_reject_ipv6 xt_hl ip6t_rt ipt_REJECT nf_reject_ipv4 xt_LOG nf_log_syslog xt_multiport xt_recent xt_comment xt_limit xt_addrtype xt_tcpudp xt_conntrack nf_conntrack nf_defrag_ipv6 nf_defrag_ipv4 ip6table_filter ip6_tables iptable_filter ip_tables x_tables sg i2c_dev ntsync crypto_user nfnetlink nvidia_drm(OE) nvme nvme_core nvidia_modeset(OE) nvidia_uvm(OE) intel_lpss_pci nvme_keyring intel_lpss spi_intel_pci nvme_auth spi_intel hkdf idma64 serio_raw nvidia(OE) video drm_ttm_helper wmi ttm acpi_call(OE)
[11933.191154] CPU: 6 UID: 1000 PID: 11060 Comm: explorer.exe Tainted: G W OE 6.18.9-arch1-2 #1 PREEMPT(full) acc0345693780c55f83aaf9a0c9efd10d8da358f
[11933.191158] Tainted: [W]=WARN, [O]=OOT_MODULE, [E]=UNSIGNED_MODULE
[11933.191159] Hardware name: LENOVO 82K1/LNVNB161216, BIOS H4CN37WW(V2.06) 06/18/2024
[11933.191160] RIP: 0010:nvidia_dev_put+0xa4/0xb0 [nvidia]
[11933.191274] Code: 89 de 4c 89 e7 e8 2c bd 14 00 85 c0 75 1c 5b 48 89 ef 5d 41 5c e9 dc fa 9b da 5b 48 c7 c7 c0 85 83 c0 5d 41 5c e9 cc fa 9b da <0f> 0b eb e0 0f 1f 84 00 00 00 00 00 90 90 90 90 90 90 90 90 90 90
[11933.191275] RSP: 0018:ffffcf6a46cabcc0 EFLAGS: 00010202
[11933.191277] RAX: 0000000000000026 RBX: ffff8db612128000 RCX: 0000000000000000
[11933.191278] RDX: ffffcf6a46cabc40 RSI: 0000000000000282 RDI: ffffcf6a46cabc00
[11933.191279] RBP: ffff8db612128720 R08: 0000000000000000 R09: 0000000000000000
[11933.191280] R10: ffffcf6a46cabc68 R11: ffff8db600042200 R12: 0000000000000000
[11933.191281] R13: ffffffffc0838720 R14: ffff8db600697f00 R15: 0000000000000000
[11933.191282] FS: 0000000000000000(0000) GS:ffff8dba02a6f000(0000) knlGS:0000000000000000
[11933.191284] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033
[11933.191285] CR2: 00007fb6c0788fc8 CR3: 000000010414b006 CR4: 0000000000f72ef0
[11933.191286] PKRU: 55555554
[11933.191287] Call Trace:
[11933.191289] <TASK>
[11933.191291] nvidia_close+0x182/0x270 [nvidia c668d9d83bb24b5e78745b61fca0ad75dbe168ac]
[11933.191413] __fput+0xe6/0x2a0
[11933.191417] task_work_run+0x5d/0x90
[11933.191422] do_exit+0x299/0xa90
[11933.191427] do_group_exit+0x2d/0xc0
[11933.191430] __x64_sys_exit_group+0x18/0x20
[11933.191433] x64_sys_call+0x14fa/0x1500
[11933.191437] do_syscall_64+0x81/0x7f0
[11933.191440] ? count_memcg_events+0xc2/0x190
[11933.191444] ? handle_mm_fault+0x1d7/0x2d0
[11933.191447] ? do_user_addr_fault+0x21a/0x690
[11933.191451] ? clear_bhb_loop+0x50/0xa0
[11933.191454] ? clear_bhb_loop+0x50/0xa0
[11933.191455] ? clear_bhb_loop+0x50/0xa0
[11933.191457] entry_SYSCALL_64_after_hwframe+0x76/0x7e
[11933.191460] RIP: 0033:0x7fb6c11b1928
[11933.191486] Code: Unable to access opcode bytes at 0x7fb6c11b18fe.
[11933.191487] RSP: 002b:00000001000ff468 EFLAGS: 00000202 ORIG_RAX: 00000000000000e7
[11933.191489] RAX: ffffffffffffffda RBX: 00007fb6c12b5f88 RCX: 00007fb6c11b1928
[11933.191490] RDX: 00007fb6c10cbe88 RSI: ffffffffffffffb0 RDI: 0000000000000000
[11933.191491] RBP: 00000001000ff4c0 R08: 0000000000000000 R09: 0000000000000000
[11933.191492] R10: 0000000000000008 R11: 0000000000000202 R12: 0000000000000a29
[11933.191493] R13: 0000000000000000 R14: 00007fb6c12b4680 R15: 00007fb6c12b5fa0
[11933.191495] </TASK>
[11933.191496] ---[ end trace 0000000000000000 ]---looking at lspci -k I can see
02:00.0 3D controller: NVIDIA Corporation TU117M [GeForce GTX 1650 Mobile / Max-Q] (rev a1)
Subsystem: Lenovo Device 3a5b
Kernel driver in use: nvidia
Kernel modules: nouveau, nvidia_drm, nvidiaThese are my current modprobe parameters (I got them from deepseek trying to fix the issue)
# Disable GSP firmware (fixes most VA space issues on Turing)
options nvidia NVreg_EnableGpuFirmware=0
# Improve VA space management
options nvidia NVreg_UsePageTableDirectories=1
# Increase VA space allocation size
options nvidia NVreg_RegistryDwords="RMUsePageTableDirectories=1; RMUseFbForMappings=0x2"
# Stabilize PCIe communication
options nvidia NVreg_EnablePCIeGen3=0
# Prevent power management from disrupting mappings
options nvidia NVreg_DynamicPowerManagement=0x00
# UVM specific tweaks
options nvidia_uvm uvm_perf_mode=1 uvm_enable_faults=0Last edited by obkt (2026-02-22 22:04:15)
Offline
Pages: 1