Re: [Intel-gfx] [PATCH v2] drm/i915: dell wyse 3040 shutdown fix
From: Alexey Lukyachuk
Date: Mon Jan 02 2023 - 09:03:35 EST
On Tue, 27 Dec 2022 20:40:03 +0300
Alexey Lukyachuk <skif@xxxxxxxxxxx> wrote:
> On Tue, 27 Dec 2022 11:39:25 -0500
> Rodrigo Vivi <rodrigo.vivi@xxxxxxxxx> wrote:
>
> > On Sun, Dec 25, 2022 at 09:55:08PM +0300, Alexey Lukyanchuk wrote:
> > > dell wyse 3040 doesn't peform poweroff properly, but instead remains in
> > > turned power on state.
> >
> > okay, the motivation is explained in the commit msg..
> >
> > > Additional mutex_lock and
> > > intel_crtc_wait_for_next_vblank
> > > feature 6.2 kernel resolve this trouble.
> >
> > but this why is not very clear... seems that by magic it was found,
> > without explaining what race we are really protecting here.
> >
> > but even worse is:
> > what about those many random vblank waits in the code? what's the
> > reasoning?
> >
> > >
> > > cc: stable@xxxxxxxxxxxxxxx
> > > original commit Link: https://patchwork.freedesktop.org/patch/508926/
> > > fixes: fe0f1e3bfdfeb53e18f1206aea4f40b9bd1f291c
> > > Signed-off-by: Alexey Lukyanchuk <skif@xxxxxxxxxxx>
> > > ---
> > > I got some troubles with this device (dell wyse 3040) since kernel 5.11
> > > started to use i915_driver_shutdown function. I found solution here:
> > >
> > > https://lore.kernel.org/dri-devel/Y1wd6ZJ8LdJpCfZL@xxxxxxxxx/#r
> > >
> > > ---
> > > drivers/gpu/drm/i915/display/intel_audio.c | 37 +++++++++++++++-------
> > > 1 file changed, 25 insertions(+), 12 deletions(-)
> > >
> > > diff --git a/drivers/gpu/drm/i915/display/intel_audio.c b/drivers/gpu/drm/i915/display/intel_audio.c
> > > index aacbc6da8..44344ecdf 100644
> > > --- a/drivers/gpu/drm/i915/display/intel_audio.c
> > > +++ b/drivers/gpu/drm/i915/display/intel_audio.c
> > > @@ -336,6 +336,7 @@ static void g4x_audio_codec_disable(struct intel_encoder *encoder,
> > > const struct drm_connector_state *old_conn_state)
> > > {
> > > struct drm_i915_private *dev_priv = to_i915(encoder->base.dev);
> > > + struct intel_crtc *crtc = to_intel_crtc(old_crtc_state->uapi.crtc);
> > > u32 eldv, tmp;
> > >
> > > tmp = intel_de_read(dev_priv, G4X_AUD_VID_DID);
> > > @@ -348,6 +349,9 @@ static void g4x_audio_codec_disable(struct intel_encoder *encoder,
> > > tmp = intel_de_read(dev_priv, G4X_AUD_CNTL_ST);
> > > tmp &= ~eldv;
> > > intel_de_write(dev_priv, G4X_AUD_CNTL_ST, tmp);
> > > +
> > > + intel_crtc_wait_for_next_vblank(crtc);
> > > + intel_crtc_wait_for_next_vblank(crtc);
> > > }
> > >
> > > static void g4x_audio_codec_enable(struct intel_encoder *encoder,
> > > @@ -355,12 +359,15 @@ static void g4x_audio_codec_enable(struct intel_encoder *encoder,
> > > const struct drm_connector_state *conn_state)
> > > {
> > > struct drm_i915_private *dev_priv = to_i915(encoder->base.dev);
> > > + struct intel_crtc *crtc = to_intel_crtc(crtc_state->uapi.crtc);
> > > struct drm_connector *connector = conn_state->connector;
> > > const u8 *eld = connector->eld;
> > > u32 eldv;
> > > u32 tmp;
> > > int len, i;
> > >
> > > + intel_crtc_wait_for_next_vblank(crtc);
> > > +
> > > tmp = intel_de_read(dev_priv, G4X_AUD_VID_DID);
> > > if (tmp == INTEL_AUDIO_DEVBLC || tmp == INTEL_AUDIO_DEVCL)
> > > eldv = G4X_ELDV_DEVCL_DEVBLC;
> > > @@ -493,6 +500,7 @@ static void hsw_audio_codec_disable(struct intel_encoder *encoder,
> > > const struct drm_connector_state *old_conn_state)
> > > {
> > > struct drm_i915_private *dev_priv = to_i915(encoder->base.dev);
> > > + struct intel_crtc *crtc = to_intel_crtc(old_crtc_state->uapi.crtc);
> > > enum transcoder cpu_transcoder = old_crtc_state->cpu_transcoder;
> > > u32 tmp;
> > >
> > > @@ -508,6 +516,10 @@ static void hsw_audio_codec_disable(struct intel_encoder *encoder,
> > > tmp |= AUD_CONFIG_N_VALUE_INDEX;
> > > intel_de_write(dev_priv, HSW_AUD_CFG(cpu_transcoder), tmp);
> > >
> > > +
> > > + intel_crtc_wait_for_next_vblank(crtc);
> > > + intel_crtc_wait_for_next_vblank(crtc);
> > > +
> > > /* Invalidate ELD */
> > > tmp = intel_de_read(dev_priv, HSW_AUD_PIN_ELD_CP_VLD);
> > > tmp &= ~AUDIO_ELD_VALID(cpu_transcoder);
> > > @@ -633,6 +645,7 @@ static void hsw_audio_codec_enable(struct intel_encoder *encoder,
> > > const struct drm_connector_state *conn_state)
> > > {
> > > struct drm_i915_private *dev_priv = to_i915(encoder->base.dev);
> > > + struct intel_crtc *crtc = to_intel_crtc(crtc_state->uapi.crtc);
> > > struct drm_connector *connector = conn_state->connector;
> > > enum transcoder cpu_transcoder = crtc_state->cpu_transcoder;
> > > const u8 *eld = connector->eld;
> > > @@ -651,12 +664,7 @@ static void hsw_audio_codec_enable(struct intel_encoder *encoder,
> > > tmp &= ~AUDIO_ELD_VALID(cpu_transcoder);
> > > intel_de_write(dev_priv, HSW_AUD_PIN_ELD_CP_VLD, tmp);
> > >
> > > - /*
> > > - * FIXME: We're supposed to wait for vblank here, but we have vblanks
> > > - * disabled during the mode set. The proper fix would be to push the
> > > - * rest of the setup into a vblank work item, queued here, but the
> > > - * infrastructure is not there yet.
> > > - */
> > > + intel_crtc_wait_for_next_vblank(crtc);
> > >
> > > /* Reset ELD write address */
> > > tmp = intel_de_read(dev_priv, HSW_AUD_DIP_ELD_CTRL(cpu_transcoder));
> > > @@ -705,6 +713,8 @@ static void ilk_audio_codec_disable(struct intel_encoder *encoder,
> > > aud_cntrl_st2 = CPT_AUD_CNTRL_ST2;
> > > }
> > >
> > > + mutex_lock(&dev_priv->display.audio.mutex);
> > > +
> > > /* Disable timestamps */
> > > tmp = intel_de_read(dev_priv, aud_config);
> > > tmp &= ~AUD_CONFIG_N_VALUE_INDEX;
> > > @@ -721,6 +731,10 @@ static void ilk_audio_codec_disable(struct intel_encoder *encoder,
> > > tmp = intel_de_read(dev_priv, aud_cntrl_st2);
> > > tmp &= ~eldv;
> > > intel_de_write(dev_priv, aud_cntrl_st2, tmp);
> > > + mutex_unlock(&dev_priv->display.audio.mutex);
> > > +
> > > + intel_crtc_wait_for_next_vblank(crtc);
> > > + intel_crtc_wait_for_next_vblank(crtc);
> > > }
> > >
> > > static void ilk_audio_codec_enable(struct intel_encoder *encoder,
> > > @@ -740,12 +754,7 @@ static void ilk_audio_codec_enable(struct intel_encoder *encoder,
> > > if (drm_WARN_ON(&dev_priv->drm, port == PORT_A))
> > > return;
> > >
> > > - /*
> > > - * FIXME: We're supposed to wait for vblank here, but we have vblanks
> > > - * disabled during the mode set. The proper fix would be to push the
> > > - * rest of the setup into a vblank work item, queued here, but the
> > > - * infrastructure is not there yet.
> > > - */
> > > + intel_crtc_wait_for_next_vblank(crtc);
> > >
> > > if (HAS_PCH_IBX(dev_priv)) {
> > > hdmiw_hdmiedid = IBX_HDMIW_HDMIEDID(pipe);
> > > @@ -767,6 +776,8 @@ static void ilk_audio_codec_enable(struct intel_encoder *encoder,
> > >
> > > eldv = IBX_ELD_VALID(port);
> > >
> > > + mutex_lock(&dev_priv->display.audio.mutex);
> > > +
> > > /* Invalidate ELD */
> > > tmp = intel_de_read(dev_priv, aud_cntrl_st2);
> > > tmp &= ~eldv;
> > > @@ -798,6 +809,8 @@ static void ilk_audio_codec_enable(struct intel_encoder *encoder,
> > > else
> > > tmp |= audio_config_hdmi_pixel_clock(crtc_state);
> > > intel_de_write(dev_priv, aud_config, tmp);
> > > +
> > > + mutex_unlock(&dev_priv->display.audio.mutex);
> > > }
> > >
> > > /**
> > > --
> > > 2.25.1
> > >
>
>
> I would like to say, that this solution was found in drm-tip repository:
> link: git://anongit.freedesktop.org/drm-tip
> I will quotate original commit message from Ville Syrjälä
> <ville.syrjala@xxxxxxxxxxxxxxx>: "The spec tells us to do a bunch of
> vblank waits in the audio enable/disable sequences. Make it so."
> So it's just a backport of accepted patch.
> Which i wanna to propagate to stable versions
Yes, I have checked 6.2-rc2 and everything work fine. I want to backport
this commit to 6.0 and 6.1 because my company going to use these versions.
Maybe it will be useful for 5.15, companies and vendors are passionate about
LTS kernel ( I am edge to make special version of this patch for 5.15
because hank 3 will be failed with it.).
I am fully supportive with you that trouble is in timings/ locking changes.
Early in detecting process I made some sleeps and it's help but not reliable.
Regarding to your question about fdo gitlab, I went to do it. And in process
("Before filing the bug, please try to reproduce your issue with the latest
kernel. Use the latest drm-tip branch") I found that trouble is resolves.
Using bisect and tests, I got needed commit.
Also I add log (by netconsole) from 5.15 kernel
[ 60.031680] ------------[ cut here ]------------
[ 60.031709] i915 0000:00:02.0: drm_WARN_ON(!intel_irqs_enabled(dev_priv))
[ 60.031766] WARNING: CPU: 1 PID: 1964 at drivers/gpu/drm/i915/i915_irq.c:527 i915_enable_pipestat+0x1b9/0x230 [i915]
[ 60.032016] Modules linked in: snd_soc_sst_cht_bsw_rt5672 snd_hdmi_lpe_audio mei_hdcp intel_rapl_msr intel_powerclamp coretemp kvm_intel kvm punit_atom_debug crct10dif_pclmul ghash_clmulni_intel joydev input_leds aesni_intel crypto_simd cryptd snd_sof_acpi_intel_byt intel_cstate snd_sof_intel_ipc snd_sof_acpi snd_sof_intel_atom dell_wmi snd_sof_xtensa_dsp snd_sof dell_smbios ledtrig_audio dcdbas snd_intel_sst_acpi nls_iso8859_1 snd_soc_acpi_intel_match sparse_keymap snd_soc_acpi i915 efi_pstore snd_intel_sst_core wmi_bmof dell_wmi_descriptor snd_soc_sst_atom_hifi2_platform snd_soc_rt5670 snd_intel_dspcfg intel_chtdc_ti_pwrbtn snd_soc_rl6231 snd_intel_sdw_acpi ttm drm_kms_helper snd_soc_core cec snd_compress ac97_bus rc_core processor_thermal_device_pci_legacy snd_pcm_dmaengine i2c_algo_bit processor_thermal_device fb_sys_fops processor_thermal_rfim snd_pcm snd_seq_midi syscopyarea processor_thermal_mbox sysfillrect processor_thermal_rapl intel_rapl_common mei_txe intel_soc_dts_iosf
[ 60.032231] snd_seq_midi_event mei intel_xhci_usb_role_switch sysimgblt snd_rawmidi snd_seq snd_seq_device snd_timer snd soundcore 8250_dw int3406_thermal mac_hid int3403_thermal int340x_thermal_zone int3400_thermal acpi_pad intel_int0002_vgpio acpi_thermal_rel sch_fq_codel ipmi_devintf ipmi_msghandler msr parport_pc ppdev lp parport drm ip_tables x_tables autofs4 overlay hid_logitech_hidpp hid_logitech_dj hid_generic usbhid hid netconsole mmc_block crc32_pclmul r8169 realtek lpc_ich sdhci_pci xhci_pci cqhci xhci_pci_renesas dw_dmac wmi sdhci_acpi video dw_dmac_core intel_soc_pmic_chtdc_ti sdhci
[ 60.032427] CPU: 1 PID: 1964 Comm: plymouthd Not tainted 5.15.0-57-generic #63~20.04.1-Ubuntu
[ 60.032440] Hardware name: Dell Inc. Wyse 3040 Thin Client/0G56C0, BIOS 1.2.4 01/18/2018
[ 60.032450] RIP: 0010:i915_enable_pipestat+0x1b9/0x230 [i915]
[ 60.032669] Code: 89 55 cc 44 89 5d d0 44 89 4d d4 e8 c1 15 ae d8 48 8b 55 c0 48 c7 c1 a8 72 b5 c0 48 c7 c7 54 b5 b8 c0 48 89 c6 e8 0e 21 f5 d8 <0f> 0b 44 8b 55 cc 44 8b 5d d0 44 8b 4d d4 e9 9d fe ff ff 4c 89 f6
[ 60.032682] RSP: 0018:ffffaaa50070b878 EFLAGS: 00010086
[ 60.032694] RAX: 0000000000000000 RBX: ffff980ec8080000 RCX: ffffffff9ab7a748
[ 60.032703] RDX: 00000000ffffdfff RSI: ffffaaa50070b6b8 RDI: 0000000000000001
[ 60.032713] RBP: ffffaaa50070b8c0 R08: 0000000000000003 R09: 0000000000000001
[ 60.032721] R10: ffffffff9b21f3b6 R11: 000000009b21f38a R12: 0000000000000004
[ 60.032730] R13: 0000000000000000 R14: 0000000000000000 R15: ffff980ec8080000
[ 60.032740] FS: 00007f0967eec740(0000) GS:ffff980f34280000(0000) knlGS:0000000000000000
[ 60.032752] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033
[ 60.032762] CR2: 00007f7f5f21eaa4 CR3: 000000000a34a000 CR4: 00000000001006e0
[ 60.032772] Call Trace:
[ 60.032781] <TASK>
[ 60.032793] ? drm_crtc_vblank_helper_get_vblank_timestamp_internal+0xe0/0x370 [drm]
[ 60.032899] i965_enable_vblank+0x3d/0x60 [i915]
[ 60.033139] drm_vblank_enable+0xfd/0x1a0 [drm]
[ 60.033240] drm_vblank_get+0xaf/0x100 [drm]
[ 60.033335] drm_crtc_vblank_get+0x17/0x20 [drm]
[ 60.033426] intel_pipe_update_start+0x128/0x2f0 [i915]
[ 60.033689] ? wait_woken+0x60/0x60
[ 60.033710] intel_update_crtc+0xd2/0x420 [i915]
[ 60.033969] intel_commit_modeset_enables+0x74/0xa0 [i915]
[ 60.034228] intel_atomic_commit_tail+0x587/0x14e0 [i915]
[ 60.034488] intel_atomic_commit+0x3a6/0x410 [i915]
[ 60.034746] drm_atomic_commit+0x4a/0x60 [drm]
[ 60.034849] drm_atomic_helper_set_config+0x80/0xc0 [drm_kms_helper]
[ 60.034921] drm_mode_setcrtc+0x1ff/0x7d0 [drm]
[ 60.035011] ? drm_mode_getcrtc+0x1e0/0x1e0 [drm]
[ 60.035098] drm_ioctl_kernel+0xb2/0x100 [drm]
[ 60.035182] drm_ioctl+0x275/0x4a0 [drm]
[ 60.035265] ? drm_mode_getcrtc+0x1e0/0x1e0 [drm]
[ 60.035354] __x64_sys_ioctl+0x95/0xd0
[ 60.035372] do_syscall_64+0x5c/0xc0
[ 60.035388] ? exit_to_user_mode_prepare+0x3d/0x1c0
[ 60.035404] ? syscall_exit_to_user_mode+0x27/0x50
[ 60.035418] ? do_syscall_64+0x69/0xc0
[ 60.035431] ? syscall_exit_to_user_mode+0x27/0x50
[ 60.035445] ? do_syscall_64+0x69/0xc0
[ 60.035459] ? syscall_exit_to_user_mode+0x27/0x50
[ 60.035474] ? do_syscall_64+0x69/0xc0
[ 60.035487] ? do_syscall_64+0x69/0xc0
[ 60.035501] ? do_syscall_64+0x69/0xc0
[ 60.035514] entry_SYSCALL_64_after_hwframe+0x61/0xcb
[ 60.035528] RIP: 0033:0x7f09681aa3ab
[ 60.035542] Code: 0f 1e fa 48 8b 05 e5 7a 0d 00 64 c7 00 26 00 00 00 48 c7 c0 ff ff ff ff c3 66 0f 1f 44 00 00 f3 0f 1e fa b8 10 00 00 00 0f 05 <48> 3d 01 f0 ff ff 73 01 c3 48 8b 0d b5 7a 0d 00 f7 d8 64 89 01 48
[ 60.035554] RSP: 002b:00007fff40931638 EFLAGS: 00000246 ORIG_RAX: 0000000000000010
[ 60.035567] RAX: ffffffffffffffda RBX: 00007fff40931670 RCX: 00007f09681aa3ab
[ 60.035576] RDX: 00007fff40931670 RSI: 00000000c06864a2 RDI: 0000000000000009
[ 60.035584] RBP: 00000000c06864a2 R08: 0000000000000000 R09: 00005560dd410090
[ 60.035592] R10: 0000000000000000 R11: 0000000000000246 R12: 000000000000007f
[ 60.035601] R13: 0000000000000009 R14: 00005560dd40ffe0 R15: 00005560dd410020
[ 60.035613] </TASK>
[ 60.035622] ---[ end trace a700e85625cc752d ]---