Skip site navigation (1)Skip section navigation (2)
Date:      Wed, 1 Sep 2010 21:11:31 +0400
From:      pluknet <pluknet@gmail.com>
To:        John Baldwin <jhb@freebsd.org>
Cc:        freebsd-stable@freebsd.org
Subject:   Re: page fault in e1000_clear_hw_cntrs_base_generic() during SIOCAIFADDR
Message-ID:  <AANLkTimD6K0UKu80Xf3hu6Mx5MEth2Gaqr-Dxm44fqSi@mail.gmail.com>
In-Reply-To: <201009011206.15494.jhb@freebsd.org>
References:  <AANLkTi=cQF0Ta5scpMBZ6Ba_uj_Zqxu9=2qUv2g=14fp@mail.gmail.com> <201009011206.15494.jhb@freebsd.org>

next in thread | previous in thread | raw e-mail | index | archive | help
On 1 September 2010 20:06, John Baldwin <jhb@freebsd.org> wrote:
> On Wednesday, September 01, 2010 11:53:09 am pluknet wrote:
>> Hi.
>>
>> This is reproducible from time to time on boot when
>> handling SIOCAIFADDR called from ifconfig on igb
>> on fresh (and not so fresh) 8-STABLE.
>>
>> How can I help with debugging?
>>
>> Kernel page fault with the following non-sleepable locks held:
>> exclusive sleep mutex igb0 (IGB Core Lock) r =3D 0 (0xc2655534) locked @
>> /usr/src/sys/modules/igb/../../dev/e1000/if_igb.c:965
>> KDB: stack backtrace:
>> db_trace_self_wrapper(c08b5055,cce577b8,c060db15,3c5,0,...) at
>> db_trace_self_wrapper+0x26
>> kdb_backtrace(3c5,0,ffffffff,c0a94864,cce577f0,...) at kdb_backtrace+0x2=
9
>> _witness_debugger(c08b74fe,cce57804,4,1,0,...) at _witness_debugger+0x25
>> witness_warn(5,0,c08e3140,cce5782c,c2956000,...) at witness_warn+0x1fe
>> trap(cce57890) at trap+0x195
>> calltrap() at calltrap+0x6
>> --- trap 0xc, eip =3D 0xc3192477, esp =3D 0xcce578d0, ebp =3D 0xcce578e0=
 ---
>> e1000_clear_hw_cntrs_base_generic(c2651004,64,c3185850,c2651000,0,...)
>> at e1000_clear_hw_cntrs_base_generic+0x3e7
>
> Can you use gdb on your kernel.debug to map this to a source file and lin=
e?
>

Here it is (btw, it took about 10-15 reboots to reproduce after adding
swap and dumpon setup).
Hmm.. don't see where it might access an invalid pointer.

#0  doadump () at pcpu.h:231
#1  0xc04a3679 in db_fncall (dummy1=3D1, dummy2=3D0, dummy3=3D-1062122144,
    dummy4=3D0xcce636a8 "") at /usr/src/sys/ddb/db_command.c:548
#2  0xc04a3a71 in db_command (last_cmdp=3D0xc093d19c, cmd_table=3D0x0, dopa=
ger=3D1)
    at /usr/src/sys/ddb/db_command.c:445
#3  0xc04a3bca in db_command_loop () at /usr/src/sys/ddb/db_command.c:498
#4  0xc04a5aed in db_trap (type=3D12, code=3D0) at /usr/src/sys/ddb/db_main=
.c:229
#5  0xc05fa64e in kdb_trap (type=3D12, code=3D0, tf=3D0xcce63890)
    at /usr/src/sys/kern/subr_kdb.c:535
#6  0xc084dcdf in trap_fatal (frame=3D0xcce63890, eva=3D3428511744)
    at /usr/src/sys/i386/i386/trap.c:929
#7  0xc084e553 in trap (frame=3D0xcce63890) at /usr/src/sys/i386/i386/trap.=
c:328
#8  0xc082f66c in calltrap () at /usr/src/sys/i386/i386/exception.s:166
#9  0xc318c477 in e1000_clear_hw_cntrs_base_generic (hw=3D0xc2655004)
    at /usr/src/sys/modules/igb/../../dev/e1000/e1000_mac.c:643
#10 0xc317ec82 in igb_init_locked (adapter=3D0xc2655000)
    at /usr/src/sys/modules/igb/../../dev/e1000/if_igb.c:1202
#11 0xc31801e5 in igb_ioctl (ifp=3D0xc2943c00, command=3D2149607692,
    data=3D0xc29db600 "=E2=95=A2=E2=95=A4\235=D0=B1=D0=B4=E2=95=A4\235=D0=
=B1=D1=82=E2=95=A4\235=D0=B1")
    at /usr/src/sys/modules/igb/../../dev/e1000/if_igb.c:966
#12 0xc0696c4e in in_ifinit (ifp=3D0xc2943c00, ia=3D0xc29db600,
sin=3DVariable "sin" is not available.
)
    at /usr/src/sys/netinet/in.c:848
#13 0xc06980cb in in_control (so=3D0xc2a5d9a8, cmd=3D2151704858,
    data=3D0xc2649400 "igb0", ifp=3D0xc2943c00, td=3D0xc29b8280)
---Type <return> to continue, or q <return> to quit---
    at /usr/src/sys/netinet/in.c:563
#14 0xc067c860 in ifioctl (so=3D0xc2a5d9a8, cmd=3D2151704858,
    data=3D0xc2649400 "igb0", td=3D0xc29b8280) at /usr/src/sys/net/if.c:252=
3
#15 0xc0617395 in soo_ioctl (fp=3D0xc29ce310, cmd=3D2151704858, data=3D0xc2=
649400,
    active_cred=3D0xc254b100, td=3D0xc29b8280)
    at /usr/src/sys/kern/sys_socket.c:212
#16 0xc06113dd in kern_ioctl (td=3D0xc29b8280, fd=3D3, com=3D2151704858,
    data=3D0xc2649400 "igb0") at file.h:262
#17 0xc0611564 in ioctl (td=3D0xc29b8280, uap=3D0xcce63cf8)
    at /usr/src/sys/kern/sys_generic.c:678
#18 0xc084e160 in syscall (frame=3D0xcce63d38)
    at /usr/src/sys/i386/i386/trap.c:1111
#19 0xc082f6d1 in Xint0x80_syscall ()
    at /usr/src/sys/i386/i386/exception.s:264
#20 0x00000033 in ?? ()
Previous frame inner to this frame (corrupt stack?)

(kgdb) f 9
#9  0xc318c477 in e1000_clear_hw_cntrs_base_generic (hw=3D0xc2655004)
    at /usr/src/sys/modules/igb/../../dev/e1000/e1000_mac.c:643
643             E1000_READ_REG(hw, E1000_SYMERRS);
(kgdb) list
638     void e1000_clear_hw_cntrs_base_generic(struct e1000_hw *hw)
639     {
640             DEBUGFUNC("e1000_clear_hw_cntrs_base_generic");
641
642             E1000_READ_REG(hw, E1000_CRCERRS);
643             E1000_READ_REG(hw, E1000_SYMERRS);
644             E1000_READ_REG(hw, E1000_MPC);
645             E1000_READ_REG(hw, E1000_SCC);
646             E1000_READ_REG(hw, E1000_ECOL);
647             E1000_READ_REG(hw, E1000_MCC);

(kgdb) p *(struct e1000_osdep *)hw->back
$6 =3D {mem_bus_space_tag =3D 1, mem_bus_space_handle =3D 3428495360,
  io_bus_space_tag =3D 0, io_bus_space_handle =3D 0, flash_bus_space_tag =
=3D 0,
  flash_bus_space_handle =3D 0, dev =3D 0xc261a600}

(kgdb) p *hw
[...]
      power_down =3D 0xc3186340 <e1000_null_phy_generic>}, type =3D e1000_p=
hy_vf,
[...]

(kgdb) p (struct e1000_mac_info *)hw->mac.type
$8 =3D (struct e1000_mac_info *) 0x1a

(kgdb) p *(struct e1000_mac_info *)hw->mac
$10 =3D {ops =3D {init_params =3D 0x8be58955, id_led_init =3D 0x80c70845,
    blink_led =3D 0x390, check_for_link =3D 0, check_mng_mode =3D 0x2d480c7=
,
    cleanup_led =3D 0, clear_hw_cntrs =3D 0x80c70000, clear_vfta =3D 0x2d0,
    get_bus_info =3D 0, set_lan_id =3D 0x2c880c7, get_link_up_info =3D 0,
    led_on =3D 0xc7660000, led_off =3D 0xbe80, update_mc_addr_list =3D 0x66=
008000,
    reset_hw =3D 0x2c480c7, init_hw =3D 0x10000, shutdown_serdes =3D 0xf058=
40c7,
    power_up_serdes =3D 0xc7c31a4f, setup_link =3D 0x50003040,
    setup_physical_interface =3D 0x40c7c31a, setup_led =3D 0x1a539048,
    write_vfta =3D 0x4c40c7c3,
    config_collision_dist =3D 0xc31a5360 <e1000_init_hw_vf>,
    rar_set =3D 0x901c40c7, read_mac_addr =3D 0xc7c31a55,
    validate_mdi_setting =3D 0x55103840, mng_host_if_write =3D 0x40c7c31a,
    mng_write_cmd_header =3D 0x1a502044, mng_enable_host_if =3D 0x6c40c7c3,
    wait_autoneg =3D 0xc31a52a0 <e1000_rar_set_vf>}, addr =3D "=D0=B3@p@R\0=
32",
  perm_addr =3D "=D1=861=D1=8E]=D1=86\215", type =3D 182, collision_delta =
=3D 666668288,
  ledctl_default =3D 0, ledctl_mode1 =3D 2347075925, ledctl_mode2 =3D 10867=
85605,
  mc_filter_type =3D 441389072, tx_packet_delta =3D 3095447491,
  txcw =3D 3758096387, current_ifs_val =3D 6734, ifs_max_val =3D 51139,
  ifs_min_val =3D 5248, ifs_ratio =3D 3, ifs_step_size =3D 45056,
  mta_reg_count =3D 6734, uta_reg_count =3D 51139, mta_shadow =3D {18790481=
96,
    1573067352, 7769539, 4294883413, 3851026431, 3062743901, 0, 1575323989,
    645172675, 666668288, 0, 2311074133, 2311282149, 666668534, 0,
    2347075925, 2160527429, 1016, 4, 66879687, 393216, 3224436736,
    4136223581, 1474660693, 3968029526, 209554260, 504397187, 1170701942,
---Type <return> to continue, or q <return> to quit---
    503317428, 273008384, 30, 3339212171, 45125, 3071213568, 48770, 9861555=
2,
    838817933, 4294672841, 3187671040, 8, 3526433396, 2298593923, 340092924=
0,
    4282247379, 1962934272, 573167, 3458793472, 88585743, 72857103,
    4052345043, 3490314963, 565204363, 4280641240, 1149855247, 1301002325,
    29524752, 967857545, 2199679946, 2817197767, 3239069067, 3364032736,
    3024455939, 2232436107, 2038763456, 2348810239, 1166870613, 608487348,
    12, 608487168, 4104, 608471296, 605325572, 68719359, 3296919552,
    1600019284, 3029189469, 38, 666668288, 0, 2212858197, 1300961516,
    1169624848, 139823884, 83379655, 2231369728, 4232415689, 1170671476,
    16778488, 4165307648, 203703495, 0, 136594631, 2, 69485705, 4280554633,
    268434, 2311309568, 666668534, 0, 2212858197, 3071219948, 1166740565,
    4165322504, 5, 203703495, 0, 2382124425, 1153955925, 133156, 1418264576=
,
    76088356, 412155684, 3372220420, 649366979, 0, 2212858197, 1435180268,
    4166879500, 2299026827, 1170734197, 1780, 33194752, 812861556,
    3354686861, 795716, 3338665984, 17310788, 2298478592},
  rar_entry_count =3D 9332, forced_speed_duplex =3D 4 '\004',
  adaptive_ifs =3D -1811995620, has_fwsm =3D 1048,
  arc_subsystem_valid =3D 745848965, asf_firmware_present =3D -1946657397,
  autoneg =3D -326501259, autoneg_failed =3D -158743715,
  get_link_status =3D 1946352259, in_ifs_mode =3D 66749261,
  report_tx_early =3D -1096, serdes_link_state =3D 3353703935,
  serdes_has_link =3D 455749, tx_pkt_filtering =3D 1300299778}

(kgdb) p *hw
$13 =3D {back =3D 0xc2659498, hw_addr =3D 0xc265949c "", flash_address =3D =
0x0,
  io_base =3D 0, mac =3D {ops =3D {
      init_params =3D 0xc31a4f10 <e1000_init_mac_params_vf>, id_led_init =
=3D 0,
      blink_led =3D 0xc318b140 <e1000_null_ops_generic>,
      check_for_link =3D 0xc31a5590 <e1000_check_for_link_vf>,
      check_mng_mode =3D 0xc318b170 <e1000_null_mng_mode>,
      cleanup_led =3D 0xc318b140 <e1000_null_ops_generic>,
      clear_hw_cntrs =3D 0xc318b150 <e1000_null_mac_generic>,
      clear_vfta =3D 0xc318b150 <e1000_null_mac_generic>,
      get_bus_info =3D 0xc31a5000 <e1000_get_bus_info_pcie_vf>,
      set_lan_id =3D 0xc318b9f0 <e1000_set_lan_id_multi_port_pcie>,
      get_link_up_info =3D 0xc31a5510 <e1000_get_link_up_info_vf>,
      led_on =3D 0xc318b140 <e1000_null_ops_generic>,
      led_off =3D 0xc318b140 <e1000_null_ops_generic>,
      update_mc_addr_list =3D 0xc31a5020 <e1000_update_mc_addr_list_vf>,
      reset_hw =3D 0xc31a5390 <e1000_reset_hw_vf>,
      init_hw =3D 0xc31a5360 <e1000_init_hw_vf>, shutdown_serdes =3D 0,
      power_up_serdes =3D 0, setup_link =3D 0xc31a4ff0 <e1000_setup_link_vf=
>,
      setup_physical_interface =3D 0xc318b140 <e1000_null_ops_generic>,
      setup_led =3D 0xc318b140 <e1000_null_ops_generic>,
      write_vfta =3D 0xc318b190 <e1000_null_write_vfta>,
      config_collision_dist =3D 0xc318dbf0
<e1000_config_collision_dist_generic>, rar_set =3D 0xc31a52a0
<e1000_rar_set_vf>,
      read_mac_addr =3D 0xc31a5240 <e1000_read_mac_addr_vf>,
---Type <return> to continue, or q <return> to quit---
      validate_mdi_setting =3D 0xc318b490 <e1000_validate_mdi_setting_gener=
ic>,
      mng_host_if_write =3D 0xc318ed90 <e1000_mng_host_if_write_generic>,
      mng_write_cmd_header =3D 0xc318f070 <e1000_mng_write_cmd_header_gener=
ic>,
      mng_enable_host_if =3D 0xc318e880 <e1000_mng_enable_host_if_generic>,
      wait_autoneg =3D 0xc3187a20 <e1000_wait_autoneg_generic>},
    addr =3D "&\177=D0=92h=E2=95=91\221", perm_addr =3D "&\177=D0=92h=E2=95=
=91\221", type =3D e1000_vfadapt,
    collision_delta =3D 0, ledctl_default =3D 0, ledctl_mode1 =3D 0,
    ledctl_mode2 =3D 0, mc_filter_type =3D 0, tx_packet_delta =3D 0, txcw =
=3D 0,
    current_ifs_val =3D 0, ifs_max_val =3D 0, ifs_min_val =3D 0, ifs_ratio =
=3D 0,
    ifs_step_size =3D 0, mta_reg_count =3D 128, uta_reg_count =3D 0, mta_sh=
adow =3D {
      0 <repeats 128 times>}, rar_entry_count =3D 1,
    forced_speed_duplex =3D 0 '\0', adaptive_ifs =3D 0, has_fwsm =3D 0,
    arc_subsystem_valid =3D 0, asf_firmware_present =3D 0, autoneg =3D 1,
    autoneg_failed =3D 0, get_link_status =3D 0, in_ifs_mode =3D 0,
    report_tx_early =3D 0, serdes_link_state =3D e1000_serdes_link_down,
    serdes_has_link =3D 0, tx_pkt_filtering =3D 0}, fc =3D {high_water =3D =
58976,
    low_water =3D 58960, pause_time =3D 1664, refresh_time =3D 0, send_xon =
=3D 1,
    strict_ieee =3D 0, current_mode =3D e1000_fc_full,
    requested_mode =3D e1000_fc_full}, phy =3D {ops =3D {
      init_params =3D 0xc31a4eb0 <e1000_init_phy_params_vf>,
      acquire =3D 0xc31a4fd0 <e1000_acquire_vf>,
      cfg_on_link_up =3D 0xc318b140 <e1000_null_ops_generic>,
      check_polarity =3D 0xc318b140 <e1000_null_ops_generic>,
      check_reset_block =3D 0xc318b140 <e1000_null_ops_generic>,
---Type <return> to continue, or q <return> to quit---
      commit =3D 0xc318b140 <e1000_null_ops_generic>,
      force_speed_duplex =3D 0xc318b140 <e1000_null_ops_generic>,
      get_cfg_done =3D 0xc318b140 <e1000_null_ops_generic>,
      get_cable_length =3D 0xc318b140 <e1000_null_ops_generic>,
      get_info =3D 0xc318b140 <e1000_null_ops_generic>,
      read_reg =3D 0xc3186330 <e1000_null_read_reg>,
      read_reg_locked =3D 0xc3186330 <e1000_null_read_reg>,
      release =3D 0xc31a4fe0 <e1000_release_vf>,
      reset =3D 0xc318b140 <e1000_null_ops_generic>,
      set_d0_lplu_state =3D 0xc3186350 <e1000_null_lplu_state>,
      set_d3_lplu_state =3D 0xc3186350 <e1000_null_lplu_state>,
      write_reg =3D 0xc3186360 <e1000_null_write_reg>,
      write_reg_locked =3D 0xc3186360 <e1000_null_write_reg>,
      power_up =3D 0xc3186340 <e1000_null_phy_generic>,
      power_down =3D 0xc3186340 <e1000_null_phy_generic>}, type =3D e1000_p=
hy_vf,
    local_rx =3D e1000_1000t_rx_status_not_ok,
    remote_rx =3D e1000_1000t_rx_status_not_ok, ms_type =3D e1000_ms_hw_def=
ault,
    original_ms_type =3D e1000_ms_hw_default,
    cable_polarity =3D e1000_rev_polarity_normal,
    smart_speed =3D e1000_smart_speed_default, addr =3D 0, id =3D 0,
    reset_delay_us =3D 0, revision =3D 0, media_type =3D e1000_media_type_u=
nknown,
    autoneg_advertised =3D 47, autoneg_mask =3D 0, cable_length =3D 0,
    max_cable_length =3D 0, min_cable_length =3D 0, mdix =3D 0 '\0',
    disable_polarity_correction =3D 0, is_mdix =3D 0, polarity_correction =
=3D 0,
---Type <return> to continue, or q <return> to quit---
    reset_disable =3D 0, speed_downgraded =3D 0, autoneg_wait_to_complete =
=3D 0},
  nvm =3D {ops =3D {init_params =3D 0xc31a4ee0 <e1000_init_nvm_params_vf>,
      acquire =3D 0xc31a4fd0 <e1000_acquire_vf>,
      read =3D 0xc3189970 <e1000_null_read_nvm>,
      release =3D 0xc31a4fe0 <e1000_release_vf>,
      reload =3D 0xc318ada0 <e1000_reload_nvm_generic>,
      update =3D 0xc318b140 <e1000_null_ops_generic>,
      valid_led_default =3D 0xc3189990 <e1000_null_led_default>,
      validate =3D 0xc318b140 <e1000_null_ops_generic>,
      write =3D 0xc31899a0 <e1000_null_write_nvm>}, type =3D e1000_nvm_none=
,
    override =3D e1000_nvm_override_none, flash_bank_size =3D 0,
    flash_base_addr =3D 0, word_size =3D 0, delay_usec =3D 0, address_bits =
=3D 0,
    opcode_bits =3D 0, page_size =3D 0}, bus =3D {type =3D e1000_bus_type_r=
eserved,
    speed =3D e1000_bus_speed_2500, width =3D e1000_bus_width_unknown, func=
 =3D 0,
    pci_cmd_word =3D 7}, mbx =3D {ops =3D {
      init_params =3D 0xc31a5870 <e1000_init_mbx_params_vf>,
      read =3D 0xc31a60d0 <e1000_read_mbx_vf>,
      write =3D 0xc31a5e80 <e1000_write_mbx_vf>,
      read_posted =3D 0xc31a5dd0 <e1000_read_posted_mbx>,
      write_posted =3D 0xc31a5d00 <e1000_write_posted_mbx>,
      check_for_msg =3D 0xc31a5cd0 <e1000_check_for_msg_vf>,
      check_for_ack =3D 0xc31a5ca0 <e1000_check_for_ack_vf>,
      check_for_rst =3D 0xc31a5c70 <e1000_check_for_rst_vf>}, stats =3D {
      msgs_tx =3D 8, msgs_rx =3D 8, acks =3D 8, reqs =3D 8, rsts =3D 0},
---Type <return> to continue, or q <return> to quit---
    timeout =3D 2000, usec_delay =3D 500, size =3D 16}, mng_cookie =3D {
    signature =3D 0, status =3D 0 '\0', reserved0 =3D 0 '\0', vlan_id =3D 0=
,
    reserved1 =3D 0, reserved2 =3D 0, reserved3 =3D 0 '\0', checksum =3D 0 =
'\0'},
  dev_spec =3D {_82541 =3D {dsp_config =3D e1000_dsp_config_disabled,
      ffe_config =3D e1000_ffe_config_enabled, spd_default =3D 0,
      phy_init_script =3D 0}, _82542 =3D {dma_fairness =3D 0}, _82543 =3D {
      tbi_compatibility =3D 0, dma_fairness =3D 0, init_phy_disabled =3D 0}=
,
    _82571 =3D {laa_is_present =3D 0, smb_counter =3D 0}, _80003es2lan =3D =
{
      mdic_wa_enable =3D 0}, ich8lan =3D {kmrn_lock_loss_workaround_enabled=
 =3D 0,
      shadow_ram =3D {{value =3D 0, modified =3D 0} <repeats 2048 times>},
      nvm_mutex =3D {lock_object =3D {lo_name =3D 0x0, lo_flags =3D 0, lo_d=
ata =3D 0,
          lo_witness =3D 0x0}, mtx_lock =3D 0}, swflag_mutex =3D {lock_obje=
ct =3D {
          lo_name =3D 0x0, lo_flags =3D 0, lo_data =3D 0, lo_witness =3D 0x=
0},
        mtx_lock =3D 0}, nvm_k1_enabled =3D 0}, _82575 =3D {sgmii_active =
=3D 0,
      global_device_reset =3D 0}, vf =3D {vf_number =3D 0, v2p_mailbox =3D =
0}},
  device_id =3D 4298, subsystem_vendor_id =3D 32902, subsystem_device_id =
=3D 41020,
  vendor_id =3D 32902, revision_id =3D 1 '\001'}

--=20
wbr,
pluknet



Want to link to this message? Use this URL: <https://mail-archive.FreeBSD.org/cgi/mid.cgi?AANLkTimD6K0UKu80Xf3hu6Mx5MEth2Gaqr-Dxm44fqSi>