Closed ma3252788 closed 3 years ago
sipl@sipl-4Xp:~$ lxc info config: images.auto_update_interval: "0" api_extensions: - storage_zfs_remove_snapshots - container_host_shutdown_timeout - container_stop_priority - container_syscall_filtering - auth_pki - container_last_used_at - etag - patch - usb_devices - https_allowed_credentials - image_compression_algorithm - directory_manipulation - container_cpu_time - storage_zfs_use_refquota - storage_lvm_mount_options - network - profile_usedby - container_push - container_exec_recording - certificate_update - container_exec_signal_handling - gpu_devices - container_image_properties - migration_progress - id_map - network_firewall_filtering - network_routes - storage - file_delete - file_append - network_dhcp_expiry - storage_lvm_vg_rename - storage_lvm_thinpool_rename - network_vlan - image_create_aliases - container_stateless_copy - container_only_migration - storage_zfs_clone_copy - unix_device_rename - storage_lvm_use_thinpool - storage_rsync_bwlimit - network_vxlan_interface - storage_btrfs_mount_options - entity_description - image_force_refresh - storage_lvm_lv_resizing - id_map_base - file_symlinks - container_push_target - network_vlan_physical - storage_images_delete - container_edit_metadata - container_snapshot_stateful_migration - storage_driver_ceph - storage_ceph_user_name - resource_limits - storage_volatile_initial_source - storage_ceph_force_osd_reuse - storage_block_filesystem_btrfs - resources - kernel_limits - storage_api_volume_rename - macaroon_authentication - network_sriov - console - restrict_devlxd - migration_pre_copy - infiniband - maas_network - devlxd_events - proxy - network_dhcp_gateway - file_get_symlink - network_leases - unix_device_hotplug - storage_api_local_volume_handling - operation_description - clustering - event_lifecycle - storage_api_remote_volume_handling - nvidia_runtime - candid_authentication - candid_config - candid_config_key - usb_optional_vendorid api_status: stable api_version: "1.0" auth: trusted public: false auth_methods: - tls environment: addresses: [] architectures: - x86_64 - i686 certificate: | -----BEGIN CERTIFICATE----- MIIFajCCA1KgAwIBAgIQOq+mN5s5ojifgPe/CpFALDANBgkqhkiG9w0BAQsFADA2 MRwwGgYDVQQKExNsaW51eGNvbnRhaW5lcnMub3JnMRYwFAYDVQQDDA1yb290QHNp cGwtNFhwMB4XDTE4MDQyNDE1MTQ1OFoXDTI4MDQyMTE1MTQ1OFowNjEcMBoGA1UE ChMTbGludXhjb250YWluZXJzLm9yZzEWMBQGA1UEAwwNcm9vdEBzaXBsLTRYcDCC AiIwDQYJKoZIhvcNAQEBBQADggIPADCCAgoCggIBAODIy12JEIgSwi6XvttM4AXT A+ZK9x7fgI6zC57Yj5TEaCIpSl8n+ZwvL6m4m2Mk82YLHWgQ0tJuYsythN5bXj5c MG/Clp9Cj0+Hfo2zRvYu0EON1YUiBSj+4lEpH5oh9nQA2z/b54eca+dQb10xbVV1 7Igp+4vfdAyPsEkyJtX5Btdy22CpWCQbF5m3t3uMHT2eKXxiu94UjOxb6SBPSELm n1H0ozT6Qr1OMN1LpjMBhCpYKSklKVfb2+sV5S3YBQ6WJCuATJMwwtdSYTzaPmSa eKECmjIA0SDzMEXo2LYHmqX9n/xiBLWKljub1upBf8CuKSC/NRJJ47U1B4BsYC26 3RGcLDoJoKH8BkBx/Vo72UlEM8IyfRs/uo6Q2Hrrkmg1x4wvBT26Nz3KsbTI4aA9 Yf6fsb6wkJ76UPnpeX/TxhNCaXaeoNWuU2333uiPmyUIhpPT89kfhblNiq/+zO9u x+KxlY9NEVAi4gzTzvRz2Rct5dUio8wFr3KTKtyEdQNP1hzG1cpU3bY0p3bL0NtH Wz5NUz8+J7vfneSMvC0yRtAC1GsiLK7d7JtFOiOEbc/pdoQEry6OJ9tAkCMHpSZV hzNVWUiSsxLGSS+Q0oFhoOWr55y/RWs+onr1mZwN1xBTr6cpcbrEDGx+2+NwVCN0 kutZKH8kTz27LWhbPUnBAgMBAAGjdDByMA4GA1UdDwEB/wQEAwIFoDATBgNVHSUE DDAKBggrBgEFBQcDATAMBgNVHRMBAf8EAjAAMD0GA1UdEQQ2MDSCCHNpcGwtNFhw hwSsGRGqhxAgAQ2oAhYlEcgOmG3bMMM4hxAgAQ2oAhYlEZJmtWN3DyLCMA0GCSqG SIb3DQEBCwUAA4ICAQDRMn1cpIWn8arDjsSiFp16+zaBunmJsnwYlhqcS3JUn+Lp wZbok4p9YgqKasUW34DSkEm9cHg6KBNWom0/bclTWJUbvejD8qTHWbti6IsCxfZO ziCEvIcz+KuyeRmsm57IINvUJXNmcmft75AEPOtiXjiReHoJUVIPQ5fZ7ml4q1mX jJZBxAfl9jfhRvFYetaoSKOjL6pZ2+u7p1pOW0TCO/+tohExgM+PwUBek9iYqtuE Xq2TmudFXbFUNZmOJN6xsw6yDNFwYA++QwwtGtiCP3Ml1saHkqMf8VNPGMgAGkvS JQqMHDkg8VoY3kopdshbeI7dv/H9FpU5xNmLIT7eun6urBK9BpiIFPdaioGRegjH WfI4eU1AUzSpTTGc9FYW6TFlpgQFv5/0aQNiJbrC0zvYKD9jnqDfVlF8NG8Qnyl0 zA9cC1QkYrfaRJmTRDWpayIWwpGPtgS0pz9RA3KR0+mVnEZGgQhixToKLPMfO29m /9SRzica4ARELOUuFpocVSBtQZunej8ZmQBOoe+ZwWLoGacXfQVyBMAUbeCT+cxW Zxd9qXts/QZiGiVJtCBFzielMjQe8Yuhj1DMn4T/GhV4vxk4+BnzyE2enFpoqhvI AaDEDFf+NhnfVMXOMz2ab73i0wnyDcfTKMBJDjEh9GitWKNCwIpBcMJvzA1C7A== -----END CERTIFICATE----- certificate_fingerprint: 20fe4f60860b908ac17b2fc3560c13ef61199af8c3bb0b7cbb2db13b02a4db46 driver: lxc driver_version: 3.0.3 kernel: Linux kernel_architecture: x86_64 kernel_version: 4.4.248-0404248-generic server: lxd server_pid: 4115 server_version: 3.0.3 storage: zfs storage_version: 0.6.5.6-0ubuntu28 server_clustered: false server_name: sipl-4Xp project: ""
I don't assign GPUs to the container, but all GPUs are displayed in the container
lxc exec xxx bash
nvidia-smi
[ ] Any relevant kernel output (dmesg)
dmesg
[ 10.646552] EDAC sbridge: ECC is disabled. Aborting [ 10.646568] EDAC sbridge: Couldn't find mci handler [ 10.647470] bridge: automatic filtering via arp/ip/ip6tables has been deprecated. Update your scripts to load br_netfilter if you need this. [ 10.651073] device enp14s0 entered promiscuous mode [ 10.656992] snd_hda_codec_realtek hdaudioC0D0: ALC1150: SKU not ready 0x00000000 [ 10.657499] snd_hda_codec_realtek hdaudioC0D0: autoconfig for ALC1150: line_outs=3 (0x14/0x15/0x16/0x0/0x0) type:line [ 10.657502] snd_hda_codec_realtek hdaudioC0D0: speaker_outs=0 (0x0/0x0/0x0/0x0/0x0) [ 10.657503] snd_hda_codec_realtek hdaudioC0D0: hp_outs=1 (0x1b/0x0/0x0/0x0/0x0) [ 10.657504] snd_hda_codec_realtek hdaudioC0D0: mono: mono_out=0x0 [ 10.657505] snd_hda_codec_realtek hdaudioC0D0: dig-out=0x11/0x1e [ 10.657506] snd_hda_codec_realtek hdaudioC0D0: inputs: [ 10.657508] snd_hda_codec_realtek hdaudioC0D0: Front Mic=0x19 [ 10.657509] snd_hda_codec_realtek hdaudioC0D0: Rear Mic=0x18 [ 10.657511] snd_hda_codec_realtek hdaudioC0D0: Line=0x1a [ 10.668593] usb 3-9.2: New USB device found, idVendor=05e3, idProduct=0607 [ 10.668598] usb 3-9.2: New USB device strings: Mfr=0, Product=1, SerialNumber=0 [ 10.668600] usb 3-9.2: Product: USB2.0 Hub [ 10.669445] hub 3-9.2:1.0: USB hub found [ 10.669697] hub 3-9.2:1.0: 4 ports detected [ 10.669953] AVX2 version of gcm_enc/dec engaged. [ 10.669955] AES CTR mode by8 optimization enabled [ 10.670282] input: HDA Intel PCH Front Mic as /devices/pci0000:00/0000:00:1b.0/sound/card0/input5 [ 10.670341] input: HDA Intel PCH Rear Mic as /devices/pci0000:00/0000:00:1b.0/sound/card0/input6 [ 10.670415] input: HDA Intel PCH Line as /devices/pci0000:00/0000:00:1b.0/sound/card0/input7 [ 10.670466] input: HDA Intel PCH Line Out Front as /devices/pci0000:00/0000:00:1b.0/sound/card0/input8 [ 10.670515] input: HDA Intel PCH Line Out Surround as /devices/pci0000:00/0000:00:1b.0/sound/card0/input9 [ 10.670561] input: HDA Intel PCH Line Out CLFE as /devices/pci0000:00/0000:00:1b.0/sound/card0/input10 [ 10.670609] input: HDA Intel PCH Front Headphone as /devices/pci0000:00/0000:00:1b.0/sound/card0/input11 [ 10.685797] kvm: disabled by bios [ 10.719729] asus_wmi: ASUS WMI generic driver loaded [ 10.721518] asus_wmi: Initialization: 0x0 [ 10.721539] asus_wmi: BIOS WMI version: 0.9 [ 10.721578] asus_wmi: SFUN value: 0x0 [ 10.721944] input: Eee PC WMI hotkeys as /devices/platform/eeepc-wmi/input/input12 [ 10.722033] asus_wmi: Number of fans: 1 [ 10.722526] hidraw: raw HID events driver (C) Jiri Kosina [ 10.726508] usbcore: registered new interface driver usbhid [ 10.726510] usbhid: USB HID core driver [ 10.737891] input: PixArt HP X500 USB Optical Mouse as /devices/pci0000:00/0000:00:14.0/usb3/3-9/3-9.1/3-9.1:1.0/0003:03F0:0941.0001/input/input13 [ 10.737986] hid-generic 0003:03F0:0941.0001: input,hidraw0: USB HID v1.11 Mouse [PixArt HP X500 USB Optical Mouse] on usb-0000:00:14.0-9.1/input0 [ 10.775255] nvidia: loading out-of-tree module taints kernel. [ 10.775260] Spectre V2 : System may be vulnerable to spectre v2 [ 10.775285] nvidia: loading module not compiled with retpoline compiler. [ 10.775288] nvidia: module license 'NVIDIA' taints kernel. [ 10.775289] Disabling lock debugging due to kernel taint [ 10.779239] Spectre V2 : System may be vulnerable to spectre v2 [ 10.779260] nvidia: loading module not compiled with retpoline compiler. [ 10.780629] nvidia: module verification failed: signature and/or required key missing - tainting kernel [ 10.788317] nvidia-nvlink: Nvlink Core is being initialized, major device number 243 [ 10.788590] nvidia 0000:09:00.0: enabling device (0100 -> 0103) [ 10.788673] vgaarb: device changed decodes: PCI:0000:09:00.0,olddecodes=io+mem,decodes=none:owns=none [ 10.790063] Spectre V2 : System may be vulnerable to spectre v2 [ 10.790081] nvidia: loading module not compiled with retpoline compiler. [ 10.790102] IPv6: ADDRCONF(NETDEV_UP): enp14s0: link is not ready [ 10.888133] clocksource: Switched to clocksource tsc [ 10.888189] nvidia 0000:06:00.0: enabling device (0100 -> 0103) [ 10.888276] vgaarb: device changed decodes: PCI:0000:06:00.0,olddecodes=io+mem,decodes=none:owns=none [ 10.947333] usb 3-9.2.1: new low-speed USB device number 6 using xhci_hcd [ 10.987838] vgaarb: device changed decodes: PCI:0000:05:00.0,olddecodes=io+mem,decodes=none:owns=io+mem [ 11.019336] usb 3-9.2.1: device descriptor read/64, error -32 [ 11.087279] NVRM: loading NVIDIA UNIX x86_64 Kernel Module 450.66 Wed Aug 12 19:42:48 UTC 2020 [ 11.092421] kvm: disabled by bios [ 11.094822] intel_rapl: Found RAPL domain package [ 11.099336] Spectre V2 : System may be vulnerable to spectre v2 [ 11.099353] nvidia_modeset: loading module not compiled with retpoline compiler. [ 11.099375] Spectre V2 : System may be vulnerable to spectre v2 [ 11.099398] nvidia_modeset: loading module not compiled with retpoline compiler. [ 11.099940] Spectre V2 : System may be vulnerable to spectre v2 [ 11.099955] nvidia_modeset: loading module not compiled with retpoline compiler. [ 11.100303] nvidia-modeset: Loading NVIDIA Kernel Mode Setting Driver for UNIX platforms 450.66 Wed Aug 12 19:37:58 UTC 2020 [ 11.100920] Spectre V2 : System may be vulnerable to spectre v2 [ 11.100924] Spectre V2 : System may be vulnerable to spectre v2 [ 11.100925] nvidia_drm: loading module not compiled with retpoline compiler. [ 11.100947] nvidia_drm: loading module not compiled with retpoline compiler. [ 11.101162] Spectre V2 : System may be vulnerable to spectre v2 [ 11.101186] nvidia_drm: loading module not compiled with retpoline compiler. [ 11.101774] [drm] [nvidia-drm] [GPU ID 0x00000900] Loading driver [ 11.101853] [drm] [nvidia-drm] [GPU ID 0x00000600] Loading driver [ 11.101909] [drm] [nvidia-drm] [GPU ID 0x00000500] Loading driver [ 11.106674] Adding 134125564k swap on /dev/nvme0n1p3. Priority:-1 extents:1 across:134125564k SSFS [ 11.140342] kvm: disabled by bios [ 11.184331] kvm: disabled by bios [ 11.199303] usb 3-9.2.1: device descriptor read/64, error -32 [ 11.220131] kvm: disabled by bios [ 11.260104] kvm: disabled by bios [ 11.296085] kvm: disabled by bios [ 11.324121] kvm: disabled by bios [ 11.364086] kvm: disabled by bios [ 11.375291] usb 3-9.2.1: new low-speed USB device number 7 using xhci_hcd [ 11.412072] kvm: disabled by bios [ 11.447294] usb 3-9.2.1: device descriptor read/64, error -32 [ 11.456091] kvm: disabled by bios [ 11.496148] kvm: disabled by bios [ 11.572454] Spectre V2 : System may be vulnerable to spectre v2 [ 11.572471] zavl: loading module not compiled with retpoline compiler. [ 11.573786] Spectre V2 : System may be vulnerable to spectre v2 [ 11.573800] spl: loading module not compiled with retpoline compiler. [ 11.576399] SPL: Loaded module v0.6.5.6-0ubuntu4 [ 11.577088] Spectre V2 : System may be vulnerable to spectre v2 [ 11.577103] znvpair: loading module not compiled with retpoline compiler. [ 11.579471] Spectre V2 : System may be vulnerable to spectre v2 [ 11.579485] zcommon: loading module not compiled with retpoline compiler. [ 11.581836] Spectre V2 : System may be vulnerable to spectre v2 [ 11.581850] zunicode: loading module not compiled with retpoline compiler. [ 11.592030] Spectre V2 : System may be vulnerable to spectre v2 [ 11.592044] zfs: loading module not compiled with retpoline compiler. [ 11.623345] usb 3-9.2.1: device descriptor read/64, error -32 [ 11.628104] ZFS: Loaded module v0.6.5.6-0ubuntu28, ZFS pool version 5000, ZFS filesystem version 5 [ 11.727479] usb 3-9.2-port1: attempt power cycle [ 11.908202] SPL: using hostid 0x007f0100 [ 11.959808] input: HDA NVidia HDMI/DP,pcm=3 as /devices/pci0000:00/0000:00:03.0/0000:03:00.0/0000:04:08.0/0000:06:00.1/sound/card2/input14 [ 11.959855] input: HDA NVidia HDMI/DP,pcm=7 as /devices/pci0000:00/0000:00:03.0/0000:03:00.0/0000:04:08.0/0000:06:00.1/sound/card2/input15 [ 11.959899] input: HDA NVidia HDMI/DP,pcm=8 as /devices/pci0000:00/0000:00:03.0/0000:03:00.0/0000:04:08.0/0000:06:00.1/sound/card2/input16 [ 11.959951] input: HDA NVidia HDMI/DP,pcm=9 as /devices/pci0000:00/0000:00:03.0/0000:03:00.0/0000:04:08.0/0000:06:00.1/sound/card2/input17 [ 11.960056] input: HDA NVidia HDMI/DP,pcm=3 as /devices/pci0000:00/0000:00:03.0/0000:03:00.0/0000:04:10.0/0000:05:00.1/sound/card3/input22 [ 11.960097] input: HDA NVidia HDMI/DP,pcm=7 as /devices/pci0000:00/0000:00:03.0/0000:03:00.0/0000:04:10.0/0000:05:00.1/sound/card3/input23 [ 11.960148] input: HDA NVidia HDMI/DP,pcm=8 as /devices/pci0000:00/0000:00:03.0/0000:03:00.0/0000:04:10.0/0000:05:00.1/sound/card3/input24 [ 11.960196] input: HDA NVidia HDMI/DP,pcm=9 as /devices/pci0000:00/0000:00:03.0/0000:03:00.0/0000:04:10.0/0000:05:00.1/sound/card3/input25 [ 11.960313] input: HDA NVidia HDMI/DP,pcm=3 as /devices/pci0000:00/0000:00:02.0/0000:07:00.0/0000:08:10.0/0000:09:00.1/sound/card1/input18 [ 11.960353] input: HDA NVidia HDMI/DP,pcm=7 as /devices/pci0000:00/0000:00:02.0/0000:07:00.0/0000:08:10.0/0000:09:00.1/sound/card1/input19 [ 11.960404] input: HDA NVidia HDMI/DP,pcm=8 as /devices/pci0000:00/0000:00:02.0/0000:07:00.0/0000:08:10.0/0000:09:00.1/sound/card1/input20 [ 11.960443] input: HDA NVidia HDMI/DP,pcm=9 as /devices/pci0000:00/0000:00:02.0/0000:07:00.0/0000:08:10.0/0000:09:00.1/sound/card1/input21 [ 12.311305] usb 3-9.2.1: new low-speed USB device number 8 using xhci_hcd [ 12.311740] usb 3-9.2.1: Device not responding to setup address. [ 12.348636] igb 0000:0e:00.0 enp14s0: igb: enp14s0 NIC Link is Up 100 Mbps Full Duplex, Flow Control: RX/TX [ 12.348951] IPv6: ADDRCONF(NETDEV_CHANGE): enp14s0: link becomes ready [ 12.515724] usb 3-9.2.1: Device not responding to setup address. [ 12.719282] usb 3-9.2.1: device not accepting address 8, error -71 [ 12.791263] usb 3-9.2.1: new low-speed USB device number 9 using xhci_hcd [ 12.791676] usb 3-9.2.1: Device not responding to setup address. [ 12.995662] usb 3-9.2.1: Device not responding to setup address. [ 13.199250] usb 3-9.2.1: device not accepting address 9, error -71 [ 13.199453] usb 3-9.2-port1: unable to enumerate USB device [ 13.271299] usb 3-9.2.3: new low-speed USB device number 10 using xhci_hcd [ 13.365976] usb 3-9.2.3: New USB device found, idVendor=046d, idProduct=c22a [ 13.365978] usb 3-9.2.3: New USB device strings: Mfr=0, Product=2, SerialNumber=0 [ 13.365980] usb 3-9.2.3: Product: Gaming Keyboard G110 [ 13.366086] usb 3-9.2.3: ep 0x81 - rounding interval to 128 microframes, ep desc says 192 microframes [ 13.366090] usb 3-9.2.3: ep 0x82 - rounding interval to 128 microframes, ep desc says 192 microframes [ 13.369609] input: Gaming Keyboard G110 as /devices/pci0000:00/0000:00:14.0/usb3/3-9/3-9.2/3-9.2.3/3-9.2.3:1.0/0003:046D:C22A.0002/input/input26 [ 13.423343] hid-generic 0003:046D:C22A.0002: input,hidraw1: USB HID v1.10 Keyboard [Gaming Keyboard G110] on usb-0000:00:14.0-9.2.3/input0 [ 13.428812] input: Gaming Keyboard G110 as /devices/pci0000:00/0000:00:14.0/usb3/3-9/3-9.2/3-9.2.3/3-9.2.3:1.1/0003:046D:C22A.0003/input/input27 [ 13.483359] hid-generic 0003:046D:C22A.0003: input,hiddev0,hidraw2: USB HID v1.10 Device [Gaming Keyboard G110] on usb-0000:00:14.0-9.2.3/input1 [ 17.005967] audit: type=1400 audit(1608541456.477:2): apparmor="STATUS" operation="profile_load" name="/usr/bin/ubuntu-core-launcher" pid=3174 comm="apparmor_parser" [ 17.006161] audit: type=1400 audit(1608541456.477:3): apparmor="STATUS" operation="profile_load" name="/usr/bin/lxc-start" pid=3173 comm="apparmor_parser" [ 17.006173] audit: type=1400 audit(1608541456.477:4): apparmor="STATUS" operation="profile_load" name="/usr/sbin/ippusbxd" pid=3180 comm="apparmor_parser" [ 17.007219] audit: type=1400 audit(1608541456.481:5): apparmor="STATUS" operation="profile_load" name="/usr/lib/snapd/snap-confine" pid=3176 comm="apparmor_parser" [ 17.007222] audit: type=1400 audit(1608541456.481:6): apparmor="STATUS" operation="profile_load" name="mount-namespace-capture-helper" pid=3176 comm="apparmor_parser" [ 17.007611] audit: type=1400 audit(1608541456.481:7): apparmor="STATUS" operation="profile_load" name="/usr/sbin/tcpdump" pid=3182 comm="apparmor_parser" [ 17.007691] audit: type=1400 audit(1608541456.481:8): apparmor="STATUS" operation="profile_load" name="/usr/sbin/cups-browsed" pid=3177 comm="apparmor_parser" [ 17.008009] audit: type=1400 audit(1608541456.481:9): apparmor="STATUS" operation="profile_load" name="/sbin/dhclient" pid=3170 comm="apparmor_parser" [ 17.008012] audit: type=1400 audit(1608541456.481:10): apparmor="STATUS" operation="profile_load" name="/usr/lib/NetworkManager/nm-dhcp-client.action" pid=3170 comm="apparmor_parser" [ 17.008015] audit: type=1400 audit(1608541456.481:11): apparmor="STATUS" operation="profile_load" name="/usr/lib/NetworkManager/nm-dhcp-helper" pid=3170 comm="apparmor_parser" [ 17.022583] br0: port 1(enp14s0) entered forwarding state [ 17.022591] br0: port 1(enp14s0) entered forwarding state [ 17.029712] cgroup: new mount options do not match the existing superblock, will be ignored [ 17.128591] IPv6: ADDRCONF(NETDEV_UP): eno1: link is not ready [ 17.327992] pcieport 0000:00:03.0: AER: Corrected error received: id=0018 [ 17.327999] pcieport 0000:00:03.0: PCIe Bus Error: severity=Corrected, type=Data Link Layer, id=0018(Transmitter ID) [ 17.328001] pcieport 0000:00:03.0: device [8086:6f08] error status/mask=00001000/00002000 [ 17.328003] pcieport 0000:00:03.0: [12] Replay Timer Timeout [ 17.359287] IPv6: ADDRCONF(NETDEV_UP): eno1: link is not ready [ 20.779567] pcieport 0000:00:03.0: AER: Corrected error received: id=0018 [ 20.779575] pcieport 0000:00:03.0: PCIe Bus Error: severity=Corrected, type=Data Link Layer, id=0018(Receiver ID) [ 20.779577] pcieport 0000:00:03.0: device [8086:6f08] error status/mask=00000040/00002000 [ 20.779579] pcieport 0000:00:03.0: [ 6] Bad TLP [ 22.544761] pcieport 0000:00:01.1: AER: Multiple Corrected error received: id=0009 [ 22.544769] pcieport 0000:00:01.1: PCIe Bus Error: severity=Corrected, type=Data Link Layer, id=0009(Receiver ID) [ 22.544771] pcieport 0000:00:01.1: device [8086:6f03] error status/mask=00000040/00002000 [ 22.544773] pcieport 0000:00:01.1: [ 6] Bad TLP [ 31.217836] pcieport 0000:00:03.0: AER: Corrected error received: id=0018 [ 31.217844] pcieport 0000:00:03.0: PCIe Bus Error: severity=Corrected, type=Data Link Layer, id=0018(Receiver ID) [ 31.217846] pcieport 0000:00:03.0: device [8086:6f08] error status/mask=00000040/00002000 [ 31.217848] pcieport 0000:00:03.0: [ 6] Bad TLP [ 32.042856] br0: port 1(enp14s0) entered forwarding state [ 35.590978] Spectre V2 : System may be vulnerable to spectre v2 [ 35.590982] nvidia_uvm: loading module not compiled with retpoline compiler. [ 35.593493] nvidia-uvm: Loaded the UVM driver, major device number 241. [ 63.970039] Ebtables v2.0 registered [ 64.378791] audit_printk_skb: 51 callbacks suppressed [ 64.378793] audit: type=1400 audit(1608541503.853:29): apparmor="STATUS" operation="profile_load" name="lxd-tianjimiao_</var/lib/lxd>" pid=4454 comm="apparmor_parser" [ 64.388165] device vethAFV8T8 entered promiscuous mode [ 64.388211] IPv6: ADDRCONF(NETDEV_UP): vethAFV8T8: link is not ready [ 64.454558] eth0: renamed from vethD75TH2 [ 64.466339] IPv6: ADDRCONF(NETDEV_CHANGE): vethAFV8T8: link becomes ready [ 64.466358] br0: port 2(vethAFV8T8) entered forwarding state [ 64.466365] br0: port 2(vethAFV8T8) entered forwarding state [ 79.497758] br0: port 2(vethAFV8T8) entered forwarding state [ 117.241731] Loading iSCSI transport class v2.0-870. [ 299.884789] mce: [Hardware Error]: Machine check events logged
lxc info NAME --show-log
sipl@sipl-4Xp:~$ lxc info tianjimiao --show-log Name: tianjimiao Remote: unix:// Architecture: x86_64 Created: 2019/11/19 07:43 UTC Status: Running Type: persistent Profiles: default Pid: 4464 Ips: eth0: inet 172.25.17.60 vethAFV8T8 eth0: inet6 2001:da8:216:2511:216:3eff:fede:3b86 vethAFV8T8 eth0: inet6 fe80::216:3eff:fede:3b86 vethAFV8T8 lo: inet 127.0.0.1 lo: inet6 ::1 Resources: Processes: 259 Disk usage: root: 899.06GB CPU usage: CPU usage (in seconds): 258 Memory usage: Memory (current): 1.87GB Memory (peak): 1.94GB Network usage: eth0: Bytes received: 1.81MB Bytes sent: 5.30MB Packets received: 11873 Packets sent: 7105 lo: Bytes received: 19.43kB Bytes sent: 19.43kB Packets received: 38 Packets sent: 38
Log:
lxc tianjimiao 20201221090504.400 WARN conf - conf.c:lxc_setup_devpts:1616 - Invalid argument - Failed to unmount old devpts instance lxc tianjimiao 20201221090504.400 WARN apparmor - lsm/apparmor.c:apparmor_process_label_set:221 - Incomplete AppArmor support in your kernel
- [ ] Container configuration (`lxc config show NAME --expanded`)
sipl@sipl-4Xp:~$ lxc config show tianjimiao --expanded architecture: x86_64 config: image.architecture: x86_64 image.description: Ubuntu 16.04 LTS server (20180424) image.os: ubuntu image.release: xenial raw.lxc: lxc.apparmor.allow_incomplete=1 security.privileged: "true" volatile.base_image: 55c06c2c9b9e47fbb89537134395c12d221e1536d26788c07ee042d07b34dd07 volatile.eth0.hwaddr: 00:16:3e:de:3b:86 volatile.eth0.name: eth0 volatile.idmap.base: "0" volatile.idmap.next: '[]' volatile.last_state.idmap: '[]' volatile.last_state.power: RUNNING devices: A-Pool: path: /A-pool source: /A-pool type: disk eth0: nictype: bridged parent: br0 type: nic nvidia-uvm: path: /dev/nvidia-uvm type: unix-char root: path: / pool: default type: disk ephemeral: false profiles:
default stateful: false description: ""
- [ ] Main daemon log (at /var/log/lxd/lxd.log or /var/snap/lxd/common/lxd/logs/lxd.log)
t=2020-12-21T15:17:24+0800 lvl=info msg="Container initiated reboot" action=reboot created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao stateful=false used=2020-12-18T19:22:54+0800 t=2020-12-21T15:17:28+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=tianjimiao t=2020-12-21T15:17:29+0800 lvl=info msg="Starting container" action=start created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao stateful=false used=2020-12-18T19:22:54+0800 t=2020-12-21T15:17:30+0800 lvl=info msg="Started container" action=start created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao stateful=false used=2020-12-18T19:22:54+0800 t=2020-12-21T15:30:07+0800 lvl=info msg="Container initiated reboot" action=reboot created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao stateful=false used=2020-12-21T15:17:29+0800 t=2020-12-21T15:30:08+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=tianjimiao t=2020-12-21T15:30:10+0800 lvl=info msg="Starting container" action=start created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao stateful=false used=2020-12-21T15:17:29+0800 t=2020-12-21T15:30:10+0800 lvl=info msg="Started container" action=start created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao stateful=false used=2020-12-21T15:17:29+0800 t=2020-12-21T15:45:58+0800 lvl=info msg="Container initiated reboot" action=reboot created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao stateful=false used=2020-12-21T15:30:10+0800 t=2020-12-21T15:45:58+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=tianjimiao t=2020-12-21T15:46:00+0800 lvl=info msg="Starting container" action=start created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao stateful=false used=2020-12-21T15:30:10+0800 t=2020-12-21T15:46:00+0800 lvl=info msg="Started container" action=start created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao stateful=false used=2020-12-21T15:30:10+0800 t=2020-12-21T15:48:30+0800 lvl=info msg="Asked to shutdown by API, shutting down containers" t=2020-12-21T15:48:30+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=allenzsy t=2020-12-21T15:48:30+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=anxin t=2020-12-21T15:48:30+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=dln t=2020-12-21T15:48:30+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=houfeng t=2020-12-21T15:48:30+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=kml t=2020-12-21T15:48:30+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=kml2 t=2020-12-21T15:48:30+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=liubin t=2020-12-21T15:48:30+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=lx t=2020-12-21T15:48:30+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=matlab-caffe t=2020-12-21T15:48:30+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=matlab-caffe2 t=2020-12-21T15:48:30+0800 lvl=info msg="Shutting down container" action=shutdown created=2018-08-23T16:42:37+0800 ephemeral=false name=mcj timeout=30s used=2020-12-18T19:20:41+0800 t=2020-12-21T15:48:30+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=mcj2 t=2020-12-21T15:48:31+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=momo t=2020-12-21T15:48:31+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=pytorch t=2020-12-21T15:48:31+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=sunliangliang t=2020-12-21T15:48:31+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=tessss t=2020-12-21T15:48:31+0800 lvl=info msg="Shutting down container" action=shutdown created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao timeout=30s used=2020-12-21T15:46:00+0800 t=2020-12-21T15:48:31+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=wangke t=2020-12-21T15:48:31+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=wangke2 t=2020-12-21T15:48:31+0800 lvl=info msg="Shutting down container" action=shutdown created=2019-09-18T10:56:32+0800 ephemeral=false name=wuxinjia timeout=30s used=2020-12-18T19:23:21+0800 t=2020-12-21T15:48:36+0800 lvl=info msg="Shut down container" action=shutdown created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao timeout=30s used=2020-12-21T15:46:00+0800 t=2020-12-21T15:48:36+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=tianjimiao t=2020-12-21T15:48:37+0800 lvl=info msg="Shut down container" action=shutdown created=2018-08-23T16:42:37+0800 ephemeral=false name=mcj timeout=30s used=2020-12-18T19:20:41+0800 t=2020-12-21T15:48:37+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=mcj t=2020-12-21T15:48:39+0800 lvl=info msg="Shut down container" action=shutdown created=2019-09-18T10:56:32+0800 ephemeral=false name=wuxinjia timeout=30s used=2020-12-18T19:23:21+0800 t=2020-12-21T15:48:39+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=wuxinjia t=2020-12-21T15:48:39+0800 lvl=info msg="Starting shutdown sequence" t=2020-12-21T15:48:39+0800 lvl=info msg="Stopping REST API handler:" t=2020-12-21T15:48:39+0800 lvl=info msg=" - closing socket" socket=/var/lib/lxd/unix.socket t=2020-12-21T15:48:39+0800 lvl=info msg="Stopping /dev/lxd handler" t=2020-12-21T15:48:39+0800 lvl=info msg=" - closing socket" socket=/var/lib/lxd/devlxd/sock t=2020-12-21T15:48:39+0800 lvl=info msg="Closing the database" t=2020-12-21T15:48:39+0800 lvl=info msg="Stopping REST API handler:" t=2020-12-21T15:48:39+0800 lvl=info msg="Stopping /dev/lxd handler" t=2020-12-21T15:48:39+0800 lvl=info msg="Stopping REST API handler:" t=2020-12-21T15:48:39+0800 lvl=info msg="Stopping /dev/lxd handler" t=2020-12-21T15:48:39+0800 lvl=info msg="Unmounting temporary filesystems" t=2020-12-21T15:48:39+0800 lvl=info msg="Done unmounting temporary filesystems" t=2020-12-21T15:48:39+0800 lvl=info msg="Saving simplestreams cache" t=2020-12-21T15:48:39+0800 lvl=info msg="Saved simplestreams cache" t=2020-12-21T15:49:29+0800 lvl=info msg="LXD 3.0.3 is starting in normal mode" path=/var/lib/lxd t=2020-12-21T15:49:29+0800 lvl=info msg="Kernel uid/gid map:" t=2020-12-21T15:49:29+0800 lvl=info msg=" - u 0 0 4294967295" t=2020-12-21T15:49:29+0800 lvl=info msg=" - g 0 0 4294967295" t=2020-12-21T15:49:29+0800 lvl=info msg="Configured LXD uid/gid map:" t=2020-12-21T15:49:29+0800 lvl=info msg=" - u 0 165536 65536" t=2020-12-21T15:49:29+0800 lvl=info msg=" - g 0 165536 65536" t=2020-12-21T15:49:29+0800 lvl=warn msg="CGroup memory swap accounting is disabled, swap limits will be ignored." t=2020-12-21T15:49:29+0800 lvl=info msg="Kernel features:" t=2020-12-21T15:49:29+0800 lvl=info msg=" - netnsid-based network retrieval: no" t=2020-12-21T15:49:29+0800 lvl=info msg=" - unprivileged file capabilities: no" t=2020-12-21T15:49:29+0800 lvl=info msg="Initializing local database" t=2020-12-21T15:49:29+0800 lvl=info msg="Starting /dev/lxd handler:" t=2020-12-21T15:49:29+0800 lvl=info msg=" - binding devlxd socket" socket=/var/lib/lxd/devlxd/sock t=2020-12-21T15:49:29+0800 lvl=info msg="REST API daemon:" t=2020-12-21T15:49:29+0800 lvl=info msg=" - binding Unix socket" inherited=true socket=/var/lib/lxd/unix.socket t=2020-12-21T15:49:29+0800 lvl=info msg="Initializing global database" t=2020-12-21T15:49:29+0800 lvl=info msg="Initializing storage pools" t=2020-12-21T15:49:29+0800 lvl=info msg="Initializing networks" t=2020-12-21T15:49:29+0800 lvl=info msg="Pruning leftover image files" t=2020-12-21T15:49:29+0800 lvl=info msg="Done pruning leftover image files" t=2020-12-21T15:49:29+0800 lvl=info msg="Loading daemon configuration" t=2020-12-21T15:49:29+0800 lvl=info msg="Pruning expired images" t=2020-12-21T15:49:29+0800 lvl=info msg="Done pruning expired images" t=2020-12-21T15:49:29+0800 lvl=info msg="Updating instance types" t=2020-12-21T15:49:29+0800 lvl=info msg="Done updating instance types" t=2020-12-21T15:49:29+0800 lvl=info msg="Expiring log files" t=2020-12-21T15:49:29+0800 lvl=info msg="Done expiring log files" t=2020-12-21T15:49:29+0800 lvl=eror msg="Failed to start container 'mcj': Common start logic: Missing source '/dev/nvidia-uvm' for device 'nvidia-uvm'" t=2020-12-21T15:49:29+0800 lvl=eror msg="Failed to start container 'tianjimiao': Common start logic: Missing source '/dev/nvidia-uvm' for device 'nvidia-uvm'" t=2020-12-21T15:49:29+0800 lvl=eror msg="Failed to start container 'wuxinjia': Common start logic: Missing source '/dev/nvidia-uvm' for device 'nvidia-uvm'" t=2020-12-21T15:50:12+0800 lvl=warn msg="Failed to update instance types: Get https://images.linuxcontainers.org/meta/instance-types/.yaml: Unable to connect to: images.linuxcontainers.org:443" t=2020-12-21T15:50:29+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=tianjimiao t=2020-12-21T15:50:29+0800 lvl=info msg="Starting container" action=start created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao stateful=false used=2020-12-21T15:46:00+0800 t=2020-12-21T15:50:30+0800 lvl=info msg="Started container" action=start created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao stateful=false used=2020-12-21T15:46:00+0800 t=2020-12-21T15:52:10+0800 lvl=info msg="Asked to shutdown by API, shutting down containers" t=2020-12-21T15:52:10+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=allenzsy t=2020-12-21T15:52:10+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=anxin t=2020-12-21T15:52:10+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=dln t=2020-12-21T15:52:10+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=houfeng t=2020-12-21T15:52:10+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=kml t=2020-12-21T15:52:10+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=kml2 t=2020-12-21T15:52:10+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=liubin t=2020-12-21T15:52:10+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=lx t=2020-12-21T15:52:10+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=matlab-caffe t=2020-12-21T15:52:10+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=matlab-caffe2 t=2020-12-21T15:52:10+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=mcj t=2020-12-21T15:52:10+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=mcj2 t=2020-12-21T15:52:10+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=momo t=2020-12-21T15:52:10+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=pytorch t=2020-12-21T15:52:10+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=sunliangliang t=2020-12-21T15:52:10+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=tessss t=2020-12-21T15:52:10+0800 lvl=info msg="Shutting down container" action=shutdown created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao timeout=30s used=2020-12-21T15:50:29+0800 t=2020-12-21T15:52:10+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=wangke t=2020-12-21T15:52:10+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=wangke2 t=2020-12-21T15:52:10+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=wuxinjia t=2020-12-21T15:52:16+0800 lvl=info msg="Shut down container" action=shutdown created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao timeout=30s used=2020-12-21T15:50:29+0800 t=2020-12-21T15:52:16+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=tianjimiao t=2020-12-21T15:52:16+0800 lvl=info msg="Starting shutdown sequence" t=2020-12-21T15:52:16+0800 lvl=info msg="Stopping REST API handler:" t=2020-12-21T15:52:16+0800 lvl=info msg=" - closing socket" socket=/var/lib/lxd/unix.socket t=2020-12-21T15:52:16+0800 lvl=info msg="Stopping /dev/lxd handler" t=2020-12-21T15:52:16+0800 lvl=info msg=" - closing socket" socket=/var/lib/lxd/devlxd/sock t=2020-12-21T15:52:16+0800 lvl=info msg="Closing the database" t=2020-12-21T15:52:16+0800 lvl=info msg="Stopping REST API handler:" t=2020-12-21T15:52:16+0800 lvl=info msg="Stopping /dev/lxd handler" t=2020-12-21T15:52:16+0800 lvl=info msg="Stopping REST API handler:" t=2020-12-21T15:52:16+0800 lvl=info msg="Stopping /dev/lxd handler" t=2020-12-21T15:52:16+0800 lvl=info msg="Unmounting temporary filesystems" t=2020-12-21T15:52:16+0800 lvl=info msg="Done unmounting temporary filesystems" t=2020-12-21T15:52:16+0800 lvl=info msg="Saving simplestreams cache" t=2020-12-21T15:52:16+0800 lvl=info msg="Saved simplestreams cache" t=2020-12-21T15:53:03+0800 lvl=info msg="LXD 3.0.3 is starting in normal mode" path=/var/lib/lxd t=2020-12-21T15:53:03+0800 lvl=info msg="Kernel uid/gid map:" t=2020-12-21T15:53:03+0800 lvl=info msg=" - u 0 0 4294967295" t=2020-12-21T15:53:03+0800 lvl=info msg=" - g 0 0 4294967295" t=2020-12-21T15:53:03+0800 lvl=info msg="Configured LXD uid/gid map:" t=2020-12-21T15:53:03+0800 lvl=info msg=" - u 0 165536 65536" t=2020-12-21T15:53:03+0800 lvl=info msg=" - g 0 165536 65536" t=2020-12-21T15:53:03+0800 lvl=warn msg="CGroup memory swap accounting is disabled, swap limits will be ignored." t=2020-12-21T15:53:03+0800 lvl=info msg="Kernel features:" t=2020-12-21T15:53:03+0800 lvl=info msg=" - netnsid-based network retrieval: no" t=2020-12-21T15:53:03+0800 lvl=info msg=" - unprivileged file capabilities: no" t=2020-12-21T15:53:03+0800 lvl=info msg="Initializing local database" t=2020-12-21T15:53:03+0800 lvl=info msg="Starting /dev/lxd handler:" t=2020-12-21T15:53:03+0800 lvl=info msg=" - binding devlxd socket" socket=/var/lib/lxd/devlxd/sock t=2020-12-21T15:53:03+0800 lvl=info msg="REST API daemon:" t=2020-12-21T15:53:03+0800 lvl=info msg=" - binding Unix socket" inherited=true socket=/var/lib/lxd/unix.socket t=2020-12-21T15:53:03+0800 lvl=info msg="Initializing global database" t=2020-12-21T15:53:03+0800 lvl=info msg="Initializing storage pools" t=2020-12-21T15:53:03+0800 lvl=info msg="Initializing networks" t=2020-12-21T15:53:03+0800 lvl=info msg="Pruning leftover image files" t=2020-12-21T15:53:03+0800 lvl=info msg="Done pruning leftover image files" t=2020-12-21T15:53:03+0800 lvl=info msg="Loading daemon configuration" t=2020-12-21T15:53:03+0800 lvl=info msg="Pruning expired images" t=2020-12-21T15:53:03+0800 lvl=info msg="Done pruning expired images" t=2020-12-21T15:53:03+0800 lvl=info msg="Expiring log files" t=2020-12-21T15:53:03+0800 lvl=info msg="Done expiring log files" t=2020-12-21T15:53:03+0800 lvl=info msg="Updating instance types" t=2020-12-21T15:53:03+0800 lvl=info msg="Done updating instance types" t=2020-12-21T15:53:03+0800 lvl=eror msg="Failed to start container 'tianjimiao': Common start logic: Missing source '/dev/nvidia-uvm' for device 'nvidia-uvm'" t=2020-12-21T15:53:43+0800 lvl=warn msg="Failed to update instance types: Get https://images.linuxcontainers.org/meta/instance-types/.yaml: Unable to connect to: images.linuxcontainers.org:443" t=2020-12-21T16:11:42+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=tianjimiao t=2020-12-21T16:11:43+0800 lvl=info msg="Starting container" action=start created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao stateful=false used=2020-12-21T15:50:29+0800 t=2020-12-21T16:11:44+0800 lvl=info msg="Started container" action=start created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao stateful=false used=2020-12-21T15:50:29+0800 t=2020-12-21T16:21:29+0800 lvl=info msg="Container initiated reboot" action=reboot created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao stateful=false used=2020-12-21T16:11:43+0800 t=2020-12-21T16:21:30+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=tianjimiao t=2020-12-21T16:21:30+0800 lvl=info msg="Starting container" action=start created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao stateful=false used=2020-12-21T16:11:43+0800 t=2020-12-21T16:21:30+0800 lvl=info msg="Started container" action=start created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao stateful=false used=2020-12-21T16:11:43+0800 t=2020-12-21T16:30:24+0800 lvl=warn msg="Detected poll(POLLNVAL) event." t=2020-12-21T16:32:34+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=wuxinjia t=2020-12-21T16:32:34+0800 lvl=info msg="Starting container" action=start created=2019-09-18T10:56:32+0800 ephemeral=false name=wuxinjia stateful=false used=2020-12-18T19:23:21+0800 t=2020-12-21T16:32:37+0800 lvl=info msg="Started container" action=start created=2019-09-18T10:56:32+0800 ephemeral=false name=wuxinjia stateful=false used=2020-12-18T19:23:21+0800 t=2020-12-21T16:48:32+0800 lvl=info msg="Container initiated reboot" action=reboot created=2019-09-18T10:56:32+0800 ephemeral=false name=wuxinjia stateful=false used=2020-12-21T16:32:34+0800 t=2020-12-21T16:48:33+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=wuxinjia t=2020-12-21T16:48:33+0800 lvl=info msg="Starting container" action=start created=2019-09-18T10:56:32+0800 ephemeral=false name=wuxinjia stateful=false used=2020-12-21T16:32:34+0800 t=2020-12-21T16:48:34+0800 lvl=info msg="Started container" action=start created=2019-09-18T10:56:32+0800 ephemeral=false name=wuxinjia stateful=false used=2020-12-21T16:32:34+0800 t=2020-12-21T16:56:22+0800 lvl=info msg="Container initiated reboot" action=reboot created=2019-09-18T10:56:32+0800 ephemeral=false name=wuxinjia stateful=false used=2020-12-21T16:48:33+0800 t=2020-12-21T16:56:23+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=wuxinjia t=2020-12-21T16:56:24+0800 lvl=info msg="Starting container" action=start created=2019-09-18T10:56:32+0800 ephemeral=false name=wuxinjia stateful=false used=2020-12-21T16:48:33+0800 t=2020-12-21T16:56:24+0800 lvl=info msg="Started container" action=start created=2019-09-18T10:56:32+0800 ephemeral=false name=wuxinjia stateful=false used=2020-12-21T16:48:33+0800 t=2020-12-21T17:01:22+0800 lvl=info msg="Shutting down container" action=shutdown created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao timeout=-1s used=2020-12-21T16:21:30+0800 t=2020-12-21T17:01:29+0800 lvl=info msg="Shut down container" action=shutdown created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao timeout=-1s used=2020-12-21T16:21:30+0800 t=2020-12-21T17:01:35+0800 lvl=info msg="Shutting down container" action=shutdown created=2019-09-18T10:56:32+0800 ephemeral=false name=wuxinjia timeout=-1s used=2020-12-21T16:56:24+0800 t=2020-12-21T17:01:42+0800 lvl=info msg="Shut down container" action=shutdown created=2019-09-18T10:56:32+0800 ephemeral=false name=wuxinjia timeout=-1s used=2020-12-21T16:56:24+0800 t=2020-12-21T17:01:54+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=tianjimiao t=2020-12-21T17:01:56+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=tianjimiao t=2020-12-21T17:02:36+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=tianjimiao t=2020-12-21T17:02:44+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=tianjimiao t=2020-12-21T17:02:44+0800 lvl=info msg="Starting container" action=start created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao stateful=false used=2020-12-21T16:21:30+0800 t=2020-12-21T17:02:45+0800 lvl=info msg="Started container" action=start created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao stateful=false used=2020-12-21T16:21:30+0800 t=2020-12-21T17:03:32+0800 lvl=info msg="Asked to shutdown by API, shutting down containers" t=2020-12-21T17:03:32+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=allenzsy t=2020-12-21T17:03:32+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=anxin t=2020-12-21T17:03:32+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=dln t=2020-12-21T17:03:32+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=houfeng t=2020-12-21T17:03:32+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=kml t=2020-12-21T17:03:32+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=kml2 t=2020-12-21T17:03:32+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=liubin t=2020-12-21T17:03:32+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=lx t=2020-12-21T17:03:32+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=matlab-caffe t=2020-12-21T17:03:32+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=matlab-caffe2 t=2020-12-21T17:03:32+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=mcj t=2020-12-21T17:03:32+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=mcj2 t=2020-12-21T17:03:32+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=momo t=2020-12-21T17:03:32+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=pytorch t=2020-12-21T17:03:32+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=sunliangliang t=2020-12-21T17:03:32+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=tessss t=2020-12-21T17:03:32+0800 lvl=info msg="Shutting down container" action=shutdown created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao timeout=30s used=2020-12-21T17:02:44+0800 t=2020-12-21T17:03:32+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=wangke t=2020-12-21T17:03:32+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=wangke2 t=2020-12-21T17:03:32+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=wuxinjia t=2020-12-21T17:03:35+0800 lvl=info msg="Shut down container" action=shutdown created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao timeout=30s used=2020-12-21T17:02:44+0800 t=2020-12-21T17:03:35+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=tianjimiao t=2020-12-21T17:03:35+0800 lvl=info msg="Starting shutdown sequence" t=2020-12-21T17:03:35+0800 lvl=info msg="Stopping REST API handler:" t=2020-12-21T17:03:35+0800 lvl=info msg=" - closing socket" socket=/var/lib/lxd/unix.socket t=2020-12-21T17:03:35+0800 lvl=info msg="Stopping /dev/lxd handler" t=2020-12-21T17:03:35+0800 lvl=info msg=" - closing socket" socket=/var/lib/lxd/devlxd/sock t=2020-12-21T17:03:35+0800 lvl=info msg="Closing the database" t=2020-12-21T17:03:35+0800 lvl=info msg="Stopping REST API handler:" t=2020-12-21T17:03:35+0800 lvl=info msg="Stopping /dev/lxd handler" t=2020-12-21T17:03:35+0800 lvl=info msg="Stopping REST API handler:" t=2020-12-21T17:03:35+0800 lvl=info msg="Stopping /dev/lxd handler" t=2020-12-21T17:03:35+0800 lvl=info msg="Unmounting temporary filesystems" t=2020-12-21T17:03:35+0800 lvl=info msg="Done unmounting temporary filesystems" t=2020-12-21T17:03:35+0800 lvl=info msg="Saving simplestreams cache" t=2020-12-21T17:03:35+0800 lvl=info msg="Saved simplestreams cache" t=2020-12-21T17:04:22+0800 lvl=info msg="LXD 3.0.3 is starting in normal mode" path=/var/lib/lxd t=2020-12-21T17:04:22+0800 lvl=info msg="Kernel uid/gid map:" t=2020-12-21T17:04:22+0800 lvl=info msg=" - u 0 0 4294967295" t=2020-12-21T17:04:22+0800 lvl=info msg=" - g 0 0 4294967295" t=2020-12-21T17:04:22+0800 lvl=info msg="Configured LXD uid/gid map:" t=2020-12-21T17:04:22+0800 lvl=info msg=" - u 0 165536 65536" t=2020-12-21T17:04:22+0800 lvl=info msg=" - g 0 165536 65536" t=2020-12-21T17:04:22+0800 lvl=warn msg="CGroup memory swap accounting is disabled, swap limits will be ignored." t=2020-12-21T17:04:22+0800 lvl=info msg="Kernel features:" t=2020-12-21T17:04:22+0800 lvl=info msg=" - netnsid-based network retrieval: no" t=2020-12-21T17:04:22+0800 lvl=info msg=" - unprivileged file capabilities: no" t=2020-12-21T17:04:22+0800 lvl=info msg="Initializing local database" t=2020-12-21T17:04:22+0800 lvl=info msg="Starting /dev/lxd handler:" t=2020-12-21T17:04:22+0800 lvl=info msg=" - binding devlxd socket" socket=/var/lib/lxd/devlxd/sock t=2020-12-21T17:04:22+0800 lvl=info msg="REST API daemon:" t=2020-12-21T17:04:22+0800 lvl=info msg=" - binding Unix socket" inherited=true socket=/var/lib/lxd/unix.socket t=2020-12-21T17:04:22+0800 lvl=info msg="Initializing global database" t=2020-12-21T17:04:22+0800 lvl=info msg="Initializing storage pools" t=2020-12-21T17:04:22+0800 lvl=info msg="Initializing networks" t=2020-12-21T17:04:22+0800 lvl=info msg="Pruning leftover image files" t=2020-12-21T17:04:22+0800 lvl=info msg="Done pruning leftover image files" t=2020-12-21T17:04:22+0800 lvl=info msg="Loading daemon configuration" t=2020-12-21T17:04:22+0800 lvl=info msg="Pruning expired images" t=2020-12-21T17:04:22+0800 lvl=info msg="Done pruning expired images" t=2020-12-21T17:04:22+0800 lvl=info msg="Updating instance types" t=2020-12-21T17:04:22+0800 lvl=info msg="Done updating instance types" t=2020-12-21T17:04:22+0800 lvl=info msg="Expiring log files" t=2020-12-21T17:04:22+0800 lvl=info msg="Done expiring log files" t=2020-12-21T17:04:22+0800 lvl=eror msg="Failed to start container 'tianjimiao': Common start logic: Missing source '/dev/nvidia-uvm' for device 'nvidia-uvm'" t=2020-12-21T17:04:54+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=tianjimiao t=2020-12-21T17:05:03+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=tianjimiao t=2020-12-21T17:05:03+0800 lvl=info msg="Starting container" action=start created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao stateful=false used=2020-12-21T17:02:44+0800 t=2020-12-21T17:05:03+0800 lvl=warn msg="Failed to update instance types: Get https://images.linuxcontainers.org/meta/instance-types/.yaml: Unable to connect to: images.linuxcontainers.org:443" t=2020-12-21T17:05:04+0800 lvl=info msg="Started container" action=start created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao stateful=false used=2020-12-21T17:02:44+0800
- [ ] Output of the client with --debug - [ ] Output of the daemon with --debug (alternatively output of `lxc monitor` while reproducing the issue)
Your config shows you're passing /dev/nvidia-uvm to the container, what happens if your remove that device?
Also, please show "find /dev" inside the container.
Required information
Issue description
I don't assign GPUs to the container, but all GPUs are displayed in the container
Steps to reproduce
lxc exec xxx bash
nvidia-smi
Information to attach
[ ] Any relevant kernel output (
dmesg
)lxc info NAME --show-log
)Log:
lxc tianjimiao 20201221090504.400 WARN conf - conf.c:lxc_setup_devpts:1616 - Invalid argument - Failed to unmount old devpts instance lxc tianjimiao 20201221090504.400 WARN apparmor - lsm/apparmor.c:apparmor_process_label_set:221 - Incomplete AppArmor support in your kernel
sipl@sipl-4Xp:~$ lxc config show tianjimiao --expanded architecture: x86_64 config: image.architecture: x86_64 image.description: Ubuntu 16.04 LTS server (20180424) image.os: ubuntu image.release: xenial raw.lxc: lxc.apparmor.allow_incomplete=1 security.privileged: "true" volatile.base_image: 55c06c2c9b9e47fbb89537134395c12d221e1536d26788c07ee042d07b34dd07 volatile.eth0.hwaddr: 00:16:3e:de:3b:86 volatile.eth0.name: eth0 volatile.idmap.base: "0" volatile.idmap.next: '[]' volatile.last_state.idmap: '[]' volatile.last_state.power: RUNNING devices: A-Pool: path: /A-pool source: /A-pool type: disk eth0: nictype: bridged parent: br0 type: nic nvidia-uvm: path: /dev/nvidia-uvm type: unix-char root: path: / pool: default type: disk ephemeral: false profiles:
default stateful: false description: ""
t=2020-12-21T15:17:24+0800 lvl=info msg="Container initiated reboot" action=reboot created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao stateful=false used=2020-12-18T19:22:54+0800 t=2020-12-21T15:17:28+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=tianjimiao t=2020-12-21T15:17:29+0800 lvl=info msg="Starting container" action=start created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao stateful=false used=2020-12-18T19:22:54+0800 t=2020-12-21T15:17:30+0800 lvl=info msg="Started container" action=start created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao stateful=false used=2020-12-18T19:22:54+0800 t=2020-12-21T15:30:07+0800 lvl=info msg="Container initiated reboot" action=reboot created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao stateful=false used=2020-12-21T15:17:29+0800 t=2020-12-21T15:30:08+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=tianjimiao t=2020-12-21T15:30:10+0800 lvl=info msg="Starting container" action=start created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao stateful=false used=2020-12-21T15:17:29+0800 t=2020-12-21T15:30:10+0800 lvl=info msg="Started container" action=start created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao stateful=false used=2020-12-21T15:17:29+0800 t=2020-12-21T15:45:58+0800 lvl=info msg="Container initiated reboot" action=reboot created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao stateful=false used=2020-12-21T15:30:10+0800 t=2020-12-21T15:45:58+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=tianjimiao t=2020-12-21T15:46:00+0800 lvl=info msg="Starting container" action=start created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao stateful=false used=2020-12-21T15:30:10+0800 t=2020-12-21T15:46:00+0800 lvl=info msg="Started container" action=start created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao stateful=false used=2020-12-21T15:30:10+0800 t=2020-12-21T15:48:30+0800 lvl=info msg="Asked to shutdown by API, shutting down containers" t=2020-12-21T15:48:30+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=allenzsy t=2020-12-21T15:48:30+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=anxin t=2020-12-21T15:48:30+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=dln t=2020-12-21T15:48:30+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=houfeng t=2020-12-21T15:48:30+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=kml t=2020-12-21T15:48:30+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=kml2 t=2020-12-21T15:48:30+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=liubin t=2020-12-21T15:48:30+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=lx t=2020-12-21T15:48:30+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=matlab-caffe t=2020-12-21T15:48:30+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=matlab-caffe2 t=2020-12-21T15:48:30+0800 lvl=info msg="Shutting down container" action=shutdown created=2018-08-23T16:42:37+0800 ephemeral=false name=mcj timeout=30s used=2020-12-18T19:20:41+0800 t=2020-12-21T15:48:30+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=mcj2 t=2020-12-21T15:48:31+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=momo t=2020-12-21T15:48:31+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=pytorch t=2020-12-21T15:48:31+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=sunliangliang t=2020-12-21T15:48:31+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=tessss t=2020-12-21T15:48:31+0800 lvl=info msg="Shutting down container" action=shutdown created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao timeout=30s used=2020-12-21T15:46:00+0800 t=2020-12-21T15:48:31+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=wangke t=2020-12-21T15:48:31+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=wangke2 t=2020-12-21T15:48:31+0800 lvl=info msg="Shutting down container" action=shutdown created=2019-09-18T10:56:32+0800 ephemeral=false name=wuxinjia timeout=30s used=2020-12-18T19:23:21+0800 t=2020-12-21T15:48:36+0800 lvl=info msg="Shut down container" action=shutdown created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao timeout=30s used=2020-12-21T15:46:00+0800 t=2020-12-21T15:48:36+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=tianjimiao t=2020-12-21T15:48:37+0800 lvl=info msg="Shut down container" action=shutdown created=2018-08-23T16:42:37+0800 ephemeral=false name=mcj timeout=30s used=2020-12-18T19:20:41+0800 t=2020-12-21T15:48:37+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=mcj t=2020-12-21T15:48:39+0800 lvl=info msg="Shut down container" action=shutdown created=2019-09-18T10:56:32+0800 ephemeral=false name=wuxinjia timeout=30s used=2020-12-18T19:23:21+0800 t=2020-12-21T15:48:39+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=wuxinjia t=2020-12-21T15:48:39+0800 lvl=info msg="Starting shutdown sequence" t=2020-12-21T15:48:39+0800 lvl=info msg="Stopping REST API handler:" t=2020-12-21T15:48:39+0800 lvl=info msg=" - closing socket" socket=/var/lib/lxd/unix.socket t=2020-12-21T15:48:39+0800 lvl=info msg="Stopping /dev/lxd handler" t=2020-12-21T15:48:39+0800 lvl=info msg=" - closing socket" socket=/var/lib/lxd/devlxd/sock t=2020-12-21T15:48:39+0800 lvl=info msg="Closing the database" t=2020-12-21T15:48:39+0800 lvl=info msg="Stopping REST API handler:" t=2020-12-21T15:48:39+0800 lvl=info msg="Stopping /dev/lxd handler" t=2020-12-21T15:48:39+0800 lvl=info msg="Stopping REST API handler:" t=2020-12-21T15:48:39+0800 lvl=info msg="Stopping /dev/lxd handler" t=2020-12-21T15:48:39+0800 lvl=info msg="Unmounting temporary filesystems" t=2020-12-21T15:48:39+0800 lvl=info msg="Done unmounting temporary filesystems" t=2020-12-21T15:48:39+0800 lvl=info msg="Saving simplestreams cache" t=2020-12-21T15:48:39+0800 lvl=info msg="Saved simplestreams cache" t=2020-12-21T15:49:29+0800 lvl=info msg="LXD 3.0.3 is starting in normal mode" path=/var/lib/lxd t=2020-12-21T15:49:29+0800 lvl=info msg="Kernel uid/gid map:" t=2020-12-21T15:49:29+0800 lvl=info msg=" - u 0 0 4294967295" t=2020-12-21T15:49:29+0800 lvl=info msg=" - g 0 0 4294967295" t=2020-12-21T15:49:29+0800 lvl=info msg="Configured LXD uid/gid map:" t=2020-12-21T15:49:29+0800 lvl=info msg=" - u 0 165536 65536" t=2020-12-21T15:49:29+0800 lvl=info msg=" - g 0 165536 65536" t=2020-12-21T15:49:29+0800 lvl=warn msg="CGroup memory swap accounting is disabled, swap limits will be ignored." t=2020-12-21T15:49:29+0800 lvl=info msg="Kernel features:" t=2020-12-21T15:49:29+0800 lvl=info msg=" - netnsid-based network retrieval: no" t=2020-12-21T15:49:29+0800 lvl=info msg=" - unprivileged file capabilities: no" t=2020-12-21T15:49:29+0800 lvl=info msg="Initializing local database" t=2020-12-21T15:49:29+0800 lvl=info msg="Starting /dev/lxd handler:" t=2020-12-21T15:49:29+0800 lvl=info msg=" - binding devlxd socket" socket=/var/lib/lxd/devlxd/sock t=2020-12-21T15:49:29+0800 lvl=info msg="REST API daemon:" t=2020-12-21T15:49:29+0800 lvl=info msg=" - binding Unix socket" inherited=true socket=/var/lib/lxd/unix.socket t=2020-12-21T15:49:29+0800 lvl=info msg="Initializing global database" t=2020-12-21T15:49:29+0800 lvl=info msg="Initializing storage pools" t=2020-12-21T15:49:29+0800 lvl=info msg="Initializing networks" t=2020-12-21T15:49:29+0800 lvl=info msg="Pruning leftover image files" t=2020-12-21T15:49:29+0800 lvl=info msg="Done pruning leftover image files" t=2020-12-21T15:49:29+0800 lvl=info msg="Loading daemon configuration" t=2020-12-21T15:49:29+0800 lvl=info msg="Pruning expired images" t=2020-12-21T15:49:29+0800 lvl=info msg="Done pruning expired images" t=2020-12-21T15:49:29+0800 lvl=info msg="Updating instance types" t=2020-12-21T15:49:29+0800 lvl=info msg="Done updating instance types" t=2020-12-21T15:49:29+0800 lvl=info msg="Expiring log files" t=2020-12-21T15:49:29+0800 lvl=info msg="Done expiring log files" t=2020-12-21T15:49:29+0800 lvl=eror msg="Failed to start container 'mcj': Common start logic: Missing source '/dev/nvidia-uvm' for device 'nvidia-uvm'" t=2020-12-21T15:49:29+0800 lvl=eror msg="Failed to start container 'tianjimiao': Common start logic: Missing source '/dev/nvidia-uvm' for device 'nvidia-uvm'" t=2020-12-21T15:49:29+0800 lvl=eror msg="Failed to start container 'wuxinjia': Common start logic: Missing source '/dev/nvidia-uvm' for device 'nvidia-uvm'" t=2020-12-21T15:50:12+0800 lvl=warn msg="Failed to update instance types: Get https://images.linuxcontainers.org/meta/instance-types/.yaml: Unable to connect to: images.linuxcontainers.org:443" t=2020-12-21T15:50:29+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=tianjimiao t=2020-12-21T15:50:29+0800 lvl=info msg="Starting container" action=start created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao stateful=false used=2020-12-21T15:46:00+0800 t=2020-12-21T15:50:30+0800 lvl=info msg="Started container" action=start created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao stateful=false used=2020-12-21T15:46:00+0800 t=2020-12-21T15:52:10+0800 lvl=info msg="Asked to shutdown by API, shutting down containers" t=2020-12-21T15:52:10+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=allenzsy t=2020-12-21T15:52:10+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=anxin t=2020-12-21T15:52:10+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=dln t=2020-12-21T15:52:10+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=houfeng t=2020-12-21T15:52:10+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=kml t=2020-12-21T15:52:10+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=kml2 t=2020-12-21T15:52:10+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=liubin t=2020-12-21T15:52:10+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=lx t=2020-12-21T15:52:10+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=matlab-caffe t=2020-12-21T15:52:10+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=matlab-caffe2 t=2020-12-21T15:52:10+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=mcj t=2020-12-21T15:52:10+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=mcj2 t=2020-12-21T15:52:10+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=momo t=2020-12-21T15:52:10+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=pytorch t=2020-12-21T15:52:10+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=sunliangliang t=2020-12-21T15:52:10+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=tessss t=2020-12-21T15:52:10+0800 lvl=info msg="Shutting down container" action=shutdown created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao timeout=30s used=2020-12-21T15:50:29+0800 t=2020-12-21T15:52:10+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=wangke t=2020-12-21T15:52:10+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=wangke2 t=2020-12-21T15:52:10+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=wuxinjia t=2020-12-21T15:52:16+0800 lvl=info msg="Shut down container" action=shutdown created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao timeout=30s used=2020-12-21T15:50:29+0800 t=2020-12-21T15:52:16+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=tianjimiao t=2020-12-21T15:52:16+0800 lvl=info msg="Starting shutdown sequence" t=2020-12-21T15:52:16+0800 lvl=info msg="Stopping REST API handler:" t=2020-12-21T15:52:16+0800 lvl=info msg=" - closing socket" socket=/var/lib/lxd/unix.socket t=2020-12-21T15:52:16+0800 lvl=info msg="Stopping /dev/lxd handler" t=2020-12-21T15:52:16+0800 lvl=info msg=" - closing socket" socket=/var/lib/lxd/devlxd/sock t=2020-12-21T15:52:16+0800 lvl=info msg="Closing the database" t=2020-12-21T15:52:16+0800 lvl=info msg="Stopping REST API handler:" t=2020-12-21T15:52:16+0800 lvl=info msg="Stopping /dev/lxd handler" t=2020-12-21T15:52:16+0800 lvl=info msg="Stopping REST API handler:" t=2020-12-21T15:52:16+0800 lvl=info msg="Stopping /dev/lxd handler" t=2020-12-21T15:52:16+0800 lvl=info msg="Unmounting temporary filesystems" t=2020-12-21T15:52:16+0800 lvl=info msg="Done unmounting temporary filesystems" t=2020-12-21T15:52:16+0800 lvl=info msg="Saving simplestreams cache" t=2020-12-21T15:52:16+0800 lvl=info msg="Saved simplestreams cache" t=2020-12-21T15:53:03+0800 lvl=info msg="LXD 3.0.3 is starting in normal mode" path=/var/lib/lxd t=2020-12-21T15:53:03+0800 lvl=info msg="Kernel uid/gid map:" t=2020-12-21T15:53:03+0800 lvl=info msg=" - u 0 0 4294967295" t=2020-12-21T15:53:03+0800 lvl=info msg=" - g 0 0 4294967295" t=2020-12-21T15:53:03+0800 lvl=info msg="Configured LXD uid/gid map:" t=2020-12-21T15:53:03+0800 lvl=info msg=" - u 0 165536 65536" t=2020-12-21T15:53:03+0800 lvl=info msg=" - g 0 165536 65536" t=2020-12-21T15:53:03+0800 lvl=warn msg="CGroup memory swap accounting is disabled, swap limits will be ignored." t=2020-12-21T15:53:03+0800 lvl=info msg="Kernel features:" t=2020-12-21T15:53:03+0800 lvl=info msg=" - netnsid-based network retrieval: no" t=2020-12-21T15:53:03+0800 lvl=info msg=" - unprivileged file capabilities: no" t=2020-12-21T15:53:03+0800 lvl=info msg="Initializing local database" t=2020-12-21T15:53:03+0800 lvl=info msg="Starting /dev/lxd handler:" t=2020-12-21T15:53:03+0800 lvl=info msg=" - binding devlxd socket" socket=/var/lib/lxd/devlxd/sock t=2020-12-21T15:53:03+0800 lvl=info msg="REST API daemon:" t=2020-12-21T15:53:03+0800 lvl=info msg=" - binding Unix socket" inherited=true socket=/var/lib/lxd/unix.socket t=2020-12-21T15:53:03+0800 lvl=info msg="Initializing global database" t=2020-12-21T15:53:03+0800 lvl=info msg="Initializing storage pools" t=2020-12-21T15:53:03+0800 lvl=info msg="Initializing networks" t=2020-12-21T15:53:03+0800 lvl=info msg="Pruning leftover image files" t=2020-12-21T15:53:03+0800 lvl=info msg="Done pruning leftover image files" t=2020-12-21T15:53:03+0800 lvl=info msg="Loading daemon configuration" t=2020-12-21T15:53:03+0800 lvl=info msg="Pruning expired images" t=2020-12-21T15:53:03+0800 lvl=info msg="Done pruning expired images" t=2020-12-21T15:53:03+0800 lvl=info msg="Expiring log files" t=2020-12-21T15:53:03+0800 lvl=info msg="Done expiring log files" t=2020-12-21T15:53:03+0800 lvl=info msg="Updating instance types" t=2020-12-21T15:53:03+0800 lvl=info msg="Done updating instance types" t=2020-12-21T15:53:03+0800 lvl=eror msg="Failed to start container 'tianjimiao': Common start logic: Missing source '/dev/nvidia-uvm' for device 'nvidia-uvm'" t=2020-12-21T15:53:43+0800 lvl=warn msg="Failed to update instance types: Get https://images.linuxcontainers.org/meta/instance-types/.yaml: Unable to connect to: images.linuxcontainers.org:443" t=2020-12-21T16:11:42+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=tianjimiao t=2020-12-21T16:11:43+0800 lvl=info msg="Starting container" action=start created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao stateful=false used=2020-12-21T15:50:29+0800 t=2020-12-21T16:11:44+0800 lvl=info msg="Started container" action=start created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao stateful=false used=2020-12-21T15:50:29+0800 t=2020-12-21T16:21:29+0800 lvl=info msg="Container initiated reboot" action=reboot created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao stateful=false used=2020-12-21T16:11:43+0800 t=2020-12-21T16:21:30+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=tianjimiao t=2020-12-21T16:21:30+0800 lvl=info msg="Starting container" action=start created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao stateful=false used=2020-12-21T16:11:43+0800 t=2020-12-21T16:21:30+0800 lvl=info msg="Started container" action=start created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao stateful=false used=2020-12-21T16:11:43+0800 t=2020-12-21T16:30:24+0800 lvl=warn msg="Detected poll(POLLNVAL) event." t=2020-12-21T16:32:34+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=wuxinjia t=2020-12-21T16:32:34+0800 lvl=info msg="Starting container" action=start created=2019-09-18T10:56:32+0800 ephemeral=false name=wuxinjia stateful=false used=2020-12-18T19:23:21+0800 t=2020-12-21T16:32:37+0800 lvl=info msg="Started container" action=start created=2019-09-18T10:56:32+0800 ephemeral=false name=wuxinjia stateful=false used=2020-12-18T19:23:21+0800 t=2020-12-21T16:48:32+0800 lvl=info msg="Container initiated reboot" action=reboot created=2019-09-18T10:56:32+0800 ephemeral=false name=wuxinjia stateful=false used=2020-12-21T16:32:34+0800 t=2020-12-21T16:48:33+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=wuxinjia t=2020-12-21T16:48:33+0800 lvl=info msg="Starting container" action=start created=2019-09-18T10:56:32+0800 ephemeral=false name=wuxinjia stateful=false used=2020-12-21T16:32:34+0800 t=2020-12-21T16:48:34+0800 lvl=info msg="Started container" action=start created=2019-09-18T10:56:32+0800 ephemeral=false name=wuxinjia stateful=false used=2020-12-21T16:32:34+0800 t=2020-12-21T16:56:22+0800 lvl=info msg="Container initiated reboot" action=reboot created=2019-09-18T10:56:32+0800 ephemeral=false name=wuxinjia stateful=false used=2020-12-21T16:48:33+0800 t=2020-12-21T16:56:23+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=wuxinjia t=2020-12-21T16:56:24+0800 lvl=info msg="Starting container" action=start created=2019-09-18T10:56:32+0800 ephemeral=false name=wuxinjia stateful=false used=2020-12-21T16:48:33+0800 t=2020-12-21T16:56:24+0800 lvl=info msg="Started container" action=start created=2019-09-18T10:56:32+0800 ephemeral=false name=wuxinjia stateful=false used=2020-12-21T16:48:33+0800 t=2020-12-21T17:01:22+0800 lvl=info msg="Shutting down container" action=shutdown created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao timeout=-1s used=2020-12-21T16:21:30+0800 t=2020-12-21T17:01:29+0800 lvl=info msg="Shut down container" action=shutdown created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao timeout=-1s used=2020-12-21T16:21:30+0800 t=2020-12-21T17:01:35+0800 lvl=info msg="Shutting down container" action=shutdown created=2019-09-18T10:56:32+0800 ephemeral=false name=wuxinjia timeout=-1s used=2020-12-21T16:56:24+0800 t=2020-12-21T17:01:42+0800 lvl=info msg="Shut down container" action=shutdown created=2019-09-18T10:56:32+0800 ephemeral=false name=wuxinjia timeout=-1s used=2020-12-21T16:56:24+0800 t=2020-12-21T17:01:54+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=tianjimiao t=2020-12-21T17:01:56+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=tianjimiao t=2020-12-21T17:02:36+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=tianjimiao t=2020-12-21T17:02:44+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=tianjimiao t=2020-12-21T17:02:44+0800 lvl=info msg="Starting container" action=start created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao stateful=false used=2020-12-21T16:21:30+0800 t=2020-12-21T17:02:45+0800 lvl=info msg="Started container" action=start created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao stateful=false used=2020-12-21T16:21:30+0800 t=2020-12-21T17:03:32+0800 lvl=info msg="Asked to shutdown by API, shutting down containers" t=2020-12-21T17:03:32+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=allenzsy t=2020-12-21T17:03:32+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=anxin t=2020-12-21T17:03:32+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=dln t=2020-12-21T17:03:32+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=houfeng t=2020-12-21T17:03:32+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=kml t=2020-12-21T17:03:32+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=kml2 t=2020-12-21T17:03:32+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=liubin t=2020-12-21T17:03:32+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=lx t=2020-12-21T17:03:32+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=matlab-caffe t=2020-12-21T17:03:32+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=matlab-caffe2 t=2020-12-21T17:03:32+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=mcj t=2020-12-21T17:03:32+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=mcj2 t=2020-12-21T17:03:32+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=momo t=2020-12-21T17:03:32+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=pytorch t=2020-12-21T17:03:32+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=sunliangliang t=2020-12-21T17:03:32+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=tessss t=2020-12-21T17:03:32+0800 lvl=info msg="Shutting down container" action=shutdown created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao timeout=30s used=2020-12-21T17:02:44+0800 t=2020-12-21T17:03:32+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=wangke t=2020-12-21T17:03:32+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=wangke2 t=2020-12-21T17:03:32+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=wuxinjia t=2020-12-21T17:03:35+0800 lvl=info msg="Shut down container" action=shutdown created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao timeout=30s used=2020-12-21T17:02:44+0800 t=2020-12-21T17:03:35+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=tianjimiao t=2020-12-21T17:03:35+0800 lvl=info msg="Starting shutdown sequence" t=2020-12-21T17:03:35+0800 lvl=info msg="Stopping REST API handler:" t=2020-12-21T17:03:35+0800 lvl=info msg=" - closing socket" socket=/var/lib/lxd/unix.socket t=2020-12-21T17:03:35+0800 lvl=info msg="Stopping /dev/lxd handler" t=2020-12-21T17:03:35+0800 lvl=info msg=" - closing socket" socket=/var/lib/lxd/devlxd/sock t=2020-12-21T17:03:35+0800 lvl=info msg="Closing the database" t=2020-12-21T17:03:35+0800 lvl=info msg="Stopping REST API handler:" t=2020-12-21T17:03:35+0800 lvl=info msg="Stopping /dev/lxd handler" t=2020-12-21T17:03:35+0800 lvl=info msg="Stopping REST API handler:" t=2020-12-21T17:03:35+0800 lvl=info msg="Stopping /dev/lxd handler" t=2020-12-21T17:03:35+0800 lvl=info msg="Unmounting temporary filesystems" t=2020-12-21T17:03:35+0800 lvl=info msg="Done unmounting temporary filesystems" t=2020-12-21T17:03:35+0800 lvl=info msg="Saving simplestreams cache" t=2020-12-21T17:03:35+0800 lvl=info msg="Saved simplestreams cache" t=2020-12-21T17:04:22+0800 lvl=info msg="LXD 3.0.3 is starting in normal mode" path=/var/lib/lxd t=2020-12-21T17:04:22+0800 lvl=info msg="Kernel uid/gid map:" t=2020-12-21T17:04:22+0800 lvl=info msg=" - u 0 0 4294967295" t=2020-12-21T17:04:22+0800 lvl=info msg=" - g 0 0 4294967295" t=2020-12-21T17:04:22+0800 lvl=info msg="Configured LXD uid/gid map:" t=2020-12-21T17:04:22+0800 lvl=info msg=" - u 0 165536 65536" t=2020-12-21T17:04:22+0800 lvl=info msg=" - g 0 165536 65536" t=2020-12-21T17:04:22+0800 lvl=warn msg="CGroup memory swap accounting is disabled, swap limits will be ignored." t=2020-12-21T17:04:22+0800 lvl=info msg="Kernel features:" t=2020-12-21T17:04:22+0800 lvl=info msg=" - netnsid-based network retrieval: no" t=2020-12-21T17:04:22+0800 lvl=info msg=" - unprivileged file capabilities: no" t=2020-12-21T17:04:22+0800 lvl=info msg="Initializing local database" t=2020-12-21T17:04:22+0800 lvl=info msg="Starting /dev/lxd handler:" t=2020-12-21T17:04:22+0800 lvl=info msg=" - binding devlxd socket" socket=/var/lib/lxd/devlxd/sock t=2020-12-21T17:04:22+0800 lvl=info msg="REST API daemon:" t=2020-12-21T17:04:22+0800 lvl=info msg=" - binding Unix socket" inherited=true socket=/var/lib/lxd/unix.socket t=2020-12-21T17:04:22+0800 lvl=info msg="Initializing global database" t=2020-12-21T17:04:22+0800 lvl=info msg="Initializing storage pools" t=2020-12-21T17:04:22+0800 lvl=info msg="Initializing networks" t=2020-12-21T17:04:22+0800 lvl=info msg="Pruning leftover image files" t=2020-12-21T17:04:22+0800 lvl=info msg="Done pruning leftover image files" t=2020-12-21T17:04:22+0800 lvl=info msg="Loading daemon configuration" t=2020-12-21T17:04:22+0800 lvl=info msg="Pruning expired images" t=2020-12-21T17:04:22+0800 lvl=info msg="Done pruning expired images" t=2020-12-21T17:04:22+0800 lvl=info msg="Updating instance types" t=2020-12-21T17:04:22+0800 lvl=info msg="Done updating instance types" t=2020-12-21T17:04:22+0800 lvl=info msg="Expiring log files" t=2020-12-21T17:04:22+0800 lvl=info msg="Done expiring log files" t=2020-12-21T17:04:22+0800 lvl=eror msg="Failed to start container 'tianjimiao': Common start logic: Missing source '/dev/nvidia-uvm' for device 'nvidia-uvm'" t=2020-12-21T17:04:54+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=tianjimiao t=2020-12-21T17:05:03+0800 lvl=warn msg="Unable to update backup.yaml at this time" name=tianjimiao t=2020-12-21T17:05:03+0800 lvl=info msg="Starting container" action=start created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao stateful=false used=2020-12-21T17:02:44+0800 t=2020-12-21T17:05:03+0800 lvl=warn msg="Failed to update instance types: Get https://images.linuxcontainers.org/meta/instance-types/.yaml: Unable to connect to: images.linuxcontainers.org:443" t=2020-12-21T17:05:04+0800 lvl=info msg="Started container" action=start created=2019-11-19T15:43:25+0800 ephemeral=false name=tianjimiao stateful=false used=2020-12-21T17:02:44+0800