NVIDAI Orin platforms boots up failed with extra kernel configs

I download kernel source from https://developer.nvidia.com/downloads/embedded/l4t/r36_release_v4.3/sources/public_sources.tbz2, and then build it with below extra configs

CONFIG_ARM64_CRYPTO=y
CONFIG_CPU_FREQ_GOV_ATTR_SET=y
CONFIG_CPU_FREQ_GOV_COMMON=y
CONFIG_CPU_FREQ_GOV_CONSERVATIVE=y
CONFIG_CPU_FREQ_GOV_ONDEMAND=y
CONFIG_CPU_FREQ_GOV_PERFORMANCE=y
CONFIG_CPU_FREQ_GOV_POWERSAVE=y
CONFIG_CPU_FREQ_GOV_SCHEDUTIL=y
CONFIG_CPU_FREQ_GOV_USERSPACE=y
CONFIG_CPU_FREQ_STAT=y
CONFIG_CPU_IDLE=y
CONFIG_CRYPTO=y
CONFIG_CRYPTO_AES_ARM64_CE=y
CONFIG_CRYPTO_AES_ARM64_CE_BLK=y
CONFIG_CRYPTO_SHA1_ARM64_CE=y
CONFIG_CRYPTO_SHA2_ARM64_CE=y
CONFIG_CRYPTO_USER_API_SKCIPHER=y
CONFIG_DEBUG_LL=y
CONFIG_EARLY_PRINTK=y
CONFIG_EDAC_DEBUG=y
CONFIG_F2FS_FS=y
CONFIG_F2FS_STAT_FS=y
CONFIG_NETFILTER_NETLINK=m
CONFIG_NFSD=y
CONFIG_NFSD_V3=y
CONFIG_NFSD_V4=y
CONFIG_NF_CT_NETLINK=m
CONFIG_PERF_EVENTS=y
CONFIG_PTP_1588_CLOCK_GIANFAR=y
CONFIG_RFKILL=y
CONFIG_TEST_UDELAY=m
CONFIG_TIPC=m
CONFIG_USB_ETH=m
CONFIG_USB_GADGET=y
CONFIG_USB_G_SERIAL=m
CONFIG_USB_MASS_STORAGE=m

CONFIG_DEBUG_INFO=y
CONFIG_DYNAMIC_FTRACE=y
CONFIG_DEBUG_PAGEALLOC=y
CONFIG_GPIO_PCA953X=y
CONFIG_EXPERT=y
CONFIG_ACPI=y
CONFIG_FHANDLE=y
CONFIG_TASKSTATS=y
CONFIG_TASK_DELAY_ACCT=y
CONFIG_TASK_XACCT=y
CONFIG_TASK_IO_ACCOUNTING=y
CONFIG_RCU_NOCB_CPU=y
CONFIG_LOG_BUF_SHIFT=17
CONFIG_CGROUP_PERF=y
CONFIG_CHECKPOINT_RESTORE=y
CONFIG_SGETMASK_SYSCALL=y
CONFIG_KALLSYMS_ALL=y
CONFIG_BPF_SYSCALL=y
CONFIG_KPROBES=y
CONFIG_MODULE_FORCE_LOAD=y
CONFIG_MODULE_FORCE_UNLOAD=y
CONFIG_BLK_DEV_BSGLIB=y
CONFIG_BLK_DEV_INTEGRITY=y
CONFIG_BLK_DEV_THROTTLING=y
CONFIG_BLK_CMDLINE_PARSER=y
CONFIG_PARTITION_ADVANCED=y
CONFIG_IOSCHED_BFQ=y
CONFIG_PCI_DEBUG=y
CONFIG_PCI_REALLOC_ENABLE_AUTO=y
CONFIG_PCIEPORTBUS=y
CONFIG_PCIEAER=y
CONFIG_PCIE_ECRC=y
CONFIG_PCIEAER_INJECT=y
CONFIG_PCIEASPM=y
CONFIG_PCIEASPM_DEFAULT=y
CONFIG_SCHED_MC=y
CONFIG_SCHED_SMT=y
CONFIG_KSM=y
CONFIG_CMA=y
CONFIG_CMA_DEBUG=y
CONFIG_CMA_DEBUGFS=y
CONFIG_ZPOOL=y
CONFIG_ZBUD=y
CONFIG_BINFMT_MISC=y
CONFIG_PRINTK_TIME=y
CONFIG_DEBUG_SECTION_MISMATCH=y
CONFIG_PAGE_EXTENSION=y
CONFIG_SLUB_DEBUG_ON=y
CONFIG_SLUB_STATS=y
CONFIG_DEBUG_KMEMLEAK=y
CONFIG_DEBUG_STACK_USAGE=y
CONFIG_DEBUG_VM=y
CONFIG_DEBUG_VM_VMACACHE=y
CONFIG_DEBUG_VM_RB=y
CONFIG_DEBUG_MEMORY_INIT=y
CONFIG_DEBUG_PER_CPU_MAPS=y
CONFIG_DEBUG_SHIRQ=y
CONFIG_DETECT_HUNG_TASK=y
CONFIG_DEFAULT_HUNG_TASK_TIMEOUT=3000
CONFIG_BOOTPARAM_HUNG_TASK_PANIC=y
CONFIG_PANIC_ON_OOPS=y
CONFIG_SCHED_DEBUG=y
CONFIG_SCHEDSTATS=y
CONFIG_SCHED_STACK_END_CHECK=y
CONFIG_DEBUG_TIMEKEEPING=y
CONFIG_DEBUG_RT_MUTEXES=y
CONFIG_DEBUG_SPINLOCK=y
CONFIG_DEBUG_MUTEXES=y
CONFIG_DEBUG_WW_MUTEX_SLOWPATH=y
CONFIG_DEBUG_LOCK_ALLOC=y
CONFIG_PROVE_LOCKING=y
CONFIG_LOCK_STAT=y
CONFIG_LOCKDEP=y
CONFIG_DEBUG_LOCKDEP=y
CONFIG_DEBUG_KOBJECT_RELEASE=y
CONFIG_DEBUG_LIST=y
CONFIG_DEBUG_SG=y
CONFIG_DEBUG_NOTIFIERS=y
CONFIG_DEBUG_CREDENTIALS=y
CONFIG_RCU_TRACE=y
CONFIG_FAULT_INJECTION=y
CONFIG_FAILSLAB=y
CONFIG_FAIL_PAGE_ALLOC=y
CONFIG_FAIL_MAKE_REQUEST=y
CONFIG_FAIL_IO_TIMEOUT=y
CONFIG_FAULT_INJECTION_DEBUG_FS=y
CONFIG_FAULT_INJECTION_STACKTRACE_FILTER=y
CONFIG_IRQSOFF_TRACER=y
CONFIG_PREEMPT_TRACER=y
CONFIG_SCHED_TRACER=y
CONFIG_STACK_TRACER=y
CONFIG_FUNCTION_PROFILER=y
CONFIG_TRACEPOINT_BENCHMARK=y
CONFIG_RING_BUFFER_BENCHMARK=y
CONFIG_RING_BUFFER_STARTUP_TEST=y
CONFIG_LKDTM=y
CONFIG_TEST_LIST_SORT=y
CONFIG_KPROBES_SANITY_TEST=y
CONFIG_RBTREE_TEST=y

CONFIG_ATOMIC64_SELFTEST=y

CONFIG_TEST_HEXDUMP=y
CONFIG_TEST_STRING_HELPERS=y
CONFIG_TEST_KSTRTOX=y
CONFIG_TEST_RHASHTABLE=y

CONFIG_PID_IN_CONTEXTIDR=y
CONFIG_FW_LOADER=y

#CONFIG_DEBUG_DRIVER=y
#CONFIG_DEBUG_DEVRES=y

CONFIG_DMA_CMA=y
CONFIG_CMA_SIZE_SEL_MBYTES=y
CONFIG_ARM_CCN=y
CONFIG_CONNECTOR=y
CONFIG_PROC_EVENTS=y
CONFIG_BLK_DEV_NULL_BLK=y
CONFIG_BLK_DEV_LOOP=y
CONFIG_BLK_DEV_CRYPTOLOOP=y
CONFIG_BLK_DEV_NBD=y
CONFIG_EEPROM_AT25=y
CONFIG_CHR_DEV_SG=y
CONFIG_MD_RAID456=y
CONFIG_I2C_CHARDEV=y
CONFIG_I2C_MUX=y
CONFIG_I2C_SLAVE=y
CONFIG_I2C_SLAVE_EEPROM=y
CONFIG_I2C_DEBUG_CORE=y
CONFIG_I2C_DEBUG_ALGO=y
CONFIG_I2C_DEBUG_BUS=y

CONFIG_PPS=y
CONFIG_PTP_1588_CLOCK=y
CONFIG_NETWORK_PHY_TIMESTAMPING=y
CONFIG_DP83640_PHY=y
CONFIG_PMBUS=y
CONFIG_THERMAL=y
CONFIG_THERMAL_HWMON=y
CONFIG_THERMAL_OF=y
CONFIG_THERMAL_DEFAULT_GOV_STEP_WISE=y
CONFIG_FB=y
CONFIG_FB_MODE_HELPERS=y
CONFIG_USB_ANNOUNCE_NEW_DEVICES=y
CONFIG_DMATEST=m
CONFIG_STAGING=y
CONFIG_MAILBOX=y
CONFIG_PL320_MBOX=y
CONFIG_EXT4_DEBUG=y
CONFIG_FANOTIFY=y
CONFIG_QUOTA=y
CONFIG_QUOTA_DEBUG=y
CONFIG_FUSE_FS=y
CONFIG_CUSE=y
CONFIG_OVERLAY_FS=y
CONFIG_FSCACHE=y
CONFIG_FSCACHE_STATS=y
CONFIG_FSCACHE_HISTOGRAM=y
CONFIG_FSCACHE_DEBUG=y
CONFIG_FSCACHE_OBJECT_LIST=y
CONFIG_CACHEFILES=y
CONFIG_CACHEFILES_DEBUG=y
CONFIG_CACHEFILES_HISTOGRAM=y
CONFIG_UDF_FS=y
CONFIG_HUGETLBFS=y
CONFIG_CONFIGFS_FS=y

CONFIG_MTD_TESTS=m
CONFIG_USB_TEST=y
CONFIG_GLOB_SELFTEST=y
CONFIG_DEBUG_GPIO=y

CONFIG_DMA_API_DEBUG=y

CONFIG_JBD2_DEBUG=y
CONFIG_BTRFS_DEBUG=y
CONFIG_CIFS_DEBUG=y
CONFIG_CIFS_DEBUG2=y

CONFIG_TEST_LKM=m
CONFIG_TEST_BPF=m
CONFIG_HAVE_DEBUG_BUGVERBOSE=y
CONFIG_SYSCTL_EXCEPTION_TRACE=y
CONFIG_TEST_USER_COPY=m
CONFIG_MEMTEST=y
CONFIG_KGDB=y

CONFIG_NOTIFIER_ERROR_INJECTION=y
CONFIG_KGDB_TESTS=y
CONFIG_KGDB_TESTS_ON_BOOT=y
CONFIG_SAMPLES=y
CONFIG_SAMPLE_TRACE_EVENTS=m
CONFIG_SAMPLE_TRACE_PRINTK=m
CONFIG_SAMPLE_KOBJECT=m
CONFIG_SAMPLE_KPROBES=m
CONFIG_SAMPLE_HW_BREAKPOINT=m
CONFIG_SAMPLE_KFIFO=m
CONFIG_SAMPLE_CONFIGFS=m
CONFIG_VETH=y
CONFIG_SECURITYFS=y
CONFIG_RCU_EXPERT=y
CONFIG_TORTURE_TEST=m
CONFIG_RCU_TORTURE_TEST=m
CONFIG_LOCK_TORTURE_TEST=m

when I boot up system, there is no graphics displayed on the monitor, and there is below error reported continuously.

[ 1094.156174] tegra-mc 2c00000.memory-controller: nvl1r: read @0x000000dfd727c000: EMEM address decode error (EMEM decode error)
[ 1094.156246] tegra-mc 2c00000.memory-controller: nvl1r: read @0x000000dfd6b4c000: EMEM address decode error (EMEM decode error)

after investigating, I found out the key config is CONFIG_DMA_API_DEBUG, but I am not sure which driver to read the invalid memory.

could you please help to check it? or is it a known issue?

thanks,

Limeng

1 Like

Hi,

Are you sure if you only add above config in tegra config then you will also reproduce this error?

no. If I only enable config CONFIG_DMA_API_DEBUG, I can see there is graphics displayed on monitor.
So, I think system should boot up normally.

Then please figure out what else you added is causing the crash…

Not quite sure what does that mean “I found out the key config is CONFIG_DMA_API_DEBUG” but seems not causing problem.

Is this still an issue to support? Any result can be shared?

I have remove config CONFIG_DMA_API_DEBUG in my project temporarily

thanks,
LImeng

Got it, thanks for your update.