diff --git a/configs/AM62DX/AM62DX_linux_toc.txt b/configs/AM62DX/AM62DX_linux_toc.txt index d84069088..d4c62c308 100644 --- a/configs/AM62DX/AM62DX_linux_toc.txt +++ b/configs/AM62DX/AM62DX_linux_toc.txt @@ -8,9 +8,8 @@ devices/AM62DX/linux/Release_Specific_Release_Notes devices/AM62DX/linux/Release_Specific_Build_Sheet devices/AM62DX/linux/Release_Specific_Yocto_layer_Configuration #devices/AM62DX/linux/Release_Specific_Migration_Guide -#devices/AM62DX/linux/Release_Specific_Kernel_Performance_Guide -#devices/AM62DX/linux/Linux_Performance_Guide -#devices/AM62DX/linux/RT_Linux_Performance_Guide +devices/AM62DX/linux/Release_Specific_Kernel_Performance_Guide +devices/AM62DX/linux/Linux_Performance_Guide #devices/AM62DX/linux/Release_Specific_Workarounds devices/AM62DX/linux/Release_Specific_Supported_Platforms_and_Versions diff --git a/source/devices/AM62DX/linux/Linux_Performance_Guide.rst b/source/devices/AM62DX/linux/Linux_Performance_Guide.rst new file mode 100644 index 000000000..7d132d1ce --- /dev/null +++ b/source/devices/AM62DX/linux/Linux_Performance_Guide.rst @@ -0,0 +1,448 @@ + +==================================== + Linux 11.02.08.02 Performance Guide +==================================== + +.. rubric:: **Read This First** + :name: read-this-first-kernel-perf-guide + +**All performance numbers provided in this document are gathered using +following Evaluation Modules unless otherwise specified.** + ++----------------+----------------------------------------------------------------------------------------------------------------+ +| Name | Description | ++================+================================================================================================================+ ++----------------+----------------------------------------------------------------------------------------------------------------+ +| AM62Dx EVM | AM62Dx Evaluation Module rev E1 with ARM running at 1.4GHz, DDR data rate 3733 MT/S | ++----------------+----------------------------------------------------------------------------------------------------------------+ + +Table: Evaluation Modules + +.. rubric:: About This Manual + :name: about-this-manual-kernel-perf-guide + +This document provides performance data for each of the device drivers +which are part of the Processor SDK Linux package. This document should be +used in conjunction with release notes and user guides provided with the +Processor SDK Linux package for information on specific issues present +with drivers included in a particular release. + +.. rubric:: If You Need Assistance + :name: if-you-need-assistance-kernel-perf-guide + +For further information or to report any problems, contact +https://e2e.ti.com/ or https://support.ti.com/ + +System Benchmarks +----------------- + +LMBench +^^^^^^^ +LMBench is a collection of microbenchmarks of which the memory bandwidth +and latency related ones are typically used to estimate processor +memory system performance. More information about lmbench at +https://lmbench.sourceforge.net/whatis_lmbench.html and +https://lmbench.sourceforge.net/man/lmbench.8.html + +**Latency**: lat_mem_rd-stride128-szN, where N is equal to or smaller than the cache +size at given level measures the cache miss penalty. N that is at least +double the size of last level cache is the latency to external memory. + +**Bandwidth**: bw_mem_bcopy-N, where N is equal to or smaller than the cache size at +a given level measures the achievable memory bandwidth from software doing +a memcpy() type operation. Typical use is for external memory bandwidth +calculation. The bandwidth is calculated as byte read and written counts +as 1 which should be roughly half of STREAM copy result. + +Execute the LMBench with the following: + +:: + + cd /opt/ltp + ./runltp -P j721e-idk-gw -f ddt/lmbench -s LMBENCH_L_PERF_0001 + +.. csv-table:: LMBench Benchmarks + :header: "Benchmarks","am62dxx_evm-fs: perf" + + "af_unix_sock_stream_latency (microsec)","30.12 (min 29.31, max 30.82)" + "af_unix_socket_stream_bandwidth (mb\s)","1054.72 (min 1042.80, max 1065.78)" + "bw_file_rd-io-1mb (mb/s)","1394.63 (min 1375.04, max 1403.65)" + "bw_file_rd-o2c-1mb (mb/s)","749.43 (min 694.32, max 788.64)" + "bw_mem-bcopy-16mb (mb/s)","1740.68 (min 1715.63, max 1750.16)" + "bw_mem-bcopy-1mb (mb/s)","1863.03 (min 1842.75, max 1889.39)" + "bw_mem-bcopy-2mb (mb/s)","1625.67 (min 1545.83, max 1692.05)" + "bw_mem-bcopy-4mb (mb/s)","1647.32 (min 1548.79, max 1713.31)" + "bw_mem-bcopy-8mb (mb/s)","1729.40 (min 1707.76, max 1746.34)" + "bw_mem-bzero-16mb (mb/s)","7938.98 (min 7920.79, max 7952.29)" + "bw_mem-bzero-1mb (mb/s)","4881.67 (min 1842.75, max 7925.07)" + "bw_mem-bzero-2mb (mb/s)","4766.95 (min 1545.83, max 7952.29)" + "bw_mem-bzero-4mb (mb/s)","4788.22 (min 1548.79, max 7945.11)" + "bw_mem-bzero-8mb (mb/s)","4831.41 (min 1707.76, max 7947.02)" + "bw_mem-cp-16mb (mb/s)","840.43 (min 834.03, max 852.65)" + "bw_mem-cp-1mb (mb/s)","4506.74 (min 795.42, max 8218.15)" + "bw_mem-cp-2mb (mb/s)","4415.13 (min 784.93, max 8064.52)" + "bw_mem-cp-4mb (mb/s)","4431.16 (min 849.98, max 8001.45)" + "bw_mem-cp-8mb (mb/s)","4434.57 (min 870.70, max 7984.03)" + "bw_mem-fcp-16mb (mb/s)","1532.91 (min 1509.72, max 1557.94)" + "bw_mem-fcp-1mb (mb/s)","4726.56 (min 1515.15, max 7925.07)" + "bw_mem-fcp-2mb (mb/s)","4700.63 (min 1429.08, max 7952.29)" + "bw_mem-fcp-4mb (mb/s)","4735.69 (min 1504.61, max 7945.11)" + "bw_mem-fcp-8mb (mb/s)","4744.51 (min 1547.39, max 7947.02)" + "bw_mem-frd-16mb (mb/s)","1887.64 (min 1876.61, max 1895.06)" + "bw_mem-frd-1mb (mb/s)","1782.58 (min 1515.15, max 2047.08)" + "bw_mem-frd-2mb (mb/s)","1605.52 (min 1429.08, max 1839.25)" + "bw_mem-frd-4mb (mb/s)","1646.92 (min 1504.61, max 1855.86)" + "bw_mem-frd-8mb (mb/s)","1665.51 (min 1547.39, max 1882.13)" + "bw_mem-fwr-16mb (mb/s)","7962.52 (min 7943.07, max 7974.75)" + "bw_mem-fwr-1mb (mb/s)","5099.94 (min 1932.20, max 8218.15)" + "bw_mem-fwr-2mb (mb/s)","4869.22 (min 1611.08, max 8064.52)" + "bw_mem-fwr-4mb (mb/s)","4872.60 (min 1653.58, max 8001.45)" + "bw_mem-fwr-8mb (mb/s)","4875.39 (min 1660.27, max 7984.03)" + "bw_mem-rd-16mb (mb/s)","1932.53 (min 1913.65, max 1942.22)" + "bw_mem-rd-1mb (mb/s)","1725.48 (min 1225.28, max 2219.76)" + "bw_mem-rd-2mb (mb/s)","1571.95 (min 1133.63, max 1943.32)" + "bw_mem-rd-4mb (mb/s)","1665.97 (min 1365.65, max 1941.12)" + "bw_mem-rd-8mb (mb/s)","1730.15 (min 1454.28, max 1948.61)" + "bw_mem-rdwr-16mb (mb/s)","1672.28 (min 1600.32, max 1718.40)" + "bw_mem-rdwr-1mb (mb/s)","1037.11 (min 795.42, max 1297.02)" + "bw_mem-rdwr-2mb (mb/s)","986.71 (min 784.93, max 1238.39)" + "bw_mem-rdwr-4mb (mb/s)","1135.79 (min 849.98, max 1446.39)" + "bw_mem-rdwr-8mb (mb/s)","1211.02 (min 870.70, max 1599.04)" + "bw_mem-wr-16mb (mb/s)","1619.91 (min 1548.29, max 1668.40)" + "bw_mem-wr-1mb (mb/s)","1255.05 (min 1206.06, max 1308.90)" + "bw_mem-wr-2mb (mb/s)","1195.30 (min 1057.64, max 1289.08)" + "bw_mem-wr-4mb (mb/s)","1403.98 (min 1295.97, max 1454.55)" + "bw_mem-wr-8mb (mb/s)","1525.80 (min 1389.37, max 1599.04)" + "bw_mmap_rd-mo-1mb (mb/s)","2117.81 (min 2081.76, max 2139.04)" + "bw_mmap_rd-o2c-1mb (mb/s)","750.19 (min 693.72, max 794.91)" + "bw_pipe (mb/s)","702.59 (min 692.16, max 713.48)" + "bw_unix (mb/s)","1054.72 (min 1042.80, max 1065.78)" + "lat_connect (us)","57.00 (min 56.61, max 57.41)" + "lat_ctx-2-128k (us)","7.85 (min 7.55, max 8.11)" + "lat_ctx-2-256k (us)","7.33 (min 6.40, max 8.28)" + "lat_ctx-4-128k (us)","7.44 (min 7.06, max 7.89)" + "lat_ctx-4-256k (us)","7.12 (min 5.25, max 8.97)" + "lat_fs-0k (num_files)","234.50 (min 215.00, max 251.00)" + "lat_fs-10k (num_files)","113.25 (min 104.00, max 122.00)" + "lat_fs-1k (num_files)","163.75 (min 144.00, max 178.00)" + "lat_fs-4k (num_files)","159.75 (min 144.00, max 174.00)" + "lat_mem_rd-stride128-sz1000k (ns)","31.04 (min 30.78, max 31.41)" + "lat_mem_rd-stride128-sz125k (ns)","5.56 (min 5.53, max 5.61)" + "lat_mem_rd-stride128-sz250k (ns)","5.90 (min 5.83, max 6.36)" + "lat_mem_rd-stride128-sz31k (ns)","3.67 (min 2.16, max 4.19)" + "lat_mem_rd-stride128-sz50 (ns)","2.15" + "lat_mem_rd-stride128-sz500k (ns)","11.25 (min 9.86, max 13.27)" + "lat_mem_rd-stride128-sz62k (ns)","5.15 (min 4.51, max 5.27)" + "lat_mmap-1m (us)","55.75 (min 51.00, max 58.00)" + "lat_ops-double-add (ns)","2.86" + "lat_ops-double-div (ns)","15.75 (min 15.74, max 15.76)" + "lat_ops-double-mul (ns)","2.86" + "lat_ops-float-add (ns)","2.86" + "lat_ops-float-div (ns)","9.30 (min 9.30, max 9.31)" + "lat_ops-float-mul (ns)","2.86" + "lat_ops-int-add (ns)","0.72" + "lat_ops-int-bit (ns)","0.48" + "lat_ops-int-div (ns)","4.29" + "lat_ops-int-mod (ns)","4.53 (min 4.53, max 4.54)" + "lat_ops-int-mul (ns)","3.08 (min 3.07, max 3.09)" + "lat_ops-int64-add (ns)","0.72" + "lat_ops-int64-bit (ns)","0.48" + "lat_ops-int64-div (ns)","6.80" + "lat_ops-int64-mod (ns)","5.25 (min 5.25, max 5.26)" + "lat_ops-int64-mul (ns)","3.55" + "lat_pagefault (us)","0.65 (min 0.51, max 1.06)" + "lat_pipe (us)","25.70 (min 25.35, max 26.22)" + "lat_proc-exec (us)","712.79 (min 689.13, max 735.50)" + "lat_proc-fork (us)","624.24 (min 601.00, max 643.00)" + "lat_proc-proccall (us)","0.01" + "lat_select (us)","34.08 (min 33.89, max 34.33)" + "lat_sem (us)","2.99 (min 2.61, max 3.63)" + "lat_sig-catch (us)","5.51 (min 5.27, max 5.71)" + "lat_sig-install (us)","0.67 (min 0.64, max 0.70)" + "lat_sig-prot (us)","0.64 (min 0.46, max 0.80)" + "lat_syscall-fstat (us)","1.98 (min 1.90, max 2.07)" + "lat_syscall-null (us)","0.46 (min 0.46, max 0.50)" + "lat_syscall-open (us)","166.27 (min 150.75, max 200.85)" + "lat_syscall-read (us)","0.82 (min 0.80, max 0.88)" + "lat_syscall-stat (us)","4.79 (min 4.64, max 4.97)" + "lat_syscall-write (us)","0.78 (min 0.75, max 0.83)" + "lat_tcp (us)","0.92 (min 0.91, max 0.97)" + "lat_unix (us)","30.12 (min 29.31, max 30.82)" + "latency_for_0.50_mb_block_size (nanosec)","11.25 (min 9.86, max 13.27)" + "latency_for_1.00_mb_block_size (nanosec)","15.52 (min 0.00, max 31.41)" + "pipe_bandwidth (mb\s)","702.59 (min 692.16, max 713.48)" + "pipe_latency (microsec)","25.70 (min 25.35, max 26.22)" + "procedure_call (microsec)","0.01" + "select_on_200_tcp_fds (microsec)","34.08 (min 33.89, max 34.33)" + "semaphore_latency (microsec)","2.99 (min 2.61, max 3.63)" + "signal_handler_latency (microsec)","0.67 (min 0.64, max 0.70)" + "signal_handler_overhead (microsec)","5.51 (min 5.27, max 5.71)" + "tcp_ip_connection_cost_to_localhost (microsec)","57.00 (min 56.61, max 57.41)" + "tcp_latency_using_localhost (microsec)","0.92 (min 0.91, max 0.97)" + +Dhrystone +^^^^^^^^^ +Dhrystone is a core only benchmark that runs from warm L1 caches in all +modern processors. It scales linearly with clock speed. + +Please take note, different run may produce different slightly results. +This is advised to run this test multiple times in order to get maximum +performance numbers. + +Execute the benchmark with the following: + +:: + + runDhrystone + +.. csv-table:: Dhrystone Benchmarks + :header: "Benchmarks","am62dxx_evm-fs: perf" + + "cpu_clock (mhz)","1400.00" + "dhrystone_per_mhz (dmips/mhz)","2.90" + "dhrystone_per_second (dhrystonep)","7142857.00" + +Whetstone +^^^^^^^^^ +Whetstone is a benchmark primarily measuring floating-point arithmetic performance. + +Execute the benchmark with the following: + +:: + + runWhetstone + +.. csv-table:: Whetstone Benchmarks + :header: "Benchmarks","am62dxx_evm-fs: perf" + + "whetstone (mips)","7500.00 (min 5000.00, max 10000.00)" + +Linpack +^^^^^^^ +Linpack measures peak double precision (64 bit) floating point performance in +solving a dense linear system. + +.. csv-table:: Linpack Benchmarks + :header: "Benchmarks","am62dxx_evm-fs: perf" + + "linpack (kflops)","576688.25 (min 574136.00, max 578099.00)" + +Stream +^^^^^^ +STREAM is a microbenchmark for measuring data memory system performance without +any data reuse. It is designed to miss on caches and exercise data prefetcher +and speculative accesses. +It uses double precision floating point (64bit) but in +most modern processors the memory access will be the bottleneck. +The four individual scores are copy, scale as in multiply by constant, +add two numbers, and triad for multiply accumulate. +For bandwidth, a byte read counts as one and a byte written counts as one, +resulting in a score that is double the bandwidth LMBench will show. + +Execute the benchmark with the following: + +:: + + stream_c + +.. csv-table:: Stream Benchmarks + :header: "Benchmarks","am62dxx_evm-fs: perf" + + "add (mb/s)","2565.85 (min 2558.60, max 2572.00)" + "copy (mb/s)","3569.39 (min 3553.00, max 3582.00)" + "scale (mb/s)","3338.13 (min 3282.60, max 3379.00)" + "triad (mb/s)","2385.28 (min 2379.40, max 2389.10)" + +CoreMarkPro +^^^^^^^^^^^ +CoreMark®-Pro is a comprehensive, advanced processor benchmark that works with +and enhances the market-proven industry-standard EEMBC CoreMark® benchmark. +While CoreMark stresses the CPU pipeline, CoreMark-Pro tests the entire processor, +adding comprehensive support for multicore technology, a combination of integer +and floating-point workloads, and data sets for utilizing larger memory subsystems. + +.. csv-table:: CoreMarkPro Benchmarks + :header: "Benchmarks","am62dxx_evm-fs: perf" + + "cjpeg-rose7-preset (workloads/)","42.00 (min 41.84, max 42.19)" + "core (workloads/)","0.30" + "coremark-pro ()","923.79 (min 903.66, max 936.49)" + "linear_alg-mid-100x100-sp (workloads/)","14.68 (min 14.67, max 14.69)" + "loops-all-mid-10k-sp (workloads/)","0.71" + "nnet_test (workloads/)","1.09 (min 1.08, max 1.09)" + "parser-125k (workloads/)","8.78 (min 8.70, max 8.85)" + "radix2-big-64k (workloads/)","61.55 (min 51.68, max 69.15)" + "sha-test (workloads/)","81.30 (min 80.65, max 81.97)" + "zip-test (workloads/)","22.16 (min 21.74, max 22.22)" + +.. csv-table:: CoreMarkProFourCore Benchmarks + :header: "Benchmarks","am62dxx_evm-fs: perf" + + "cjpeg-rose7-preset (workloads/)","160.97 (min 158.73, max 161.29)" + "core (workloads/)","1.20" + "coremark-pro ()","2540.92 (min 2504.79, max 2570.41)" + "linear_alg-mid-100x100-sp (workloads/)","56.35 (min 56.31, max 56.37)" + "loops-all-mid-10k-sp (workloads/)","2.07 (min 2.03, max 2.12)" + "nnet_test (workloads/)","3.62" + "parser-125k (workloads/)","9.29 (min 8.89, max 9.93)" + "radix2-big-64k (workloads/)","81.13 (min 79.71, max 82.65)" + "sha-test (workloads/)","269.38 (min 263.16, max 270.27)" + "zip-test (workloads/)","75.50 (min 72.73, max 76.92)" + +MultiBench +^^^^^^^^^^ +MultiBench™ is a suite of benchmarks that allows processor and system designers to +analyze, test, and improve multicore processors. It uses three forms of concurrency: +Data decomposition: multiple threads cooperating on achieving a unified goal and +demonstrating a processor’s support for fine grain parallelism. +Processing multiple data streams: uses common code running over multiple threads and +demonstrating how well a processor scales over scalable data inputs. +Multiple workload processing: shows the scalability of general-purpose processing, +demonstrating concurrency over both code and data. +MultiBench combines a wide variety of application-specific workloads with the EEMBC +Multi-Instance-Test Harness (MITH), compatible and portable with most any multicore +processors and operating systems. MITH uses a thread-based API (POSIX-compliant) to +establish a common programming model that communicates with the benchmark through an +abstraction layer and provides a flexible interface to allow a wide variety of +thread-enabled workloads to be tested. + +.. csv-table:: Multibench Benchmarks + :header: "Benchmarks","am62dxx_evm-fs: perf" + + "4m-check (workloads/)","417.14 (min 415.49, max 418.62)" + "4m-check-reassembly (workloads/)","113.35 (min 111.86, max 115.08)" + "4m-check-reassembly-tcp (workloads/)","58.41 (min 58.14, max 58.69)" + "4m-check-reassembly-tcp-cmykw2-rotatew2 (workloads/)","33.11 (min 32.89, max 33.33)" + "4m-check-reassembly-tcp-x264w2 (workloads/)","1.89 (min 1.87, max 1.91)" + "4m-cmykw2 (workloads/)","240.20 (min 227.02, max 246.61)" + "4m-cmykw2-rotatew2 (workloads/)","49.45 (min 49.14, max 49.75)" + "4m-reassembly (workloads/)","79.96 (min 78.86, max 80.97)" + "4m-rotatew2 (workloads/)","52.44 (min 51.84, max 52.83)" + "4m-tcp-mixed (workloads/)","119.07 (min 118.52, max 120.30)" + "4m-x264w2 (workloads/)","1.97 (min 1.94, max 2.00)" + "idct-4m (workloads/)","19.16 (min 19.14, max 19.20)" + "idct-4mw1 (workloads/)","19.17 (min 19.15, max 19.21)" + "ippktcheck-4m (workloads/)","414.97 (min 413.43, max 417.08)" + "ippktcheck-4mw1 (workloads/)","416.58 (min 413.22, max 418.76)" + "ipres-4m (workloads/)","108.42 (min 107.30, max 109.49)" + "ipres-4mw1 (workloads/)","107.73 (min 106.84, max 109.09)" + "md5-4m (workloads/)","27.55 (min 27.30, max 27.87)" + "md5-4mw1 (workloads/)","27.59 (min 27.32, max 27.78)" + "rgbcmyk-4m (workloads/)","63.65 (min 63.57, max 63.78)" + "rgbcmyk-4mw1 (workloads/)","63.67 (min 63.41, max 63.88)" + "rotate-4ms1 (workloads/)","23.44 (min 23.33, max 23.55)" + "rotate-4ms1w1 (workloads/)","23.47 (min 23.28, max 23.84)" + "rotate-4ms64 (workloads/)","23.71 (min 23.61, max 23.79)" + "rotate-4ms64w1 (workloads/)","23.70 (min 23.57, max 23.76)" + "x264-4mq (workloads/)","0.58" + "x264-4mqw1 (workloads/)","0.58" + +Boot-time Measurement +--------------------- + +Boot media: MMCSD +^^^^^^^^^^^^^^^^^ + +.. csv-table:: Linux boot time MMCSD + :header: "Boot Configuration","am62dxx_evm-fs: Boot time in seconds: avg(min,max)" + + "Linux boot time from SD with default rootfs (20 boot cycles)","14.31 (min 12.88, max 20.51)" + +Boot time numbers [avg, min, max] are measured from "Starting kernel" to Linux prompt across 20 boot cycles. + +| + +USB Driver +---------- + +USB Device Controller +^^^^^^^^^^^^^^^^^^^^^ + +.. csv-table:: USBDEVICE HIGHSPEED SLAVE_READ_THROUGHPUT + :header: "Number of Blocks","am62dxx_evm-fs: Throughput (MB/sec)" + + "150","31.79 (min 20.00, max 34.80)" + +.. csv-table:: USBDEVICE HIGHSPEED SLAVE_WRITE_THROUGHPUT + :header: "Number of Blocks","am62dxx_evm-fs: Throughput (MB/sec)" + + "150","30.64 (min 24.70, max 32.80)" + +| + +CRYPTO Driver +------------- + +OpenSSL Performance +^^^^^^^^^^^^^^^^^^^ + +.. csv-table:: OpenSSL Performance + :header: "Algorithm","Buffer Size (in bytes)","am62dxx_evm-fs: throughput (KBytes/Sec)" + + "aes-128-cbc","1024","23511.81 (min 22199.30, max 24003.58)" + "aes-128-cbc","16","424.58 (min 400.86, max 435.84)" + "aes-128-cbc","16384","85633.71 (min 84454.06, max 86250.84)" + "aes-128-cbc","256","7031.72 (min 6708.74, max 7234.22)" + "aes-128-cbc","64","1847.05 (min 1762.45, max 1904.09)" + "aes-128-cbc","8192","72108.37 (min 70328.32, max 72742.23)" + "aes-128-ecb","1024","24118.53 (min 23312.38, max 24716.29)" + "aes-128-ecb","16","436.57 (min 412.31, max 446.68)" + "aes-128-ecb","16384","88354.13 (min 87086.42, max 89161.73)" + "aes-128-ecb","256","7186.42 (min 6870.70, max 7333.55)" + "aes-128-ecb","64","1899.44 (min 1787.95, max 1948.69)" + "aes-128-ecb","8192","74231.47 (min 72373.59, max 74986.84)" + "aes-192-cbc","1024","23054.25 (min 21801.64, max 23675.90)" + "aes-192-cbc","16","426.41 (min 403.57, max 437.48)" + "aes-192-cbc","16384","77032.11 (min 75956.22, max 77736.62)" + "aes-192-cbc","256","6940.00 (min 6559.74, max 7117.23)" + "aes-192-cbc","64","1855.78 (min 1761.34, max 1896.92)" + "aes-192-cbc","8192","66243.58 (min 64476.50, max 67100.67)" + "aes-192-ecb","1024","23512.23 (min 22242.65, max 24032.94)" + "aes-192-ecb","16","435.23 (min 416.22, max 443.56)" + "aes-192-ecb","16384","79489.02 (min 77490.86, max 80303.45)" + "aes-192-ecb","256","7143.25 (min 6823.34, max 7303.17)" + "aes-192-ecb","64","1892.40 (min 1786.77, max 1936.68)" + "aes-192-ecb","8192","67959.13 (min 66158.59, max 68741.80)" + "aes-256-cbc","1024","22439.42 (min 21377.71, max 22966.27)" + "aes-256-cbc","16","427.52 (min 403.20, max 438.70)" + "aes-256-cbc","16384","70787.07 (min 69331.63, max 71254.02)" + "aes-256-cbc","256","6881.53 (min 6456.32, max 7109.89)" + "aes-256-cbc","64","1843.97 (min 1729.77, max 1889.94)" + "aes-256-cbc","8192","61376.17 (min 59588.61, max 62046.21)" + "aes-256-ecb","1024","23099.73 (min 22211.93, max 23634.60)" + "aes-256-ecb","16","435.45 (min 415.85, max 443.94)" + "aes-256-ecb","16384","72642.56 (min 71390.55, max 73176.41)" + "aes-256-ecb","256","7103.46 (min 6742.61, max 7271.85)" + "aes-256-ecb","64","1893.37 (min 1771.86, max 1932.05)" + "aes-256-ecb","8192","62965.42 (min 61532.84, max 63539.88)" + "sha256","1024","38004.99 (min 37393.07, max 38651.90)" + "sha256","16","632.01 (min 623.18, max 639.92)" + "sha256","16384","300601.34 (min 296621.40, max 303781.21)" + "sha256","256","9924.28 (min 9777.24, max 10089.73)" + "sha256","64","2500.19 (min 2459.39, max 2530.41)" + "sha256","8192","203442.52 (min 201657.00, max 204671.66)" + "sha512","1024","26159.23 (min 25836.20, max 26417.49)" + "sha512","16","614.39 (min 601.95, max 625.40)" + "sha512","16384","68399.79 (min 68119.21, max 68577.96)" + "sha512","256","8720.94 (min 8533.85, max 8851.97)" + "sha512","64","2456.83 (min 2404.99, max 2503.42)" + "sha512","8192","61606.57 (min 61311.66, max 61794.99)" + +.. csv-table:: OpenSSL CPU Load + :header: "Algorithm","am62dxx_evm-fs: CPU Load" + + "aes-128-cbc","31.50 (min 30.00, max 32.00)" + "aes-128-ecb","32.75 (min 31.00, max 34.00)" + "aes-192-cbc","31.50 (min 30.00, max 32.00)" + "aes-192-ecb","32.13 (min 30.00, max 33.00)" + "aes-256-cbc","31.00 (min 29.00, max 32.00)" + "aes-256-ecb","31.63 (min 30.00, max 33.00)" + "sha256","95.50 (min 94.00, max 96.00)" + "sha512","95.63 (min 95.00, max 96.00)" + +Listed for each algorithm are the code snippets used to run each + benchmark test. + +:: + + time -v openssl speed -elapsed -evp aes-128-cbc diff --git a/source/devices/AM62DX/linux/Release_Specific_Kernel_Performance_Guide.rst b/source/devices/AM62DX/linux/Release_Specific_Kernel_Performance_Guide.rst new file mode 100644 index 000000000..e65b22f15 --- /dev/null +++ b/source/devices/AM62DX/linux/Release_Specific_Kernel_Performance_Guide.rst @@ -0,0 +1,8 @@ +######################## +Kernel Performance Guide +######################## + +.. toctree:: + :maxdepth: 4 + + Linux_Performance_Guide diff --git a/source/devices/AM62LX/linux/Linux_Performance_Guide.rst b/source/devices/AM62LX/linux/Linux_Performance_Guide.rst index 180a3a93d..8f68dec10 100644 --- a/source/devices/AM62LX/linux/Linux_Performance_Guide.rst +++ b/source/devices/AM62LX/linux/Linux_Performance_Guide.rst @@ -1,6 +1,6 @@ ==================================== - Linux 11.01.16.13 Performance Guide + Linux 11.02.08.02 Performance Guide ==================================== .. rubric:: **Read This First** @@ -32,17 +32,17 @@ with drivers included in a particular release. For further information or to report any problems, contact https://e2e.ti.com/ or https://support.ti.com/ -System Benchmarks -------------------- +System Benchmarks +----------------- LMBench ^^^^^^^ LMBench is a collection of microbenchmarks of which the memory bandwidth and latency related ones are typically used to estimate processor memory system performance. More information about lmbench at -http://lmbench.sourceforge.net/whatis_lmbench.html and -http://lmbench.sourceforge.net/man/lmbench.8.html +https://lmbench.sourceforge.net/whatis_lmbench.html and +https://lmbench.sourceforge.net/man/lmbench.8.html **Latency**: lat_mem_rd-stride128-szN, where N is equal to or smaller than the cache size at given level measures the cache miss penalty. N that is at least @@ -64,126 +64,124 @@ Execute the LMBench with the following: .. csv-table:: LMBench Benchmarks :header: "Benchmarks","am62lxx_evm-fs: perf" - "af_unix_sock_stream_latency (microsec)","33.32 (min 32.78, max 34.30)" - "af_unix_socket_stream_bandwidth (mb\s)","477.67 (min 424.53, max 533.19)" - "bw_file_rd-io-1mb (mb/s)","1017.86 (min 930.23, max 1103.75)" - "bw_file_rd-o2c-1mb (mb/s)","498.42 (min 476.87, max 515.11)" - "bw_mem-bcopy-16mb (mb/s)","785.15 (min 707.87, max 861.19)" - "bw_mem-bcopy-1mb (mb/s)","808.29 (min 696.74, max 916.42)" - "bw_mem-bcopy-2mb (mb/s)","811.05 (min 686.58, max 932.84)" - "bw_mem-bcopy-4mb (mb/s)","835.91 (min 713.78, max 944.51)" - "bw_mem-bcopy-8mb (mb/s)","860.43 (min 743.43, max 972.05)" - "bw_mem-bzero-16mb (mb/s)","2426.00 (min 2106.09, max 2726.19)" - "bw_mem-bzero-1mb (mb/s)","1616.51 (min 696.74, max 2726.28)" - "bw_mem-bzero-2mb (mb/s)","1618.34 (min 686.58, max 2725.72)" - "bw_mem-bzero-4mb (mb/s)","1630.79 (min 713.78, max 2725.26)" - "bw_mem-bzero-8mb (mb/s)","1643.18 (min 743.43, max 2726.19)" - "bw_mem-cp-16mb (mb/s)","454.69 (min 396.23, max 512.71)" - "bw_mem-cp-1mb (mb/s)","1541.45 (min 397.93, max 2954.21)" - "bw_mem-cp-2mb (mb/s)","1490.05 (min 396.47, max 2828.85)" - "bw_mem-cp-4mb (mb/s)","1483.53 (min 419.77, max 2781.64)" - "bw_mem-cp-8mb (mb/s)","1481.96 (min 440.72, max 2755.77)" - "bw_mem-fcp-16mb (mb/s)","788.37 (min 712.79, max 865.71)" - "bw_mem-fcp-1mb (mb/s)","1646.16 (min 767.75, max 2726.28)" - "bw_mem-fcp-2mb (mb/s)","1647.26 (min 767.46, max 2725.72)" - "bw_mem-fcp-4mb (mb/s)","1659.77 (min 742.67, max 2725.26)" - "bw_mem-fcp-8mb (mb/s)","1668.94 (min 800.48, max 2726.19)" - "bw_mem-frd-16mb (mb/s)","1412.28 (min 1254.12, max 1571.86)" - "bw_mem-frd-1mb (mb/s)","1117.35 (min 767.75, max 1527.01)" - "bw_mem-frd-2mb (mb/s)","1119.11 (min 767.46, max 1539.94)" - "bw_mem-frd-4mb (mb/s)","1144.37 (min 742.67, max 1557.33)" - "bw_mem-frd-8mb (mb/s)","1161.00 (min 800.48, max 1572.02)" - "bw_mem-fwr-16mb (mb/s)","2441.13 (min 2120.89, max 2737.85)" - "bw_mem-fwr-1mb (mb/s)","1993.66 (min 1208.77, max 2954.21)" - "bw_mem-fwr-2mb (mb/s)","1947.01 (min 1216.92, max 2828.85)" - "bw_mem-fwr-4mb (mb/s)","1937.10 (min 1219.70, max 2781.64)" - "bw_mem-fwr-8mb (mb/s)","1934.21 (min 1245.91, max 2755.77)" - "bw_mem-rd-16mb (mb/s)","1425.70 (min 1267.63, max 1576.67)" - "bw_mem-rd-1mb (mb/s)","1017.79 (min 520.56, max 1563.04)" - "bw_mem-rd-2mb (mb/s)","1013.96 (min 514.87, max 1562.26)" - "bw_mem-rd-4mb (mb/s)","1054.25 (min 594.71, max 1573.56)" - "bw_mem-rd-8mb (mb/s)","1097.67 (min 678.20, max 1575.11)" - "bw_mem-rdwr-16mb (mb/s)","795.82 (min 678.22, max 938.80)" - "bw_mem-rdwr-1mb (mb/s)","548.03 (min 397.93, max 769.82)" - "bw_mem-rdwr-2mb (mb/s)","533.22 (min 396.47, max 744.32)" - "bw_mem-rdwr-4mb (mb/s)","585.02 (min 419.77, max 796.89)" - "bw_mem-rdwr-8mb (mb/s)","621.08 (min 440.72, max 865.33)" - "bw_mem-wr-16mb (mb/s)","815.25 (min 709.75, max 917.80)" - "bw_mem-wr-1mb (mb/s)","630.18 (min 520.56, max 769.82)" - "bw_mem-wr-2mb (mb/s)","617.21 (min 505.50, max 744.32)" - "bw_mem-wr-4mb (mb/s)","689.76 (min 592.33, max 827.22)" - "bw_mem-wr-8mb (mb/s)","753.35 (min 623.59, max 876.71)" - "bw_mmap_rd-mo-1mb (mb/s)","1316.12 (min 1163.76, max 1486.16)" - "bw_mmap_rd-o2c-1mb (mb/s)","501.44 (min 449.51, max 560.70)" - "bw_pipe (mb/s)","451.18 (min 373.01, max 509.56)" - "bw_unix (mb/s)","477.67 (min 424.53, max 533.19)" - "lat_connect (us)","70.44 (min 66.29, max 74.05)" - "lat_ctx-2-128k (us)","14.18 (min 10.78, max 18.24)" - "lat_ctx-2-256k (us)","25.92 (min 17.18, max 33.03)" - "lat_ctx-4-128k (us)","15.49 (min 11.20, max 18.76)" - "lat_ctx-4-256k (us)","11.87 (min 2.03, max 17.07)" - "lat_fs-0k (num_files)","196.75 (min 184.00, max 207.00)" - "lat_fs-10k (num_files)","88.13 (min 80.00, max 95.00)" - "lat_fs-1k (num_files)","131.13 (min 117.00, max 140.00)" - "lat_fs-4k (num_files)","131.50 (min 116.00, max 140.00)" - "lat_mem_rd-stride128-sz1000k (ns)","47.61 (min 42.75, max 52.39)" - "lat_mem_rd-stride128-sz125k (ns)","6.19 (min 6.17, max 6.24)" - "lat_mem_rd-stride128-sz250k (ns)","11.95 (min 9.14, max 16.02)" - "lat_mem_rd-stride128-sz31k (ns)","3.78 (min 2.42, max 4.44)" + "af_unix_sock_stream_latency (microsec)","33.14 (min 32.70, max 34.50)" + "af_unix_socket_stream_bandwidth (mb\s)","458.31 (min 416.22, max 548.49)" + "bw_file_rd-io-1mb (mb/s)","971.18 (min 906.62, max 1128.85)" + "bw_file_rd-o2c-1mb (mb/s)","515.41 (min 508.13, max 525.95)" + "bw_mem-bcopy-16mb (mb/s)","742.11 (min 704.91, max 849.57)" + "bw_mem-bcopy-1mb (mb/s)","755.61 (min 687.76, max 942.68)" + "bw_mem-bcopy-2mb (mb/s)","748.93 (min 681.43, max 958.47)" + "bw_mem-bcopy-4mb (mb/s)","781.73 (min 727.40, max 944.73)" + "bw_mem-bcopy-8mb (mb/s)","801.94 (min 738.69, max 994.53)" + "bw_mem-bzero-16mb (mb/s)","2250.16 (min 2104.16, max 2805.54)" + "bw_mem-bzero-1mb (mb/s)","1502.54 (min 687.76, max 2800.63)" + "bw_mem-bzero-2mb (mb/s)","1499.05 (min 681.43, max 2807.02)" + "bw_mem-bzero-4mb (mb/s)","1516.48 (min 727.40, max 2806.03)" + "bw_mem-bzero-8mb (mb/s)","1526.92 (min 738.69, max 2807.02)" + "bw_mem-cp-16mb (mb/s)","422.87 (min 397.28, max 517.95)" + "bw_mem-cp-1mb (mb/s)","1450.86 (min 401.50, max 3062.20)" + "bw_mem-cp-2mb (mb/s)","1387.71 (min 399.24, max 2898.03)" + "bw_mem-cp-4mb (mb/s)","1383.65 (min 434.12, max 2868.93)" + "bw_mem-cp-8mb (mb/s)","1376.95 (min 436.56, max 2827.85)" + "bw_mem-fcp-16mb (mb/s)","751.75 (min 710.13, max 879.75)" + "bw_mem-fcp-1mb (mb/s)","1538.99 (min 777.24, max 2800.63)" + "bw_mem-fcp-2mb (mb/s)","1534.98 (min 762.92, max 2807.02)" + "bw_mem-fcp-4mb (mb/s)","1547.58 (min 788.72, max 2806.03)" + "bw_mem-fcp-8mb (mb/s)","1556.02 (min 804.67, max 2807.02)" + "bw_mem-frd-16mb (mb/s)","1328.40 (min 1227.75, max 1609.50)" + "bw_mem-frd-1mb (mb/s)","1057.89 (min 777.24, max 1525.94)" + "bw_mem-frd-2mb (mb/s)","1063.22 (min 762.92, max 1550.87)" + "bw_mem-frd-4mb (mb/s)","1080.32 (min 788.72, max 1555.81)" + "bw_mem-frd-8mb (mb/s)","1093.89 (min 804.67, max 1611.60)" + "bw_mem-fwr-16mb (mb/s)","2270.76 (min 2123.71, max 2819.38)" + "bw_mem-fwr-1mb (mb/s)","1876.87 (min 1218.45, max 3062.20)" + "bw_mem-fwr-2mb (mb/s)","1828.62 (min 1203.61, max 2898.03)" + "bw_mem-fwr-4mb (mb/s)","1809.91 (min 1247.47, max 2868.93)" + "bw_mem-fwr-8mb (mb/s)","1802.83 (min 1250.00, max 2827.85)" + "bw_mem-rd-16mb (mb/s)","1345.30 (min 1264.92, max 1616.65)" + "bw_mem-rd-1mb (mb/s)","953.97 (min 525.76, max 1599.43)" + "bw_mem-rd-2mb (mb/s)","940.68 (min 511.31, max 1592.61)" + "bw_mem-rd-4mb (mb/s)","978.01 (min 513.68, max 1601.71)" + "bw_mem-rd-8mb (mb/s)","1032.26 (min 681.02, max 1605.14)" + "bw_mem-rdwr-16mb (mb/s)","732.31 (min 663.63, max 858.23)" + "bw_mem-rdwr-1mb (mb/s)","503.57 (min 401.50, max 680.27)" + "bw_mem-rdwr-2mb (mb/s)","494.06 (min 399.24, max 692.28)" + "bw_mem-rdwr-4mb (mb/s)","553.67 (min 434.12, max 778.21)" + "bw_mem-rdwr-8mb (mb/s)","585.97 (min 436.56, max 857.72)" + "bw_mem-wr-16mb (mb/s)","763.43 (min 702.83, max 927.75)" + "bw_mem-wr-1mb (mb/s)","573.83 (min 525.76, max 686.34)" + "bw_mem-wr-2mb (mb/s)","559.79 (min 507.29, max 692.28)" + "bw_mem-wr-4mb (mb/s)","633.10 (min 513.68, max 800.24)" + "bw_mem-wr-8mb (mb/s)","708.78 (min 627.60, max 871.93)" + "bw_mmap_rd-mo-1mb (mb/s)","1245.57 (min 1156.29, max 1501.22)" + "bw_mmap_rd-o2c-1mb (mb/s)","509.91 (min 505.22, max 519.21)" + "bw_pipe (mb/s)","426.35 (min 382.91, max 518.60)" + "bw_unix (mb/s)","458.31 (min 416.22, max 548.49)" + "lat_connect (us)","72.81 (min 71.39, max 76.51)" + "lat_ctx-2-128k (us)","17.46 (min 11.52, max 25.12)" + "lat_ctx-2-256k (us)","31.42 (min 26.43, max 34.63)" + "lat_ctx-4-128k (us)","15.70 (min 12.41, max 17.36)" + "lat_ctx-4-256k (us)","8.13 (min 0.00, max 16.57)" + "lat_fs-0k (num_files)","198.17 (min 189.00, max 213.00)" + "lat_fs-10k (num_files)","84.33 (min 76.00, max 90.00)" + "lat_fs-1k (num_files)","127.00 (min 113.00, max 140.00)" + "lat_fs-4k (num_files)","128.17 (min 119.00, max 134.00)" + "lat_mem_rd-stride128-sz1000k (ns)","49.98 (min 41.71, max 52.46)" + "lat_mem_rd-stride128-sz125k (ns)","6.19 (min 6.16, max 6.22)" + "lat_mem_rd-stride128-sz250k (ns)","13.46 (min 6.99, max 21.17)" + "lat_mem_rd-stride128-sz31k (ns)","3.59 (min 2.42, max 4.45)" "lat_mem_rd-stride128-sz50 (ns)","2.40 (min 2.40, max 2.41)" - "lat_mem_rd-stride128-sz500k (ns)","43.36 (min 37.83, max 47.82)" - "lat_mem_rd-stride128-sz62k (ns)","5.64 (min 4.95, max 5.76)" - "lat_mmap-1m (us)","60.38 (min 57.00, max 68.00)" + "lat_mem_rd-stride128-sz500k (ns)","45.07 (min 38.07, max 48.16)" + "lat_mem_rd-stride128-sz62k (ns)","5.74 (min 5.72, max 5.75)" + "lat_mmap-1m (us)","59.83 (min 57.00, max 70.00)" "lat_ops-double-add (ns)","3.21" "lat_ops-double-div (ns)","17.65 (min 17.64, max 17.66)" - "lat_ops-double-mul (ns)","3.21" + "lat_ops-double-mul (ns)","3.21 (min 3.21, max 3.22)" "lat_ops-float-add (ns)","3.21" - "lat_ops-float-div (ns)","10.43 (min 10.43, max 10.44)" + "lat_ops-float-div (ns)","10.43 (min 10.42, max 10.43)" "lat_ops-float-mul (ns)","3.21" "lat_ops-int-add (ns)","0.80" "lat_ops-int-bit (ns)","0.53" "lat_ops-int-div (ns)","4.82 (min 4.81, max 4.82)" "lat_ops-int-mod (ns)","5.08 (min 5.08, max 5.09)" - "lat_ops-int-mul (ns)","3.48 (min 3.44, max 3.51)" + "lat_ops-int-mul (ns)","3.45 (min 3.44, max 3.46)" "lat_ops-int64-add (ns)","0.80" "lat_ops-int64-bit (ns)","0.53 (min 0.53, max 0.54)" - "lat_ops-int64-div (ns)","7.62 (min 7.62, max 7.63)" + "lat_ops-int64-div (ns)","7.62" "lat_ops-int64-mod (ns)","5.88 (min 5.88, max 5.89)" - "lat_ops-int64-mul (ns)","3.99 (min 3.98, max 3.99)" - "lat_pagefault (us)","0.90 (min 0.83, max 0.99)" - "lat_pipe (us)","26.34 (min 25.59, max 27.41)" - "lat_proc-exec (us)","1394.59 (min 1262.00, max 1528.25)" - "lat_proc-fork (us)","1229.03 (min 1120.80, max 1349.80)" + "lat_ops-int64-mul (ns)","3.99 (min 3.98, max 4.04)" + "lat_pagefault (us)","0.93 (min 0.81, max 0.98)" + "lat_pipe (us)","26.36 (min 24.71, max 27.33)" + "lat_proc-exec (us)","1447.93 (min 1267.60, max 1563.25)" + "lat_proc-fork (us)","1269.68 (min 1094.20, max 1328.60)" "lat_proc-proccall (us)","0.01" - "lat_select (us)","38.25 (min 38.05, max 38.51)" - "lat_sem (us)","3.97 (min 3.64, max 4.35)" - "lat_sig-catch (us)","6.05 (min 5.87, max 6.26)" - "lat_sig-install (us)","0.72 (min 0.72, max 0.74)" - "lat_sig-prot (us)","0.62 (min 0.57, max 0.67)" - "lat_syscall-fstat (us)","2.25 (min 2.18, max 2.38)" - "lat_syscall-null (us)","0.52 (min 0.51, max 0.53)" - "lat_syscall-open (us)","493.24 (min 374.64, max 590.10)" - "lat_syscall-read (us)","0.91 (min 0.88, max 0.92)" - "lat_syscall-stat (us)","5.40 (min 5.27, max 5.67)" - "lat_syscall-write (us)","0.87 (min 0.83, max 0.91)" - "lat_tcp (us)","1.05 (min 1.02, max 1.10)" - "lat_unix (us)","33.32 (min 32.78, max 34.30)" - "latency_for_0.50_mb_block_size (nanosec)","43.36 (min 37.83, max 47.82)" - "latency_for_1.00_mb_block_size (nanosec)","23.80 (min 0.00, max 52.39)" - "pipe_bandwidth (mb\s)","451.18 (min 373.01, max 509.56)" - "pipe_latency (microsec)","26.34 (min 25.59, max 27.41)" + "lat_select (us)","38.21 (min 38.12, max 38.41)" + "lat_sem (us)","4.12 (min 3.74, max 4.31)" + "lat_sig-catch (us)","6.22 (min 6.07, max 6.38)" + "lat_sig-install (us)","0.74 (min 0.72, max 0.78)" + "lat_sig-prot (us)","0.69 (min 0.49, max 0.88)" + "lat_syscall-fstat (us)","2.20 (min 2.12, max 2.31)" + "lat_syscall-null (us)","0.51 (min 0.51, max 0.52)" + "lat_syscall-open (us)","403.50 (min 362.00, max 459.33)" + "lat_syscall-read (us)","0.91 (min 0.90, max 0.91)" + "lat_syscall-stat (us)","5.41 (min 5.23, max 5.60)" + "lat_syscall-write (us)","0.86 (min 0.84, max 0.88)" + "lat_tcp (us)","1.02" + "lat_unix (us)","33.14 (min 32.70, max 34.50)" + "latency_for_0.50_mb_block_size (nanosec)","45.07 (min 38.07, max 48.16)" + "latency_for_1.00_mb_block_size (nanosec)","24.99 (min 0.00, max 52.46)" + "pipe_bandwidth (mb\s)","426.35 (min 382.91, max 518.60)" + "pipe_latency (microsec)","26.36 (min 24.71, max 27.33)" "procedure_call (microsec)","0.01" - "select_on_200_tcp_fds (microsec)","38.25 (min 38.05, max 38.51)" - "semaphore_latency (microsec)","3.97 (min 3.64, max 4.35)" - "signal_handler_latency (microsec)","0.72 (min 0.72, max 0.74)" - "signal_handler_overhead (microsec)","6.05 (min 5.87, max 6.26)" - "tcp_ip_connection_cost_to_localhost (microsec)","70.44 (min 66.29, max 74.05)" - "tcp_latency_using_localhost (microsec)","1.05 (min 1.02, max 1.10)" - - + "select_on_200_tcp_fds (microsec)","38.21 (min 38.12, max 38.41)" + "semaphore_latency (microsec)","4.12 (min 3.74, max 4.31)" + "signal_handler_latency (microsec)","0.74 (min 0.72, max 0.78)" + "signal_handler_overhead (microsec)","6.22 (min 6.07, max 6.38)" + "tcp_ip_connection_cost_to_localhost (microsec)","72.81 (min 71.39, max 76.51)" + "tcp_latency_using_localhost (microsec)","1.02" Dhrystone -^^^^^^^^^^^^^^^^^^^^^^^^^^^ +^^^^^^^^^ Dhrystone is a core only benchmark that runs from warm L1 caches in all modern processors. It scales linearly with clock speed. @@ -191,7 +189,6 @@ Please take note, different run may produce different slightly results. This is advised to run this test multiple times in order to get maximum performance numbers. - Execute the benchmark with the following: :: @@ -202,13 +199,11 @@ Execute the benchmark with the following: :header: "Benchmarks","am62lxx_evm-fs: perf" "cpu_clock (mhz)","400.00" - "dhrystone_per_mhz (dmips/mhz)","9.03 (min 8.90, max 9.20)" - "dhrystone_per_second (dhrystonep)","6339605.78 (min 6250000.00, max 6451613.00)" - - + "dhrystone_per_mhz (dmips/mhz)","8.90" + "dhrystone_per_second (dhrystonep)","6250000.00" Whetstone -^^^^^^^^^^^^^^^^^^^^^^^^^^^ +^^^^^^^^^ Whetstone is a benchmark primarily measuring floating-point arithmetic performance. Execute the benchmark with the following: @@ -220,24 +215,20 @@ Execute the benchmark with the following: .. csv-table:: Whetstone Benchmarks :header: "Benchmarks","am62lxx_evm-fs: perf" - "whetstone (mips)","5625.00 (min 5000.00, max 10000.00)" - - + "whetstone (mips)","5833.33 (min 5000.00, max 10000.00)" Linpack -^^^^^^^^^^^^^^^^^^^^^^^^^^^ +^^^^^^^ Linpack measures peak double precision (64 bit) floating point performance in solving a dense linear system. .. csv-table:: Linpack Benchmarks :header: "Benchmarks","am62lxx_evm-fs: perf" - "linpack (kflops)","513526.67 (min 511598.00, max 515322.00)" - - + "linpack (kflops)","515149.67 (min 514088.00, max 516563.00)" NBench -^^^^^^^^^^^^^^^^^^^^^^^^^^^ +^^^^^^ NBench which stands for Native Benchmark is used to measure macro benchmarks for commonly used operations such as sorting and analysis algorithms. More information about NBench at @@ -247,20 +238,18 @@ https://nbench.io/articles/index.html .. csv-table:: NBench Benchmarks :header: "Benchmarks","am62lxx_evm-fs: perf" - "assignment (iterations)","12.93 (min 12.89, max 12.97)" - "fourier (iterations)","20382.13 (min 20379.00, max 20384.00)" - "fp_emulation (iterations)","192.44 (min 192.37, max 192.47)" - "huffman (iterations)","1057.10 (min 1056.70, max 1057.30)" - "idea (iterations)","3075.39 (min 3075.10, max 3075.60)" - "lu_decomposition (iterations)","472.38 (min 471.18, max 473.82)" - "neural_net (iterations)","7.72 (min 7.69, max 7.73)" - "numeric_sort (iterations)","559.37 (min 555.24, max 561.74)" - "string_sort (iterations)","146.37 (min 146.34, max 146.39)" - - + "assignment (iterations)","12.95 (min 12.90, max 12.97)" + "fourier (iterations)","20382.00 (min 20379.00, max 20384.00)" + "fp_emulation (iterations)","192.40 (min 192.33, max 192.47)" + "huffman (iterations)","1057.02 (min 1056.80, max 1057.20)" + "idea (iterations)","3075.14 (min 3074.90, max 3075.50)" + "lu_decomposition (iterations)","473.43 (min 470.10, max 479.32)" + "neural_net (iterations)","7.73 (min 7.72, max 7.73)" + "numeric_sort (iterations)","558.36 (min 555.56, max 562.43)" + "string_sort (iterations)","146.38 (min 146.36, max 146.39)" Stream -^^^^^^^^^^^^^^^^^^^^^^^^^^^ +^^^^^^ STREAM is a microbenchmark for measuring data memory system performance without any data reuse. It is designed to miss on caches and exercise data prefetcher and speculative accesses. @@ -280,16 +269,13 @@ Execute the benchmark with the following: .. csv-table:: Stream Benchmarks :header: "Benchmarks","am62lxx_evm-fs: perf" - "add (mb/s)","1814.33 (min 1507.90, max 1859.50)" - "copy (mb/s)","1907.35 (min 1562.40, max 1976.20)" - "scale (mb/s)","2009.28 (min 1651.30, max 2080.60)" - "triad (mb/s)","1792.49 (min 1490.60, max 1837.30)" - - - + "add (mb/s)","1651.55 (min 1501.10, max 1914.10)" + "copy (mb/s)","1735.32 (min 1565.10, max 2033.20)" + "scale (mb/s)","1830.72 (min 1641.00, max 2134.40)" + "triad (mb/s)","1632.43 (min 1491.50, max 1888.40)" CoreMarkPro -^^^^^^^^^^^^^^^^^^^^^^^^^^^ +^^^^^^^^^^^ CoreMark®-Pro is a comprehensive, advanced processor benchmark that works with and enhances the market-proven industry-standard EEMBC CoreMark® benchmark. While CoreMark stresses the CPU pipeline, CoreMark-Pro tests the entire processor, @@ -300,37 +286,33 @@ and floating-point workloads, and data sets for utilizing larger memory subsyste .. csv-table:: CoreMarkPro Benchmarks :header: "Benchmarks","am62lxx_evm-fs: perf" - "cjpeg-rose7-preset (workloads/)","37.24 (min 37.04, max 37.45)" + "cjpeg-rose7-preset (workloads/)","37.22 (min 37.04, max 37.31)" "core (workloads/)","0.27" - "coremark-pro ()","714.25 (min 680.43, max 728.34)" - "linear_alg-mid-100x100-sp (workloads/)","13.09 (min 13.07, max 13.10)" - "loops-all-mid-10k-sp (workloads/)","0.58 (min 0.56, max 0.59)" + "coremark-pro ()","705.20 (min 686.04, max 730.09)" + "linear_alg-mid-100x100-sp (workloads/)","13.09 (min 13.06, max 13.11)" + "loops-all-mid-10k-sp (workloads/)","0.57 (min 0.56, max 0.60)" "nnet_test (workloads/)","0.97" - "parser-125k (workloads/)","6.42 (min 5.24, max 7.04)" - "radix2-big-64k (workloads/)","20.92 (min 18.16, max 22.04)" - "sha-test (workloads/)","71.77 (min 69.44, max 72.46)" - "zip-test (workloads/)","19.19 (min 18.87, max 19.61)" - - + "parser-125k (workloads/)","6.35 (min 5.62, max 6.99)" + "radix2-big-64k (workloads/)","19.56 (min 17.06, max 22.07)" + "sha-test (workloads/)","71.11 (min 69.93, max 72.46)" + "zip-test (workloads/)","18.99 (min 18.52, max 19.61)" .. csv-table:: CoreMarkProTwoCore Benchmarks :header: "Benchmarks","am62lxx_evm-fs: perf" - "cjpeg-rose7-preset (workloads/)","73.00 (min 71.94, max 73.53)" - "core (workloads/)","0.54" - "coremark-pro ()","1227.03 (min 1186.04, max 1267.74)" - "linear_alg-mid-100x100-sp (workloads/)","26.06 (min 25.92, max 26.14)" - "loops-all-mid-10k-sp (workloads/)","1.03 (min 0.99, max 1.08)" + "cjpeg-rose7-preset (workloads/)","72.89 (min 71.94, max 74.07)" + "core (workloads/)","0.54 (min 0.53, max 0.54)" + "coremark-pro ()","1226.57 (min 1185.87, max 1277.14)" + "linear_alg-mid-100x100-sp (workloads/)","26.03 (min 25.97, max 26.11)" + "loops-all-mid-10k-sp (workloads/)","1.03 (min 1.00, max 1.07)" "nnet_test (workloads/)","1.93 (min 1.93, max 1.94)" - "parser-125k (workloads/)","6.48 (min 5.78, max 7.22)" - "radix2-big-64k (workloads/)","28.01 (min 24.43, max 32.16)" - "sha-test (workloads/)","140.88 (min 136.99, max 142.86)" - "zip-test (workloads/)","34.23 (min 32.79, max 36.36)" - - + "parser-125k (workloads/)","6.48 (min 5.81, max 7.33)" + "radix2-big-64k (workloads/)","28.39 (min 25.03, max 31.84)" + "sha-test (workloads/)","140.47 (min 138.89, max 142.86)" + "zip-test (workloads/)","34.17 (min 32.26, max 35.71)" MultiBench -^^^^^^^^^^^^^^^^^^^^^^^^^^^ +^^^^^^^^^^ MultiBench™ is a suite of benchmarks that allows processor and system designers to analyze, test, and improve multicore processors. It uses three forms of concurrency: Data decomposition: multiple threads cooperating on achieving a unified goal and @@ -349,272 +331,107 @@ thread-enabled workloads to be tested. .. csv-table:: Multibench Benchmarks :header: "Benchmarks","am62lxx_evm-fs: perf" - "4m-check (workloads/)","280.25 (min 263.49, max 314.58)" - "4m-check-reassembly (workloads/)","56.17 (min 52.44, max 64.10)" - "4m-check-reassembly-tcp (workloads/)","36.29 (min 34.34, max 40.92)" - "4m-check-reassembly-tcp-cmykw2-rotatew2 (workloads/)","15.99 (min 15.14, max 17.81)" - "4m-check-reassembly-tcp-x264w2 (workloads/)","0.92 (min 0.89, max 0.95)" - "4m-cmykw2 (workloads/)","109.32 (min 107.64, max 111.79)" - "4m-cmykw2-rotatew2 (workloads/)","20.95 (min 19.16, max 24.17)" - "4m-reassembly (workloads/)","51.98 (min 48.40, max 60.06)" - "4m-rotatew2 (workloads/)","20.48 (min 18.58, max 22.06)" - "4m-tcp-mixed (workloads/)","99.60 (min 98.16, max 104.58)" + "4m-check (workloads/)","288.19 (min 268.24, max 314.90)" + "4m-check-reassembly (workloads/)","57.34 (min 52.49, max 63.94)" + "4m-check-reassembly-tcp (workloads/)","36.65 (min 34.01, max 40.39)" + "4m-check-reassembly-tcp-cmykw2-rotatew2 (workloads/)","16.34 (min 15.28, max 18.05)" + "4m-check-reassembly-tcp-x264w2 (workloads/)","0.93 (min 0.91, max 0.95)" + "4m-cmykw2 (workloads/)","109.44 (min 107.88, max 112.05)" + "4m-cmykw2-rotatew2 (workloads/)","21.20 (min 19.46, max 23.21)" + "4m-reassembly (workloads/)","52.91 (min 49.41, max 58.24)" + "4m-rotatew2 (workloads/)","21.26 (min 19.25, max 23.63)" + "4m-tcp-mixed (workloads/)","95.76 (min 93.02, max 98.16)" "4m-x264w2 (workloads/)","0.94 (min 0.93, max 0.96)" "empty-wld (workloads/)","1.00" - "idct-4m (workloads/)","16.93 (min 16.59, max 17.09)" - "idct-4mw1 (workloads/)","16.93 (min 16.61, max 17.10)" - "ippktcheck-4m (workloads/)","280.55 (min 264.63, max 314.55)" - "ippktcheck-4mw1 (workloads/)","279.72 (min 264.05, max 312.77)" - "ipres-4m (workloads/)","66.59 (min 62.32, max 76.26)" - "ipres-4mw1 (workloads/)","66.74 (min 62.21, max 77.16)" - "md5-4m (workloads/)","18.51 (min 17.80, max 20.26)" - "md5-4mw1 (workloads/)","18.76 (min 18.18, max 19.69)" - "rgbcmyk-4m (workloads/)","56.72 (min 56.23, max 57.41)" - "rgbcmyk-4mw1 (workloads/)","56.78 (min 56.32, max 57.29)" - "rotate-4ms1 (workloads/)","18.75 (min 17.48, max 21.19)" - "rotate-4ms1w1 (workloads/)","18.66 (min 17.66, max 20.72)" - "rotate-4ms64 (workloads/)","18.80 (min 17.77, max 20.95)" - "rotate-4ms64w1 (workloads/)","19.06 (min 17.84, max 22.76)" + "idct-4m (workloads/)","16.97 (min 16.90, max 17.08)" + "idct-4mw1 (workloads/)","16.97 (min 16.89, max 17.09)" + "ippktcheck-4m (workloads/)","288.16 (min 267.84, max 314.11)" + "ippktcheck-4mw1 (workloads/)","287.54 (min 267.58, max 312.77)" + "ipres-4m (workloads/)","68.41 (min 62.50, max 76.69)" + "ipres-4mw1 (workloads/)","68.31 (min 62.47, max 76.18)" + "md5-4m (workloads/)","18.99 (min 17.91, max 20.68)" + "md5-4mw1 (workloads/)","19.11 (min 18.16, max 20.15)" + "rgbcmyk-4m (workloads/)","56.70 (min 56.45, max 57.08)" + "rgbcmyk-4mw1 (workloads/)","56.64 (min 56.32, max 57.01)" + "rotate-4ms1 (workloads/)","19.37 (min 17.85, max 20.73)" + "rotate-4ms1w1 (workloads/)","19.04 (min 17.85, max 20.74)" + "rotate-4ms64 (workloads/)","19.51 (min 18.04, max 22.62)" + "rotate-4ms64w1 (workloads/)","19.33 (min 18.01, max 21.44)" "x264-4mq (workloads/)","0.50 (min 0.50, max 0.51)" - "x264-4mqw1 (workloads/)","0.50 (min 0.50, max 0.51)" - - + "x264-4mqw1 (workloads/)","0.50 (min 0.49, max 0.51)" Boot-time Measurement --------------------- - Boot media: MMCSD ^^^^^^^^^^^^^^^^^ .. csv-table:: Linux boot time MMCSD :header: "Boot Configuration","am62lxx_evm-fs: Boot time in seconds: avg(min,max)" - "Linux boot time from SD with default rootfs (20 boot cycles)","19.88 (min 17.98, max 25.20)" - - + "Linux boot time from SD with default rootfs (20 boot cycles)","19.01 (min 17.68, max 27.66)" Boot time numbers [avg, min, max] are measured from "Starting kernel" to Linux prompt across 20 boot cycles. - | ALSA SoC Audio Driver -------------------------- +--------------------- #. Access type - RW\_INTERLEAVED #. Channels - 2 #. Format - S16\_LE #. Period size - 64 - .. csv-table:: Audio Capture :header: "Sampling Rate (Hz)","am62lxx_evm-fs: Throughput (bits/sec)","am62lxx_evm-fs: CPU Load (%)" - "11025","352796.09 (min 352795.00, max 352799.00)","0.30 (min 0.23, max 0.48)" - "16000","511995.18 (min 511993.00, max 511999.00)","0.32 (min 0.20, max 0.55)" - "22050","705582.36 (min 705523.00, max 705596.00)","0.33 (min 0.28, max 0.37)" - "24000","705590.73 (min 705588.00, max 705596.00)","0.38 (min 0.34, max 0.43)" - "32000","1023987.82 (min 1023985.00, max 1023995.00)","0.40 (min 0.21, max 1.18)" - "44100","1411159.45 (min 1410927.00, max 1411193.00)","0.50 (min 0.43, max 0.56)" - "48000","1535980.91 (min 1535976.00, max 1535992.00)","0.75 (min 0.42, max 2.97)" - "88200","2822264.91 (min 2821350.00, max 2822376.00)","0.98 (min 0.86, max 1.08)" - "96000","3071944.73 (min 3071933.00, max 3071967.00)","0.66 (min 0.30, max 3.07)" - - - + "11025","352795.83 (min 352795.00, max 352797.00)","0.38 (min 0.29, max 0.48)" + "16000","511995.00 (min 511994.00, max 511996.00)","0.35 (min 0.20, max 0.79)" + "22050","705589.67 (min 705586.00, max 705594.00)","0.40 (min 0.30, max 0.53)" + "24000","705591.50 (min 705589.00, max 705595.00)","0.47 (min 0.37, max 0.60)" + "32000","1023987.83 (min 1023985.00, max 1023991.00)","0.30 (min 0.21, max 0.40)" + "44100","1411182.17 (min 1411179.00, max 1411186.00)","0.59 (min 0.50, max 0.72)" + "48000","1535980.33 (min 1535976.00, max 1535985.00)","0.91 (min 0.23, max 1.56)" + "88200","2822355.00 (min 2822349.00, max 2822363.00)","1.09 (min 0.93, max 1.20)" + "96000","3071938.67 (min 3071934.00, max 3071943.00)","1.22 (min 0.39, max 3.19)" .. csv-table:: Audio Playback :header: "Sampling Rate (Hz)","am62lxx_evm-fs: Throughput (bits/sec)","am62lxx_evm-fs: CPU Load (%)" - "11025","352943.67 (min 352942.00, max 352947.00)","0.31 (min 0.21, max 0.44)" - "16000","512209.17 (min 512205.00, max 512214.00)","0.26 (min 0.17, max 0.37)" - "22050","705876.08 (min 705834.00, max 705889.00)","0.30 (min 0.24, max 0.39)" - "24000","705886.42 (min 705884.00, max 705891.00)","0.35 (min 0.29, max 0.43)" - "32000","1024416.42 (min 1024413.00, max 1024424.00)","0.31 (min 0.21, max 0.69)" - "44100","1411742.25 (min 1411579.00, max 1411784.00)","0.43 (min 0.38, max 0.51)" - "48000","1536623.92 (min 1536619.00, max 1536636.00)","0.60 (min 0.41, max 0.92)" - "88200","2823412.83 (min 2822773.00, max 2823559.00)","0.80 (min 0.73, max 0.91)" - "96000","3073230.64 (min 3073221.00, max 3073254.00)","0.73 (min 0.29, max 2.03)" - - -| - -Ethernet ------------------ -Ethernet performance benchmarks were measured using Netperf 2.7.1 https://hewlettpackard.github.io/netperf/doc/netperf.html -Test procedures were modeled after those defined in RFC-2544: -https://tools.ietf.org/html/rfc2544, where the DUT is the TI device -and the "tester" used was a Linux PC. To produce consistent results, -it is recommended to carry out performance tests in a private network and to avoid -running NFS on the same interface used in the test. In these results, -CPU utilization was captured as the total percentage used across all cores on the device, -while running the performance test over one external interface. - -UDP Throughput (0% loss) was measured by the procedure defined in RFC-2544 section 26.1: Throughput. -In this scenario, netperf options burst_size (-b) and wait_time (-w) are used to limit bandwidth -during different trials of the test, with the goal of finding the highest rate at which -no loss is seen. For example, to limit bandwidth to 500Mbits/sec with 1472B datagram: - -:: - - burst_size = / 8 (bits -> bytes) / / 100 (seconds -> 10 ms) - burst_size = 500000000 / 8 / 1472 / 100 = 425 - - wait_time = 10 milliseconds (minimum supported by Linux PC used for testing) - -UDP Throughput (possible loss) was measured by capturing throughput and packet loss statistics when -running the netperf test with no bandwidth limit (remove -b/-w options). - -In order to start a netperf client on one device, the other device must have netserver running. -To start netserver: - -:: - - netserver [-p ] [-4 (IPv4 addressing)] [-6 (IPv6 addressing)] - -Running the following shell script from the DUT will trigger netperf clients to measure -bidirectional TCP performance for 60 seconds and report CPU utilization. Parameter -k is used in -client commands to summarize selected statistics on their own line and -j is used to gain -additional timing measurements during the test. - -:: - - #!/bin/bash - for i in 1 - do - netperf -H -j -c -l 60 -t TCP_STREAM -- - -k DIRECTION,THROUGHPUT,MEAN_LATENCY,LOCAL_CPU_UTIL,REMOTE_CPU_UTIL,LOCAL_BYTES_SENT,REMOTE_BYTES_RECVD,LOCAL_SEND_SIZE & - - netperf -H -j -c -l 60 -t TCP_MAERTS -- - -k DIRECTION,THROUGHPUT,MEAN_LATENCY,LOCAL_CPU_UTIL,REMOTE_CPU_UTIL,LOCAL_BYTES_SENT,REMOTE_BYTES_RECVD,LOCAL_SEND_SIZE & - done - -Running the following commands will trigger netperf clients to measure UDP burst performance for -60 seconds at various burst/datagram sizes and report CPU utilization. - -- For UDP egress tests, run netperf client from DUT and start netserver on tester. - -:: - - netperf -H -j -c -l 60 -t UDP_STREAM -b -w -- -m - -k DIRECTION,THROUGHPUT,MEAN_LATENCY,LOCAL_CPU_UTIL,REMOTE_CPU_UTIL,LOCAL_BYTES_SENT,REMOTE_BYTES_RECVD,LOCAL_SEND_SIZE - -- For UDP ingress tests, run netperf client from tester and start netserver on DUT. - -:: - - netperf -H -j -C -l 60 -t UDP_STREAM -b -w -- -m - -k DIRECTION,THROUGHPUT,MEAN_LATENCY,LOCAL_CPU_UTIL,REMOTE_CPU_UTIL,LOCAL_BYTES_SENT,REMOTE_BYTES_RECVD,LOCAL_SEND_SIZE - - -CPSW/CPSW2g/CPSW3g Ethernet Driver -^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ - - -.. rubric:: TCP Bidirectional Throughput - :name: CPSW2g-tcp-bidirectional-throughput - -.. csv-table:: CPSW2g TCP Bidirectional Throughput - :header: "Command Used","am62lxx_evm-fs: THROUGHPUT (Mbits/sec)","am62lxx_evm-fs: CPU Load % (LOCAL_CPU_UTIL)" - - "netperf -H 192.168.0.1 -j -c -C -l 60 -t TCP_STREAM; netperf -H 192.168.0.1 -j -c -C -l 60 -t TCP_MAERTS","932.42 (min 315.68, max 1272.81)","85.10 (min 47.92, max 100.00)" - - - - -.. rubric:: TCP Bidirectional Throughput Interrupt Pacing - :name: CPSW2g-tcp-bidirectional-throughput-interrupt-pacing - -.. csv-table:: CPSW2g TCP Bidirectional Throughput Interrupt Pacing - :header: "Command Used","am62lxx_evm-fs: THROUGHPUT (Mbits/sec)","am62lxx_evm-fs: CPU Load % (LOCAL_CPU_UTIL)" - - "netperf -H 192.168.0.1 -j -c -C -l 60 -t TCP_STREAM; netperf -H 192.168.0.1 -j -c -C -l 60 -t TCP_MAERTS","1224.89 (min 1089.90, max 1387.62)","97.80 (min 92.06, max 99.99)" - - - - -.. rubric:: UDP Throughput - :name: CPSW2g-udp-throughput-0-loss - -.. csv-table:: CPSW2g UDP Egress Throughput 0 loss - :header: "Frame Size(bytes)","am62lxx_evm-fs: UDP Datagram Size(bytes) (LOCAL_SEND_SIZE)","am62lxx_evm-fs: THROUGHPUT (Mbits/sec)","am62lxx_evm-fs: Packets Per Second (kPPS)","am62lxx_evm-fs: CPU Load % (LOCAL_CPU_UTIL)" - - "64","18.00","41.92 (min 12.23, max 49.53)","91.38 (min 85.00, max 97.00)","81.74 (min 79.77, max 84.67)" - "128","82.00","86.33 (min 50.77, max 97.64)","89.45 (min 77.00, max 95.00)","75.62 (min 50.37, max 83.33)" - "256","210.00","171.57 (min 139.16, max 189.82)","86.25 (min 78.00, max 93.00)","75.94 (min 50.62, max 82.88)" - "1024","978.00","488.10 (min 181.00, max 683.63)","60.10 (min 22.00, max 83.00)","62.42 (min 26.04, max 79.88)" - "1518","1472.00","712.23 (min 653.18, max 870.48)","59.00 (min 54.00, max 74.00)","74.48 (min 72.13, max 80.78)" - - - - -.. csv-table:: CPSW2g UDP Ingress Throughput 0 loss - :header: "Frame Size(bytes)","am62lxx_evm-fs: UDP Datagram Size(bytes) (LOCAL_SEND_SIZE)","am62lxx_evm-fs: THROUGHPUT (Mbits/sec)","am62lxx_evm-fs: Packets Per Second (kPPS)","am62lxx_evm-fs: CPU Load % (LOCAL_CPU_UTIL)" - - "64","","2.55 (min 2.15, max 3.33)","5.00 (min 4.00, max 7.00)","4.77 (min 3.83, max 6.57)" - "128","82.00","5.99 (min 4.10, max 7.68)","6.33 (min 4.00, max 8.00)","3.40 (min 1.92, max 6.28)" - "256","210.00","12.24 (min 1.02, max 15.36)","6.09 (min 0.00, max 8.00)","4.60 (min 0.54, max 7.52)" - "1024","978.00","55.74 (min 39.32, max 65.72)","6.83 (min 5.00, max 8.00)","6.64 (min 3.03, max 10.09)" - "1518","1472.00","63.39 (min 8.24, max 98.92)","5.50 (min 1.00, max 8.00)","5.70 (min 0.89, max 10.58)" - - - - -.. csv-table:: CPSW2g UDP Ingress Throughput possible loss - :header: "Frame Size(bytes)","am62lxx_evm-fs: UDP Datagram Size(bytes) (LOCAL_SEND_SIZE)","am62lxx_evm-fs: THROUGHPUT (Mbits/sec)","am62lxx_evm-fs: Packets Per Second (kPPS)","am62lxx_evm-fs: CPU Load % (LOCAL_CPU_UTIL)","am62lxx_evm-fs: Packet Loss %" - - "64","","72.74 (min 68.22, max 80.12)","142.00 (min 133.00, max 156.00)","83.20 (min 81.93, max 85.28)","74.92 (min 61.45, max 82.42)" - "128","82.00","133.35 (min 64.37, max 165.54)","136.25 (min 98.00, max 162.00)","84.18 (min 72.40, max 88.93)","70.62 (min 52.05, max 85.34)" - "256","210.00","262.08 (min 170.59, max 311.88)","131.45 (min 102.00, max 152.00)","83.40 (min 75.15, max 87.02)","51.76 (min 28.30, max 76.63)" - "1024","978.00","740.76 (min 558.42, max 876.07)","91.08 (min 68.00, max 107.00)","85.63 (min 77.24, max 92.38)","9.14 (min 4.33, max 17.50)" - "1518","1472.00","753.68 (min 444.48, max 895.93)","64.00 (min 38.00, max 76.00)","81.54 (min 60.50, max 90.29)","6.15 (min 0.64, max 9.91)" - + "11025","352943.17 (min 352943.00, max 352944.00)","0.30 (min 0.19, max 0.42)" + "16000","512208.83 (min 512208.00, max 512209.00)","0.26 (min 0.17, max 0.42)" + "22050","705883.83 (min 705882.00, max 705888.00)","0.30 (min 0.25, max 0.41)" + "24000","705886.17 (min 705886.00, max 705887.00)","0.33 (min 0.29, max 0.36)" + "32000","1024415.50 (min 1024414.00, max 1024417.00)","0.30 (min 0.19, max 0.65)" + "44100","1411772.17 (min 1411772.00, max 1411773.00)","0.41 (min 0.38, max 0.45)" + "48000","1536622.00 (min 1536621.00, max 1536623.00)","0.50 (min 0.19, max 0.95)" + "88200","2823534.17 (min 2823531.00, max 2823536.00)","0.77 (min 0.73, max 0.81)" + "96000","3073226.00 (min 3073218.00, max 3073234.00)","0.56 (min 0.31, max 1.58)" | Linux OSPI Flash Driver -------------------------- - - -AM62XX-SK -^^^^^^^^^^^^^^^^^^^^^^^^^^^ - - -RAW -""""""""""""""""""""""""""" - -.. csv-table:: OSPI Raw Flash Driver - :header: "File size (Mbytes)","am62lxx_evm-fs: Raw Read Throughput (Mbytes/sec)" - - "50","17.29 (min 16.89, max 17.67)" - - - -AM62LXX-EVM -^^^^^^^^^^^^^^^^^^^^^^^^^^^ - +----------------------- -UBIFS -""""""""""""""""""""""""""" +.. rubric:: UBIFS + :name: am62lxx-evm-ospi-ubifs .. csv-table:: OSPI Flash Driver :header: "Buffer size (bytes)","am62lxx_evm-fs: Write UBIFS Throughput (Mbytes/sec)","am62lxx_evm-fs: Write UBIFS CPU Load (%)","am62lxx_evm-fs: Read UBIFS Throughput (Mbytes/sec)","am62lxx_evm-fs: Read UBIFS CPU Load (%)" - "102400","3.83 (min 3.45, max 4.17)","28.48 (min 24.75, max 32.35)","11.35 (min 11.20, max 11.52)","32.57 (min 27.59, max 37.14)" - "262144","3.76 (min 3.33, max 4.18)","28.21 (min 23.76, max 36.11)","11.33 (min 11.04, max 11.56)","35.23 (min 30.00, max 40.00)" - "524288","3.73 (min 3.34, max 4.19)","28.86 (min 23.81, max 45.61)","11.32 (min 11.14, max 11.58)","33.91 (min 29.03, max 38.89)" - "1048576","3.77 (min 3.33, max 4.22)","28.69 (min 22.55, max 33.65)","11.26 (min 11.09, max 11.46)","35.56 (min 29.03, max 40.54)" + "102400","3.84 (min 3.55, max 4.17)","29.68 (min 24.49, max 34.58)","11.32 (min 11.19, max 11.63)","33.47 (min 31.25, max 35.29)" + "262144","3.77 (min 3.49, max 4.27)","28.92 (min 24.49, max 33.65)","11.31 (min 11.20, max 11.55)","33.93 (min 31.25, max 37.14)" + "524288","3.76 (min 3.45, max 4.15)","28.78 (min 25.49, max 33.98)","11.28 (min 11.19, max 11.50)","33.96 (min 31.25, max 35.29)" + "1048576","3.77 (min 3.44, max 4.13)","28.45 (min 24.72, max 32.20)","11.18 (min 11.05, max 11.31)","37.67 (min 35.29, max 38.89)" - -RAW -""""""""""""""""""""""""""" +.. rubric:: RAW + :name: am62lxx-evm-ospi-raw .. csv-table:: OSPI Raw Flash Driver :header: "File size (Mbytes)","am62lxx_evm-fs: Raw Read Throughput (Mbytes/sec)" - "50","17.29 (min 16.89, max 17.67)" - + "50","17.36 (min 16.95, max 17.67)" EMMC Driver ----------- @@ -626,18 +443,16 @@ EMMC Driver sensitive applications, umount the auto-mounted filesystem and re-mount in async mode. - EMMC EXT4 FIO 1G ^^^^^^^^^^^^^^^^ .. csv-table:: EMMC EXT4 FIO 1G :header: "Buffer size (bytes)","am62lxx_evm-fs: Write EXT4 Throughput (Mbytes/sec)","am62lxx_evm-fs: Write EXT4 CPU Load (%)","am62lxx_evm-fs: Read EXT4 Throughput (Mbytes/sec)","am62lxx_evm-fs: Read EXT4 CPU Load (%)" - "1m","128.09 (min 128.00, max 129.00)","8.78 (min 8.62, max 9.02)","179.55 (min 179.00, max 180.00)","8.10 (min 7.36, max 8.35)" - "4m","127.64 (min 125.00, max 129.00)","5.47 (min 5.09, max 5.69)","179.18 (min 179.00, max 180.00)","4.94 (min 4.69, max 5.20)" - "4k","82.85 (min 75.50, max 86.90)","60.78 (min 59.59, max 62.96)","88.41 (min 85.50, max 91.00)","56.55 (min 55.14, max 58.55)" - "256k","122.82 (min 122.00, max 123.00)","11.89 (min 11.32, max 12.14)","178.18 (min 177.00, max 179.00)","10.21 (min 9.89, max 10.55)" - + "1m","128.17 (min 128.00, max 129.00)","8.56 (min 8.30, max 8.86)","179.33 (min 179.00, max 180.00)","7.98 (min 7.62, max 8.22)" + "4m","127.50 (min 125.00, max 128.00)","5.46 (min 5.28, max 5.63)","179.50 (min 179.00, max 180.00)","4.95 (min 4.74, max 5.08)" + "4k","86.62 (min 86.40, max 86.90)","59.76 (min 59.27, max 60.23)","90.67 (min 88.60, max 93.50)","56.33 (min 55.48, max 56.62)" + "256k","122.83 (min 122.00, max 123.00)","11.83 (min 11.60, max 12.02)","178.33 (min 178.00, max 179.00)","10.08 (min 9.65, max 10.27)" EMMC RAW FIO 1G ^^^^^^^^^^^^^^^ @@ -645,11 +460,10 @@ EMMC RAW FIO 1G .. csv-table:: EMMC RAW FIO 1G :header: "Buffer size (bytes)","am62lxx_evm-fs: Write Raw Throughput (Mbytes/sec)","am62lxx_evm-fs: Write Raw CPU Load (%)","am62lxx_evm-fs: Read Raw Throughput (Mbytes/sec)","am62lxx_evm-fs: Read Raw CPU Load (%)" - "1m","127.08 (min 122.00, max 129.00)","7.88 (min 7.24, max 8.20)","180.00","7.61 (min 6.21, max 8.13)" - "4m","128.54 (min 128.00, max 129.00)","5.29 (min 4.90, max 5.68)","180.00","4.71 (min 4.39, max 5.05)" - "4k","94.25 (min 90.40, max 96.50)","47.94 (min 46.23, max 49.73)","93.92 (min 91.80, max 96.30)","54.26 (min 52.60, max 57.08)" - "256k","122.77 (min 118.00, max 125.00)","9.94 (min 9.03, max 10.37)","178.54 (min 178.00, max 179.00)","9.33 (min 7.73, max 10.01)" - + "1m","127.83 (min 122.00, max 129.00)","7.85 (min 7.48, max 7.99)","180.00","7.63 (min 7.16, max 8.07)" + "4m","129.00","5.33 (min 5.10, max 5.56)","180.00","4.67 (min 4.51, max 4.96)" + "4k","95.57 (min 93.50, max 96.40)","47.29 (min 45.85, max 48.11)","94.90 (min 94.00, max 95.80)","53.35 (min 52.55, max 54.08)" + "256k","122.67 (min 118.00, max 124.00)","9.76 (min 9.54, max 10.07)","178.17 (min 178.00, max 179.00)","9.31 (min 9.00, max 9.65)" EMMC EXT4 ^^^^^^^^^ @@ -657,51 +471,32 @@ EMMC EXT4 .. csv-table:: EMMC EXT4 :header: "Buffer size (bytes)","am62lxx_evm-fs: Write EXT4 Throughput (Mbytes/sec)","am62lxx_evm-fs: Write EXT4 CPU Load (%)","am62lxx_evm-fs: Read EXT4 Throughput (Mbytes/sec)","am62lxx_evm-fs: Read EXT4 CPU Load (%)" - "102400","89.95 (min 81.91, max 99.06)","20.14 (min 16.67, max 26.53)","180.24 (min 178.28, max 181.35)","38.95 (min 36.11, max 41.59)" - "262144","94.39 (min 82.96, max 99.33)","21.11 (min 18.57, max 26.64)","184.25 (min 183.09, max 185.21)","38.34 (min 35.51, max 48.18)" - "524288","95.44 (min 84.33, max 100.71)","21.19 (min 18.69, max 26.21)","186.73 (min 186.35, max 187.13)","33.40 (min 30.84, max 35.14)" - "1048576","95.63 (min 84.01, max 101.22)","20.93 (min 17.84, max 26.61)","186.55 (min 186.13, max 186.94)","32.91 (min 31.78, max 34.55)" - "5242880","95.84 (min 85.17, max 100.83)","20.72 (min 18.31, max 26.10)","186.14 (min 185.24, max 186.78)","33.33 (min 31.48, max 34.82)" - - -EMMC EXT2 -^^^^^^^^^ - - -.. csv-table:: EMMC EXT2 - :header: "Buffer size (bytes)","am62lxx_evm-fs: Write EXT2 Throughput (Mbytes/sec)","am62lxx_evm-fs: Write EXT2 CPU Load (%)","am62lxx_evm-fs: Read EXT2 Throughput (Mbytes/sec)","am62lxx_evm-fs: Read EXT2 CPU Load (%)" - - "102400","33.22 (min 16.63, max 37.66)","15.99 (min 12.80, max 23.97)","174.78 (min 168.57, max 176.68)","39.40 (min 36.70, max 41.59)" - "262144","48.63 (min 20.43, max 63.88)","17.72 (min 12.16, max 25.76)","179.48 (min 175.01, max 181.23)","38.53 (min 36.94, max 40.87)" - "524288","59.55 (min 22.13, max 76.08)","18.73 (min 15.46, max 26.62)","181.73 (min 177.71, max 182.42)","33.12 (min 31.82, max 35.34)" - "1048576","66.02 (min 22.84, max 84.31)","18.83 (min 14.96, max 26.95)","181.17 (min 176.66, max 181.82)","33.17 (min 31.53, max 35.40)" - "5242880","76.28 (min 23.43, max 91.74)","20.31 (min 17.17, max 29.32)","180.86 (min 177.57, max 181.84)","32.91 (min 31.53, max 34.75)" - + "102400","90.91 (min 83.00, max 97.71)","20.38 (min 17.87, max 25.90)","180.36 (min 177.78, max 181.30)","37.46 (min 36.45, max 39.09)" + "262144","94.89 (min 83.93, max 100.22)","20.88 (min 18.72, max 25.51)","183.72 (min 177.40, max 185.29)","39.71 (min 36.70, max 50.88)" + "524288","95.62 (min 84.98, max 101.40)","20.84 (min 18.31, max 26.53)","186.81 (min 186.21, max 187.09)","32.93 (min 31.82, max 34.26)" + "1048576","95.42 (min 82.97, max 100.97)","21.14 (min 18.45, max 26.53)","186.89 (min 186.56, max 187.07)","32.73 (min 32.11, max 33.33)" + "5242880","96.51 (min 85.25, max 101.40)","20.64 (min 17.87, max 25.82)","186.37 (min 185.98, max 186.68)","32.98 (min 32.43, max 33.64)" EMMC VFAT ^^^^^^^^^ - .. csv-table:: EMMC VFAT :header: "Buffer size (bytes)","am62lxx_evm-fs: Write VFAT Throughput (Mbytes/sec)","am62lxx_evm-fs: Write VFAT CPU Load (%)","am62lxx_evm-fs: Read VFAT Throughput (Mbytes/sec)","am62lxx_evm-fs: Read VFAT CPU Load (%)" - "102400","32.51 (min 16.29, max 36.85)","15.82 (min 13.44, max 19.58)","172.29 (min 169.56, max 173.89)","39.02 (min 36.94, max 40.52)" - "262144","47.09 (min 20.19, max 62.79)","17.59 (min 13.14, max 21.52)","177.08 (min 175.97, max 177.69)","38.17 (min 37.17, max 39.13)" - "524288","56.02 (min 21.98, max 70.61)","18.85 (min 15.85, max 22.42)","177.08 (min 176.50, max 177.67)","32.90 (min 31.30, max 35.04)" - "1048576","61.25 (min 22.84, max 75.98)","19.85 (min 17.81, max 23.49)","177.32 (min 176.61, max 177.85)","32.79 (min 30.97, max 34.19)" - "5242880","70.86 (min 23.63, max 85.00)","20.74 (min 19.31, max 23.77)","176.55 (min 176.03, max 177.18)","32.28 (min 30.97, max 33.90)" - + "102400","32.73 (min 16.59, max 37.40)","15.81 (min 14.03, max 18.56)","173.62 (min 172.15, max 174.70)","39.10 (min 37.72, max 40.52)" + "262144","47.45 (min 20.52, max 63.09)","17.72 (min 13.82, max 23.74)","174.94 (min 164.63, max 177.64)","40.50 (min 36.61, max 55.74)" + "524288","56.02 (min 22.44, max 71.58)","18.76 (min 12.94, max 22.48)","177.43 (min 177.03, max 177.74)","32.31 (min 30.97, max 34.19)" + "1048576","61.76 (min 23.47, max 77.61)","19.71 (min 18.09, max 22.20)","177.54 (min 175.95, max 178.35)","34.28 (min 31.62, max 40.71)" + "5242880","71.24 (min 24.09, max 85.03)","20.62 (min 18.65, max 23.67)","176.90 (min 176.63, max 177.31)","32.18 (min 30.70, max 33.90)" UBoot EMMC Driver ----------------- - .. csv-table:: UBOOT EMMC RAW :header: "File size (bytes in hex)","am62lxx_evm-fs: Write Throughput (Kbytes/sec)","am62lxx_evm-fs: Read Throughput (Kbytes/sec)" - "2000000","111773.53 (min 105703.23, max 117870.50)","175229.95" - "4000000","125710.23 (min 123886.58, max 128000.00)","178198.94 (min 178086.96, max 178572.21)" - + "2000000","112634.05 (min 110702.70, max 116198.58)","174765.56 (min 173375.66, max 175229.95)" + "4000000","125497.58 (min 122268.66, max 127254.37)","178086.96" MMCSD ----- @@ -714,18 +509,16 @@ MMCSD sensitive applications, umount the auto-mounted filesystem and re-mount in async mode. - MMC EXT4 FIO 1G ^^^^^^^^^^^^^^^ .. csv-table:: MMC EXT4 FIO 1G :header: "Buffer size (bytes)","am62lxx_evm-fs: Write EXT4 Throughput (Mbytes/sec)","am62lxx_evm-fs: Write EXT4 CPU Load (%)","am62lxx_evm-fs: Read EXT4 Throughput (Mbytes/sec)","am62lxx_evm-fs: Read EXT4 CPU Load (%)" - "1m","18.77 (min 17.90, max 19.80)","2.36 (min 1.91, max 2.69)","85.09 (min 79.70, max 87.30)","5.35 (min 4.63, max 5.70)" - "4m","18.70 (min 17.70, max 19.50)","1.68 (min 1.50, max 1.96)","84.56 (min 76.30, max 86.90)","3.13 (min 2.75, max 3.43)" - "4k","4.47 (min 4.25, max 4.74)","10.39 (min 8.49, max 11.72)","13.52 (min 13.40, max 13.60)","14.22 (min 12.04, max 17.18)" - "256k","18.38 (min 17.30, max 19.20)","3.59 (min 3.08, max 3.96)","82.45 (min 79.50, max 83.60)","6.72 (min 5.94, max 7.40)" - + "1m","35.31 (min 18.70, max 42.30)","3.38 (min 2.18, max 4.24)","87.01 (min 86.40, max 87.50)","5.29 (min 4.42, max 5.60)" + "4m","34.96 (min 18.70, max 42.40)","2.36 (min 1.75, max 2.97)","86.47 (min 83.20, max 87.40)","3.02 (min 2.66, max 3.38)" + "4k","3.23 (min 2.74, max 4.29)","7.39 (min 5.78, max 9.52)","13.10 (min 12.90, max 13.50)","12.51 (min 11.54, max 13.83)" + "256k","31.90 (min 18.00, max 38.20)","5.09 (min 3.67, max 6.32)","83.10 (min 82.00, max 83.90)","6.51 (min 5.61, max 6.78)" MMC RAW FIO 1G ^^^^^^^^^^^^^^ @@ -733,11 +526,10 @@ MMC RAW FIO 1G .. csv-table:: MMC RAW FIO 1G :header: "Buffer size (bytes)","am62lxx_evm-fs: Write Raw Throughput (Mbytes/sec)","am62lxx_evm-fs: Write Raw CPU Load (%)","am62lxx_evm-fs: Read Raw Throughput (Mbytes/sec)","am62lxx_evm-fs: Read Raw CPU Load (%)" - "1m","22.89 (min 18.50, max 43.30)","2.23 (min 1.61, max 2.99)","87.52 (min 86.80, max 88.10)","4.48 (min 3.90, max 4.78)" - "4m","22.47 (min 18.50, max 42.50)","1.75 (min 1.35, max 2.22)","87.58 (min 86.90, max 88.20)","2.96 (min 2.51, max 3.36)" - "4k","3.98 (min 2.80, max 4.47)","5.92 (min 4.35, max 7.08)","13.52 (min 13.10, max 13.60)","11.51 (min 9.36, max 13.34)" - "256k","21.43 (min 17.40, max 37.70)","3.21 (min 2.65, max 4.31)","83.23 (min 82.20, max 84.30)","5.82 (min 4.84, max 6.32)" - + "1m","31.02 (min 18.20, max 44.20)","2.80 (min 1.82, max 3.70)","87.63 (min 87.10, max 88.00)","4.61 (min 4.27, max 5.11)" + "4m","30.72 (min 18.20, max 43.60)","2.09 (min 1.32, max 2.68)","87.67 (min 87.00, max 88.10)","3.00 (min 2.61, max 3.48)" + "4k","3.45 (min 2.80, max 4.15)","5.24 (min 4.23, max 6.10)","13.32 (min 13.00, max 13.60)","11.41 (min 10.56, max 12.38)" + "256k","27.70 (min 17.60, max 38.60)","3.72 (min 2.58, max 4.57)","83.30 (min 82.10, max 84.10)","5.72 (min 4.84, max 6.15)" MMC EXT4 ^^^^^^^^ @@ -745,43 +537,16 @@ MMC EXT4 .. csv-table:: MMC EXT4 :header: "Buffer size (bytes)","am62lxx_evm-fs: Write Raw Throughput (Mbytes/sec)","am62lxx_evm-fs: Write Raw CPU Load (%)","am62lxx_evm-fs: Read Raw Throughput (Mbytes/sec)","am62lxx_evm-fs: Read Raw CPU Load (%)" - "102400","9.42 (min 8.48, max 10.75)","2.28 (min 1.67, max 3.26)","11.03 (min 10.62, max 11.78)","2.69 (min 2.31, max 2.99)" - "262144","9.41 (min 8.66, max 10.66)","2.29 (min 1.74, max 3.45)","11.06 (min 10.59, max 11.92)","2.39 (min 2.12, max 2.78)" - "524288","9.43 (min 8.71, max 10.85)","2.24 (min 1.71, max 3.47)","11.00 (min 10.74, max 11.26)","2.02 (min 1.76, max 2.24)" - "1048576","9.38 (min 8.86, max 10.52)","2.34 (min 1.62, max 3.95)","11.11 (min 10.82, max 11.48)","2.04 (min 1.79, max 2.26)" - "5242880","9.43 (min 8.83, max 10.68)","2.20 (min 1.62, max 3.92)","11.35 (min 10.84, max 12.01)","2.10 (min 1.71, max 2.35)" - -MMC EXT3 -^^^^^^^^ - -.. csv-table:: MMC EXT3 - :header: "Buffer size (bytes)","am62lxx_evm-fs: Write Raw Throughput (Mbytes/sec)","am62lxx_evm-fs: Write Raw CPU Load (%)","am62lxx_evm-fs: Read Raw Throughput (Mbytes/sec)","am62lxx_evm-fs: Read Raw CPU Load (%)" - - "102400","23.20 (min 15.57, max 40.38)","6.01 (min 3.41, max 14.56)","76.27 (min 71.64, max 78.41)","17.37 (min 14.67, max 20.80)" - "262144","22.76 (min 15.81, max 39.78)","5.79 (min 3.29, max 13.83)","81.99 (min 79.01, max 85.25)","16.70 (min 15.33, max 18.15)" - "524288","23.16 (min 16.44, max 39.82)","5.72 (min 3.30, max 14.22)","86.75 (min 83.12, max 89.74)","15.42 (min 13.25, max 17.32)" - "1048576","22.52 (min 16.11, max 36.71)","5.54 (min 3.17, max 13.11)","88.33 (min 82.79, max 89.91)","15.29 (min 13.55, max 17.99)" - "5242880","22.91 (min 16.00, max 39.33)","5.69 (min 3.34, max 13.42)","87.07 (min 82.59, max 89.42)","15.07 (min 12.80, max 17.15)" - - -MMC EXT2 -^^^^^^^^ - -.. csv-table:: MMC EXT2 - :header: "Buffer size (bytes)","am62lxx_evm-fs: Write Raw Throughput (Mbytes/sec)","am62lxx_evm-fs: Write Raw CPU Load (%)","am62lxx_evm-fs: Read Raw Throughput (Mbytes/sec)","am62lxx_evm-fs: Read Raw CPU Load (%)" - - "102400","13.52 (min 2.68, max 19.90)","6.03 (min 4.38, max 8.77)","75.44 (min 71.95, max 78.17)","18.59 (min 15.56, max 24.91)" - "262144","16.84 (min 2.63, max 36.72)","5.59 (min 3.62, max 11.25)","83.89 (min 79.18, max 85.49)","17.55 (min 15.16, max 19.23)" - "524288","17.78 (min 2.61, max 40.70)","5.27 (min 3.51, max 10.25)","88.26 (min 83.81, max 90.12)","15.92 (min 14.10, max 17.72)" - "1048576","18.10 (min 2.91, max 40.66)","5.19 (min 3.61, max 12.89)","86.83 (min 83.40, max 90.09)","15.72 (min 13.10, max 17.20)" - "5242880","18.08 (min 2.91, max 39.87)","5.04 (min 3.29, max 9.56)","88.72 (min 84.09, max 90.20)","15.76 (min 13.10, max 17.30)" + "102400","9.60 (min 8.52, max 10.57)","2.45 (min 1.99, max 3.24)","10.84 (min 10.64, max 11.16)","2.81 (min 2.45, max 3.08)" + "262144","9.45 (min 8.73, max 10.75)","2.46 (min 1.98, max 3.38)","10.99 (min 10.74, max 11.20)","2.35 (min 2.06, max 2.67)" + "524288","9.52 (min 8.75, max 10.56)","2.42 (min 1.92, max 3.28)","11.13 (min 10.90, max 11.49)","2.10 (min 1.94, max 2.18)" + "1048576","9.46 (min 8.86, max 10.52)","2.50 (min 1.96, max 3.77)","11.20 (min 11.08, max 11.38)","2.23 (min 2.01, max 2.66)" + "5242880","9.53 (min 8.79, max 10.77)","2.38 (min 1.91, max 3.95)","11.46 (min 11.05, max 12.02)","2.23 (min 1.96, max 2.49)" The performance numbers were captured using the following: - SanDisk Max Endurance SD card (SDSQQVR-032G-GN6IA) - Partition was mounted with async option - - UBoot MMCSD ----------- @@ -792,93 +557,28 @@ UBOOT MMCSD FAT .. csv-table:: UBOOT MMCSD FAT :header: "File size (bytes in hex)","am62lxx_evm-fs: Write Throughput (Kbytes/sec)","am62lxx_evm-fs: Read Throughput (Kbytes/sec)" - "400000","16887.87 (min 13170.42, max 20078.43)","22546.94 (min 22505.49, max 22629.83)" - "800000","17033.13 (min 12681.11, max 19366.43)","23025.64 (min 23011.24, max 23076.06)" - "1000000","15915.67 (min 14499.12, max 17808.70)","23254.39 (min 23239.72, max 23272.73)" - + "400000","17604.61 (min 12962.03, max 19692.31)","22714.58 (min 22505.49, max 22882.68)" + "800000","20272.80 (min 18004.40, max 21501.31)","23152.29 (min 23076.06, max 23206.80)" + "1000000","19450.02 (min 16015.64, max 21250.32)","23311.43 (min 23239.72, max 23339.03)" The performance numbers were captured using the following: - SanDisk Max Endurance SD card (SDSQQVR-032G-GN6IA) - | USB Driver ---------- - USB Device Controller ^^^^^^^^^^^^^^^^^^^^^ .. csv-table:: USBDEVICE HIGHSPEED SLAVE_READ_THROUGHPUT :header: "Number of Blocks","am62lxx_evm-fs: Throughput (MB/sec)" - "150","40.81 (min 37.30, max 43.40)" - - - + "150","41.14 (min 36.20, max 43.50)" .. csv-table:: USBDEVICE HIGHSPEED SLAVE_WRITE_THROUGHPUT :header: "Number of Blocks","am62lxx_evm-fs: Throughput (MB/sec)" - "150","37.14 (min 30.70, max 41.70)" - - -Low Power Performance ---------------------- - -Power Performance -^^^^^^^^^^^^^^^^^ - -These are power measurements taken while the device is in various low power modes like -Deep Sleep and RTC Only + DDR. - -.. csv-table:: Deep Sleep Power Performance - :header: "Rail name","Rail voltage(V)","Power (mW)" - - "vdd_core", "0.75", "5.41" - "soc_dvdd_1v8", "1.80", "0.30" - "soc_dvdd_3v3", "3.29", "3.45" - "vdda_1v8", "1.80", "1.26" - "vdd_lpddr4_pmic2", "1.10", "1.00" - "vdd_rtc", "0.74", "0.02" - "vdd_rtc_1v8", "1.80", "0.02" - "Total"," ","11.47" - -.. csv-table:: RTC Only + DDR Power Performance - :header: "Rail name","Rail voltage(V)","Power (mW)" - - "vdd_core", "0.00", "0.00" - "soc_dvdd_1v8", "1.80", "0.36" - "soc_dvdd_3v3", "3.29", "0.93" - "vdda_1v8", "0.00", "0.00" - "vdd_lpddr4_pmic2", "1.10", "1.08" - "vdd_rtc", "0.75", "0.02" - "vdd_rtc_1v8", "1.80", "0.02" - "Total"," ","2.41" - -Resume Latency Performance -^^^^^^^^^^^^^^^^^^^^^^^^^^ - -.. csv-table:: LPM Resume Latency Performance - :header: "Low Power Mode","Total Resume Latency (ms)" - - "RTC Only + DDR", "459.40" - "Deep Sleep", "98.70" - -The performance numbers are measured without the Linux printk logs. To remove the -Linux printk logs, run the following commands in the terminal: - -.. code:: console - - # Detach kernel serial console - consoles=$(find /sys/bus/platform/devices/*.serial/ -name console) - for console in ${consoles}; do - echo -n N > ${console} - done - - -.. note:: - - The measurements shown are from using the default SDK with no extra optimizations. \ No newline at end of file + "150","37.43 (min 31.00, max 41.40)" diff --git a/source/devices/AM62LX/linux/RT_Linux_Performance_Guide.rst b/source/devices/AM62LX/linux/RT_Linux_Performance_Guide.rst index cb13d850b..e2d51c912 100644 --- a/source/devices/AM62LX/linux/RT_Linux_Performance_Guide.rst +++ b/source/devices/AM62LX/linux/RT_Linux_Performance_Guide.rst @@ -1,5 +1,5 @@ ======================================= - RT-linux 11.00.00.00 Performance Guide + RT-linux 11.02.08.02 Performance Guide ======================================= .. rubric:: **Read This First** @@ -72,12 +72,3 @@ default SDK image: Components section: :ref:`building-optee-with-prng`, and enabling the RNG node in the Linux kernel device tree. This way the HW TRNG is accessed from the kernel itself. - -.. csv-table:: - :header: "Latencies","CPU 0","CPU 1" - - "Minimum (us)","5","5" - "Average (us)","8","7" - "Maximum (us)","57","48" - -.. image:: img/rt-cpu-method-all-latency-histogram.png diff --git a/source/devices/AM62PX/linux/Linux_Performance_Guide.rst b/source/devices/AM62PX/linux/Linux_Performance_Guide.rst index 59ce73069..d890bb499 100644 --- a/source/devices/AM62PX/linux/Linux_Performance_Guide.rst +++ b/source/devices/AM62PX/linux/Linux_Performance_Guide.rst @@ -1,6 +1,6 @@ =================================== -Linux 11.01.16.13 Performance Guide +Linux 11.02.08.02 Performance Guide =================================== .. rubric:: **Read This First** @@ -33,16 +33,15 @@ For further information or to report any problems, contact https://e2e.ti.com/ or https://support.ti.com/ System Benchmarks -------------------- - +----------------- LMBench ^^^^^^^ LMBench is a collection of microbenchmarks of which the memory bandwidth and latency related ones are typically used to estimate processor memory system performance. More information about lmbench at -http://lmbench.sourceforge.net/whatis_lmbench.html and -http://lmbench.sourceforge.net/man/lmbench.8.html +https://lmbench.sourceforge.net/whatis_lmbench.html and +https://lmbench.sourceforge.net/man/lmbench.8.html **Latency**: lat_mem_rd-stride128-szN, where N is equal to or smaller than the cache size at given level measures the cache miss penalty. N that is at least @@ -64,126 +63,124 @@ Execute the LMBench with the following: .. csv-table:: LMBench Benchmarks :header: "Benchmarks","am62pxx_sk-fs: perf" - "af_unix_sock_stream_latency (microsec)","30.00 (min 29.99, max 30.01)" - "af_unix_socket_stream_bandwidth (mb\s)","1140.42 (min 1129.11, max 1151.73)" - "bw_file_rd-io-1mb (mb/s)","1430.38 (min 1396.89, max 1463.86)" - "bw_file_rd-o2c-1mb (mb/s)","704.15 (min 657.68, max 750.61)" - "bw_mem-bcopy-16mb (mb/s)","1732.51 (min 1616.16, max 1848.86)" - "bw_mem-bcopy-1mb (mb/s)","2079.23 (min 2003.28, max 2155.17)" - "bw_mem-bcopy-2mb (mb/s)","1725.21 (min 1723.54, max 1726.87)" - "bw_mem-bcopy-4mb (mb/s)","1671.07 (min 1634.43, max 1707.70)" - "bw_mem-bcopy-8mb (mb/s)","1887.75 (min 1808.93, max 1966.57)" - "bw_mem-bzero-16mb (mb/s)","7962.36 (min 7812.50, max 8112.22)" - "bw_mem-bzero-1mb (mb/s)","5015.40 (min 2003.28, max 8108.62)" - "bw_mem-bzero-2mb (mb/s)","4834.47 (min 1723.54, max 8094.32)" - "bw_mem-bzero-4mb (mb/s)","4812.58 (min 1634.43, max 8104.00)" - "bw_mem-bzero-8mb (mb/s)","4923.05 (min 1808.93, max 8106.74)" - "bw_mem-cp-16mb (mb/s)","951.23 (min 913.71, max 988.75)" - "bw_mem-cp-1mb (mb/s)","4570.21 (min 898.63, max 8395.16)" - "bw_mem-cp-2mb (mb/s)","4506.43 (min 885.74, max 8248.16)" - "bw_mem-cp-4mb (mb/s)","4505.73 (min 943.95, max 8181.35)" - "bw_mem-cp-8mb (mb/s)","4499.51 (min 962.35, max 8150.79)" - "bw_mem-fcp-16mb (mb/s)","1780.36 (min 1722.47, max 1838.24)" - "bw_mem-fcp-1mb (mb/s)","4854.96 (min 1695.23, max 8108.62)" - "bw_mem-fcp-2mb (mb/s)","4835.00 (min 1680.11, max 8094.32)" - "bw_mem-fcp-4mb (mb/s)","4839.75 (min 1664.82, max 8104.00)" - "bw_mem-fcp-8mb (mb/s)","4861.43 (min 1716.00, max 8106.74)" - "bw_mem-frd-16mb (mb/s)","1949.05 (min 1886.79, max 2011.31)" - "bw_mem-frd-1mb (mb/s)","1903.28 (min 1695.23, max 2066.89)" - "bw_mem-frd-2mb (mb/s)","1757.28 (min 1680.11, max 1842.30)" - "bw_mem-frd-4mb (mb/s)","1816.81 (min 1664.82, max 2002.67)" - "bw_mem-frd-8mb (mb/s)","1792.14 (min 1716.00, max 1844.38)" - "bw_mem-fwr-16mb (mb/s)","7986.11 (min 7838.01, max 8134.21)" - "bw_mem-fwr-1mb (mb/s)","5128.73 (min 2029.52, max 8395.16)" - "bw_mem-fwr-2mb (mb/s)","4938.53 (min 1734.30, max 8248.16)" - "bw_mem-fwr-4mb (mb/s)","4968.66 (min 1813.78, max 8181.35)" - "bw_mem-fwr-8mb (mb/s)","4909.96 (min 1795.13, max 8150.79)" - "bw_mem-rd-16mb (mb/s)","2002.61 (min 1928.64, max 2076.57)" - "bw_mem-rd-1mb (mb/s)","2071.05 (min 1728.91, max 2346.15)" - "bw_mem-rd-2mb (mb/s)","1814.74 (min 1529.75, max 2051.98)" - "bw_mem-rd-4mb (mb/s)","1865.48 (min 1684.92, max 2033.55)" - "bw_mem-rd-8mb (mb/s)","1926.46 (min 1779.56, max 2073.08)" - "bw_mem-rdwr-16mb (mb/s)","1940.59 (min 1860.47, max 2020.71)" - "bw_mem-rdwr-1mb (mb/s)","1328.43 (min 898.63, max 1780.06)" - "bw_mem-rdwr-2mb (mb/s)","1238.26 (min 885.74, max 1610.05)" - "bw_mem-rdwr-4mb (mb/s)","1365.79 (min 943.95, max 1780.68)" - "bw_mem-rdwr-8mb (mb/s)","1418.89 (min 962.35, max 1931.90)" - "bw_mem-wr-16mb (mb/s)","1910.82 (min 1841.20, max 1980.44)" - "bw_mem-wr-1mb (mb/s)","1803.48 (min 1671.31, max 2033.65)" - "bw_mem-wr-2mb (mb/s)","1602.93 (min 1494.77, max 1777.15)" - "bw_mem-wr-4mb (mb/s)","1751.00 (min 1684.92, max 1820.66)" - "bw_mem-wr-8mb (mb/s)","1848.44 (min 1745.96, max 1936.34)" - "bw_mmap_rd-mo-1mb (mb/s)","2206.82 (min 2128.79, max 2284.84)" - "bw_mmap_rd-o2c-1mb (mb/s)","761.68 (min 727.93, max 795.42)" - "bw_pipe (mb/s)","787.85 (min 749.46, max 826.24)" - "bw_unix (mb/s)","1140.42 (min 1129.11, max 1151.73)" - "lat_connect (us)","56.68 (min 56.35, max 57.00)" - "lat_ctx-2-128k (us)","7.80 (min 7.57, max 8.02)" - "lat_ctx-2-256k (us)","7.17 (min 6.74, max 7.59)" - "lat_ctx-4-128k (us)","7.25 (min 7.22, max 7.27)" - "lat_ctx-4-256k (us)","6.43 (min 6.06, max 6.80)" - "lat_fs-0k (num_files)","233.50 (min 231.00, max 236.00)" - "lat_fs-10k (num_files)","119.50 (min 116.00, max 123.00)" - "lat_fs-1k (num_files)","167.50 (min 163.00, max 172.00)" - "lat_fs-4k (num_files)","160.50 (min 146.00, max 175.00)" - "lat_mem_rd-stride128-sz1000k (ns)","30.43 (min 29.44, max 31.43)" - "lat_mem_rd-stride128-sz125k (ns)","5.58 (min 5.55, max 5.61)" - "lat_mem_rd-stride128-sz250k (ns)","5.83 (min 5.83, max 5.84)" - "lat_mem_rd-stride128-sz31k (ns)","2.90 (min 2.15, max 3.65)" + "af_unix_sock_stream_latency (microsec)","30.38 (min 29.49, max 31.11)" + "af_unix_socket_stream_bandwidth (mb\s)","1141.99 (min 1114.62, max 1178.85)" + "bw_file_rd-io-1mb (mb/s)","1420.50 (min 1397.38, max 1467.89)" + "bw_file_rd-o2c-1mb (mb/s)","756.14 (min 707.71, max 787.56)" + "bw_mem-bcopy-16mb (mb/s)","1893.33 (min 1820.46, max 1973.12)" + "bw_mem-bcopy-1mb (mb/s)","2039.91 (min 1948.56, max 2126.53)" + "bw_mem-bcopy-2mb (mb/s)","1763.70 (min 1689.19, max 1838.80)" + "bw_mem-bcopy-4mb (mb/s)","1778.31 (min 1643.39, max 1932.06)" + "bw_mem-bcopy-8mb (mb/s)","1862.34 (min 1802.61, max 1939.39)" + "bw_mem-bzero-16mb (mb/s)","7941.37 (min 7807.42, max 8116.33)" + "bw_mem-bzero-1mb (mb/s)","4983.96 (min 1948.56, max 8117.51)" + "bw_mem-bzero-2mb (mb/s)","4846.65 (min 1689.19, max 8105.73)" + "bw_mem-bzero-4mb (mb/s)","4858.50 (min 1643.39, max 8110.85)" + "bw_mem-bzero-8mb (mb/s)","4901.14 (min 1802.61, max 8110.85)" + "bw_mem-cp-16mb (mb/s)","936.73 (min 894.15, max 985.16)" + "bw_mem-cp-1mb (mb/s)","4594.51 (min 890.31, max 8403.36)" + "bw_mem-cp-2mb (mb/s)","4486.54 (min 865.05, max 8255.56)" + "bw_mem-cp-4mb (mb/s)","4485.96 (min 926.14, max 8185.54)" + "bw_mem-cp-8mb (mb/s)","4481.34 (min 948.77, max 8154.94)" + "bw_mem-fcp-16mb (mb/s)","1764.54 (min 1699.96, max 1837.60)" + "bw_mem-fcp-1mb (mb/s)","4843.70 (min 1689.51, max 8117.51)" + "bw_mem-fcp-2mb (mb/s)","4796.57 (min 1575.05, max 8105.73)" + "bw_mem-fcp-4mb (mb/s)","4826.26 (min 1609.87, max 8110.85)" + "bw_mem-fcp-8mb (mb/s)","4831.18 (min 1631.82, max 8110.85)" + "bw_mem-frd-16mb (mb/s)","1908.07 (min 1837.18, max 2011.06)" + "bw_mem-frd-1mb (mb/s)","1907.50 (min 1689.51, max 2142.09)" + "bw_mem-frd-2mb (mb/s)","1705.84 (min 1575.05, max 1836.88)" + "bw_mem-frd-4mb (mb/s)","1764.63 (min 1609.87, max 1909.31)" + "bw_mem-frd-8mb (mb/s)","1789.25 (min 1631.82, max 1998.75)" + "bw_mem-fwr-16mb (mb/s)","7958.93 (min 7822.69, max 8134.21)" + "bw_mem-fwr-1mb (mb/s)","5153.95 (min 1974.16, max 8403.36)" + "bw_mem-fwr-2mb (mb/s)","4904.86 (min 1597.44, max 8255.56)" + "bw_mem-fwr-4mb (mb/s)","4913.69 (min 1659.06, max 8185.54)" + "bw_mem-fwr-8mb (mb/s)","4917.48 (min 1674.52, max 8154.94)" + "bw_mem-rd-16mb (mb/s)","1983.53 (min 1918.24, max 2065.32)" + "bw_mem-rd-1mb (mb/s)","2035.54 (min 1708.82, max 2331.46)" + "bw_mem-rd-2mb (mb/s)","1794.96 (min 1510.00, max 2037.35)" + "bw_mem-rd-4mb (mb/s)","1864.28 (min 1662.05, max 2055.85)" + "bw_mem-rd-8mb (mb/s)","1901.83 (min 1763.28, max 2069.05)" + "bw_mem-rdwr-16mb (mb/s)","1853.51 (min 1684.21, max 1942.45)" + "bw_mem-rdwr-1mb (mb/s)","1329.35 (min 890.31, max 1855.29)" + "bw_mem-rdwr-2mb (mb/s)","1231.50 (min 865.05, max 1661.96)" + "bw_mem-rdwr-4mb (mb/s)","1342.24 (min 926.14, max 1834.58)" + "bw_mem-rdwr-8mb (mb/s)","1405.93 (min 948.77, max 1942.22)" + "bw_mem-wr-16mb (mb/s)","1883.72 (min 1802.41, max 1975.55)" + "bw_mem-wr-1mb (mb/s)","1779.17 (min 1614.06, max 2043.60)" + "bw_mem-wr-2mb (mb/s)","1589.31 (min 1490.59, max 1853.57)" + "bw_mem-wr-4mb (mb/s)","1739.42 (min 1631.10, max 1869.45)" + "bw_mem-wr-8mb (mb/s)","1824.68 (min 1672.24, max 1942.22)" + "bw_mmap_rd-mo-1mb (mb/s)","2177.27 (min 2111.56, max 2271.54)" + "bw_mmap_rd-o2c-1mb (mb/s)","772.38 (min 680.85, max 826.72)" + "bw_pipe (mb/s)","783.15 (min 729.29, max 819.18)" + "bw_unix (mb/s)","1141.99 (min 1114.62, max 1178.85)" + "lat_connect (us)","56.81 (min 56.67, max 57.00)" + "lat_ctx-2-128k (us)","7.83 (min 7.60, max 8.13)" + "lat_ctx-2-256k (us)","7.72 (min 6.67, max 11.90)" + "lat_ctx-4-128k (us)","7.42 (min 6.78, max 7.96)" + "lat_ctx-4-256k (us)","6.99 (min 6.18, max 8.04)" + "lat_fs-0k (num_files)","239.71 (min 221.00, max 253.00)" + "lat_fs-10k (num_files)","117.29 (min 106.00, max 136.00)" + "lat_fs-1k (num_files)","160.43 (min 145.00, max 179.00)" + "lat_fs-4k (num_files)","159.43 (min 142.00, max 176.00)" + "lat_mem_rd-stride128-sz1000k (ns)","30.55 (min 29.36, max 31.41)" + "lat_mem_rd-stride128-sz125k (ns)","5.57 (min 5.54, max 5.64)" + "lat_mem_rd-stride128-sz250k (ns)","5.84 (min 5.83, max 5.85)" + "lat_mem_rd-stride128-sz31k (ns)","3.15 (min 2.16, max 4.66)" "lat_mem_rd-stride128-sz50 (ns)","2.15" - "lat_mem_rd-stride128-sz500k (ns)","12.11 (min 10.58, max 13.64)" - "lat_mem_rd-stride128-sz62k (ns)","4.90 (min 4.54, max 5.25)" - "lat_mmap-1m (us)","51.00" + "lat_mem_rd-stride128-sz500k (ns)","10.88 (min 9.02, max 12.76)" + "lat_mem_rd-stride128-sz62k (ns)","5.24 (min 5.20, max 5.26)" + "lat_mmap-1m (us)","52.57 (min 50.00, max 57.00)" "lat_ops-double-add (ns)","2.86" - "lat_ops-double-div (ns)","15.74 (min 15.73, max 15.74)" - "lat_ops-double-mul (ns)","2.87 (min 2.86, max 2.87)" + "lat_ops-double-div (ns)","15.74 (min 15.74, max 15.75)" + "lat_ops-double-mul (ns)","2.86" "lat_ops-float-add (ns)","2.86" - "lat_ops-float-div (ns)","9.30" + "lat_ops-float-div (ns)","9.30 (min 9.30, max 9.31)" "lat_ops-float-mul (ns)","2.86" "lat_ops-int-add (ns)","0.72" "lat_ops-int-bit (ns)","0.48" "lat_ops-int-div (ns)","4.29" - "lat_ops-int-mod (ns)","4.53" - "lat_ops-int-mul (ns)","3.07" + "lat_ops-int-mod (ns)","4.53 (min 4.53, max 4.54)" + "lat_ops-int-mul (ns)","3.08 (min 3.07, max 3.09)" "lat_ops-int64-add (ns)","0.72" "lat_ops-int64-bit (ns)","0.48" "lat_ops-int64-div (ns)","6.80" "lat_ops-int64-mod (ns)","5.25" - "lat_ops-int64-mul (ns)","3.55" - "lat_pagefault (us)","0.51 (min 0.50, max 0.52)" - "lat_pipe (us)","25.78 (min 25.77, max 25.79)" - "lat_proc-exec (us)","706.31 (min 685.11, max 727.50)" - "lat_proc-fork (us)","615.95 (min 598.78, max 633.13)" + "lat_ops-int64-mul (ns)","3.56 (min 3.55, max 3.57)" + "lat_pagefault (us)","0.52 (min 0.50, max 0.54)" + "lat_pipe (us)","25.74 (min 25.17, max 26.44)" + "lat_proc-exec (us)","709.41 (min 689.88, max 728.75)" + "lat_proc-fork (us)","616.86 (min 602.89, max 633.11)" "lat_proc-proccall (us)","0.01" - "lat_select (us)","33.79 (min 33.79, max 33.80)" - "lat_sem (us)","2.68 (min 2.48, max 2.89)" - "lat_sig-catch (us)","5.45 (min 5.43, max 5.48)" - "lat_sig-install (us)","0.67" - "lat_sig-prot (us)","0.52 (min 0.51, max 0.54)" - "lat_syscall-fstat (us)","1.98" - "lat_syscall-null (us)","0.47" - "lat_syscall-open (us)","147.83 (min 133.40, max 162.26)" - "lat_syscall-read (us)","0.82 (min 0.81, max 0.82)" - "lat_syscall-stat (us)","4.67 (min 4.64, max 4.71)" - "lat_syscall-write (us)","0.76 (min 0.75, max 0.77)" - "lat_tcp (us)","1.00 (min 0.98, max 1.02)" - "lat_unix (us)","30.00 (min 29.99, max 30.01)" - "latency_for_0.50_mb_block_size (nanosec)","12.11 (min 10.58, max 13.64)" - "latency_for_1.00_mb_block_size (nanosec)","15.22 (min 0.00, max 31.43)" - "pipe_bandwidth (mb\s)","787.85 (min 749.46, max 826.24)" - "pipe_latency (microsec)","25.78 (min 25.77, max 25.79)" + "lat_select (us)","33.97 (min 33.79, max 34.06)" + "lat_sem (us)","3.04 (min 2.65, max 3.79)" + "lat_sig-catch (us)","5.54 (min 5.27, max 5.77)" + "lat_sig-install (us)","0.67 (min 0.65, max 0.71)" + "lat_sig-prot (us)","0.65 (min 0.50, max 0.76)" + "lat_syscall-fstat (us)","1.99 (min 1.90, max 2.07)" + "lat_syscall-null (us)","0.46 (min 0.46, max 0.50)" + "lat_syscall-open (us)","188.47 (min 153.56, max 251.41)" + "lat_syscall-read (us)","0.83 (min 0.80, max 0.88)" + "lat_syscall-stat (us)","4.79 (min 4.67, max 4.97)" + "lat_syscall-write (us)","0.78 (min 0.75, max 0.84)" + "lat_tcp (us)","0.92 (min 0.91, max 0.97)" + "lat_unix (us)","30.38 (min 29.49, max 31.11)" + "latency_for_0.50_mb_block_size (nanosec)","10.88 (min 9.02, max 12.76)" + "latency_for_1.00_mb_block_size (nanosec)","15.28 (min 0.00, max 31.41)" + "pipe_bandwidth (mb\s)","783.15 (min 729.29, max 819.18)" + "pipe_latency (microsec)","25.74 (min 25.17, max 26.44)" "procedure_call (microsec)","0.01" - "select_on_200_tcp_fds (microsec)","33.79 (min 33.79, max 33.80)" - "semaphore_latency (microsec)","2.68 (min 2.48, max 2.89)" - "signal_handler_latency (microsec)","0.67" - "signal_handler_overhead (microsec)","5.45 (min 5.43, max 5.48)" - "tcp_ip_connection_cost_to_localhost (microsec)","56.68 (min 56.35, max 57.00)" - "tcp_latency_using_localhost (microsec)","1.00 (min 0.98, max 1.02)" - - + "select_on_200_tcp_fds (microsec)","33.97 (min 33.79, max 34.06)" + "semaphore_latency (microsec)","3.04 (min 2.65, max 3.79)" + "signal_handler_latency (microsec)","0.67 (min 0.65, max 0.71)" + "signal_handler_overhead (microsec)","5.54 (min 5.27, max 5.77)" + "tcp_ip_connection_cost_to_localhost (microsec)","56.81 (min 56.67, max 57.00)" + "tcp_latency_using_localhost (microsec)","0.92 (min 0.91, max 0.97)" Dhrystone -^^^^^^^^^^^^^^^^^^^^^^^^^^^ +^^^^^^^^^ Dhrystone is a core only benchmark that runs from warm L1 caches in all modern processors. It scales linearly with clock speed. @@ -191,7 +188,6 @@ Please take note, different run may produce different slightly results. This is advised to run this test multiple times in order to get maximum performance numbers. - Execute the benchmark with the following: :: @@ -202,12 +198,11 @@ Execute the benchmark with the following: :header: "Benchmarks","am62pxx_sk-fs: perf" "cpu_clock (mhz)","1400.00" - "dhrystone_per_mhz (dmips/mhz)","2.95 (min 2.90, max 3.00)" - "dhrystone_per_second (dhrystonep)","7275132.25 (min 7142857.00, max 7407407.50)" - + "dhrystone_per_mhz (dmips/mhz)","2.91 (min 2.90, max 3.00)" + "dhrystone_per_second (dhrystonep)","7180649.93 (min 7142857.00, max 7407407.50)" Whetstone -^^^^^^^^^^^^^^^^^^^^^^^^^^^ +^^^^^^^^^ Whetstone is a benchmark primarily measuring floating-point arithmetic performance. Execute the benchmark with the following: @@ -219,22 +214,20 @@ Execute the benchmark with the following: .. csv-table:: Whetstone Benchmarks :header: "Benchmarks","am62pxx_sk-fs: perf" - "whetstone (mips)","7500.00 (min 5000.00, max 10000.00)" - + "whetstone (mips)","6428.57 (min 5000.00, max 10000.00)" Linpack -^^^^^^^^^^^^^^^^^^^^^^^^^^^ +^^^^^^^ Linpack measures peak double precision (64 bit) floating point performance in solving a dense linear system. .. csv-table:: Linpack Benchmarks :header: "Benchmarks","am62pxx_sk-fs: perf" - "linpack (kflops)","575872.00 (min 574616.00, max 577128.00)" - + "linpack (kflops)","575572.00 (min 571460.00, max 577031.00)" NBench -^^^^^^^^^^^^^^^^^^^^^^^^^^^ +^^^^^^ NBench which stands for Native Benchmark is used to measure macro benchmarks for commonly used operations such as sorting and analysis algorithms. More information about NBench at @@ -244,19 +237,18 @@ https://nbench.io/articles/index.html .. csv-table:: NBench Benchmarks :header: "Benchmarks","am62pxx_sk-fs: perf" - "assignment (iterations)","14.47 (min 14.46, max 14.48)" - "fourier (iterations)","22831.50 (min 22831.00, max 22832.00)" - "fp_emulation (iterations)","215.64" - "huffman (iterations)","1184.10 (min 1183.90, max 1184.30)" - "idea (iterations)","3444.85 (min 3444.80, max 3444.90)" - "lu_decomposition (iterations)","530.01 (min 529.95, max 530.06)" - "neural_net (iterations)","8.65" - "numeric_sort (iterations)","628.51 (min 628.05, max 628.96)" - "string_sort (iterations)","163.94" - + "assignment (iterations)","14.48 (min 14.45, max 14.50)" + "fourier (iterations)","22831.29 (min 22831.00, max 22832.00)" + "fp_emulation (iterations)","215.64 (min 215.64, max 215.65)" + "huffman (iterations)","1184.13 (min 1183.30, max 1184.40)" + "idea (iterations)","3444.83 (min 3444.70, max 3444.90)" + "lu_decomposition (iterations)","529.08 (min 526.35, max 533.03)" + "neural_net (iterations)","8.65 (min 8.65, max 8.66)" + "numeric_sort (iterations)","625.73 (min 617.87, max 629.99)" + "string_sort (iterations)","163.94 (min 163.93, max 163.94)" Stream -^^^^^^^^^^^^^^^^^^^^^^^^^^^ +^^^^^^ STREAM is a microbenchmark for measuring data memory system performance without any data reuse. It is designed to miss on caches and exercise data prefetcher and speculative accesses. @@ -276,56 +268,49 @@ Execute the benchmark with the following: .. csv-table:: Stream Benchmarks :header: "Benchmarks","am62pxx_sk-fs: perf" - "add (mb/s)","2693.95 (min 2693.70, max 2694.20)" - "copy (mb/s)","3756.90 (min 3756.30, max 3757.50)" - "scale (mb/s)","3484.05 (min 3482.60, max 3485.50)" - "triad (mb/s)","2400.10 (min 2397.20, max 2403.00)" - + "add (mb/s)","2825.76 (min 2698.10, max 2879.00)" + "copy (mb/s)","3941.66 (min 3718.70, max 4027.40)" + "scale (mb/s)","3624.44 (min 3481.60, max 3704.10)" + "triad (mb/s)","2492.96 (min 2403.50, max 2530.10)" CoreMarkPro -^^^^^^^^^^^^^^^^^^^^^^^^^^^ +^^^^^^^^^^^ CoreMark®-Pro is a comprehensive, advanced processor benchmark that works with and enhances the market-proven industry-standard EEMBC CoreMark® benchmark. While CoreMark stresses the CPU pipeline, CoreMark-Pro tests the entire processor, adding comprehensive support for multicore technology, a combination of integer and floating-point workloads, and data sets for utilizing larger memory subsystems. - .. csv-table:: CoreMarkPro Benchmarks :header: "Benchmarks","am62pxx_sk-fs: perf" - "cjpeg-rose7-preset (workloads/)","42.19" + "cjpeg-rose7-preset (workloads/)","41.97 (min 41.84, max 42.02)" "core (workloads/)","0.30" - "coremark-pro ()","915.19 (min 905.27, max 925.11)" - "linear_alg-mid-100x100-sp (workloads/)","14.68 (min 14.67, max 14.68)" - "loops-all-mid-10k-sp (workloads/)","0.71" + "coremark-pro ()","927.45 (min 906.93, max 947.60)" + "linear_alg-mid-100x100-sp (workloads/)","14.68 (min 14.68, max 14.70)" + "loops-all-mid-10k-sp (workloads/)","0.71 (min 0.71, max 0.72)" "nnet_test (workloads/)","1.09" - "parser-125k (workloads/)","8.81 (min 8.77, max 8.85)" - "radix2-big-64k (workloads/)","57.20 (min 51.86, max 62.54)" - "sha-test (workloads/)","81.31 (min 80.65, max 81.97)" - "zip-test (workloads/)","21.74" - - - + "parser-125k (workloads/)","8.83 (min 8.77, max 8.85)" + "radix2-big-64k (workloads/)","62.81 (min 53.18, max 74.52)" + "sha-test (workloads/)","81.68 (min 81.30, max 81.97)" + "zip-test (workloads/)","22.15 (min 21.74, max 22.22)" .. csv-table:: CoreMarkProTwoCore Benchmarks :header: "Benchmarks","am62pxx_sk-fs: perf" - "cjpeg-rose7-preset (workloads/)","82.99 (min 82.64, max 83.33)" + "cjpeg-rose7-preset (workloads/)","83.45 (min 82.64, max 84.03)" "core (workloads/)","0.60" - "coremark-pro ()","1673.63 (min 1669.43, max 1677.83)" - "linear_alg-mid-100x100-sp (workloads/)","29.37 (min 29.34, max 29.39)" - "loops-all-mid-10k-sp (workloads/)","1.31 (min 1.30, max 1.32)" - "nnet_test (workloads/)","2.17" - "parser-125k (workloads/)","13.95 (min 13.51, max 14.39)" - "radix2-big-64k (workloads/)","72.78 (min 71.34, max 74.21)" + "coremark-pro ()","1670.65 (min 1656.51, max 1691.47)" + "linear_alg-mid-100x100-sp (workloads/)","29.34 (min 29.31, max 29.36)" + "loops-all-mid-10k-sp (workloads/)","1.31 (min 1.30, max 1.31)" + "nnet_test (workloads/)","2.17 (min 2.16, max 2.17)" + "parser-125k (workloads/)","13.95 (min 13.51, max 14.49)" + "radix2-big-64k (workloads/)","71.62 (min 68.31, max 76.15)" "sha-test (workloads/)","162.61 (min 161.29, max 163.93)" "zip-test (workloads/)","42.55" - - MultiBench -^^^^^^^^^^^^^^^^^^^^^^^^^^^ +^^^^^^^^^^ MultiBench™ is a suite of benchmarks that allows processor and system designers to analyze, test, and improve multicore processors. It uses three forms of concurrency: Data decomposition: multiple threads cooperating on achieving a unified goal and @@ -344,267 +329,137 @@ thread-enabled workloads to be tested. .. csv-table:: Multibench Benchmarks :header: "Benchmarks","am62pxx_sk-fs: perf" - "4m-check (workloads/)","411.93" - "4m-check-reassembly (workloads/)","119.76" - "4m-check-reassembly-tcp (workloads/)","59.24" - "4m-check-reassembly-tcp-cmykw2-rotatew2 (workloads/)","33.15" - "4m-check-reassembly-tcp-x264w2 (workloads/)","1.87" - "4m-cmykw2 (workloads/)","246.31" - "4m-cmykw2-rotatew2 (workloads/)","49.75" - "4m-reassembly (workloads/)","83.13" - "4m-rotatew2 (workloads/)","52.66" - "4m-tcp-mixed (workloads/)","118.52" - "4m-x264w2 (workloads/)","1.95" - "idct-4m (workloads/)","19.24" - "idct-4mw1 (workloads/)","19.22" - "ippktcheck-4m (workloads/)","415.01" - "ippktcheck-4mw1 (workloads/)","413.98" - "ipres-4m (workloads/)","112.11" - "ipres-4mw1 (workloads/)","110.78" - "md5-4m (workloads/)","27.67" - "md5-4mw1 (workloads/)","27.21" - "rgbcmyk-4m (workloads/)","65.88" - "rgbcmyk-4mw1 (workloads/)","65.81" - "rotate-4ms1 (workloads/)","23.44" - "rotate-4ms1w1 (workloads/)","23.42" - "rotate-4ms64 (workloads/)","23.71" - "rotate-4ms64w1 (workloads/)","23.71" - "x264-4mq (workloads/)","0.58" - "x264-4mqw1 (workloads/)","0.58" - - + "4m-check (workloads/)","419.94 (min 412.34, max 431.18)" + "4m-check-reassembly (workloads/)","123.93 (min 120.34, max 128.54)" + "4m-check-reassembly-tcp (workloads/)","59.99 (min 59.10, max 61.27)" + "4m-check-reassembly-tcp-cmykw2-rotatew2 (workloads/)","33.80 (min 33.24, max 34.68)" + "4m-check-reassembly-tcp-x264w2 (workloads/)","1.89 (min 1.87, max 1.91)" + "4m-cmykw2 (workloads/)","243.33 (min 238.66, max 246.61)" + "4m-cmykw2-rotatew2 (workloads/)","50.36 (min 49.71, max 51.37)" + "4m-reassembly (workloads/)","83.96 (min 82.30, max 86.28)" + "4m-rotatew2 (workloads/)","53.30 (min 52.63, max 54.26)" + "4m-tcp-mixed (workloads/)","118.90 (min 118.52, max 119.40)" + "4m-x264w2 (workloads/)","1.95 (min 1.80, max 2.00)" + "idct-4m (workloads/)","19.21 (min 19.18, max 19.23)" + "idct-4mw1 (workloads/)","19.21 (min 19.18, max 19.23)" + "ippktcheck-4m (workloads/)","421.59 (min 413.22, max 431.63)" + "ippktcheck-4mw1 (workloads/)","421.60 (min 412.61, max 431.33)" + "ipres-4m (workloads/)","113.14 (min 110.54, max 116.73)" + "ipres-4mw1 (workloads/)","113.31 (min 110.13, max 116.64)" + "md5-4m (workloads/)","27.53 (min 27.10, max 27.88)" + "md5-4mw1 (workloads/)","27.73 (min 27.45, max 27.98)" + "rgbcmyk-4m (workloads/)","64.48 (min 62.70, max 65.81)" + "rgbcmyk-4mw1 (workloads/)","64.46 (min 62.68, max 65.77)" + "rotate-4ms1 (workloads/)","23.74 (min 23.38, max 24.15)" + "rotate-4ms1w1 (workloads/)","23.76 (min 23.41, max 24.21)" + "rotate-4ms64 (workloads/)","24.00 (min 23.66, max 24.49)" + "rotate-4ms64w1 (workloads/)","24.34 (min 23.64, max 26.53)" + "x264-4mq (workloads/)","0.58 (min 0.57, max 0.58)" + "x264-4mqw1 (workloads/)","0.57 (min 0.53, max 0.58)" Boot-time Measurement --------------------- - Boot media: MMCSD ^^^^^^^^^^^^^^^^^ .. csv-table:: Linux boot time MMCSD :header: "Boot Configuration","am62pxx_sk-fs: Boot time in seconds: avg(min,max)" - "Linux boot time from SD with default rootfs (20 boot cycles)","13.40 (min 13.11, max 13.80)" - - + "Linux boot time from SD with default rootfs (20 boot cycles)","13.59 (min 13.10, max 18.72)" Boot time numbers [avg, min, max] are measured from "Starting kernel" to Linux prompt across 20 boot cycles. - - | ALSA SoC Audio Driver -------------------------- +--------------------- #. Access type - RW\_INTERLEAVED #. Channels - 2 #. Format - S16\_LE #. Period size - 64 - .. csv-table:: Audio Capture :header: "Sampling Rate (Hz)","am62pxx_sk-fs: Throughput (bits/sec)","am62pxx_sk-fs: CPU Load (%)" - "11025","352799.00 (min 352798.00, max 352800.00)","0.10 (min 0.09, max 0.10)" - "16000","511999.00 (min 511998.00, max 512000.00)","0.08 (min 0.06, max 0.09)" - "22050","705590.00 (min 705587.00, max 705593.00)","0.12 (min 0.11, max 0.13)" - "24000","705594.00 (min 705593.00, max 705595.00)","0.14 (min 0.12, max 0.16)" - "32000","1023994.50 (min 1023994.00, max 1023995.00)","0.10 (min 0.09, max 0.11)" - "44100","1411192.50 (min 1411192.00, max 1411193.00)","0.21 (min 0.20, max 0.21)" - "48000","1535993.00","0.16 (min 0.14, max 0.17)" - "88200","2822383.50 (min 2822383.00, max 2822384.00)","0.36 (min 0.34, max 0.38)" - "96000","3071979.00 (min 3071976.00, max 3071982.00)","0.15 (min 0.13, max 0.17)" - - - + "11025","352798.33 (min 352797.00, max 352800.00)","0.10 (min 0.08, max 0.10)" + "16000","511998.83 (min 511997.00, max 512002.00)","0.23 (min 0.08, max 0.48)" + "22050","705594.83 (min 705589.00, max 705599.00)","0.13 (min 0.11, max 0.15)" + "24000","705597.17 (min 705595.00, max 705599.00)","0.14 (min 0.13, max 0.15)" + "32000","1023996.67 (min 1023994.00, max 1023998.00)","0.23 (min 0.08, max 0.87)" + "44100","1411195.33 (min 1411192.00, max 1411197.00)","0.21 (min 0.20, max 0.23)" + "48000","1535995.17 (min 1535991.00, max 1535998.00)","0.26 (min 0.09, max 0.92)" + "88200","2822388.00 (min 2822381.00, max 2822394.00)","0.38 (min 0.35, max 0.40)" + "96000","3071985.50 (min 3071973.00, max 3071993.00)","0.19 (min 0.17, max 0.21)" .. csv-table:: Audio Playback :header: "Sampling Rate (Hz)","am62pxx_sk-fs: Throughput (bits/sec)","am62pxx_sk-fs: CPU Load (%)" - "11025","352945.00 (min 352944.00, max 352946.00)","0.09" - "16000","512211.50 (min 512210.00, max 512213.00)","0.08" - "22050","705861.00 (min 705832.00, max 705890.00)","0.12" - "24000","705890.00 (min 705888.00, max 705892.00)","0.12" - "32000","551611.50 (min 78799.00, max 1024424.00)","0.08 (min 0.07, max 0.09)" - "44100","1411538.00 (min 1411523.00, max 1411553.00)","0.17 (min 0.16, max 0.17)" - "48000","1536631.50 (min 1536627.00, max 1536636.00)","0.13 (min 0.11, max 0.14)" - "88200","2823566.00","0.31" - - + "11025","352946.33 (min 352945.00, max 352947.00)","0.09 (min 0.07, max 0.10)" + "16000","512213.17 (min 512210.00, max 512215.00)","0.08 (min 0.05, max 0.10)" + "22050","705849.17 (min 705824.00, max 705896.00)","0.11 (min 0.09, max 0.12)" + "24000","705891.33 (min 705888.00, max 705896.00)","0.13 (min 0.11, max 0.15)" + "32000","551612.00 (min 78800.00, max 1024427.00)","0.21 (min 0.05, max 0.84)" + "44100","1411628.17 (min 1411540.00, max 1411789.00)","0.18 (min 0.16, max 0.19)" + "48000","1536632.67 (min 1536629.00, max 1536635.00)","0.26 (min 0.12, max 0.51)" + "88200","2823553.00","0.34" + "96000","3073255.00","0.94" | Graphics SGX/RGX Driver -------------------------- - - +----------------------- GFXBench -^^^^^^^^^^^^^^^^^^^^^^^^^^^ +^^^^^^^^ Run GFXBench and capture performance reported (Score and Display rate in fps). All display outputs (HDMI, Displayport and/or LCD) are connected when running these tests .. csv-table:: GFXBench Performance :header: "Benchmark","am62pxx_sk-fs: Score","am62pxx_sk-fs: Fps" - " GFXBench 3.x gl_manhattan_off","907.49 (min 904.94, max 910.05)","14.64 (min 14.60, max 14.68)" - " GFXBench 3.x gl_trex_off","1587.44 (min 1586.08, max 1588.81)","28.35 (min 28.32, max 28.37)" - " GFXBench 4.x gl_4_off","260.73 (min 260.25, max 261.21)","4.41 (min 4.40, max 4.42)" - " GFXBench 5.x gl_5_high_off","114.18 (min 113.75, max 114.61)","1.78 (min 1.77, max 1.78)" - - - + " GFXBench 3.x gl_manhattan_off","906.46 (min 902.42, max 910.12)","14.62 (min 14.56, max 14.68)" + " GFXBench 3.x gl_trex_off","1582.33 (min 1576.54, max 1589.72)","28.26 (min 28.15, max 28.39)" + " GFXBench 4.x gl_4_off","260.66 (min 259.90, max 261.32)","4.41 (min 4.40, max 4.42)" + " GFXBench 5.x gl_5_high_off","114.64 (min 113.73, max 115.05)","1.78 (min 1.77, max 1.79)" Glmark2 -^^^^^^^^^^^^^^^^^^^^^^^^^^^ +^^^^^^^ Run Glmark2 and capture performance reported (Score). All display outputs (HDMI, Displayport and/or LCD) are connected when running these tests .. csv-table:: Glmark2 Performance :header: "Benchmark","am62pxx_sk-fs: Score" - "Glmark2-DRM","331.50 (min 308.00, max 355.00)" - "Glmark2-Wayland","738.00 (min 737.00, max 739.00)" - - -| - -Ethernet ------------------ -Ethernet performance benchmarks were measured using Netperf 2.7.1 https://hewlettpackard.github.io/netperf/doc/netperf.html -Test procedures were modeled after those defined in RFC-2544: -https://tools.ietf.org/html/rfc2544, where the DUT is the TI device -and the "tester" used was a Linux PC. To produce consistent results, -it is recommended to carry out performance tests in a private network and to avoid -running NFS on the same interface used in the test. In these results, -CPU utilization was captured as the total percentage used across all cores on the device, -while running the performance test over one external interface. - -UDP Throughput (0% loss) was measured by the procedure defined in RFC-2544 section 26.1: Throughput. -In this scenario, netperf options burst_size (-b) and wait_time (-w) are used to limit bandwidth -during different trials of the test, with the goal of finding the highest rate at which -no loss is seen. For example, to limit bandwidth to 500Mbits/sec with 1472B datagram: - -:: - - burst_size = / 8 (bits -> bytes) / / 100 (seconds -> 10 ms) - burst_size = 500000000 / 8 / 1472 / 100 = 425 - - wait_time = 10 milliseconds (minimum supported by Linux PC used for testing) - -UDP Throughput (possible loss) was measured by capturing throughput and packet loss statistics when -running the netperf test with no bandwidth limit (remove -b/-w options). - -In order to start a netperf client on one device, the other device must have netserver running. -To start netserver: - -:: - - netserver [-p ] [-4 (IPv4 addressing)] [-6 (IPv6 addressing)] - -Running the following shell script from the DUT will trigger netperf clients to measure -bidirectional TCP performance for 60 seconds and report CPU utilization. Parameter -k is used in -client commands to summarize selected statistics on their own line and -j is used to gain -additional timing measurements during the test. - -:: - - #!/bin/bash - for i in 1 - do - netperf -H -j -c -l 60 -t TCP_STREAM -- - -k DIRECTION,THROUGHPUT,MEAN_LATENCY,LOCAL_CPU_UTIL,REMOTE_CPU_UTIL,LOCAL_BYTES_SENT,REMOTE_BYTES_RECVD,LOCAL_SEND_SIZE & - - netperf -H -j -c -l 60 -t TCP_MAERTS -- - -k DIRECTION,THROUGHPUT,MEAN_LATENCY,LOCAL_CPU_UTIL,REMOTE_CPU_UTIL,LOCAL_BYTES_SENT,REMOTE_BYTES_RECVD,LOCAL_SEND_SIZE & - done - -Running the following commands will trigger netperf clients to measure UDP burst performance for -60 seconds at various burst/datagram sizes and report CPU utilization. - -- For UDP egress tests, run netperf client from DUT and start netserver on tester. - -:: - - netperf -H -j -c -l 60 -t UDP_STREAM -b -w -- -m - -k DIRECTION,THROUGHPUT,MEAN_LATENCY,LOCAL_CPU_UTIL,REMOTE_CPU_UTIL,LOCAL_BYTES_SENT,REMOTE_BYTES_RECVD,LOCAL_SEND_SIZE - -- For UDP ingress tests, run netperf client from tester and start netserver on DUT. - -:: - - netperf -H -j -C -l 60 -t UDP_STREAM -b -w -- -m - -k DIRECTION,THROUGHPUT,MEAN_LATENCY,LOCAL_CPU_UTIL,REMOTE_CPU_UTIL,LOCAL_BYTES_SENT,REMOTE_BYTES_RECVD,LOCAL_SEND_SIZE - - -CPSW/CPSW2g/CPSW3g Ethernet Driver -^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ - - -.. rubric:: TCP Bidirectional Throughput - :name: CPSW2g-tcp-bidirectional-throughput - -.. csv-table:: CPSW2g TCP Bidirectional Throughput - :header: "Command Used","am62pxx_sk-fs: THROUGHPUT (Mbits/sec)","am62pxx_sk-fs: CPU Load % (LOCAL_CPU_UTIL)" - - "netperf -H 192.168.0.1 -j -c -C -l 60 -t TCP_STREAM; netperf -H 192.168.0.1 -j -c -C -l 60 -t TCP_MAERTS","1797.44 (min 1756.87, max 1838.01)","63.06 (min 62.52, max 63.60)" - - - - -.. rubric:: TCP Bidirectional Throughput Interrupt Pacing - :name: CPSW2g-tcp-bidirectional-throughput-interrupt-pacing - -.. csv-table:: CPSW2g TCP Bidirectional Throughput Interrupt Pacing - :header: "Command Used","am62pxx_sk-fs: THROUGHPUT (Mbits/sec)","am62pxx_sk-fs: CPU Load % (LOCAL_CPU_UTIL)" - - "netperf -H 192.168.0.1 -j -c -C -l 60 -t TCP_STREAM; netperf -H 192.168.0.1 -j -c -C -l 60 -t TCP_MAERTS","1785.70 (min 1694.75, max 1876.65)","37.27 (min 35.52, max 39.01)" - - - - -.. rubric:: UDP Throughput - :name: CPSW2g-udp-throughput-0-loss - -.. csv-table:: CPSW2g UDP Egress Throughput 0 loss - :header: "Frame Size(bytes)","am62pxx_sk-fs: UDP Datagram Size(bytes) (LOCAL_SEND_SIZE)","am62pxx_sk-fs: THROUGHPUT (Mbits/sec)","am62pxx_sk-fs: Packets Per Second (kPPS)","am62pxx_sk-fs: CPU Load % (LOCAL_CPU_UTIL)" - - "64","","56.49 (min 56.42, max 56.55)","110.00","40.52 (min 40.38, max 40.65)" - "128","","110.21 (min 110.19, max 110.22)","108.00","40.07 (min 40.03, max 40.10)" - "256","","220.01 (min 219.29, max 220.73)","107.50 (min 107.00, max 108.00)","39.97 (min 39.60, max 40.33)" - "1024","","861.68 (min 859.04, max 864.32)","105.50 (min 105.00, max 106.00)","40.73 (min 40.59, max 40.87)" - "1518","","846.42 (min 840.54, max 852.30)","69.50 (min 69.00, max 70.00)","37.22 (min 37.16, max 37.28)" - + "Glmark2-DRM","314.14 (min 307.00, max 354.00)" + "Glmark2-Wayland","730.75 (min 717.00, max 746.00)" | Linux OSPI Flash Driver -------------------------- - - -AM62PXX-SK -^^^^^^^^^^^^^^^^^^^^^^^^^^^ +----------------------- +.. rubric:: AM62PXX-SK + :name: am62pxx-sk-ospi -UBIFS -""""""""""""""""""""""""""" +.. rubric:: UBIFS + :name: am62pxx-sk-ospi-ubifs .. csv-table:: OSPI Flash Driver :header: "Buffer size (bytes)","am62pxx_sk-fs: Write UBIFS Throughput (Mbytes/sec)","am62pxx_sk-fs: Write UBIFS CPU Load (%)","am62pxx_sk-fs: Read UBIFS Throughput (Mbytes/sec)","am62pxx_sk-fs: Read UBIFS CPU Load (%)" - "102400","0.17 (min 0.12, max 0.28)","29.48 (min 24.79, max 33.84)","28.51 (min 28.45, max 28.57)","9.90 (min 6.90, max 12.90)" - "262144","0.14 (min 0.10, max 0.18)","29.48 (min 27.27, max 31.62)","28.46 (min 28.38, max 28.54)","6.73 (min 3.45, max 10.00)" - "524288","0.14 (min 0.10, max 0.19)","29.39 (min 26.96, max 31.81)","28.23 (min 28.10, max 28.36)","8.34 (min 6.67, max 10.00)" - "1048576","0.14 (min 0.10, max 0.18)","29.92 (min 26.75, max 34.88)","28.09 (min 28.07, max 28.11)","9.68" + "102400","0.17 (min 0.12, max 0.28)","28.77 (min 24.69, max 33.84)","28.45 (min 28.34, max 28.64)","7.08 (min 3.57, max 12.50)" + "262144","0.14 (min 0.10, max 0.18)","29.70 (min 25.14, max 35.52)","28.38 (min 28.03, max 28.59)","8.42 (min 3.45, max 12.90)" + "524288","0.14 (min 0.10, max 0.18)","29.68 (min 26.42, max 33.97)","28.23 (min 27.97, max 28.56)","7.52 (min 3.45, max 12.50)" + "1048576","0.14 (min 0.10, max 0.18)","29.89 (min 26.72, max 33.36)","27.96 (min 27.72, max 28.27)","7.96 (min 6.67, max 9.68)" -RAW -""""""""""""""""""""""""""" +.. rubric:: RAW + :name: am62pxx-sk-ospi-raw .. csv-table:: OSPI Raw Flash Driver :header: "File size (Mbytes)","am62pxx_sk-fs: Raw Read Throughput (Mbytes/sec)" - "50","37.88" - + "50","37.79 (min 37.31, max 37.88)" EMMC Driver ----------- @@ -616,21 +471,16 @@ EMMC Driver sensitive applications, umount the auto-mounted filesystem and re-mount in async mode. - - EMMC EXT4 FIO 1G ^^^^^^^^^^^^^^^^ - .. csv-table:: EMMC EXT4 FIO 1G :header: "Buffer size (bytes)","am62pxx_sk-fs: Write EXT4 Throughput (Mbytes/sec)","am62pxx_sk-fs: Write EXT4 CPU Load (%)","am62pxx_sk-fs: Read EXT4 Throughput (Mbytes/sec)","am62pxx_sk-fs: Read EXT4 CPU Load (%)" - "1m","91.85 (min 90.70, max 93.00)","1.62 (min 1.60, max 1.63)","287.00 (min 285.00, max 289.00)","2.73 (min 2.65, max 2.81)" - "4m","97.50 (min 96.30, max 98.70)","1.12 (min 1.07, max 1.16)","288.00 (min 287.00, max 289.00)","2.14 (min 2.04, max 2.24)" - "4k","79.35 (min 79.20, max 79.50)","25.76 (min 25.60, max 25.92)","89.90 (min 89.20, max 90.60)","20.93 (min 20.67, max 21.18)" - "256k","91.85 (min 90.50, max 93.20)","2.08 (min 1.97, max 2.18)","290.50 (min 287.00, max 294.00)","4.03 (min 3.96, max 4.09)" - - + "1m","91.41 (min 90.40, max 92.50)","1.55 (min 1.48, max 1.61)","284.00 (min 276.00, max 289.00)","2.61 (min 2.33, max 2.79)" + "4m","95.41 (min 90.40, max 97.50)","1.06 (min 1.00, max 1.13)","230.14 (min 153.00, max 288.00)","1.72 (min 1.26, max 2.10)" + "4k","79.04 (min 78.90, max 79.30)","25.61 (min 25.54, max 25.65)","91.77 (min 89.20, max 93.10)","21.42 (min 20.63, max 21.94)" + "256k","91.33 (min 90.70, max 91.80)","1.97 (min 1.84, max 2.09)","288.43 (min 280.00, max 291.00)","4.00 (min 3.76, max 4.15)" EMMC RAW FIO 1G ^^^^^^^^^^^^^^^ @@ -638,12 +488,10 @@ EMMC RAW FIO 1G .. csv-table:: EMMC RAW FIO 1G :header: "Buffer size (bytes)","am62pxx_sk-fs: Write Raw Throughput (Mbytes/sec)","am62pxx_sk-fs: Write Raw CPU Load (%)","am62pxx_sk-fs: Read Raw Throughput (Mbytes/sec)","am62pxx_sk-fs: Read Raw CPU Load (%)" - "1m","90.00 (min 89.90, max 90.10)","1.36 (min 1.33, max 1.38)","293.00 (min 292.00, max 294.00)","2.61 (min 2.52, max 2.69)" - "4m","97.10 (min 97.00, max 97.20)","1.03 (min 1.01, max 1.05)","293.00 (min 292.00, max 294.00)","2.07 (min 2.05, max 2.08)" - "4k","77.15 (min 76.80, max 77.50)","19.09 (min 19.07, max 19.11)","93.05 (min 93.00, max 93.10)","20.30 (min 19.97, max 20.62)" - "256k","90.25 (min 90.10, max 90.40)","1.76 (min 1.74, max 1.77)","293.00 (min 292.00, max 294.00)","3.80 (min 3.70, max 3.89)" - - + "1m","90.53 (min 89.80, max 91.30)","1.37 (min 1.21, max 1.54)","293.29 (min 292.00, max 294.00)","2.64 (min 2.37, max 2.89)" + "4m","96.93 (min 96.50, max 97.50)","0.97 (min 0.86, max 1.03)","277.00 (min 182.00, max 294.00)","1.90 (min 1.48, max 2.09)" + "4k","76.76 (min 76.40, max 77.10)","18.94 (min 18.79, max 19.25)","92.90 (min 92.50, max 93.10)","20.21 (min 19.71, max 20.64)" + "256k","90.53 (min 89.70, max 91.40)","1.73 (min 1.53, max 1.95)","293.57 (min 293.00, max 294.00)","3.83 (min 3.73, max 3.91)" EMMC EXT4 ^^^^^^^^^ @@ -651,50 +499,32 @@ EMMC EXT4 .. csv-table:: EMMC EXT4 :header: "Buffer size (bytes)","am62pxx_sk-fs: Write EXT4 Throughput (Mbytes/sec)","am62pxx_sk-fs: Write EXT4 CPU Load (%)","am62pxx_sk-fs: Read EXT4 Throughput (Mbytes/sec)","am62pxx_sk-fs: Read EXT4 CPU Load (%)" - "102400","84.05 (min 80.55, max 87.86)","5.95 (min 4.96, max 8.05)","178.95 (min 178.88, max 179.02)","8.77 (min 6.99, max 10.55)" - "262144","82.22 (min 55.62, max 88.94)","5.71 (min 3.58, max 7.89)","181.33 (min 181.30, max 181.36)","8.53 (min 8.33, max 8.73)" - "524288","76.21 (min 48.83, max 88.87)","5.38 (min 3.31, max 8.06)","182.11 (min 182.06, max 182.16)","10.34 (min 6.70, max 13.97)" - "1048576","74.12 (min 49.72, max 89.67)","4.95 (min 2.92, max 7.84)","177.80 (min 173.33, max 182.26)","8.91 (min 6.75, max 11.06)" - "5242880","68.44 (min 48.58, max 88.72)","4.75 (min 2.96, max 7.38)","182.00 (min 181.88, max 182.12)","8.88 (min 7.49, max 10.26)" - - -EMMC EXT2 -^^^^^^^^^ - - -.. csv-table:: EMMC EXT2 - :header: "Buffer size (bytes)","am62pxx_sk-fs: Write EXT2 Throughput (Mbytes/sec)","am62pxx_sk-fs: Write EXT2 CPU Load (%)","am62pxx_sk-fs: Read EXT2 Throughput (Mbytes/sec)","am62pxx_sk-fs: Read EXT2 CPU Load (%)" - - "102400","46.66 (min 23.83, max 53.41)","6.19 (min 4.83, max 10.22)","206.14 (min 200.43, max 211.85)","10.42 (min 10.26, max 10.58)" - "262144","54.96 (min 26.84, max 64.68)","6.91 (min 5.78, max 10.03)","291.88 (min 291.15, max 292.60)","15.85 (min 15.49, max 16.20)" - "524288","64.23 (min 28.34, max 76.47)","6.02 (min 4.83, max 9.01)","296.85 (min 296.22, max 297.48)","14.93 (min 13.77, max 16.08)" - "1048576","65.71 (min 28.66, max 78.49)","6.38 (min 4.49, max 8.85)","294.03 (min 293.85, max 294.20)","16.03 (min 15.97, max 16.08)" - "5242880","70.98 (min 28.72, max 85.64)","6.08 (min 4.55, max 8.90)","295.09 (min 295.08, max 295.10)","14.73 (min 14.18, max 15.28)" - + "102400","83.27 (min 52.29, max 89.46)","5.94 (min 4.97, max 8.11)","178.78 (min 178.64, max 178.91)","8.44 (min 6.58, max 10.13)" + "262144","80.06 (min 49.05, max 89.23)","5.71 (min 3.40, max 8.43)","179.72 (min 172.91, max 181.11)","9.36 (min 8.77, max 9.91)" + "524288","75.36 (min 49.32, max 89.16)","5.33 (min 3.06, max 8.14)","180.13 (min 176.40, max 181.89)","8.74 (min 8.26, max 9.87)" + "1048576","75.65 (min 47.53, max 88.93)","5.37 (min 2.72, max 8.45)","181.47 (min 180.95, max 181.87)","8.62 (min 7.86, max 9.44)" + "5242880","76.21 (min 49.34, max 89.86)","5.37 (min 3.02, max 7.98)","180.45 (min 174.59, max 181.97)","8.71 (min 8.30, max 9.52)" EMMC VFAT ^^^^^^^^^ - .. csv-table:: EMMC VFAT :header: "Buffer size (bytes)","am62pxx_sk-fs: Write VFAT Throughput (Mbytes/sec)","am62pxx_sk-fs: Write VFAT CPU Load (%)","am62pxx_sk-fs: Read VFAT Throughput (Mbytes/sec)","am62pxx_sk-fs: Read VFAT CPU Load (%)" - "102400","40.66 (min 11.88, max 52.29)","5.07 (min 3.58, max 6.10)","208.81 (min 208.70, max 208.92)","10.36 (min 10.10, max 10.61)" - "262144","44.56 (min 12.48, max 62.93)","5.60 (min 4.40, max 7.81)","286.09 (min 284.98, max 287.19)","15.45 (min 14.56, max 16.33)" - "524288","50.91 (min 12.75, max 73.51)","5.09 (min 3.68, max 7.64)","287.77 (min 287.04, max 288.49)","14.77 (min 13.89, max 15.65)" - "1048576","55.28 (min 12.88, max 75.16)","5.00 (min 3.83, max 6.45)","287.39 (min 286.35, max 288.43)","14.48 (min 14.38, max 14.58)" - "5242880","56.43 (min 13.03, max 81.90)","5.02 (min 3.73, max 6.68)","287.22 (min 287.00, max 287.43)","14.78 (min 14.48, max 15.07)" - + "102400","39.61 (min 11.80, max 52.28)","5.21 (min 3.66, max 6.47)","208.97 (min 208.62, max 209.38)","11.07 (min 9.23, max 12.81)" + "262144","44.50 (min 12.47, max 62.38)","6.00 (min 4.12, max 9.12)","287.77 (min 285.96, max 289.30)","15.04 (min 12.77, max 16.55)" + "524288","50.98 (min 12.69, max 73.49)","5.12 (min 3.75, max 7.69)","287.10 (min 285.81, max 288.26)","15.14 (min 14.58, max 16.11)" + "1048576","53.77 (min 12.83, max 75.68)","5.03 (min 3.49, max 6.69)","287.01 (min 285.60, max 288.35)","14.66 (min 13.29, max 15.75)" + "5242880","55.67 (min 13.01, max 81.71)","5.12 (min 3.81, max 6.94)","286.37 (min 280.42, max 288.38)","13.94 (min 12.77, max 15.75)" UBoot EMMC Driver ----------------- - .. csv-table:: UBOOT EMMC RAW :header: "File size (bytes in hex)","am62pxx_sk-fs: Write Throughput (Kbytes/sec)","am62pxx_sk-fs: Read Throughput (Kbytes/sec)" - "2000000","99571.30 (min 97523.81, max 103044.03)","234574.66 (min 172463.16, max 277694.92)" - "4000000","97976.11 (min 96946.75, max 100054.96)","260546.71 (min 172918.21, max 300623.85)" + "2000000","96461.77 (min 93891.12, max 100515.34)","215037.67 (min 146285.71, max 282482.76)" + "4000000","97228.73 (min 95812.87, max 99447.65)","259335.04 (min 229950.88, max 296542.99)" MMCSD ----- @@ -707,76 +537,39 @@ MMCSD sensitive applications, umount the auto-mounted filesystem and re-mount in async mode. - MMC EXT4 FIO 1G ^^^^^^^^^^^^^^^ - .. csv-table:: MMC EXT4 FIO 1G :header: "Buffer size (bytes)","am62pxx_sk-fs: Write EXT4 Throughput (Mbytes/sec)","am62pxx_sk-fs: Write EXT4 CPU Load (%)","am62pxx_sk-fs: Read EXT4 Throughput (Mbytes/sec)","am62pxx_sk-fs: Read EXT4 CPU Load (%)" - "1m","41.80 (min 41.60, max 42.00)","1.01","87.30","1.38 (min 1.32, max 1.44)" - "4m","41.95 (min 41.20, max 42.70)","0.75 (min 0.74, max 0.76)","87.15 (min 87.10, max 87.20)","0.97 (min 0.96, max 0.97)" - "4k","2.80 (min 2.78, max 2.83)","1.70 (min 1.66, max 1.73)","12.95 (min 12.90, max 13.00)","4.24 (min 4.17, max 4.30)" - "256k","37.85 (min 37.20, max 38.50)","1.26 (min 1.22, max 1.30)","83.85 (min 83.80, max 83.90)","1.63 (min 1.60, max 1.65)" - - + "1m","42.59 (min 41.40, max 43.40)","1.06 (min 1.01, max 1.16)","87.31 (min 87.20, max 87.40)","1.29 (min 1.15, max 1.39)" + "4m","42.17 (min 41.40, max 43.30)","0.71 (min 0.64, max 0.76)","87.24 (min 87.10, max 87.30)","0.92 (min 0.87, max 0.98)" + "4k","2.80 (min 2.78, max 2.83)","1.67 (min 1.60, max 1.75)","12.94 (min 12.80, max 13.20)","4.31 (min 4.01, max 4.52)" + "256k","38.44 (min 36.60, max 39.10)","1.25 (min 1.20, max 1.31)","83.47 (min 83.20, max 83.80)","1.52 (min 1.44, max 1.61)" MMC RAW FIO 1G ^^^^^^^^^^^^^^ - .. csv-table:: MMC RAW FIO 1G :header: "Buffer size (bytes)","am62pxx_sk-fs: Write Raw Throughput (Mbytes/sec)","am62pxx_sk-fs: Write Raw CPU Load (%)","am62pxx_sk-fs: Read Raw Throughput (Mbytes/sec)","am62pxx_sk-fs: Read Raw CPU Load (%)" - "1m","44.20 (min 43.70, max 44.70)","0.96 (min 0.93, max 0.98)","88.20","1.18 (min 1.15, max 1.20)" - "4m","43.90 (min 43.70, max 44.10)","0.75 (min 0.72, max 0.77)","88.20","0.92 (min 0.88, max 0.96)" - "4k","2.81","1.35 (min 1.33, max 1.36)","13.05 (min 13.00, max 13.10)","3.95 (min 3.87, max 4.03)" - "256k","39.70 (min 38.30, max 41.10)","1.09 (min 1.05, max 1.12)","84.40 (min 84.30, max 84.50)","1.48 (min 1.47, max 1.49)" + "1m","43.59 (min 42.40, max 45.10)","0.91 (min 0.86, max 1.01)","88.19 (min 88.10, max 88.30)","1.14 (min 1.09, max 1.22)" + "4m","43.20 (min 42.10, max 45.00)","0.70 (min 0.63, max 0.76)","88.14 (min 88.00, max 88.30)","0.90 (min 0.84, max 0.96)" + "4k","2.81 (min 2.80, max 2.83)","1.38 (min 1.33, max 1.43)","13.06 (min 13.00, max 13.10)","3.91 (min 3.82, max 4.06)" + "256k","38.00 (min 36.20, max 41.40)","1.02 (min 0.96, max 1.08)","84.33 (min 84.20, max 84.50)","1.44 (min 1.38, max 1.50)" MMC EXT4 ^^^^^^^^ - .. csv-table:: MMC EXT4 :header: "Buffer size (bytes)","am62pxx_sk-fs: Write Raw Throughput (Mbytes/sec)","am62pxx_sk-fs: Write Raw CPU Load (%)","am62pxx_sk-fs: Read Raw Throughput (Mbytes/sec)","am62pxx_sk-fs: Read Raw CPU Load (%)" - "102400","10.86 (min 10.44, max 11.24)","0.84 (min 0.72, max 1.12)","11.82","0.71" - "262144","10.63 (min 10.46, max 10.79)","0.86 (min 0.67, max 1.15)","11.08 (min 11.00, max 11.16)","0.78 (min 0.71, max 0.85)" - "524288","10.41 (min 10.31, max 10.54)","0.79 (min 0.63, max 1.08)","11.29 (min 11.05, max 11.52)","0.69 (min 0.63, max 0.74)" - "1048576","10.54 (min 10.25, max 10.84)","0.85 (min 0.70, max 1.13)","11.05 (min 11.02, max 11.07)","0.66" - "5242880","10.52 (min 10.28, max 10.72)","0.84 (min 0.69, max 1.16)","11.30 (min 11.08, max 11.52)","0.67 (min 0.63, max 0.71)" - - - - -MMC EXT3 -^^^^^^^^ - - -.. csv-table:: MMC EXT3 - :header: "Buffer size (bytes)","am62pxx_sk-fs: Write Raw Throughput (Mbytes/sec)","am62pxx_sk-fs: Write Raw CPU Load (%)","am62pxx_sk-fs: Read Raw Throughput (Mbytes/sec)","am62pxx_sk-fs: Read Raw CPU Load (%)" - - "102400","39.34 (min 33.29, max 41.31)","3.58 (min 2.85, max 6.03)","78.75 (min 77.10, max 80.39)","5.35 (min 4.42, max 6.27)" - "262144","38.50 (min 33.14, max 41.93)","3.38 (min 2.42, max 6.09)","84.29 (min 82.02, max 86.55)","5.69 (min 5.36, max 6.02)" - "524288","36.83 (min 32.58, max 38.61)","3.34 (min 2.45, max 5.43)","90.39 (min 90.30, max 90.48)","5.26 (min 5.16, max 5.36)" - "1048576","38.74 (min 32.47, max 41.44)","3.34 (min 2.37, max 5.98)","90.10 (min 89.80, max 90.39)","5.04 (min 4.93, max 5.15)" - "5242880","38.13 (min 33.25, max 41.45)","3.28 (min 2.33, max 5.60)","90.13 (min 89.93, max 90.33)","5.04 (min 4.73, max 5.34)" - - - -MMC EXT2 -^^^^^^^^ - - -.. csv-table:: MMC EXT2 - :header: "Buffer size (bytes)","am62pxx_sk-fs: Write Raw Throughput (Mbytes/sec)","am62pxx_sk-fs: Write Raw CPU Load (%)","am62pxx_sk-fs: Read Raw Throughput (Mbytes/sec)","am62pxx_sk-fs: Read Raw CPU Load (%)" - - "102400","17.50 (min 3.49, max 21.20)","2.52 (min 2.13, max 2.86)","80.73 (min 80.69, max 80.77)","4.44 (min 4.26, max 4.62)" - "262144","30.77 (min 3.87, max 39.22)","3.32 (min 2.15, max 3.89)","86.89 (min 86.64, max 87.13)","5.18 (min 4.96, max 5.39)" - "524288","35.27 (min 3.96, max 44.35)","3.26 (min 2.12, max 4.01)","90.33 (min 90.28, max 90.37)","4.95 (min 4.74, max 5.16)" - "1048576","34.26 (min 4.01, max 43.23)","2.82 (min 1.88, max 3.57)","90.69 (min 90.61, max 90.76)","4.97 (min 4.55, max 5.39)" - "5242880","33.95 (min 4.03, max 42.47)","2.61 (min 1.97, max 3.23)","87.86 (min 85.16, max 90.55)","5.11 (min 4.75, max 5.47)" + "102400","10.75 (min 10.41, max 11.18)","0.83 (min 0.67, max 1.20)","11.19 (min 10.89, max 11.82)","0.75 (min 0.68, max 0.90)" + "262144","10.43 (min 10.25, max 10.62)","0.90 (min 0.68, max 1.46)","11.14 (min 10.99, max 11.22)","0.73 (min 0.63, max 0.78)" + "524288","10.46 (min 10.29, max 10.86)","0.81 (min 0.65, max 1.20)","11.10 (min 10.85, max 11.50)","0.68 (min 0.61, max 0.88)" + "1048576","10.49 (min 10.27, max 10.76)","0.88 (min 0.68, max 1.18)","11.06 (min 10.85, max 11.50)","0.66 (min 0.58, max 0.74)" + "5242880","10.64 (min 10.27, max 11.12)","0.83 (min 0.64, max 1.20)","11.59 (min 10.97, max 12.03)","0.66 (min 0.58, max 0.73)" The performance numbers were captured using the following: @@ -786,188 +579,113 @@ The performance numbers were captured using the following: UBoot MMCSD ----------- - UBOOT MMCSD FAT ^^^^^^^^^^^^^^^ .. csv-table:: UBOOT MMCSD FAT :header: "File size (bytes in hex)","am62pxx_sk-fs: Write Throughput (Kbytes/sec)","am62pxx_sk-fs: Read Throughput (Kbytes/sec)" - "400000","36597.69 (min 35617.39, max 37577.98)","82755.92 (min 81920.00, max 83591.84)" - "800000","38524.54 (min 32768.00, max 44281.08)","86690.26 (min 86231.58, max 87148.94)" - "1000000","45309.46 (min 41269.52, max 49349.40)","89530.05" - - + "400000","36689.07 (min 28054.79, max 43574.47)","82875.34 (min 81920.00, max 83591.84)" + "800000","40145.70 (min 33032.26, max 47627.91)","87148.94" + "1000000","48396.32 (min 42555.84, max 51360.50)","89670.60 (min 89530.05, max 90021.98)" The performance numbers were captured using the following: - SanDisk Max Endurance SD card (SDSQQVR-032G-GN6IA) - - | USB Driver -------------------------- +---------- USB Device Controller -^^^^^^^^^^^^^^^^^^^^^^^^^^^ - +^^^^^^^^^^^^^^^^^^^^^ .. csv-table:: USBDEVICE HIGHSPEED SLAVE_READ_THROUGHPUT :header: "Number of Blocks","am62pxx_sk-fs: Throughput (MB/sec)" - "150","38.95 (min 33.90, max 44.00)" - - - + "150","30.13 (min 26.60, max 43.90)" .. csv-table:: USBDEVICE HIGHSPEED SLAVE_WRITE_THROUGHPUT :header: "Number of Blocks","am62pxx_sk-fs: Throughput (MB/sec)" - "150","32.50 (min 27.90, max 37.10)" + "150","25.53 (min 21.90, max 37.10)" | CRYPTO Driver -------------------------- - +------------- OpenSSL Performance -^^^^^^^^^^^^^^^^^^^^^^^^^^^ +^^^^^^^^^^^^^^^^^^^ .. csv-table:: OpenSSL Performance :header: "Algorithm","Buffer Size (in bytes)","am62pxx_sk-fs: throughput (KBytes/Sec)" - "aes-128-cbc","1024","22944.60 (min 22896.64, max 22992.55)" - "aes-128-cbc","16","411.11 (min 409.66, max 412.57)" - "aes-128-cbc","16384","84309.33 (min 83656.70, max 84961.96)" - "aes-128-cbc","256","6772.78 (min 6760.02, max 6785.54)" - "aes-128-cbc","64","1800.77 (min 1799.74, max 1801.79)" - "aes-128-cbc","8192","70837.59 (min 70579.54, max 71095.64)" - "aes-128-ecb","1024","23454.04 (min 23428.44, max 23479.64)" - "aes-128-ecb","16","419.04 (min 418.92, max 419.16)" - "aes-128-ecb","16384","87053.65 (min 86736.90, max 87370.41)" - "aes-128-ecb","256","6953.86 (min 6949.72, max 6957.99)" - "aes-128-ecb","64","1843.58 (min 1842.69, max 1844.48)" - "aes-128-ecb","8192","73486.34 (min 73394.86, max 73577.81)" - "aes-192-cbc","1024","22431.23 (min 22398.63, max 22463.83)" - "aes-192-cbc","16","412.38 (min 411.57, max 413.18)" - "aes-192-cbc","16384","76283.90 (min 75776.00, max 76791.81)" - "aes-192-cbc","256","6698.28 (min 6681.17, max 6715.39)" - "aes-192-cbc","64","1806.75 (min 1803.65, max 1809.86)" - "aes-192-cbc","8192","65279.32 (min 65077.25, max 65481.39)" - "aes-192-ecb","1024","22946.13 (min 22890.50, max 23001.77)" - "aes-192-ecb","16","418.73 (min 417.76, max 419.71)" - "aes-192-ecb","16384","78452.05 (min 78386.52, max 78517.59)" - "aes-192-ecb","256","6863.70 (min 6831.53, max 6895.87)" - "aes-192-ecb","64","1837.65 (min 1836.99, max 1838.31)" - "aes-192-ecb","8192","67362.82 (min 67193.51, max 67532.12)" - "aes-256-cbc","1024","21829.12 (min 21806.08, max 21852.16)" - "aes-256-cbc","16","413.87 (min 412.79, max 414.94)" - "aes-256-cbc","16384","69869.57 (min 69637.46, max 70101.67)" - "aes-256-cbc","256","6656.51 (min 6655.06, max 6657.96)" - "aes-256-cbc","64","1801.61 (min 1798.98, max 1804.25)" - "aes-256-cbc","8192","60593.49 (min 60481.54, max 60705.45)" - "aes-256-ecb","1024","22341.97 (min 22245.72, max 22438.23)" - "aes-256-ecb","16","419.94 (min 419.53, max 420.34)" - "aes-256-ecb","16384","71841.11 (min 71483.39, max 72198.83)" - "aes-256-ecb","256","6813.27 (min 6799.96, max 6826.58)" - "aes-256-ecb","64","1831.33 (min 1828.18, max 1834.47)" - "aes-256-ecb","8192","61456.38 (min 61265.24, max 61647.53)" - "sha256","1024","38186.15 (min 38049.11, max 38323.20)" - "sha256","16","631.57 (min 630.11, max 633.04)" - "sha256","16384","298710.36 (min 298647.55, max 298773.16)" - "sha256","256","9972.44 (min 9929.05, max 10015.83)" - "sha256","64","2497.73 (min 2488.73, max 2506.73)" - "sha256","8192","202798.42 (min 202312.36, max 203284.48)" - "sha512","1024","26188.97 (min 26184.36, max 26193.58)" - "sha512","16","612.37 (min 610.09, max 614.65)" - "sha512","16384","68296.70 (min 68277.59, max 68315.82)" - "sha512","256","8686.17 (min 8669.53, max 8702.81)" - "sha512","64","2451.79 (min 2442.45, max 2461.12)" - "sha512","8192","61581.99 (min 61562.88, max 61601.11)" - - + "aes-128-cbc","1024","23874.22 (min 22797.65, max 24305.66)" + "aes-128-cbc","16","433.40 (min 414.08, max 439.83)" + "aes-128-cbc","16384","86033.94 (min 84885.50, max 86523.90)" + "aes-128-cbc","256","7133.66 (min 6779.65, max 7281.83)" + "aes-128-cbc","64","1854.41 (min 1809.17, max 1895.91)" + "aes-128-cbc","8192","72677.86 (min 71183.02, max 73187.33)" + "aes-128-ecb","1024","24521.24 (min 23560.19, max 24830.98)" + "aes-128-ecb","16","444.84 (min 423.89, max 450.61)" + "aes-128-ecb","16384","88832.49 (min 87801.86, max 89511.25)" + "aes-128-ecb","256","7297.62 (min 6986.33, max 7385.43)" + "aes-128-ecb","64","1921.89 (min 1846.42, max 1959.10)" + "aes-128-ecb","8192","74998.15 (min 72996.18, max 75606.70)" + "aes-192-cbc","1024","23428.24 (min 22448.13, max 23803.22)" + "aes-192-cbc","16","433.98 (min 413.37, max 440.67)" + "aes-192-cbc","16384","77998.76 (min 76961.11, max 78419.29)" + "aes-192-cbc","256","7084.75 (min 6741.16, max 7235.16)" + "aes-192-cbc","64","1858.29 (min 1806.49, max 1907.71)" + "aes-192-cbc","8192","66915.77 (min 65544.19, max 67439.27)" + "aes-192-ecb","1024","24060.10 (min 23176.19, max 24450.05)" + "aes-192-ecb","16","444.52 (min 424.39, max 449.94)" + "aes-192-ecb","16384","80076.41 (min 78779.73, max 80767.66)" + "aes-192-ecb","256","7282.65 (min 6920.45, max 7394.73)" + "aes-192-ecb","64","1914.58 (min 1845.12, max 1949.12)" + "aes-192-ecb","8192","68555.34 (min 67365.55, max 69383.51)" + "aes-256-cbc","1024","22864.60 (min 21938.52, max 23255.72)" + "aes-256-cbc","16","435.49 (min 413.74, max 442.78)" + "aes-256-cbc","16384","70860.02 (min 69817.69, max 71636.31)" + "aes-256-cbc","256","7052.84 (min 6704.38, max 7207.94)" + "aes-256-cbc","64","1867.00 (min 1805.76, max 1916.16)" + "aes-256-cbc","8192","61503.98 (min 60598.95, max 62406.66)" + "aes-256-ecb","1024","23521.77 (min 22587.39, max 23857.15)" + "aes-256-ecb","16","444.28 (min 425.70, max 450.73)" + "aes-256-ecb","16384","72667.72 (min 72176.98, max 73558.70)" + "aes-256-ecb","256","7234.73 (min 6907.56, max 7374.17)" + "aes-256-ecb","64","1913.51 (min 1846.23, max 1957.03)" + "aes-256-ecb","8192","63232.10 (min 62390.27, max 63744.68)" + "sha256","1024","37936.08 (min 37196.12, max 38420.14)" + "sha256","16","632.25 (min 614.09, max 639.77)" + "sha256","16384","299548.67 (min 296605.01, max 302246.57)" + "sha256","256","9906.47 (min 9659.73, max 10023.59)" + "sha256","64","2505.28 (min 2431.06, max 2528.36)" + "sha256","8192","203446.37 (min 199546.20, max 205512.70)" + "sha512","1024","26078.79 (min 25618.77, max 26265.94)" + "sha512","16","612.27 (min 590.90, max 623.37)" + "sha512","16384","68343.91 (min 67993.60, max 68517.89)" + "sha512","256","8707.43 (min 8436.31, max 8843.78)" + "sha512","64","2455.43 (min 2363.48, max 2505.77)" + "sha512","8192","61529.72 (min 61104.13, max 61680.30)" .. csv-table:: OpenSSL CPU Load :header: "Algorithm","am62pxx_sk-fs: CPU Load" - "aes-128-cbc","30.50 (min 30.00, max 31.00)" - "aes-128-ecb","32.00" - "aes-192-cbc","30.50 (min 30.00, max 31.00)" - "aes-192-ecb","31.00" - "aes-256-cbc","30.00" - "aes-256-ecb","30.50 (min 30.00, max 31.00)" - "sha256","95.00" - "sha512","94.50 (min 93.00, max 96.00)" + "aes-128-cbc","32.71 (min 31.00, max 33.00)" + "aes-128-ecb","33.86 (min 32.00, max 35.00)" + "aes-192-cbc","32.71 (min 31.00, max 33.00)" + "aes-192-ecb","33.29 (min 32.00, max 34.00)" + "aes-256-cbc","31.57 (min 30.00, max 32.00)" + "aes-256-ecb","32.43 (min 31.00, max 33.00)" + "sha256","95.57 (min 94.00, max 96.00)" + "sha512","95.86 (min 95.00, max 96.00)" +Listed for each algorithm are the code snippets used to run each + benchmark test. - -Low Power Performance ---------------------- - -Power Performance -^^^^^^^^^^^^^^^^^ - -.. csv-table:: Deep Sleep Power Performance - :header: "Rail name","Rail voltage(V)","Power (mW)" - - "vdd_core","0.85","14.36" - "vddr_core","0.85","1.03" - "soc_dvdd_3v3","3.30","6.02" - "soc_dvdd_1v8","1.80","2.78" - "vdda_1v8","1.80","67.41" - "vdd_lpddr4","1.10","4.92" - "Total"," ","96.52" - -.. csv-table:: MCU Only Power Performance - :header: "Rail name","Rail voltage(V)","Power (mW)" - - "vdd_core","0.85","213.68" - "vddr_core","0.85","2.79" - "soc_dvdd_3v3","3.30","7.52" - "soc_dvdd_1v8","1.80","2.85" - "vdda_1v8","1.80","75.91" - "vdd_lpddr4","1.10","5.12" - "Total"," ","307.88" - -Partial I/O Data -- All voltage rails were measured to be near 0V - -.. note:: - - The power consumption on the vdda_1v8 rail is not indicitive of the SoC's power consumption due to an oscillator on the rail - that has significant current consumption. - -.. note:: - - The measurements shown are from an AM62Px SK rev E1-1. Results may vary based off of the board revision being used. - -Further optimizations are possible for these low power modes. Please refer to the AM62x Power Consumption App Note (https://www.ti.com/lit/pdf/spradg1) - -Resume Latency Performance -^^^^^^^^^^^^^^^^^^^^^^^^^^ - -.. csv-table:: LPM Resume Latency Performance - :header: "Low Power Mode","Total Resume Latency (ms)" - - "I/O Only + DDR", "716.68" - "Deep Sleep", "150.50" - "MCU Only", "94.06" - -The performance numbers are measured without the Linux printk logs. To remove the -Linux printk logs, run the following commands in the terminal: - -.. code:: console - - # Detach kernel serial console - consoles=$(find /sys/bus/platform/devices/*.serial/ -name console) - for console in ${consoles}; do - echo -n N > ${console} - done - - -.. note:: +:: - The measurements shown are from using the default SDK with no extra optimizations. + time -v openssl speed -elapsed -evp aes-128-cbc diff --git a/source/devices/AM62PX/linux/RT_Linux_Performance_Guide.rst b/source/devices/AM62PX/linux/RT_Linux_Performance_Guide.rst index 6d68d7b90..bf8923f02 100644 --- a/source/devices/AM62PX/linux/RT_Linux_Performance_Guide.rst +++ b/source/devices/AM62PX/linux/RT_Linux_Performance_Guide.rst @@ -1,6 +1,6 @@ -================================= - RT-linux 11.01 Performance Guide -================================= +======================================= + RT-linux 11.02.08.02 Performance Guide +======================================= .. rubric:: **Read This First** :name: read-this-first-kernel-perf-guide @@ -73,12 +73,3 @@ default SDK image Components section: :ref:`building-optee-with-prng`, and enabling the RNG node in the Linux kernel device tree. This way the HW TRNG is accessed from the kernel itself. - -.. csv-table:: - :header: "Latencies","CPU 0","CPU 1","CPU 2","CPU 3" - - "Minimum (usec)","5","5","5","5" - "Average (usec)","6","6","7","6" - "Maximum (usec)","36","34","37","34" - -.. image:: img/rt-cpu-method-all-latency-histogram.png diff --git a/source/devices/AM62X/linux/Linux_Performance_Guide.rst b/source/devices/AM62X/linux/Linux_Performance_Guide.rst index 9d5d7844e..174b1ff90 100644 --- a/source/devices/AM62X/linux/Linux_Performance_Guide.rst +++ b/source/devices/AM62X/linux/Linux_Performance_Guide.rst @@ -1,7 +1,7 @@ -============================== - Linux 11.01 Performance Guide -============================== +==================================== + Linux 11.02.08.02 Performance Guide +==================================== .. rubric:: **Read This First** :name: read-this-first-kernel-perf-guide @@ -34,20 +34,17 @@ with drivers included in a particular release. :name: if-you-need-assistance-kernel-perf-guide For further information or to report any problems, contact -http://e2e.ti.com/ or http://support.ti.com/ - +https://e2e.ti.com/ or https://support.ti.com/ System Benchmarks ----------------- - - LMBench ^^^^^^^ -LMBench is a collection of microbenchmarks of which the memory bandwidth -and latency related ones are typically used to estimate processor +LMBench is a collection of microbenchmarks of which the memory bandwidth +and latency related ones are typically used to estimate processor memory system performance. More information about lmbench at -http://lmbench.sourceforge.net/whatis_lmbench.html and -http://lmbench.sourceforge.net/man/lmbench.8.html +https://lmbench.sourceforge.net/whatis_lmbench.html and +https://lmbench.sourceforge.net/man/lmbench.8.html **Latency**: lat_mem_rd-stride128-szN, where N is equal to or smaller than the cache size at given level measures the cache miss penalty. N that is at least @@ -69,123 +66,121 @@ Execute the LMBench with the following: .. csv-table:: LMBench Benchmarks :header: "Benchmarks","am62xx_lp_sk-fs: perf","am62xx_sk-fs: perf","am62xxsip_sk-fs: perf" - "af_unix_sock_stream_latency (microsec)","33.72","29.04","33.12" - "af_unix_socket_stream_bandwidth (MBs)","549.13","599.28","654.14" - "bw_file_rd-io-1mb (MB/s)","886.84","947.27","882.30" - "bw_file_rd-o2c-1mb (MB/s)","488.68","501.67","478.39" - "bw_mem-bcopy-16mb (MB/s)","702.31","758.69","750.47" - "bw_mem-bcopy-1mb (MB/s)","731.40","810.64","790.83" - "bw_mem-bcopy-2mb (MB/s)","701.26","754.34","724.51" - "bw_mem-bcopy-4mb (MB/s)","725.16","797.77","742.25" - "bw_mem-bcopy-8mb (MB/s)","737.40","788.49","726.02" - "bw_mem-bzero-16mb (MB/s)","1777.58","1757.08","1747.87" - "bw_mem-bzero-1mb (MB/s)","1249.56 (min 731.40, max 1767.72)","1273.23 (min 810.64, max 1735.81)","1259.27 (min 790.83, max 1727.71)" - "bw_mem-bzero-2mb (MB/s)","1234.34 (min 701.26, max 1767.41)","1244.32 (min 754.34, max 1734.30)","1223.29 (min 724.51, max 1722.06)" - "bw_mem-bzero-4mb (MB/s)","1247.54 (min 725.16, max 1769.91)","1274.42 (min 797.77, max 1751.06)","1240.19 (min 742.25, max 1738.12)" - "bw_mem-bzero-8mb (MB/s)","1251.41 (min 737.40, max 1765.42)","1266.66 (min 788.49, max 1744.82)","1237.62 (min 726.02, max 1749.21)" - "bw_mem-cp-16mb (MB/s)","408.49","454.88","449.99" - "bw_mem-cp-1mb (MB/s)","1146.98 (min 392.46, max 1901.50)","1153.53 (min 430.17, max 1876.88)","1156.08 (min 446.83, max 1865.32)" - "bw_mem-cp-2mb (MB/s)","1126.54 (min 410.09, max 1842.98)","1128.29 (min 438.07, max 1818.51)","1103.62 (min 412.54, max 1794.69)" - "bw_mem-cp-4mb (MB/s)","1103.66 (min 388.31, max 1819.01)","1136.35 (min 485.38, max 1787.31)","1104.23 (min 437.49, max 1770.96)" - "bw_mem-cp-8mb (MB/s)","1122.78 (min 439.68, max 1805.87)","1125.20 (min 477.73, max 1772.66)","1079.77 (min 399.36, max 1760.18)" - "bw_mem-fcp-16mb (MB/s)","696.89","736.95","808.28" - "bw_mem-fcp-1mb (MB/s)","1292.16 (min 816.59, max 1767.72)","1310.31 (min 884.80, max 1735.81)","1264.43 (min 801.15, max 1727.71)" - "bw_mem-fcp-2mb (MB/s)","1260.50 (min 753.58, max 1767.41)","1303.26 (min 872.22, max 1734.30)","1260.02 (min 797.98, max 1722.06)" - "bw_mem-fcp-4mb (MB/s)","1282.65 (min 795.39, max 1769.91)","1316.69 (min 882.32, max 1751.06)","1256.21 (min 774.29, max 1738.12)" - "bw_mem-fcp-8mb (MB/s)","1283.72 (min 802.01, max 1765.42)","1300.13 (min 855.43, max 1744.82)","1286.00 (min 822.79, max 1749.21)" - "bw_mem-frd-16mb (MB/s)","1022.56","1132.74","1084.82" - "bw_mem-frd-1mb (MB/s)","994.66 (min 816.59, max 1172.73)","1082.72 (min 884.80, max 1280.64)","1006.95 (min 801.15, max 1212.75)" - "bw_mem-frd-2mb (MB/s)","879.12 (min 753.58, max 1004.65)","997.70 (min 872.22, max 1123.17)","937.88 (min 797.98, max 1077.78)" - "bw_mem-frd-4mb (MB/s)","924.01 (min 795.39, max 1052.63)","1003.36 (min 882.32, max 1124.39)","900.76 (min 774.29, max 1027.22)" - "bw_mem-frd-8mb (MB/s)","937.56 (min 802.01, max 1073.11)","988.33 (min 855.43, max 1121.23)","946.94 (min 822.79, max 1071.09)" - "bw_mem-fwr-16mb (MB/s)","1780.94","1753.81","1753.81" - "bw_mem-fwr-1mb (MB/s)","1537.12 (min 1172.73, max 1901.50)","1578.76 (min 1280.64, max 1876.88)","1539.04 (min 1212.75, max 1865.32)" - "bw_mem-fwr-2mb (MB/s)","1423.82 (min 1004.65, max 1842.98)","1470.84 (min 1123.17, max 1818.51)","1436.24 (min 1077.78, max 1794.69)" - "bw_mem-fwr-4mb (MB/s)","1435.82 (min 1052.63, max 1819.01)","1455.85 (min 1124.39, max 1787.31)","1399.09 (min 1027.22, max 1770.96)" - "bw_mem-fwr-8mb (MB/s)","1439.49 (min 1073.11, max 1805.87)","1446.95 (min 1121.23, max 1772.66)","1415.64 (min 1071.09, max 1760.18)" - "bw_mem-rd-16mb (MB/s)","1088.51","1135.96","1081.81" - "bw_mem-rd-1mb (MB/s)","912.37 (min 579.63, max 1245.11)","976.13 (min 648.72, max 1303.54)","946.52 (min 620.54, max 1272.50)" - "bw_mem-rd-2mb (MB/s)","791.99 (min 496.83, max 1087.15)","855.46 (min 573.48, max 1137.44)","828.62 (min 554.25, max 1102.99)" - "bw_mem-rd-4mb (MB/s)","825.24 (min 586.08, max 1064.40)","899.80 (min 674.42, max 1125.18)","834.36 (min 572.08, max 1096.64)" - "bw_mem-rd-8mb (MB/s)","883.75 (min 679.35, max 1088.14)","942.36 (min 754.93, max 1129.78)","830.91 (min 573.68, max 1088.14)" - "bw_mem-rdwr-16mb (MB/s)","675.96","830.95","597.26" - "bw_mem-rdwr-1mb (MB/s)","475.87 (min 392.46, max 559.28)","538.40 (min 430.17, max 646.62)","527.09 (min 446.83, max 607.35)" - "bw_mem-rdwr-2mb (MB/s)","452.73 (min 410.09, max 495.36)","506.60 (min 438.07, max 575.13)","480.47 (min 412.54, max 548.40)" - "bw_mem-rdwr-4mb (MB/s)","485.45 (min 388.31, max 582.58)","579.51 (min 485.38, max 673.63)","505.73 (min 437.49, max 573.97)" - "bw_mem-rdwr-8mb (MB/s)","567.00 (min 439.68, max 694.32)","619.49 (min 477.73, max 761.25)","487.83 (min 399.36, max 576.29)" - "bw_mem-wr-16mb (MB/s)","745.19","766.06","609.45" - "bw_mem-wr-1mb (MB/s)","569.46 (min 559.28, max 579.63)","647.67 (min 646.62, max 648.72)","613.95 (min 607.35, max 620.54)" - "bw_mem-wr-2mb (MB/s)","496.10 (min 495.36, max 496.83)","574.31 (min 573.48, max 575.13)","551.33 (min 548.40, max 554.25)" - "bw_mem-wr-4mb (MB/s)","584.33 (min 582.58, max 586.08)","674.03 (min 673.63, max 674.42)","573.03 (min 572.08, max 573.97)" - "bw_mem-wr-8mb (MB/s)","686.84 (min 679.35, max 694.32)","758.09 (min 754.93, max 761.25)","574.99 (min 573.68, max 576.29)" - "bw_mmap_rd-mo-1mb (MB/s)","1219.51","1265.82","1244.22" - "bw_mmap_rd-o2c-1mb (MB/s)","472.52","500.92","446.10" - "bw_pipe (MB/s)","462.28","507.32","468.69" - "bw_unix (MB/s)","549.13","599.28","654.14" - "lat_connect (us)","66.58","59.62","66.43" - "lat_ctx-2-128k (us)","8.57","7.38","9.05" - "lat_ctx-2-256k (us)","10.84","10.58","12.25" - "lat_ctx-4-128k (us)","8.82","7.32","8.58" - "lat_ctx-4-256k (us)","9.82","9.93","10.74" - "lat_fs-0k (num_files)","209.00","220.00","182.00" - "lat_fs-10k (num_files)","87.00","96.00","93.00" - "lat_fs-1k (num_files)","126.00","143.00","136.00" - "lat_fs-4k (num_files)","131.00","130.00","123.00" - "lat_mem_rd-stride128-sz1000k (ns)","54.80","51.88","53.94" - "lat_mem_rd-stride128-sz125k (ns)","6.22","5.57","6.22" - "lat_mem_rd-stride128-sz250k (ns)","6.55","5.84","6.55" - "lat_mem_rd-stride128-sz31k (ns)","4.70","2.16","4.09" - "lat_mem_rd-stride128-sz50 (ns)","2.40","2.15","2.41" - "lat_mem_rd-stride128-sz500k (ns)","15.61","24.71","15.47" - "lat_mem_rd-stride128-sz62k (ns)","5.89","5.25","5.86" - "lat_mmap-1m (us)","60.00","64.00","61.00" - "lat_ops-double-add (ns)","3.21","2.86","3.21" - "lat_ops-double-div (ns)","17.63","15.75","17.63" - "lat_ops-double-mul (ns)","3.21","2.86","3.20" - "lat_ops-float-add (ns)","3.21","2.86","3.21" - "lat_ops-float-div (ns)","10.43","9.31","10.42" - "lat_ops-float-mul (ns)","3.21","2.86","3.21" + "af_unix_sock_stream_latency (microsec)","33.40 (min 32.86, max 34.65)","29.79 (min 28.64, max 30.84)","33.61 (min 33.07, max 34.90)" + "af_unix_socket_stream_bandwidth (mb\s)","532.62 (min 513.45, max 555.88)","602.54 (min 576.79, max 715.30)","728.89 (min 632.89, max 809.03)" + "bw_file_rd-io-1mb (mb/s)","844.54 (min 822.23, max 886.68)","985.59 (min 935.75, max 1129.31)","970.83 (min 868.06, max 1075.08)" + "bw_file_rd-o2c-1mb (mb/s)","460.27 (min 433.28, max 488.60)","520.63 (min 488.28, max 589.88)","545.10 (min 484.50, max 608.46)" + "bw_mem-bcopy-16mb (mb/s)","666.43 (min 656.63, max 698.69)","779.46 (min 755.22, max 916.43)","804.83 (min 710.04, max 926.57)" + "bw_mem-bcopy-1mb (mb/s)","700.75 (min 675.45, max 741.70)","842.36 (min 785.55, max 1038.96)","888.53 (min 745.85, max 1009.08)" + "bw_mem-bcopy-2mb (mb/s)","657.09 (min 645.27, max 687.52)","789.75 (min 751.88, max 965.41)","796.56 (min 719.55, max 885.48)" + "bw_mem-bcopy-4mb (mb/s)","689.78 (min 669.68, max 728.73)","816.64 (min 783.70, max 999.25)","813.86 (min 710.98, max 940.96)" + "bw_mem-bcopy-8mb (mb/s)","699.67 (min 684.46, max 732.80)","822.42 (min 799.44, max 920.70)","807.96 (min 708.84, max 914.81)" + "bw_mem-bzero-16mb (mb/s)","1706.95 (min 1678.03, max 1776.99)","1798.84 (min 1743.30, max 2125.68)","1932.00 (min 1724.88, max 2128.79)" + "bw_mem-bzero-1mb (mb/s)","1194.75 (min 675.45, max 1771.79)","1310.82 (min 785.55, max 2122.77)","1407.48 (min 745.85, max 2129.17)" + "bw_mem-bzero-2mb (mb/s)","1172.66 (min 645.27, max 1768.35)","1285.64 (min 751.88, max 2123.14)","1361.57 (min 719.55, max 2130.30)" + "bw_mem-bzero-4mb (mb/s)","1189.77 (min 669.68, max 1766.78)","1299.62 (min 783.70, max 2125.78)","1370.93 (min 710.98, max 2129.93)" + "bw_mem-bzero-8mb (mb/s)","1202.52 (min 684.46, max 1767.37)","1310.44 (min 799.44, max 2125.12)","1372.21 (min 708.84, max 2128.79)" + "bw_mem-cp-16mb (mb/s)","381.91 (min 356.51, max 400.99)","466.22 (min 438.89, max 574.16)","470.46 (min 411.22, max 525.11)" + "bw_mem-cp-1mb (mb/s)","1107.67 (min 369.41, max 1907.67)","1193.34 (min 436.81, max 2264.58)","1276.71 (min 394.48, max 2281.80)" + "bw_mem-cp-2mb (mb/s)","1071.32 (min 360.82, max 1842.30)","1160.88 (min 427.53, max 2201.03)","1231.90 (min 381.90, max 2205.48)" + "bw_mem-cp-4mb (mb/s)","1072.77 (min 398.29, max 1814.61)","1162.44 (min 467.24, max 2159.05)","1218.76 (min 398.45, max 2171.16)" + "bw_mem-cp-8mb (mb/s)","1071.48 (min 408.66, max 1804.85)","1164.03 (min 482.77, max 2152.85)","1203.39 (min 386.32, max 2174.80)" + "bw_mem-fcp-16mb (mb/s)","669.23 (min 654.21, max 689.36)","757.23 (min 728.96, max 882.76)","867.40 (min 755.89, max 1002.82)" + "bw_mem-fcp-1mb (mb/s)","1231.51 (min 756.43, max 1771.79)","1338.53 (min 855.29, max 2122.77)","1426.17 (min 823.32, max 2129.17)" + "bw_mem-fcp-2mb (mb/s)","1211.46 (min 718.13, max 1768.35)","1330.64 (min 832.52, max 2123.14)","1411.18 (min 782.78, max 2130.30)" + "bw_mem-fcp-4mb (mb/s)","1222.02 (min 729.13, max 1766.78)","1347.90 (min 869.28, max 2125.78)","1411.80 (min 780.03, max 2129.93)" + "bw_mem-fcp-8mb (mb/s)","1236.32 (min 736.85, max 1767.37)","1366.49 (min 887.71, max 2125.12)","1415.27 (min 788.18, max 2128.79)" + "bw_mem-frd-16mb (mb/s)","1022.55 (min 981.35, max 1076.35)","1188.74 (min 1132.50, max 1428.19)","1201.69 (min 1025.58, max 1350.67)" + "bw_mem-frd-1mb (mb/s)","958.09 (min 756.43, max 1193.93)","1114.58 (min 855.29, max 1598.58)","1143.78 (min 823.32, max 1534.53)" + "bw_mem-frd-2mb (mb/s)","871.89 (min 718.13, max 1081.28)","1010.04 (min 832.52, max 1378.12)","1048.22 (min 782.78, max 1358.00)" + "bw_mem-frd-4mb (mb/s)","886.22 (min 729.13, max 1068.09)","1041.72 (min 869.28, max 1402.28)","1046.94 (min 780.03, max 1353.41)" + "bw_mem-frd-8mb (mb/s)","895.53 (min 736.85, max 1082.98)","1056.14 (min 887.71, max 1422.22)","1050.26 (min 788.18, max 1356.62)" + "bw_mem-fwr-16mb (mb/s)","1713.36 (min 1690.44, max 1779.76)","1809.72 (min 1752.08, max 2139.90)","1946.08 (min 1751.89, max 2145.35)" + "bw_mem-fwr-1mb (mb/s)","1487.39 (min 1112.70, max 1907.67)","1624.29 (min 1263.54, max 2264.58)","1725.34 (min 1197.40, max 2281.80)" + "bw_mem-fwr-2mb (mb/s)","1388.30 (min 974.34, max 1842.30)","1502.10 (min 1075.85, max 2201.03)","1601.94 (min 1076.57, max 2205.48)" + "bw_mem-fwr-4mb (mb/s)","1378.25 (min 989.12, max 1814.61)","1502.80 (min 1074.98, max 2159.05)","1584.78 (min 1080.94, max 2171.16)" + "bw_mem-fwr-8mb (mb/s)","1373.81 (min 975.73, max 1804.85)","1498.37 (min 1119.66, max 2152.85)","1582.44 (min 1073.39, max 2174.80)" + "bw_mem-rd-16mb (mb/s)","1037.69 (min 1016.97, max 1083.72)","1187.07 (min 1098.90, max 1445.48)","1215.25 (min 1060.59, max 1351.12)" + "bw_mem-rd-1mb (mb/s)","867.03 (min 533.14, max 1234.35)","1028.36 (min 648.40, max 1634.88)","1048.08 (min 572.63, max 1595.18)" + "bw_mem-rd-2mb (mb/s)","767.51 (min 473.20, max 1085.19)","899.44 (min 569.48, max 1419.45)","923.31 (min 506.14, max 1376.70)" + "bw_mem-rd-4mb (mb/s)","798.39 (min 530.01, max 1083.13)","946.09 (min 674.76, max 1435.49)","922.27 (min 522.94, max 1364.26)" + "bw_mem-rd-8mb (mb/s)","831.83 (min 586.17, max 1084.60)","989.49 (min 743.43, max 1446.92)","937.43 (min 563.94, max 1356.62)" + "bw_mem-rdwr-16mb (mb/s)","670.46 (min 629.00, max 718.55)","836.08 (min 773.47, max 1046.44)","662.35 (min 584.13, max 754.68)" + "bw_mem-rdwr-1mb (mb/s)","463.26 (min 369.41, max 567.46)","576.99 (min 436.81, max 806.19)","571.73 (min 394.48, max 769.47)" + "bw_mem-rdwr-2mb (mb/s)","429.34 (min 360.82, max 514.07)","532.83 (min 427.53, max 740.60)","529.48 (min 381.90, max 690.25)" + "bw_mem-rdwr-4mb (mb/s)","480.32 (min 398.29, max 593.74)","588.73 (min 467.24, max 879.99)","548.02 (min 398.45, max 723.85)" + "bw_mem-rdwr-8mb (mb/s)","525.75 (min 408.66, max 655.68)","644.03 (min 482.77, max 956.71)","545.57 (min 386.32, max 737.87)" + "bw_mem-wr-16mb (mb/s)","667.31 (min 625.73, max 693.30)","844.62 (min 778.66, max 1039.37)","675.18 (min 587.59, max 771.12)" + "bw_mem-wr-1mb (mb/s)","545.02 (min 524.48, max 572.66)","690.54 (min 638.47, max 819.94)","676.66 (min 572.63, max 781.40)" + "bw_mem-wr-2mb (mb/s)","490.33 (min 468.06, max 525.97)","612.48 (min 567.54, max 740.60)","603.33 (min 506.14, max 707.21)" + "bw_mem-wr-4mb (mb/s)","557.39 (min 494.56, max 593.74)","697.74 (min 605.05, max 879.99)","626.41 (min 522.94, max 725.16)" + "bw_mem-wr-8mb (mb/s)","630.78 (min 586.17, max 671.76)","785.24 (min 709.66, max 1007.68)","648.27 (min 563.94, max 754.36)" + "bw_mmap_rd-mo-1mb (mb/s)","1163.27 (min 1139.38, max 1219.09)","1324.21 (min 1260.35, max 1606.86)","1377.07 (min 1225.06, max 1541.36)" + "bw_mmap_rd-o2c-1mb (mb/s)","455.11 (min 438.28, max 477.55)","500.79 (min 427.78, max 590.67)","519.99 (min 465.91, max 600.69)" + "bw_pipe (mb/s)","443.15 (min 435.10, max 453.94)","515.70 (min 492.51, max 600.38)","498.69 (min 451.80, max 545.64)" + "bw_unix (mb/s)","532.62 (min 513.45, max 555.88)","602.54 (min 576.79, max 715.30)","728.89 (min 632.89, max 809.03)" + "lat_connect (us)","66.67 (min 66.20, max 67.85)","59.11 (min 58.18, max 59.76)","65.67 (min 63.87, max 69.00)" + "lat_ctx-2-128k (us)","8.89 (min 8.32, max 9.14)","7.99 (min 7.63, max 8.34)","8.91 (min 8.50, max 9.59)" + "lat_ctx-2-256k (us)","13.57 (min 9.14, max 16.40)","9.88 (min 6.84, max 10.92)","12.44 (min 8.10, max 15.04)" + "lat_ctx-4-128k (us)","9.13 (min 8.33, max 9.61)","7.66 (min 7.17, max 8.17)","8.56 (min 8.09, max 8.88)" + "lat_ctx-4-256k (us)","10.98 (min 7.76, max 13.14)","9.48 (min 7.36, max 12.90)","8.46 (min 0.00, max 12.65)" + "lat_fs-0k (num_files)","198.86 (min 177.00, max 227.00)","213.63 (min 195.00, max 235.00)","198.88 (min 192.00, max 210.00)" + "lat_fs-10k (num_files)","92.57 (min 86.00, max 103.00)","102.88 (min 92.00, max 128.00)","93.13 (min 82.00, max 104.00)" + "lat_fs-1k (num_files)","124.29 (min 109.00, max 146.00)","145.63 (min 135.00, max 160.00)","134.75 (min 115.00, max 147.00)" + "lat_fs-4k (num_files)","123.14 (min 107.00, max 130.00)","145.25 (min 128.00, max 159.00)","133.63 (min 123.00, max 158.00)" + "lat_mem_rd-stride128-sz1000k (ns)","56.96 (min 54.29, max 58.01)","50.45 (min 42.65, max 52.51)","48.81 (min 43.55, max 54.17)" + "lat_mem_rd-stride128-sz125k (ns)","6.22 (min 6.20, max 6.26)","5.57 (min 5.54, max 5.58)","6.22 (min 6.20, max 6.26)" + "lat_mem_rd-stride128-sz250k (ns)","6.54 (min 6.54, max 6.56)","5.84 (min 5.83, max 5.85)","6.54 (min 6.53, max 6.54)" + "lat_mem_rd-stride128-sz31k (ns)","4.20 (min 2.42, max 4.70)","3.85 (min 3.65, max 4.19)","3.40 (min 2.41, max 4.70)" + "lat_mem_rd-stride128-sz50 (ns)","2.40 (min 2.40, max 2.41)","2.15","2.40 (min 2.40, max 2.41)" + "lat_mem_rd-stride128-sz500k (ns)","17.11 (min 11.46, max 21.66)","17.27 (min 13.44, max 20.26)","15.35 (min 10.09, max 21.82)" + "lat_mem_rd-stride128-sz62k (ns)","5.77 (min 5.05, max 5.89)","5.24 (min 5.22, max 5.27)","5.87 (min 5.85, max 5.90)" + "lat_mmap-1m (us)","66.14 (min 59.00, max 73.00)","55.13 (min 53.00, max 64.00)","64.75 (min 57.00, max 71.00)" + "lat_ops-double-add (ns)","3.21","2.86 (min 2.86, max 2.87)","3.21" + "lat_ops-double-div (ns)","17.63 (min 17.62, max 17.64)","15.74 (min 15.74, max 15.75)","17.63 (min 17.63, max 17.65)" + "lat_ops-double-mul (ns)","3.21","2.86","3.21" + "lat_ops-float-add (ns)","3.21","2.86 (min 2.86, max 2.87)","3.21" + "lat_ops-float-div (ns)","10.43 (min 10.42, max 10.43)","9.30","10.42 (min 10.42, max 10.43)" + "lat_ops-float-mul (ns)","3.21 (min 3.20, max 3.21)","2.86","3.21" "lat_ops-int-add (ns)","0.80","0.72","0.80" - "lat_ops-int-bit (ns)","0.53","0.48","0.53" - "lat_ops-int-div (ns)","4.81","4.29","4.81" - "lat_ops-int-mod (ns)","5.08","4.53","5.08" - "lat_ops-int-mul (ns)","3.51","3.13","3.51" + "lat_ops-int-bit (ns)","0.53","0.48","0.53 (min 0.53, max 0.54)" + "lat_ops-int-div (ns)","4.81 (min 4.81, max 4.82)","4.29 (min 4.29, max 4.30)","4.81" + "lat_ops-int-mod (ns)","5.08","4.53 (min 4.53, max 4.54)","5.08 (min 5.07, max 5.08)" + "lat_ops-int-mul (ns)","3.45 (min 3.45, max 3.46)","3.08 (min 3.07, max 3.10)","3.45 (min 3.44, max 3.46)" "lat_ops-int64-add (ns)","0.80","0.72","0.80" - "lat_ops-int64-bit (ns)","0.53","0.48","0.53" - "lat_ops-int64-div (ns)","7.61","6.80","7.62" - "lat_ops-int64-mod (ns)","5.88","5.25","5.88" - "lat_ops-int64-mul (ns)","3.98","3.55","3.98" - "lat_pagefault (us)","0.78","0.71","1.55" - "lat_pipe (us)","27.48","25.15","28.22" - "lat_proc-exec (us)","1071.80","1023.00","1042.80" - "lat_proc-fork (us)","882.86","852.86","929.00" + "lat_ops-int64-bit (ns)","0.53","0.48","0.53 (min 0.53, max 0.54)" + "lat_ops-int64-div (ns)","7.62 (min 7.61, max 7.62)","6.80","7.62 (min 7.61, max 7.62)" + "lat_ops-int64-mod (ns)","5.88","5.25","5.88 (min 5.87, max 5.89)" + "lat_ops-int64-mul (ns)","3.99 (min 3.98, max 4.04)","3.56 (min 3.55, max 3.61)","3.98" + "lat_pagefault (us)","0.80 (min 0.76, max 0.82)","0.71 (min 0.60, max 0.73)","1.26 (min 0.65, max 1.74)" + "lat_pipe (us)","28.82 (min 28.37, max 29.43)","25.77 (min 25.50, max 26.22)","28.93 (min 28.25, max 29.53)" + "lat_proc-exec (us)","1108.66 (min 1066.20, max 1142.00)","979.70 (min 844.00, max 1031.50)","1006.99 (min 886.29, max 1144.60)" + "lat_proc-fork (us)","940.39 (min 880.50, max 1009.50)","831.78 (min 684.14, max 873.14)","857.04 (min 765.86, max 954.67)" "lat_proc-proccall (us)","0.01","0.01","0.01" - "lat_select (us)","38.14","34.07","37.98" - "lat_sem (us)","4.37","2.98","3.22" - "lat_sig-catch (us)","5.97","5.31","6.03" - "lat_sig-install (us)","0.73","0.65","0.73" - "lat_sig-prot (us)","0.78","0.58","0.74" - "lat_syscall-fstat (us)","2.23","1.97","2.22" - "lat_syscall-null (us)","0.52","0.46","0.52" - "lat_syscall-open (us)","185.60","155.14","224.73" - "lat_syscall-read (us)","0.90","0.80","0.90" - "lat_syscall-stat (us)","5.44","4.87","5.44" - "lat_syscall-write (us)","0.91","0.81","0.92" - "lat_tcp (us)","1.04","0.93","1.04" - "lat_unix (us)","33.72","29.04","33.12" - "latency_for_0.50_mb_block_size (nanosec)","15.61","24.71","15.47" - "latency_for_1.00_mb_block_size (nanosec)","27.40 (min 0.00, max 54.80)","25.94 (min 0.00, max 51.88)","26.97 (min 0.00, max 53.94)" - "pipe_bandwidth (MBs)","462.28","507.32","468.69" - "pipe_latency (microsec)","27.48","25.15","28.22" + "lat_select (us)","38.12 (min 37.94, max 38.28)","34.11 (min 33.75, max 34.40)","38.13 (min 37.96, max 38.48)" + "lat_sem (us)","3.53 (min 2.89, max 4.27)","3.09 (min 2.59, max 3.54)","3.36 (min 2.96, max 3.84)" + "lat_sig-catch (us)","6.23 (min 6.03, max 6.45)","5.52 (min 5.27, max 5.68)","6.18 (min 5.95, max 6.37)" + "lat_sig-install (us)","0.74 (min 0.72, max 0.79)","0.66 (min 0.65, max 0.70)","0.75 (min 0.72, max 0.79)" + "lat_sig-prot (us)","0.71 (min 0.55, max 0.93)","0.65 (min 0.48, max 0.80)","0.83 (min 0.58, max 1.48)" + "lat_syscall-fstat (us)","2.21 (min 2.14, max 2.32)","1.98 (min 1.89, max 2.10)","2.22 (min 2.12, max 2.32)" + "lat_syscall-null (us)","0.51 (min 0.51, max 0.52)","0.46 (min 0.46, max 0.50)","0.52 (min 0.51, max 0.56)" + "lat_syscall-open (us)","214.57 (min 153.03, max 305.39)","175.20 (min 155.95, max 202.88)","174.43 (min 153.94, max 210.15)" + "lat_syscall-read (us)","0.92 (min 0.90, max 0.99)","0.82 (min 0.80, max 0.88)","0.92 (min 0.90, max 0.99)" + "lat_syscall-stat (us)","5.37 (min 5.23, max 5.53)","4.80 (min 4.66, max 5.01)","5.39 (min 5.25, max 5.60)" + "lat_syscall-write (us)","0.86 (min 0.84, max 0.89)","0.78 (min 0.75, max 0.84)","0.87 (min 0.84, max 0.94)" + "lat_tcp (us)","1.02","0.92 (min 0.91, max 0.97)","1.03 (min 1.02, max 1.09)" + "lat_unix (us)","33.40 (min 32.86, max 34.65)","29.79 (min 28.64, max 30.84)","33.61 (min 33.07, max 34.90)" + "latency_for_0.50_mb_block_size (nanosec)","17.11 (min 11.46, max 21.66)","17.27 (min 13.44, max 20.26)","15.35 (min 10.09, max 21.82)" + "latency_for_1.00_mb_block_size (nanosec)","28.48 (min 0.00, max 58.01)","25.22 (min 0.00, max 52.51)","24.41 (min 0.00, max 54.17)" + "pipe_bandwidth (mb\s)","443.15 (min 435.10, max 453.94)","515.70 (min 492.51, max 600.38)","498.69 (min 451.80, max 545.64)" + "pipe_latency (microsec)","28.82 (min 28.37, max 29.43)","25.77 (min 25.50, max 26.22)","28.93 (min 28.25, max 29.53)" "procedure_call (microsec)","0.01","0.01","0.01" - "select_on_200_tcp_fds (microsec)","38.14","34.07","37.98" - "semaphore_latency (microsec)","4.37","2.98","3.22" - "signal_handler_latency (microsec)","0.73","0.65","0.73" - "signal_handler_overhead (microsec)","5.97","5.31","6.03" - "tcp_ip_connection_cost_to_localhost (microsec)","66.58","59.62","66.43" - "tcp_latency_using_localhost (microsec)","1.04","0.93","1.04" - - + "select_on_200_tcp_fds (microsec)","38.12 (min 37.94, max 38.28)","34.11 (min 33.75, max 34.40)","38.13 (min 37.96, max 38.48)" + "semaphore_latency (microsec)","3.53 (min 2.89, max 4.27)","3.09 (min 2.59, max 3.54)","3.36 (min 2.96, max 3.84)" + "signal_handler_latency (microsec)","0.74 (min 0.72, max 0.79)","0.66 (min 0.65, max 0.70)","0.75 (min 0.72, max 0.79)" + "signal_handler_overhead (microsec)","6.23 (min 6.03, max 6.45)","5.52 (min 5.27, max 5.68)","6.18 (min 5.95, max 6.37)" + "tcp_ip_connection_cost_to_localhost (microsec)","66.67 (min 66.20, max 67.85)","59.11 (min 58.18, max 59.76)","65.67 (min 63.87, max 69.00)" + "tcp_latency_using_localhost (microsec)","1.02","0.92 (min 0.91, max 0.97)","1.03 (min 1.02, max 1.09)" Dhrystone ^^^^^^^^^ @@ -193,10 +188,9 @@ Dhrystone is a core only benchmark that runs from warm L1 caches in all modern processors. It scales linearly with clock speed. Please take note, different run may produce different slightly results. -This is advised to run this test multiple times in order to get maximum +This is advised to run this test multiple times in order to get maximum performance numbers. - Execute the benchmark with the following: :: @@ -206,11 +200,9 @@ Execute the benchmark with the following: .. csv-table:: Dhrystone Benchmarks :header: "Benchmarks","am62xx_lp_sk-fs: perf","am62xx_sk-fs: perf","am62xxsip_sk-fs: perf" - "cpu_clock (MHz)","1250.00","1400.00","1250.00" - "dhrystone_per_mhz (DMIPS/MHz)","2.90","2.90","2.90" - "dhrystone_per_second (DhrystoneP)","6451613.00","7142857.00","6451613.00" - - + "cpu_clock (mhz)","1250.00","1400.00","1250.00" + "dhrystone_per_mhz (dmips/mhz)","2.84 (min 2.80, max 2.90)","2.90","2.86 (min 2.80, max 2.90)" + "dhrystone_per_second (dhrystonep)","6336405.57 (min 6250000.00, max 6451613.00)","7142857.00","6376008.13 (min 6250000.00, max 6451613.00)" Whetstone ^^^^^^^^^ @@ -225,9 +217,7 @@ Execute the benchmark with the following: .. csv-table:: Whetstone Benchmarks :header: "Benchmarks","am62xx_lp_sk-fs: perf","am62xx_sk-fs: perf","am62xxsip_sk-fs: perf" - "whetstone (MIPS)","5000.00","5000.00","5000.00" - - + "whetstone (mips)","5000.00","5000.00","5000.00" Linpack ^^^^^^^ @@ -237,9 +227,7 @@ solving a dense linear system. .. csv-table:: Linpack Benchmarks :header: "Benchmarks","am62xx_lp_sk-fs: perf","am62xx_sk-fs: perf","am62xxsip_sk-fs: perf" - "linpack (Kflops)","515516.00","575242.00","515670.00" - - + "linpack (kflops)","513733.00 (min 511865.00, max 515438.00)","577158.63 (min 576063.00, max 577662.00)","515214.00 (min 513050.00, max 516718.00)" NBench ^^^^^^ @@ -252,17 +240,15 @@ https://nbench.io/articles/index.html .. csv-table:: NBench Benchmarks :header: "Benchmarks","am62xx_lp_sk-fs: perf","am62xx_sk-fs: perf","am62xxsip_sk-fs: perf" - "assignment (Iterations)","12.94","14.49","12.90" - "fourier (Iterations)","20380.00","22832.00","20384.00" - "fp_emulation (Iterations)","192.48","215.64","192.53" - "huffman (Iterations)","1057.10","1184.20","1057.10" - "idea (Iterations)","3075.10","3444.70","3075.50" - "lu_decomposition (Iterations)","473.03","530.04","473.87" - "neural_net (Iterations)","7.73","8.66","7.73" - "numeric_sort (Iterations)","561.61","629.58","557.46" - "string_sort (Iterations)","146.34","163.94","146.35" - - + "assignment (iterations)","12.92 (min 12.80, max 12.95)","14.49 (min 14.44, max 14.53)","12.93 (min 12.85, max 12.96)" + "fourier (iterations)","20380.88 (min 20371.00, max 20385.00)","22828.75 (min 22827.00, max 22831.00)","20383.88 (min 20381.00, max 20385.00)" + "fp_emulation (iterations)","192.50 (min 192.47, max 192.52)","215.61 (min 215.57, max 215.65)","192.52 (min 192.49, max 192.54)" + "huffman (iterations)","1057.11 (min 1056.50, max 1057.40)","1183.90 (min 1183.30, max 1184.30)","1057.24 (min 1056.70, max 1057.40)" + "idea (iterations)","3075.31 (min 3074.90, max 3075.60)","3444.45 (min 3444.20, max 3444.80)","3075.58 (min 3075.30, max 3075.70)" + "lu_decomposition (iterations)","472.14 (min 469.83, max 473.70)","527.41 (min 522.26, max 529.95)","472.13 (min 469.78, max 473.74)" + "neural_net (iterations)","7.73 (min 7.72, max 7.73)","8.65 (min 8.64, max 8.66)","7.72 (min 7.71, max 7.73)" + "numeric_sort (iterations)","559.47 (min 553.45, max 562.47)","625.06 (min 616.37, max 629.09)","559.74 (min 550.44, max 561.86)" + "string_sort (iterations)","146.35 (min 146.33, max 146.37)","163.92 (min 163.91, max 163.94)","146.36 (min 146.35, max 146.37)" Stream ^^^^^^ @@ -285,13 +271,10 @@ Execute the benchmark with the following: .. csv-table:: Stream Benchmarks :header: "Benchmarks","am62xx_lp_sk-fs: perf","am62xx_sk-fs: perf","am62xxsip_sk-fs: perf" - "add (MB/s)","1415.00","1447.90","1692.60" - "copy (MB/s)","1455.40","1638.00","1875.50" - "scale (MB/s)","1595.70","1792.70","1938.40" - "triad (MB/s)","1384.60","1477.10","1657.50" - - - + "add (mb/s)","1403.63 (min 1363.30, max 1452.60)","1628.69 (min 1443.40, max 1805.40)","1690.80 (min 1688.10, max 1693.80)" + "copy (mb/s)","1471.36 (min 1421.90, max 1537.40)","1877.63 (min 1635.60, max 2125.00)","1869.34 (min 1836.10, max 1926.50)" + "scale (mb/s)","1605.57 (min 1561.70, max 1663.20)","2031.11 (min 1793.40, max 2270.80)","1937.30 (min 1923.80, max 1949.60)" + "triad (mb/s)","1378.53 (min 1343.40, max 1423.00)","1676.24 (min 1479.30, max 1872.10)","1656.76 (min 1651.70, max 1662.10)" CoreMarkPro ^^^^^^^^^^^ @@ -301,39 +284,33 @@ While CoreMark stresses the CPU pipeline, CoreMark-Pro tests the entire processo adding comprehensive support for multicore technology, a combination of integer and floating-point workloads, and data sets for utilizing larger memory subsystems. - .. csv-table:: CoreMarkPro Benchmarks :header: "Benchmarks","am62xx_lp_sk-fs: perf","am62xx_sk-fs: perf","am62xxsip_sk-fs: perf" - "cjpeg-rose7-preset (workloads/)","37.17","41.84","37.59" + "cjpeg-rose7-preset (workloads/)","37.30 (min 37.17, max 37.45)","41.84 (min 41.67, max 42.02)","37.38 (min 36.90, max 37.59)" "core (workloads/)","0.27","0.30","0.27" - "coremark-pro ()","789.18","887.88","823.42" - "linear_alg-mid-100x100-sp (workloads/)","13.10","14.68","13.11" - "loops-all-mid-10k-sp (workloads/)","0.59","0.66","0.63" - "nnet_test (workloads/)","0.97","1.09","0.97" - "parser-125k (workloads/)","7.41","8.20","7.69" - "radix2-big-64k (workloads/)","45.59","53.18","57.64" - "sha-test (workloads/)","71.43","80.65","72.46" - "zip-test (workloads/)","18.52","20.83","18.87" - - - + "coremark-pro ()","784.22 (min 761.93, max 799.55)","874.96 (min 849.21, max 918.16)","800.81 (min 770.03, max 828.46)" + "linear_alg-mid-100x100-sp (workloads/)","13.10 (min 13.09, max 13.11)","14.68 (min 14.66, max 14.70)","13.10 (min 13.09, max 13.11)" + "loops-all-mid-10k-sp (workloads/)","0.59 (min 0.59, max 0.60)","0.67 (min 0.66, max 0.70)","0.62 (min 0.60, max 0.63)" + "nnet_test (workloads/)","0.97","1.09 (min 1.08, max 1.09)","0.97" + "parser-125k (workloads/)","7.38 (min 7.30, max 7.46)","8.30 (min 8.20, max 8.62)","7.64 (min 7.41, max 7.75)" + "radix2-big-64k (workloads/)","42.96 (min 33.97, max 51.13)","46.53 (min 35.36, max 63.36)","46.38 (min 36.20, max 60.27)" + "sha-test (workloads/)","71.81 (min 70.92, max 71.94)","80.56 (min 80.00, max 80.65)","72.14 (min 71.43, max 72.46)" + "zip-test (workloads/)","18.52","20.84 (min 20.41, max 21.28)","18.96 (min 18.52, max 19.23)" .. csv-table:: CoreMarkProTwoCore Benchmarks :header: "Benchmarks","am62xx_lp_sk-fs: perf","am62xx_sk-fs: perf","am62xxsip_sk-fs: perf" - "cjpeg-rose7-preset (workloads/)","74.07","83.33","74.07" + "cjpeg-rose7-preset (workloads/)","73.92 (min 73.53, max 74.07)","82.82 (min 81.97, max 83.33)","74.28 (min 73.53, max 74.63)" "core (workloads/)","0.54","0.60","0.54" - "coremark-pro ()","1329.74","1487.25","1358.05" - "linear_alg-mid-100x100-sp (workloads/)","26.21","29.36","26.18" - "loops-all-mid-10k-sp (workloads/)","1.03","1.15","1.05" - "nnet_test (workloads/)","1.94","2.17","1.94" - "parser-125k (workloads/)","9.43","11.70","10.64" - "radix2-big-64k (workloads/)","38.37","38.53","40.37" - "sha-test (workloads/)","140.85","158.73","140.85" - "zip-test (workloads/)","34.48","38.46","34.48" - - + "coremark-pro ()","1335.06 (min 1324.28, max 1347.82)","1527.89 (min 1465.32, max 1576.42)","1407.68 (min 1356.48, max 1438.96)" + "linear_alg-mid-100x100-sp (workloads/)","26.18 (min 26.16, max 26.19)","29.33 (min 29.31, max 29.36)","26.19 (min 26.12, max 26.21)" + "loops-all-mid-10k-sp (workloads/)","1.03 (min 1.02, max 1.05)","1.19 (min 1.14, max 1.24)","1.11 (min 1.04, max 1.13)" + "nnet_test (workloads/)","1.94 (min 1.93, max 1.94)","2.17","1.94 (min 1.93, max 1.94)" + "parser-125k (workloads/)","10.55 (min 10.26, max 10.93)","12.28 (min 11.05, max 13.42)","11.24 (min 10.00, max 12.12)" + "radix2-big-64k (workloads/)","35.17 (min 33.06, max 38.93)","44.61 (min 36.64, max 51.47)","47.05 (min 40.80, max 50.65)" + "sha-test (workloads/)","142.86","160.01 (min 158.73, max 161.29)","143.89 (min 142.86, max 144.93)" + "zip-test (workloads/)","34.49 (min 33.90, max 35.09)","39.14 (min 37.74, max 40.00)","35.96 (min 35.09, max 36.36)" MultiBench ^^^^^^^^^^ @@ -355,57 +332,48 @@ thread-enabled workloads to be tested. .. csv-table:: Multibench Benchmarks :header: "Benchmarks","am62xx_lp_sk-fs: perf","am62xx_sk-fs: perf","am62xxsip_sk-fs: perf" - "4m-check (workloads/)","281.25","301.64","283.22" - "4m-check-reassembly (workloads/)","62.19","62.93","59.24" - "4m-check-reassembly-tcp (workloads/)","38.88","40.98","38.76" - "4m-check-reassembly-tcp-cmykw2-rotatew2 (workloads/)","22.26","23.69","22.50" - "4m-check-reassembly-tcp-x264w2 (workloads/)","1.61","1.75","1.59" - "4m-cmykw2 (workloads/)","185.01","199.01","181.32" - "4m-cmykw2-rotatew2 (workloads/)","36.17","39.14","35.38" - "4m-reassembly (workloads/)","46.88","49.53","47.57" - "4m-rotatew2 (workloads/)","41.34","44.29","41.08" - "4m-tcp-mixed (workloads/)","94.67","102.56","94.12" - "4m-x264w2 (workloads/)","1.67","1.83","1.64" + "4m-check (workloads/)","274.66 (min 267.24, max 283.06)","342.64 (min 302.01, max 368.24)","302.78 (min 279.33, max 340.88)" + "4m-check-reassembly (workloads/)","58.33 (min 56.63, max 60.42)","72.79 (min 62.42, max 80.13)","63.46 (min 56.21, max 74.35)" + "4m-check-reassembly-tcp (workloads/)","37.86 (min 36.82, max 38.76)","46.33 (min 41.32, max 49.80)","41.02 (min 37.48, max 46.04)" + "4m-check-reassembly-tcp-cmykw2-rotatew2 (workloads/)","21.83 (min 21.34, max 22.42)","27.22 (min 23.86, max 29.30)","24.15 (min 22.35, max 27.04)" + "4m-check-reassembly-tcp-x264w2 (workloads/)","1.59 (min 1.58, max 1.61)","1.80 (min 1.76, max 1.84)","1.62 (min 1.59, max 1.66)" + "4m-cmykw2 (workloads/)","178.88 (min 173.61, max 184.50)","220.64 (min 194.55, max 242.13)","192.61 (min 172.86, max 216.45)" + "4m-cmykw2-rotatew2 (workloads/)","35.01 (min 34.05, max 35.93)","44.14 (min 38.78, max 47.58)","37.56 (min 33.82, max 41.81)" + "4m-reassembly (workloads/)","46.17 (min 43.86, max 51.57)","57.21 (min 49.58, max 61.27)","50.47 (min 45.79, max 57.44)" + "4m-rotatew2 (workloads/)","40.02 (min 39.09, max 41.03)","49.21 (min 44.25, max 52.47)","43.68 (min 40.95, max 47.92)" + "4m-tcp-mixed (workloads/)","93.04 (min 91.43, max 95.24)","110.80 (min 103.90, max 115.11)","97.63 (min 93.02, max 104.58)" + "4m-x264w2 (workloads/)","1.63 (min 1.56, max 1.65)","1.87 (min 1.81, max 1.91)","1.65 (min 1.58, max 1.70)" "empty-wld (workloads/)","1.00","1.00","1.00" - "idct-4m (workloads/)","16.83","18.59","16.84" - "idct-4mw1 (workloads/)","16.82","18.59","16.84" - "ippktcheck-4m (workloads/)","282.01","302.52","283.42" - "ippktcheck-4mw1 (workloads/)","282.90","299.76","283.45" - "ipres-4m (workloads/)","59.34","64.32","60.90" - "ipres-4mw1 (workloads/)","60.98","64.91","61.37" - "md5-4m (workloads/)","22.20","24.69","22.06" - "md5-4mw1 (workloads/)","22.63","24.76","22.28" - "rgbcmyk-4m (workloads/)","56.95","63.67","56.77" - "rgbcmyk-4mw1 (workloads/)","57.16","63.55","56.71" - "rotate-4ms1 (workloads/)","16.98","18.11","16.91" - "rotate-4ms1w1 (workloads/)","17.00","18.12","16.89" - "rotate-4ms64 (workloads/)","17.19","18.37","17.05" - "rotate-4ms64w1 (workloads/)","17.18","18.27","16.95" - "x264-4mq (workloads/)","0.50","0.56","0.50" - "x264-4mqw1 (workloads/)","0.50","0.56","0.50" - - - - + "idct-4m (workloads/)","16.71 (min 16.49, max 16.78)","18.89 (min 18.56, max 19.11)","16.89 (min 16.78, max 17.10)" + "idct-4mw1 (workloads/)","16.71 (min 16.49, max 16.79)","18.89 (min 18.56, max 19.11)","16.91 (min 16.76, max 17.10)" + "ippktcheck-4m (workloads/)","274.52 (min 265.53, max 283.67)","340.93 (min 303.62, max 364.38)","302.69 (min 280.36, max 339.58)" + "ippktcheck-4mw1 (workloads/)","274.24 (min 267.87, max 282.61)","342.81 (min 303.21, max 368.08)","302.30 (min 278.27, max 338.89)" + "ipres-4m (workloads/)","58.88 (min 56.58, max 61.63)","73.72 (min 63.94, max 79.79)","66.26 (min 60.61, max 74.85)" + "ipres-4mw1 (workloads/)","58.64 (min 56.97, max 60.66)","73.94 (min 64.16, max 80.30)","66.06 (min 60.68, max 74.55)" + "md5-4m (workloads/)","21.83 (min 21.29, max 22.23)","25.41 (min 24.13, max 26.17)","22.62 (min 21.41, max 23.98)" + "md5-4mw1 (workloads/)","22.12 (min 21.82, max 22.44)","25.67 (min 24.51, max 26.52)","22.83 (min 22.00, max 24.08)" + "rgbcmyk-4m (workloads/)","56.75 (min 56.35, max 57.18)","64.33 (min 63.35, max 65.02)","56.81 (min 56.58, max 57.05)" + "rgbcmyk-4mw1 (workloads/)","56.65 (min 56.37, max 57.14)","64.40 (min 63.33, max 65.08)","56.79 (min 56.66, max 57.05)" + "rotate-4ms1 (workloads/)","16.66 (min 16.20, max 17.15)","20.43 (min 18.28, max 21.82)","18.07 (min 16.78, max 20.02)" + "rotate-4ms1w1 (workloads/)","16.68 (min 16.31, max 17.16)","20.58 (min 18.29, max 22.77)","18.09 (min 16.95, max 20.03)" + "rotate-4ms64 (workloads/)","16.83 (min 16.47, max 17.25)","20.60 (min 18.40, max 22.02)","18.26 (min 17.09, max 20.15)" + "rotate-4ms64w1 (workloads/)","16.82 (min 16.46, max 17.25)","20.76 (min 18.34, max 23.08)","18.28 (min 17.10, max 20.20)" + "x264-4mq (workloads/)","0.50","0.57 (min 0.56, max 0.57)","0.50 (min 0.50, max 0.51)" + "x264-4mqw1 (workloads/)","0.50","0.56 (min 0.56, max 0.57)","0.50 (min 0.50, max 0.51)" Boot-time Measurement --------------------- - Boot media: MMCSD ^^^^^^^^^^^^^^^^^ .. csv-table:: Linux boot time MMCSD - :header: "Boot Configuration","am62xx_sk-fs: Boot time in seconds: avg(min,max)","am62xxsip_sk-fs: Boot time in seconds: avg(min,max)" - - "Linux boot time from SD with default rootfs (20 boot cycles)","16.24 (min 15.96, max 16.42)","15.09 (min 14.92, max 15.32)" - + :header: "Boot Configuration","am62xx_lp_sk-fs: Boot time in seconds: avg(min,max)","am62xx_sk-fs: Boot time in seconds: avg(min,max)","am62xxsip_sk-fs: Boot time in seconds: avg(min,max)" + "Linux boot time from SD with default rootfs (20 boot cycles)","17.36 (min 15.98, max 25.46)","16.20 (min 14.74, max 22.20)","15.91 (min 14.98, max 25.80)" Boot time numbers [avg, min, max] are measured from "Starting kernel" to Linux prompt across 20 boot cycles. - - | ALSA SoC Audio Driver @@ -416,45 +384,37 @@ ALSA SoC Audio Driver #. Format - S16\_LE #. Period size - 64 - .. csv-table:: Audio Capture :header: "Sampling Rate (Hz)","am62xx_lp_sk-fs: Throughput (bits/sec)","am62xx_lp_sk-fs: CPU Load (%)","am62xx_sk-fs: Throughput (bits/sec)","am62xx_sk-fs: CPU Load (%)","am62xxsip_sk-fs: Throughput (bits/sec)","am62xxsip_sk-fs: CPU Load (%)" - "11025","352798.00","0.12","352799.00","0.12","352799.00","0.28" - "16000","511998.00","0.48","511999.00","0.10","512000.00","0.31" - "22050","705593.00","0.16","705596.00","0.16","705594.00","0.31" - "24000","705595.00","0.19","705598.00","0.19","705597.00","0.39" - "32000","1023993.00","0.11","1023996.00","0.11","1023997.00","0.31" - "44100","1411190.00","0.27","1411195.00","0.25","1411196.00","0.48" - "48000","1535990.00","1.02","1535994.00","0.20","1535996.00","0.38" - "88200","2822374.00","0.51","2822385.00","0.51","2822389.00","0.59" - "96000","3071972.00","0.22","3071984.00","0.19","3071987.00","0.36" - - - + "11025","352792.79 (min 352756.00, max 352798.00)","0.19 (min 0.13, max 0.67)","352798.88 (min 352798.00, max 352801.00)","0.13 (min 0.11, max 0.19)","352798.25 (min 352797.00, max 352800.00)","0.14 (min 0.11, max 0.18)" + "16000","511993.07 (min 511964.00, max 511998.00)","0.19 (min 0.11, max 0.55)","511999.38 (min 511997.00, max 512002.00)","0.11 (min 0.09, max 0.17)","511998.17 (min 511996.00, max 512002.00)","0.17 (min 0.08, max 0.33)" + "22050","705595.14 (min 705591.00, max 705613.00)","0.19 (min 0.16, max 0.24)","705594.50 (min 705591.00, max 705597.00)","0.16 (min 0.15, max 0.21)","705594.42 (min 705589.00, max 705600.00)","0.17 (min 0.14, max 0.22)" + "24000","705593.71 (min 705585.00, max 705596.00)","0.21 (min 0.18, max 0.28)","705596.75 (min 705595.00, max 705599.00)","0.19 (min 0.16, max 0.25)","705596.33 (min 705594.00, max 705600.00)","0.19 (min 0.14, max 0.25)" + "32000","1023989.36 (min 1023960.00, max 1023994.00)","0.14 (min 0.10, max 0.26)","1023996.25 (min 1023993.00, max 1023999.00)","0.12 (min 0.10, max 0.17)","1023995.50 (min 1023992.00, max 1024002.00)","0.18 (min 0.09, max 0.75)" + "44100","1411184.36 (min 1411137.00, max 1411193.00)","0.29 (min 0.26, max 0.35)","1411195.00 (min 1411191.00, max 1411199.00)","0.26 (min 0.23, max 0.31)","1411193.67 (min 1411188.00, max 1411203.00)","0.26 (min 0.23, max 0.32)" + "48000","1535982.00 (min 1535927.00, max 1535992.00)","0.30 (min 0.11, max 1.33)","1535994.50 (min 1535990.00, max 1535999.00)","0.15 (min 0.10, max 0.26)","1535993.17 (min 1535987.00, max 1536003.00)","0.27 (min 0.10, max 0.92)" + "88200","2822360.21 (min 2822256.00, max 2822378.00)","0.52 (min 0.45, max 0.59)","2822385.38 (min 2822376.00, max 2822395.00)","0.49 (min 0.44, max 0.59)","2822380.33 (min 2822369.00, max 2822401.00)","0.48 (min 0.38, max 0.56)" + "96000","3071963.64 (min 3071875.00, max 3071978.00)","0.25 (min 0.17, max 0.50)","3071983.00 (min 3071971.00, max 3071992.00)","0.24 (min 0.19, max 0.39)","3071976.00 (min 3071954.00, max 3071998.00)","0.32 (min 0.16, max 1.26)" .. csv-table:: Audio Playback :header: "Sampling Rate (Hz)","am62xx_lp_sk-fs: Throughput (bits/sec)","am62xx_lp_sk-fs: CPU Load (%)","am62xx_sk-fs: Throughput (bits/sec)","am62xx_sk-fs: CPU Load (%)","am62xxsip_sk-fs: Throughput (bits/sec)","am62xxsip_sk-fs: CPU Load (%)" - "11025","352945.00","0.13","352946.00","0.11","352948.00","0.10" - "16000","512212.00","0.26","512213.00","0.11","512216.00","0.09" - "22050","705888.00","0.14","705892.00","0.12","705887.00","0.12" - "24000","705890.00","0.17","705893.00","0.14","705891.00","0.14" - "32000","1024421.00","0.13","1024426.00","0.10","1024425.00","0.10" - "44100","1411781.00","0.21","1411787.00","0.19","1411789.00","0.18" - "48000","1536633.00","0.22","1536639.00","0.19","","" - "88200","2823558.00","0.36","2823567.00","0.35","","" - "96000","3073259.00","0.28","3073271.00","0.22","","" - - + "11025","352945.43 (min 352945.00, max 352947.00)","0.13 (min 0.12, max 0.14)","352946.86 (min 352946.00, max 352949.00)","0.13 (min 0.09, max 0.17)","352946.13 (min 352945.00, max 352948.00)","0.19 (min 0.09, max 0.32)" + "16000","512212.00 (min 512211.00, max 512213.00)","0.20 (min 0.11, max 0.54)","512213.29 (min 512211.00, max 512216.00)","0.13 (min 0.08, max 0.30)","512213.25 (min 512211.00, max 512216.00)","0.20 (min 0.10, max 0.31)" + "22050","705887.71 (min 705885.00, max 705892.00)","0.16 (min 0.15, max 0.17)","705888.71 (min 705885.00, max 705891.00)","0.14 (min 0.11, max 0.21)","705888.88 (min 705888.00, max 705890.00)","0.21 (min 0.12, max 0.35)" + "24000","705889.86 (min 705888.00, max 705892.00)","0.18 (min 0.17, max 0.19)","705891.57 (min 705890.00, max 705893.00)","0.17 (min 0.12, max 0.22)","705891.63 (min 705889.00, max 705894.00)","0.24 (min 0.14, max 0.37)" + "32000","1024421.71 (min 1024419.00, max 1024423.00)","0.14 (min 0.13, max 0.15)","1024424.57 (min 1024422.00, max 1024426.00)","0.13 (min 0.09, max 0.21)","1024424.25 (min 1024420.00, max 1024429.00)","0.19 (min 0.10, max 0.30)" + "44100","1411749.57 (min 1411554.00, max 1411783.00)","0.23 (min 0.21, max 0.25)","1411755.43 (min 1411579.00, max 1411787.00)","0.20 (min 0.16, max 0.26)","1411785.25 (min 1411779.00, max 1411793.00)","0.27 (min 0.18, max 0.38)" + "48000","1536632.83 (min 1536629.00, max 1536635.00)","0.26 (min 0.11, max 0.69)","1536637.57 (min 1536633.00, max 1536640.00)","0.16 (min 0.09, max 0.21)","1536636.00 (min 1536630.00, max 1536640.00)","0.29 (min 0.11, max 0.45)" + "88200","2823558.00 (min 2823550.00, max 2823562.00)","0.39 (min 0.38, max 0.42)","2823567.00 (min 2823558.00, max 2823572.00)","0.37 (min 0.32, max 0.41)","2823443.00 (min 2822703.00, max 2823573.00)","0.44 (min 0.34, max 0.58)" + "96000","3073257.40 (min 3073251.00, max 3073262.00)","0.25 (min 0.20, max 0.28)","3073268.57 (min 3073258.00, max 3073274.00)","0.22 (min 0.17, max 0.28)","3073266.57 (min 3073255.00, max 3073276.00)","0.35 (min 0.20, max 0.63)" | Graphics SGX/RGX Driver ----------------------- - - GFXBench ^^^^^^^^ Run GFXBench and capture performance reported (Score and Display rate in fps). All display outputs (HDMI, Displayport and/or LCD) are connected when running these tests @@ -462,12 +422,9 @@ Run GFXBench and capture performance reported (Score and Display rate in fps). A .. csv-table:: GFXBench Performance :header: "Benchmark","am62xx_lp_sk-fs: Score","am62xx_lp_sk-fs: Fps","am62xx_sk-fs: Score","am62xx_sk-fs: Fps" - " GFXBench 3.x gl_manhattan_off","80.18","1.29" - " GFXBench 3.x gl_trex_off","125.77","2.25" - " GFXBench 5.x gl_5_high_off","11.41","0.18","11.48","0.18" - - - + " GFXBench 3.x gl_manhattan_off","81.66 (min 80.20, max 82.31)","1.32 (min 1.29, max 1.33)" + " GFXBench 3.x gl_trex_off","123.00 (min 120.86, max 125.32)","2.20 (min 2.16, max 2.24)" + " GFXBench 5.x gl_5_high_off","11.20 (min 11.14, max 11.28)","0.17 (min 0.17, max 0.18)","11.76 (min 11.60, max 11.89)","0.18" Glmark2 ^^^^^^^ @@ -477,173 +434,33 @@ Run Glmark2 and capture performance reported (Score). All display outputs (HDMI, .. csv-table:: Glmark2 Performance :header: "Benchmark","am62xx_lp_sk-fs: Score","am62xx_sk-fs: Score","am62xxsip_sk-fs: Score" - "Glmark2-DRM","51.00","61.00","54.00" - "Glmark2-Wayland","199.00","217.00","210.00" - "Glmark2-Wayland 1920x1080","63.00","66.00" - - - -| - -Ethernet --------- -Ethernet performance benchmarks were measured using Netperf 2.7.1 https://hewlettpackard.github.io/netperf/doc/netperf.html -Test procedures were modeled after those defined in RFC-2544: -https://tools.ietf.org/html/rfc2544, where the DUT is the TI device -and the "tester" used was a Linux PC. To produce consistent results, -it is recommended to carry out performance tests in a private network and to avoid -running NFS on the same interface used in the test. In these results, -CPU utilization was captured as the total percentage used across all cores on the device, -while running the performance test over one external interface. - -UDP Throughput (0% loss) was measured by the procedure defined in RFC-2544 section 26.1: Throughput. -In this scenario, netperf options burst_size (-b) and wait_time (-w) are used to limit bandwidth -during different trials of the test, with the goal of finding the highest rate at which -no loss is seen. For example, to limit bandwidth to 500Mbits/sec with 1472B datagram: - -:: - - burst_size = / 8 (bits -> bytes) / / 100 (seconds -> 10 ms) - burst_size = 500000000 / 8 / 1472 / 100 = 425 - - wait_time = 10 milliseconds (minimum supported by Linux PC used for testing) - -UDP Throughput (possible loss) was measured by capturing throughput and packet loss statistics when -running the netperf test with no bandwidth limit (remove -b/-w options). - -In order to start a netperf client on one device, the other device must have netserver running. -To start netserver: - -:: - - netserver [-p ] [-4 (IPv4 addressing)] [-6 (IPv6 addressing)] - -Running the following shell script from the DUT will trigger netperf clients to measure -bidirectional TCP performance for 60 seconds and report CPU utilization. Parameter -k is used in -client commands to summarize selected statistics on their own line and -j is used to gain -additional timing measurements during the test. - -:: - - #!/bin/bash - for i in 1 - do - netperf -H -j -c -l 60 -t TCP_STREAM -- - -k DIRECTION,THROUGHPUT,MEAN_LATENCY,LOCAL_CPU_UTIL,REMOTE_CPU_UTIL,LOCAL_BYTES_SENT,REMOTE_BYTES_RECVD,LOCAL_SEND_SIZE & - - netperf -H -j -c -l 60 -t TCP_MAERTS -- - -k DIRECTION,THROUGHPUT,MEAN_LATENCY,LOCAL_CPU_UTIL,REMOTE_CPU_UTIL,LOCAL_BYTES_SENT,REMOTE_BYTES_RECVD,LOCAL_SEND_SIZE & - done - -Running the following commands will trigger netperf clients to measure UDP burst performance for -60 seconds at various burst/datagram sizes and report CPU utilization. - -- For UDP egress tests, run netperf client from DUT and start netserver on tester. - -:: - - netperf -H -j -c -l 60 -t UDP_STREAM -b -w -- -m - -k DIRECTION,THROUGHPUT,MEAN_LATENCY,LOCAL_CPU_UTIL,REMOTE_CPU_UTIL,LOCAL_BYTES_SENT,REMOTE_BYTES_RECVD,LOCAL_SEND_SIZE - -- For UDP ingress tests, run netperf client from tester and start netserver on DUT. - -:: - - netperf -H -j -C -l 60 -t UDP_STREAM -b -w -- -m - -k DIRECTION,THROUGHPUT,MEAN_LATENCY,LOCAL_CPU_UTIL,REMOTE_CPU_UTIL,LOCAL_BYTES_SENT,REMOTE_BYTES_RECVD,LOCAL_SEND_SIZE - - -CPSW/CPSW2g/CPSW3g Ethernet Driver -^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ - -- CPSW3g: AM64x, AM62x, AM62ax, AM62px - - -.. rubric:: TCP Bidirectional Throughput - :name: CPSW2g-tcp-bidirectional-throughput - -.. csv-table:: CPSW2g TCP Bidirectional Throughput - :header: "Command Used","am62xx_lp_sk-fs: THROUGHPUT (Mbits/sec)","am62xx_lp_sk-fs: CPU Load % (LOCAL_CPU_UTIL)","am62xx_sk-fs: THROUGHPUT (Mbits/sec)","am62xx_sk-fs: CPU Load % (LOCAL_CPU_UTIL)","am62xxsip_sk-fs: THROUGHPUT (Mbits/sec)","am62xxsip_sk-fs: CPU Load % (LOCAL_CPU_UTIL)" - - "netperf -H 192.168.0.1 -j -c -C -l 60 -t TCP_STREAM; netperf -H 192.168.0.1 -j -c -C -l 60 -t TCP_MAERTS","1685.26","64.99","1767.54","66.70","1647.55","62.58" - - - - -.. rubric:: TCP Bidirectional Throughput Interrupt Pacing - :name: CPSW2g-tcp-bidirectional-throughput-interrupt-pacing - -.. csv-table:: CPSW2g TCP Bidirectional Throughput Interrupt Pacing - :header: "Command Used","am62xx_lp_sk-fs: THROUGHPUT (Mbits/sec)","am62xx_lp_sk-fs: CPU Load % (LOCAL_CPU_UTIL)","am62xx_sk-fs: THROUGHPUT (Mbits/sec)","am62xx_sk-fs: CPU Load % (LOCAL_CPU_UTIL)","am62xxsip_sk-fs: THROUGHPUT (Mbits/sec)","am62xxsip_sk-fs: CPU Load % (LOCAL_CPU_UTIL)" - - "netperf -H 192.168.0.1 -j -c -C -l 60 -t TCP_STREAM; netperf -H 192.168.0.1 -j -c -C -l 60 -t TCP_MAERTS","326.74","11.98","1586.14","47.14","1807.73","48.75" - - - - -.. rubric:: UDP Throughput - :name: CPSW2g-udp-throughput-0-loss - -.. csv-table:: CPSW2g UDP Egress Throughput 0 loss - :header: "Frame Size(bytes)","am62xx_lp_sk-fs: UDP Datagram Size(bytes) (LOCAL_SEND_SIZE)","am62xx_lp_sk-fs: THROUGHPUT (Mbits/sec)","am62xx_lp_sk-fs: Packets Per Second (kPPS)","am62xx_lp_sk-fs: CPU Load % (LOCAL_CPU_UTIL)","am62xx_sk-fs: UDP Datagram Size(bytes) (LOCAL_SEND_SIZE)","am62xx_sk-fs: THROUGHPUT (Mbits/sec)","am62xx_sk-fs: Packets Per Second (kPPS)","am62xx_sk-fs: CPU Load % (LOCAL_CPU_UTIL)","am62xxsip_sk-fs: UDP Datagram Size(bytes) (LOCAL_SEND_SIZE)","am62xxsip_sk-fs: THROUGHPUT (Mbits/sec)","am62xxsip_sk-fs: Packets Per Second (kPPS)","am62xxsip_sk-fs: CPU Load % (LOCAL_CPU_UTIL)" - - "64","18.00","40.95","80.00","37.35","18.00","18.74","37.00","10.12","","48.25","94.00","39.37" - "128","82.00","89.57","87.00","38.47","82.00","99.23","97.00","38.69","","97.04","95.00","26.11" - "256","210.00","175.06","85.00","38.18","210.00","198.56","97.00","38.59","","179.37","88.00","38.40" - "1024","978.00","363.71","44.00","21.25","978.00","785.68","96.00","38.33","","708.67","87.00","38.11" - "1518","1472.00","183.19","15.00","10.59","1472.00","770.81","63.00","36.09","","706.43","58.00","35.94" - - - - -.. csv-table:: CPSW2g UDP Ingress Throughput 0 loss - :header: "Frame Size(bytes)","am62xx_lp_sk-fs: UDP Datagram Size(bytes) (LOCAL_SEND_SIZE)","am62xx_lp_sk-fs: THROUGHPUT (Mbits/sec)","am62xx_lp_sk-fs: Packets Per Second (kPPS)","am62xx_lp_sk-fs: CPU Load % (LOCAL_CPU_UTIL)","am62xx_sk-fs: UDP Datagram Size(bytes) (LOCAL_SEND_SIZE)","am62xx_sk-fs: THROUGHPUT (Mbits/sec)","am62xx_sk-fs: Packets Per Second (kPPS)","am62xx_sk-fs: CPU Load % (LOCAL_CPU_UTIL)","am62xxsip_sk-fs: UDP Datagram Size(bytes) (LOCAL_SEND_SIZE)","am62xxsip_sk-fs: THROUGHPUT (Mbits/sec)","am62xxsip_sk-fs: Packets Per Second (kPPS)","am62xxsip_sk-fs: CPU Load % (LOCAL_CPU_UTIL)" - - "64","","3.38","7.00","1.44","","3.07","6.00","3.06","","2.92","6.00","0.97" - "128","82.00","6.76","7.00","1.28","82.00","7.58","7.00","2.11","","7.17","7.00","1.63" - "256","210.00","15.77","8.00","4.60","210.00","15.36","8.00","2.22","","15.16","7.00","2.19" - "1024","978.00","60.62","7.00","2.80","978.00","61.44","8.00","1.82","","61.44","8.00","4.89" - "1518","1472.00","38.86","3.00","2.09","1472.00","2.43","0.00","0.59" - - - - -.. csv-table:: CPSW2g UDP Ingress Throughput possible loss - :header: "Frame Size(bytes)","am62xx_lp_sk-fs: UDP Datagram Size(bytes) (LOCAL_SEND_SIZE)","am62xx_lp_sk-fs: THROUGHPUT (Mbits/sec)","am62xx_lp_sk-fs: Packets Per Second (kPPS)","am62xx_lp_sk-fs: CPU Load % (LOCAL_CPU_UTIL)","am62xx_lp_sk-fs: Packet Loss %","am62xx_sk-fs: UDP Datagram Size(bytes) (LOCAL_SEND_SIZE)","am62xx_sk-fs: THROUGHPUT (Mbits/sec)","am62xx_sk-fs: Packets Per Second (kPPS)","am62xx_sk-fs: CPU Load % (LOCAL_CPU_UTIL)","am62xx_sk-fs: Packet Loss %","am62xxsip_sk-fs: UDP Datagram Size(bytes) (LOCAL_SEND_SIZE)","am62xxsip_sk-fs: THROUGHPUT (Mbits/sec)","am62xxsip_sk-fs: Packets Per Second (kPPS)","am62xxsip_sk-fs: CPU Load % (LOCAL_CPU_UTIL)","am62xxsip_sk-fs: Packet Loss %" - - "64","","71.78","140.00","65.81","74.13","","97.99","191.00","40.57","61.06","","92.95","182.00","42.37","75.92" - "128","82.00","173.15","169.00","45.12","65.86","82.00","193.99","189.00","41.95","67.47","","183.40","179.00","43.96","71.84" - "256","210.00","271.82","133.00","41.55","0.42","210.00","357.95","175.00","41.46","52.51","","324.57","158.00","43.50","58.28" - "1024","978.00","939.00","115.00","44.49","0.03","978.00","904.64","110.00","42.08","0.38","","738.20","90.00","41.83","0.55" - "1518","1472.00","13.16","1.00","20.85","97.98","1472.00","3.90","0.00","24.85","99.58" - - + "Glmark2-DRM","59.00 (min 51.00, max 70.00)","61.00","54.00" + "Glmark2-Wayland","199.00 (min 198.00, max 203.00)","216.00","208.75 (min 208.00, max 209.00)" + "Glmark2-Wayland 1920x1080","62.57 (min 62.00, max 63.00)","66.29 (min 66.00, max 67.00)" | Linux OSPI Flash Driver ----------------------- +.. rubric:: AM62XX-SK + :name: am62xx-sk-ospi-flash-driver -AM62XX-SK -^^^^^^^^^ - - -RAW -""" +.. rubric:: RAW + :name: am62xx-sk-ospi-raw .. csv-table:: OSPI Raw Flash Driver :header: "File size (Mbytes)","am62xx_sk-fs: Raw Read Throughput (Mbytes/sec)" - "50","172.41" + "50","170.77 (min 166.67, max 172.41)" +.. rubric:: RAW + :name: am62xx-sk-lp-ospi-raw .. csv-table:: OSPI Raw Flash Driver :header: "File size (Mbytes)","am62xx_lp_sk-fs: Raw Read Throughput (Mbytes/sec)" - "50","29.07" - - + "50","29.24 (min 28.73, max 29.59)" EMMC Driver ----------- @@ -655,141 +472,113 @@ EMMC Driver sensitive applications, umount the auto-mounted filesystem and re-mount in async mode. - - EMMC EXT4 FIO 1G ^^^^^^^^^^^^^^^^ - .. csv-table:: EMMC EXT4 FIO 1G :header: "Buffer size (bytes)","am62xx_sk-fs: Write EXT4 Throughput (Mbytes/sec)","am62xx_sk-fs: Write EXT4 CPU Load (%)","am62xx_sk-fs: Read EXT4 Throughput (Mbytes/sec)","am62xx_sk-fs: Read EXT4 CPU Load (%)" - "1m","44.60","1.43","174.00","2.30" - "4m","44.90","1.06","174.00","1.70" - "4k","5.32","2.19","36.40","10.09" - "256k","35.40","1.49","173.00","2.84" - - + "1m","55.21 (min 43.80, max 90.90)","1.48 (min 1.08, max 2.52)","174.00 (min 171.00, max 175.00)","2.05 (min 1.79, max 2.27)" + "4m","56.05 (min 43.70, max 96.40)","1.11 (min 0.80, max 1.78)","174.00 (min 171.00, max 175.00)","1.65 (min 1.46, max 1.87)" + "4k","29.97 (min 5.31, max 63.60)","10.46 (min 2.06, max 22.72)","50.86 (min 36.30, max 93.30)","13.38 (min 9.65, max 23.05)" + "256k","50.74 (min 35.00, max 91.30)","1.69 (min 1.11, max 2.90)","173.63 (min 171.00, max 174.00)","2.68 (min 2.25, max 2.96)" .. csv-table:: EMMC EXT4 FIO 1G :header: "Buffer size (bytes)","am62xx_lp_sk-fs: Write EXT4 Throughput (Mbytes/sec)","am62xx_lp_sk-fs: Write EXT4 CPU Load (%)","am62xx_lp_sk-fs: Read EXT4 Throughput (Mbytes/sec)","am62xx_lp_sk-fs: Read EXT4 CPU Load (%)" - "1m","61.50","1.99","175.00","2.30" - "4m","61.70","1.33","175.00","1.97" - "4k","51.40","19.45","56.80","16.71" - "256k","61.60","2.33","174.00","3.23" + "1m","49.95 (min 42.90, max 58.90)","1.58 (min 1.28, max 1.85)","174.50 (min 174.00, max 175.00)","2.37 (min 1.96, max 2.55)" + "4m","49.89 (min 43.10, max 58.90)","1.27 (min 0.98, max 1.86)","174.70 (min 174.00, max 175.00)","1.91 (min 1.63, max 2.35)" + "4k","23.80 (min 5.24, max 51.70)","9.27 (min 2.38, max 19.72)","44.31 (min 36.40, max 56.30)","13.52 (min 11.10, max 16.93)" + "256k","44.37 (min 34.20, max 58.80)","1.75 (min 1.31, max 2.31)","174.00","3.09 (min 2.66, max 3.23)" +.. csv-table:: EMMC EXT4 FIO 1G + :header: "Buffer size (bytes)","am62xxsip_sk-fs: Write EXT4 Throughput (Mbytes/sec)","am62xxsip_sk-fs: Write EXT4 CPU Load (%)","am62xxsip_sk-fs: Read EXT4 Throughput (Mbytes/sec)","am62xxsip_sk-fs: Read EXT4 CPU Load (%)" + "1m","92.76 (min 91.00, max 95.90)","2.53 (min 2.25, max 2.94)","171.75 (min 171.00, max 174.00)","2.55 (min 2.22, max 2.87)" + "4m","96.81 (min 92.20, max 98.00)","2.27 (min 2.05, max 2.53)","165.75 (min 141.00, max 173.00)","2.53 (min 2.11, max 2.84)" + "4k","64.16 (min 63.70, max 64.50)","24.79 (min 24.52, max 25.21)","92.38 (min 91.60, max 92.80)","24.06 (min 23.88, max 24.22)" + "256k","91.96 (min 91.00, max 92.80)","2.63 (min 2.38, max 2.93)","171.00 (min 170.00, max 173.00)","2.92 (min 2.64, max 3.14)" EMMC EXT4 ^^^^^^^^^ - .. csv-table:: EMMC EXT4 :header: "Buffer size (bytes)","am62xx_sk-fs: Write EXT4 Throughput (Mbytes/sec)","am62xx_sk-fs: Write EXT4 CPU Load (%)","am62xx_sk-fs: Read EXT4 Throughput (Mbytes/sec)","am62xx_sk-fs: Read EXT4 CPU Load (%)" - "102400","51.83 (min 49.52, max 52.61)","5.03 (min 4.49, max 6.52)","177.99","13.56" - "262144","50.97 (min 48.59, max 51.96)","5.21 (min 4.57, max 6.73)","181.94","14.16" - "524288","50.87 (min 48.19, max 51.68)","5.79 (min 4.94, max 7.10)","182.94","15.35" - "1048576","51.33 (min 48.92, max 52.08)","5.32 (min 4.73, max 6.67)","182.83","15.72" - "5242880","51.15 (min 49.02, max 51.80)","5.18 (min 4.59, max 6.56)","181.99","15.65" - - + "102400","47.27 (min 39.38, max 68.59)","4.63 (min 3.08, max 8.55)","172.03 (min 142.58, max 179.51)","12.04 (min 10.43, max 14.23)" + "262144","46.33 (min 39.08, max 69.36)","4.62 (min 3.09, max 8.92)","171.71 (min 98.67, max 183.00)","12.59 (min 5.84, max 14.54)" + "524288","46.07 (min 39.39, max 69.29)","4.66 (min 3.27, max 8.86)","176.20 (min 132.59, max 182.99)","12.90 (min 9.65, max 14.54)" + "1048576","45.97 (min 38.94, max 67.84)","4.48 (min 3.09, max 8.61)","177.23 (min 139.09, max 182.88)","13.66 (min 10.74, max 15.35)" + "5242880","46.19 (min 39.09, max 68.52)","4.48 (min 2.89, max 8.63)","176.56 (min 136.16, max 182.81)","13.55 (min 11.04, max 15.65)" .. csv-table:: EMMC EXT4 :header: "Buffer size (bytes)","am62xx_lp_sk-fs: Write EXT4 Throughput (Mbytes/sec)","am62xx_lp_sk-fs: Write EXT4 CPU Load (%)","am62xx_lp_sk-fs: Read EXT4 Throughput (Mbytes/sec)","am62xx_lp_sk-fs: Read EXT4 CPU Load (%)" - "102400","51.16 (min 48.23, max 52.47)","5.88 (min 5.39, max 7.27)","176.55","13.73" - "262144","49.96 (min 47.07, max 50.94)","5.98 (min 5.45, max 7.53)","180.51","15.04" - "524288","49.88 (min 47.07, max 50.91)","6.06 (min 5.47, max 7.62)","182.72","17.03" - "1048576","50.54 (min 47.88, max 51.64)","5.91 (min 5.45, max 7.31)","182.53","16.81" - "5242880","50.27 (min 47.13, max 51.35)","5.73 (min 5.24, max 7.20)","181.68","17.11" - - - - -EMMC EXT2 -^^^^^^^^^ - - -.. csv-table:: EMMC EXT2 - :header: "Buffer size (bytes)","am62xx_sk-fs: Write EXT2 Throughput (Mbytes/sec)","am62xx_sk-fs: Write EXT2 CPU Load (%)","am62xx_sk-fs: Read EXT2 Throughput (Mbytes/sec)","am62xx_sk-fs: Read EXT2 CPU Load (%)" - - "102400","39.34 (min 35.40, max 40.46)","4.49 (min 3.94, max 6.48)","174.99","12.45" - "262144","40.53 (min 36.16, max 41.74)","4.57 (min 3.80, max 6.57)","177.47","15.45" - "524288","40.11 (min 35.88, max 41.23)","4.54 (min 3.93, max 6.59)","178.47","14.59" - "1048576","40.30 (min 36.06, max 41.48)","4.49 (min 3.86, max 6.46)","177.97","14.66" - "5242880","40.32 (min 35.99, max 41.47)","4.52 (min 3.85, max 6.69)","177.38","14.96" - - - -.. csv-table:: EMMC EXT2 - :header: "Buffer size (bytes)","am62xx_lp_sk-fs: Write EXT2 Throughput (Mbytes/sec)","am62xx_lp_sk-fs: Write EXT2 CPU Load (%)","am62xx_lp_sk-fs: Read EXT2 Throughput (Mbytes/sec)","am62xx_lp_sk-fs: Read EXT2 CPU Load (%)" - - "102400","50.92 (min 43.73, max 52.79)","6.83 (min 5.89, max 9.41)","173.27","13.56" - "262144","50.82 (min 43.46, max 52.86)","6.61 (min 5.74, max 9.33)","177.56","16.88" - "524288","50.63 (min 43.23, max 52.92)","6.74 (min 5.62, max 9.18)","176.84","16.74" - "1048576","50.67 (min 43.58, max 52.56)","6.62 (min 5.64, max 9.44)","177.34","17.17" - "5242880","50.70 (min 42.92, max 53.20)","6.46 (min 5.52, max 9.29)","177.49","17.45" - + "102400","46.20 (min 39.42, max 53.63)","5.41 (min 3.80, max 7.72)","175.55 (min 167.93, max 177.22)","14.04 (min 13.30, max 14.77)" + "262144","45.84 (min 39.01, max 52.84)","5.56 (min 4.45, max 7.78)","180.66 (min 180.04, max 181.28)","16.55 (min 15.93, max 17.83)" + "524288","45.78 (min 39.45, max 52.65)","5.57 (min 4.50, max 7.95)","182.34 (min 181.72, max 182.77)","17.30 (min 16.67, max 18.26)" + "1048576","45.98 (min 39.10, max 53.29)","5.48 (min 4.24, max 7.77)","181.96 (min 181.42, max 182.45)","17.45 (min 16.74, max 19.48)" + "5242880","46.10 (min 39.39, max 52.97)","5.41 (min 4.42, max 7.81)","181.51 (min 180.56, max 182.12)","17.27 (min 16.37, max 18.26)" +.. csv-table:: EMMC EXT4 + :header: "Buffer size (bytes)","am62xxsip_sk-fs: Write EXT4 Throughput (Mbytes/sec)","am62xxsip_sk-fs: Write EXT4 CPU Load (%)","am62xxsip_sk-fs: Read EXT4 Throughput (Mbytes/sec)","am62xxsip_sk-fs: Read EXT4 CPU Load (%)" + "102400","92.90 (min 35.38, max 100.03)","12.70 (min 5.91, max 26.68)","178.51 (min 178.00, max 178.87)","12.36 (min 10.82, max 14.41)" + "262144","78.13 (min 30.00, max 97.55)","7.26 (min 2.26, max 17.43)","180.57 (min 180.08, max 181.05)","13.93 (min 12.66, max 15.42)" + "524288","77.25 (min 32.87, max 96.72)","6.82 (min 2.00, max 12.76)","181.08 (min 179.75, max 181.56)","14.21 (min 12.61, max 16.81)" + "1048576","75.27 (min 32.45, max 97.43)","6.62 (min 2.05, max 12.64)","181.08 (min 180.11, max 181.60)","13.54 (min 12.28, max 16.67)" + "5242880","73.92 (min 28.97, max 96.92)","6.62 (min 2.03, max 13.75)","180.86 (min 179.21, max 181.48)","13.65 (min 12.55, max 15.95)" EMMC VFAT ^^^^^^^^^ - .. csv-table:: EMMC VFAT :header: "Buffer size (bytes)","am62xx_sk-fs: Write VFAT Throughput (Mbytes/sec)","am62xx_sk-fs: Write VFAT CPU Load (%)","am62xx_sk-fs: Read VFAT Throughput (Mbytes/sec)","am62xx_sk-fs: Read VFAT CPU Load (%)" - "102400","47.06 (min 41.03, max 48.78)","6.33 (min 5.66, max 8.51)","169.15","13.77" - "262144","48.92 (min 42.39, max 50.79)","6.86 (min 6.18, max 9.11)","169.46","15.16" - "524288","48.17 (min 41.79, max 49.95)","6.59 (min 5.95, max 8.88)","169.19","15.32" - "1048576","48.61 (min 42.40, max 50.41)","6.61 (min 5.84, max 9.10)","168.56","14.29" - "5242880","48.94 (min 42.48, max 50.83)","6.65 (min 5.99, max 8.93)","168.66","14.98" - - - + "102400","41.99 (min 33.56, max 50.47)","5.63 (min 3.71, max 8.96)","168.88 (min 167.46, max 171.01)","12.46 (min 11.43, max 13.47)" + "262144","43.21 (min 34.82, max 51.89)","5.89 (min 4.06, max 8.84)","170.74 (min 170.03, max 172.53)","14.81 (min 12.50, max 15.98)" + "524288","43.26 (min 34.68, max 51.97)","5.92 (min 3.98, max 9.32)","169.14 (min 168.50, max 170.91)","14.50 (min 12.65, max 15.66)" + "1048576","43.40 (min 35.02, max 52.21)","5.83 (min 3.98, max 9.22)","168.62 (min 167.68, max 169.36)","14.54 (min 12.60, max 15.73)" + "5242880","43.37 (min 34.99, max 52.13)","5.80 (min 3.91, max 9.17)","168.87 (min 168.10, max 170.34)","14.71 (min 11.93, max 16.06)" .. csv-table:: EMMC VFAT :header: "Buffer size (bytes)","am62xx_lp_sk-fs: Write VFAT Throughput (Mbytes/sec)","am62xx_lp_sk-fs: Write VFAT CPU Load (%)","am62xx_lp_sk-fs: Read VFAT Throughput (Mbytes/sec)","am62xx_lp_sk-fs: Read VFAT CPU Load (%)" - "102400","46.05 (min 39.74, max 47.77)","6.88 (min 5.82, max 9.39)","168.34","14.29" - "262144","47.61 (min 40.82, max 49.71)","7.33 (min 6.35, max 10.21)","169.78","17.89" - "524288","47.73 (min 40.99, max 49.58)","7.30 (min 6.47, max 9.78)","168.38","18.25" - "1048576","47.70 (min 41.07, max 49.70)","7.31 (min 6.53, max 9.81)","168.33","17.67" - "5242880","47.80 (min 40.93, max 49.80)","7.16 (min 6.26, max 9.67)","167.94","16.87" - + "102400","40.98 (min 31.93, max 49.66)","6.24 (min 4.49, max 9.95)","167.36 (min 165.22, max 169.10)","14.86 (min 13.22, max 16.27)" + "262144","42.56 (min 33.32, max 51.62)","6.69 (min 4.94, max 10.29)","169.22 (min 167.97, max 170.23)","17.21 (min 15.42, max 18.22)" + "524288","42.57 (min 33.42, max 51.68)","6.73 (min 5.00, max 10.84)","167.98 (min 167.06, max 168.70)","16.59 (min 15.51, max 17.67)" + "1048576","42.66 (min 33.48, max 51.79)","6.55 (min 4.89, max 9.98)","167.73 (min 167.03, max 168.46)","16.94 (min 15.85, max 17.74)" + "5242880","42.78 (min 33.53, max 52.13)","6.57 (min 4.94, max 10.26)","167.31 (min 166.74, max 168.09)","16.85 (min 15.73, max 17.93)" +.. csv-table:: EMMC VFAT + :header: "Buffer size (bytes)","am62xxsip_sk-fs: Write VFAT Throughput (Mbytes/sec)","am62xxsip_sk-fs: Write VFAT CPU Load (%)","am62xxsip_sk-fs: Read VFAT Throughput (Mbytes/sec)","am62xxsip_sk-fs: Read VFAT CPU Load (%)" + "102400","80.24 (min 45.77, max 96.90)","16.11 (min 5.36, max 29.32)","174.50 (min 173.84, max 174.86)","12.42 (min 10.59, max 15.29)" + "262144","73.99 (min 51.85, max 96.56)","7.98 (min 4.06, max 15.38)","175.43 (min 175.16, max 175.60)","13.91 (min 12.71, max 17.08)" + "524288","72.90 (min 49.94, max 96.87)","7.76 (min 3.53, max 14.31)","174.89 (min 174.56, max 175.13)","13.82 (min 12.97, max 15.90)" + "1048576","74.90 (min 49.90, max 96.59)","8.42 (min 4.81, max 15.75)","174.62 (min 174.19, max 174.99)","13.74 (min 12.66, max 16.60)" + "5242880","75.79 (min 49.91, max 96.31)","8.88 (min 4.68, max 13.65)","174.76 (min 174.11, max 175.19)","13.69 (min 12.61, max 15.61)" UBoot EMMC Driver ----------------- - .. csv-table:: UBOOT EMMC RAW :header: "File size (bytes in hex)","am62xx_sk-fs: Write Throughput (Kbytes/sec)","am62xx_sk-fs: Read Throughput (Kbytes/sec)" - "2000000","99296.97","171560.21" - "4000000","97523.81","175229.95" - - - + "2000000","53539.31 (min 13727.69, max 61134.33)","170336.22 (min 169782.38, max 171560.21)" + "4000000","64033.22 (min 58514.29, max 95533.53)","172287.23 (min 164663.32, max 173835.54)" .. csv-table:: UBOOT EMMC RAW :header: "File size (bytes in hex)","am62xx_lp_sk-fs: Write Throughput (Kbytes/sec)","am62xx_lp_sk-fs: Read Throughput (Kbytes/sec)" - "2000000","57588.75","169782.38" - "4000000","57893.99","173375.66" - + "2000000","60091.96 (min 57186.74, max 62178.37)","170371.91 (min 169782.38, max 170666.67)" + "4000000","61147.19 (min 57893.99, max 62415.24)","165622.92 (min 100824.62, max 174297.87)" .. csv-table:: UBOOT EMMC RAW :header: "File size (bytes in hex)","am62xxsip_sk-fs: Write Throughput (Kbytes/sec)","am62xxsip_sk-fs: Read Throughput (Kbytes/sec)" - "2000000","47627.91","91275.77" - "4000000","52261.56","92434.41" - - + "2000000","86450.84 (min 13914.23, max 97523.81)","163230.55 (min 141852.81, max 172463.16)" + "4000000","98727.53 (min 96234.95, max 101448.92)","173236.44 (min 158682.81, max 175229.95)" MMCSD ----- @@ -802,307 +591,188 @@ MMCSD sensitive applications, umount the auto-mounted filesystem and re-mount in async mode. - MMC EXT4 FIO 1G ^^^^^^^^^^^^^^^ - .. csv-table:: MMC EXT4 FIO 1G :header: "Buffer size (bytes)","am62xx_sk-fs: Write EXT4 Throughput (Mbytes/sec)","am62xx_sk-fs: Write EXT4 CPU Load (%)","am62xx_sk-fs: Read EXT4 Throughput (Mbytes/sec)","am62xx_sk-fs: Read EXT4 CPU Load (%)" - "1m","42.70","1.44","87.30","1.53" - "4m","41.60","1.07","87.20","1.24" - "4k","2.77","1.78","13.00","4.45" - "256k","37.60","1.72","83.70","1.79" - - - + "1m","42.31 (min 40.80, max 43.60)","1.53 (min 1.24, max 1.69)","87.53 (min 87.30, max 88.20)","1.59 (min 1.34, max 1.72)" + "4m","41.66 (min 40.40, max 42.40)","1.03 (min 0.92, max 1.11)","86.67 (min 82.60, max 87.50)","1.19 (min 0.94, max 1.27)" + "4k","2.79 (min 2.76, max 2.83)","1.88 (min 1.71, max 1.99)","12.93 (min 12.80, max 13.00)","4.47 (min 4.27, max 4.71)" + "256k","38.07 (min 36.30, max 39.10)","1.70 (min 1.40, max 1.85)","83.87 (min 83.60, max 84.30)","1.75 (min 1.60, max 1.87)" .. csv-table:: MMC EXT4 FIO 1G :header: "Buffer size (bytes)","am62xx_lp_sk-fs: Write EXT4 Throughput (Mbytes/sec)","am62xx_lp_sk-fs: Write EXT4 CPU Load (%)","am62xx_lp_sk-fs: Read EXT4 Throughput (Mbytes/sec)","am62xx_lp_sk-fs: Read EXT4 CPU Load (%)" - "1m","42.60","1.57","87.20","1.56" - "4m","42.20","1.07","87.30","1.13" - "4k","2.77","1.99","12.90","5.04" - "256k","38.60","1.70","84.00","1.88" - - - + "1m","42.51 (min 41.90, max 43.60)","1.66 (min 1.59, max 1.74)","87.04 (min 84.90, max 87.40)","1.74 (min 1.66, max 1.87)" + "4m","42.10 (min 40.70, max 43.20)","1.16 (min 1.07, max 1.25)","86.80 (min 84.20, max 87.40)","1.27 (min 1.22, max 1.31)" + "4k","2.79 (min 2.76, max 2.84)","2.12 (min 1.97, max 2.26)","12.90 (min 12.80, max 13.00)","4.96 (min 4.77, max 5.13)" + "256k","37.40 (min 36.10, max 38.50)","1.83 (min 1.64, max 1.93)","83.70 (min 83.30, max 84.30)","1.99 (min 1.87, max 2.06)" .. csv-table:: MMC EXT4 FIO 1G :header: "Buffer size (bytes)","am62xxsip_sk-fs: Write EXT4 Throughput (Mbytes/sec)","am62xxsip_sk-fs: Write EXT4 CPU Load (%)","am62xxsip_sk-fs: Read EXT4 Throughput (Mbytes/sec)","am62xxsip_sk-fs: Read EXT4 CPU Load (%)" - "1m","42.40","1.97","87.30","1.86" - "4m","40.70","1.40","87.00","1.79" - "4k","2.77","2.14","13.20","4.98" - "256k","37.80","1.90","83.40","1.90" - + "1m","39.39 (min 18.80, max 42.80)","1.61 (min 1.16, max 1.88)","87.29 (min 86.60, max 87.70)","1.91 (min 1.67, max 2.13)" + "4m","38.44 (min 18.60, max 42.50)","1.34 (min 0.85, max 1.57)","87.00 (min 86.20, max 87.30)","1.78 (min 1.37, max 2.02)" + "4k","2.96 (min 2.77, max 4.18)","2.17 (min 2.04, max 2.73)","13.00 (min 12.90, max 13.50)","4.93 (min 4.70, max 5.20)" + "256k","35.65 (min 17.70, max 39.60)","1.69 (min 1.15, max 1.92)","83.46 (min 82.20, max 84.00)","1.91 (min 1.68, max 2.08)" MMC EXT4 ^^^^^^^^ - .. csv-table:: MMC EXT4 :header: "Buffer size (bytes)","am62xx_sk-fs: Write Raw Throughput (Mbytes/sec)","am62xx_sk-fs: Write Raw CPU Load (%)","am62xx_sk-fs: Read Raw Throughput (Mbytes/sec)","am62xx_sk-fs: Read Raw CPU Load (%)" - "102400","10.57 (min 10.49, max 10.60)","1.19 (min 1.06, max 1.45)","11.06","1.08" - "262144","10.30 (min 9.97, max 10.61)","1.24 (min 1.10, max 1.54)","10.78","1.03" - "524288","10.31 (min 10.18, max 10.46)","1.18 (min 1.02, max 1.55)","11.44","1.01" - "1048576","10.35 (min 10.23, max 10.63)","1.22 (min 1.03, max 1.52)","11.44","1.12" - "5242880","10.55 (min 10.41, max 10.77)","1.20 (min 1.09, max 1.54)","10.95","1.05" - - - + "102400","10.57 (min 10.18, max 10.82)","1.12 (min 0.89, max 1.52)","11.02 (min 10.86, max 11.09)","0.96 (min 0.85, max 1.08)" + "262144","10.35 (min 10.13, max 10.84)","1.14 (min 0.84, max 1.65)","11.11 (min 11.00, max 11.22)","1.02 (min 0.80, max 1.22)" + "524288","10.30 (min 10.10, max 10.73)","1.12 (min 0.85, max 1.59)","11.16 (min 10.82, max 11.45)","0.99 (min 0.85, max 1.18)" + "1048576","10.35 (min 10.17, max 10.78)","1.16 (min 0.86, max 1.73)","11.14 (min 10.98, max 11.52)","0.97 (min 0.82, max 1.08)" + "5242880","10.37 (min 10.13, max 10.71)","1.08 (min 0.84, max 1.58)","11.79 (min 11.23, max 12.02)","1.02 (min 0.80, max 1.20)" .. csv-table:: MMC EXT4 :header: "Buffer size (bytes)","am62xx_lp_sk-fs: Write Raw Throughput (Mbytes/sec)","am62xx_lp_sk-fs: Write Raw CPU Load (%)","am62xx_lp_sk-fs: Read Raw Throughput (Mbytes/sec)","am62xx_lp_sk-fs: Read Raw CPU Load (%)" - "102400","10.58 (min 10.19, max 10.92)","1.36 (min 1.22, max 1.63)","11.78","1.10" - "262144","10.12 (min 10.10, max 10.15)","1.42 (min 1.23, max 1.76)","10.95","1.18" - "524288","10.17 (min 10.10, max 10.23)","1.37 (min 1.17, max 1.66)","11.06","1.19" - "1048576","10.20 (min 10.14, max 10.30)","1.38 (min 1.21, max 1.70)","11.05","1.21" - "5242880","10.19 (min 10.16, max 10.28)","1.32 (min 1.14, max 1.81)","11.52","1.13" - - - + "102400","10.53 (min 10.22, max 10.94)","1.33 (min 1.09, max 1.74)","10.99 (min 10.62, max 11.80)","1.05 (min 0.98, max 1.14)" + "262144","10.33 (min 10.09, max 10.82)","1.37 (min 1.18, max 1.97)","11.06 (min 10.73, max 11.21)","1.22 (min 1.08, max 1.31)" + "524288","10.31 (min 10.10, max 10.74)","1.34 (min 1.12, max 1.80)","11.16 (min 11.05, max 11.50)","1.15 (min 1.08, max 1.26)" + "1048576","10.32 (min 10.08, max 10.72)","1.41 (min 1.15, max 1.81)","11.20 (min 10.84, max 11.50)","1.16 (min 1.09, max 1.25)" + "5242880","10.41 (min 10.15, max 10.69)","1.31 (min 1.11, max 1.92)","11.88 (min 11.50, max 12.02)","1.20 (min 1.10, max 1.26)" .. csv-table:: MMC EXT4 :header: "Buffer size (bytes)","am62xxsip_sk-fs: Write Raw Throughput (Mbytes/sec)","am62xxsip_sk-fs: Write Raw CPU Load (%)","am62xxsip_sk-fs: Read Raw Throughput (Mbytes/sec)","am62xxsip_sk-fs: Read Raw CPU Load (%)" - "102400","10.51 (min 10.47, max 10.57)","1.40 (min 1.06, max 2.18)","10.87","1.19" - "262144","10.59 (min 10.55, max 10.63)","1.13 (min 0.99, max 1.49)","11.19","1.15" - "524288","10.71 (min 10.54, max 10.82)","1.02 (min 0.92, max 1.16)","11.01","1.08" - "1048576","10.61 (min 10.25, max 10.81)","1.16 (min 1.11, max 1.33)","10.83","1.16" - "5242880","11.04 (min 10.55, max 11.30)","1.11 (min 0.95, max 1.29)","12.02","1.12" - - -MMC EXT3 -^^^^^^^^ - - -.. csv-table:: MMC EXT3 - :header: "Buffer size (bytes)","am62xx_sk-fs: Write Raw Throughput (Mbytes/sec)","am62xx_sk-fs: Write Raw CPU Load (%)","am62xx_sk-fs: Read Raw Throughput (Mbytes/sec)","am62xx_sk-fs: Read Raw CPU Load (%)" - - "102400","36.77 (min 32.06, max 38.32)","4.58 (min 3.89, max 6.66)","79.49","6.11" - "262144","34.68 (min 31.54, max 35.94)","4.19 (min 3.63, max 6.25)","85.12","7.36" - "524288","34.44 (min 29.06, max 36.66)","4.13 (min 3.68, max 5.76)","89.51","7.51" - "1048576","34.73 (min 30.73, max 36.01)","4.02 (min 3.28, max 5.95)","89.59","7.73" - "5242880","38.45 (min 34.26, max 40.01)","4.49 (min 3.77, max 6.55)","84.49","8.22" - - - - -.. csv-table:: MMC EXT3 - :header: "Buffer size (bytes)","am62xx_lp_sk-fs: Write Raw Throughput (Mbytes/sec)","am62xx_lp_sk-fs: Write Raw CPU Load (%)","am62xx_lp_sk-fs: Read Raw Throughput (Mbytes/sec)","am62xx_lp_sk-fs: Read Raw CPU Load (%)" - - "102400","35.99 (min 31.77, max 37.53)","5.11 (min 4.33, max 7.44)","79.52","6.86" - "262144","33.79 (min 30.12, max 34.90)","4.95 (min 3.92, max 7.10)","84.64","9.05" - "524288","34.60 (min 30.25, max 35.84)","4.67 (min 3.92, max 7.00)","89.40","8.76" - "1048576","34.20 (min 29.86, max 35.48)","4.64 (min 3.71, max 6.63)","84.61","8.69" - "5242880","34.30 (min 30.30, max 35.96)","4.52 (min 3.81, max 6.73)","88.98","8.53" - - - - -.. csv-table:: MMC EXT3 - :header: "Buffer size (bytes)","am62xxsip_sk-fs: Write Raw Throughput (Mbytes/sec)","am62xxsip_sk-fs: Write Raw CPU Load (%)","am62xxsip_sk-fs: Read Raw Throughput (Mbytes/sec)","am62xxsip_sk-fs: Read Raw CPU Load (%)" - - "102400","35.61 (min 27.97, max 40.71)","5.54 (min 2.82, max 9.13)","79.32","6.99" - "262144","41.13 (min 40.19, max 42.21)","5.30 (min 2.86, max 8.60)","85.39","7.99" - "524288","42.68 (min 41.84, max 43.27)","4.09 (min 2.83, max 7.93)","84.63","7.74" - "1048576","42.30 (min 40.04, max 43.70)","3.76 (min 2.77, max 7.16)","89.59","8.72" - "5242880","42.01 (min 41.13, max 43.09)","3.97 (min 2.62, max 8.43)","89.58","8.33" - - - -MMC EXT2 -^^^^^^^^ - - -.. csv-table:: MMC EXT2 - :header: "Buffer size (bytes)","am62xx_sk-fs: Write Raw Throughput (Mbytes/sec)","am62xx_sk-fs: Write Raw CPU Load (%)","am62xx_sk-fs: Read Raw Throughput (Mbytes/sec)","am62xx_sk-fs: Read Raw CPU Load (%)" - - "102400","38.68 (min 34.18, max 40.13)","4.40 (min 3.65, max 6.69)","80.23","6.53" - "262144","35.29 (min 31.27, max 36.87)","4.22 (min 3.38, max 5.82)","85.76","7.80" - "524288","35.20 (min 32.48, max 36.36)","4.16 (min 3.34, max 6.66)","89.26","7.68" - "1048576","34.82 (min 31.53, max 37.17)","4.12 (min 3.34, max 6.15)","84.22","7.47" - "5242880","39.27 (min 35.85, max 40.49)","4.39 (min 3.68, max 6.50)","89.89","7.73" - - - - -.. csv-table:: MMC EXT2 - :header: "Buffer size (bytes)","am62xx_lp_sk-fs: Write Raw Throughput (Mbytes/sec)","am62xx_lp_sk-fs: Write Raw CPU Load (%)","am62xx_lp_sk-fs: Read Raw Throughput (Mbytes/sec)","am62xx_lp_sk-fs: Read Raw CPU Load (%)" - - "102400","38.00 (min 33.58, max 39.35)","4.74 (min 4.13, max 7.07)","75.79","6.22" - "262144","35.16 (min 31.38, max 36.39)","4.55 (min 3.80, max 6.53)","85.71","8.59" - "524288","35.08 (min 31.38, max 36.20)","4.61 (min 3.86, max 6.72)","89.64","8.37" - "1048576","38.47 (min 34.47, max 39.93)","4.85 (min 4.14, max 7.38)","89.35","8.33" - "5242880","35.09 (min 31.53, max 36.31)","4.41 (min 3.64, max 6.68)","89.43","9.15" - - - - -.. csv-table:: MMC EXT2 - :header: "Buffer size (bytes)","am62xxsip_sk-fs: Write Raw Throughput (Mbytes/sec)","am62xxsip_sk-fs: Write Raw CPU Load (%)","am62xxsip_sk-fs: Read Raw Throughput (Mbytes/sec)","am62xxsip_sk-fs: Read Raw CPU Load (%)" - - "102400","36.89 (min 27.05, max 39.82)","4.68 (min 2.56, max 7.97)","76.13","6.58" - "262144","43.94 (min 43.06, max 44.49)","3.91 (min 2.71, max 7.56)","86.00","7.44" - "524288","43.69 (min 41.15, max 45.18)","3.87 (min 3.04, max 6.82)","89.93","8.19" - "1048576","44.00 (min 42.71, max 45.20)","3.85 (min 2.86, max 7.47)","89.56","7.96" - "5242880","42.13 (min 40.07, max 44.07)","3.47 (min 2.70, max 5.73)","89.51","8.14" - - - - + "102400","10.42 (min 8.81, max 10.95)","1.34 (min 0.65, max 2.59)","11.17 (min 10.59, max 11.81)","1.26 (min 0.99, max 1.63)" + "262144","10.46 (min 8.73, max 11.13)","0.97 (min 0.66, max 1.95)","11.14 (min 10.78, max 11.92)","1.14 (min 0.94, max 1.79)" + "524288","10.48 (min 9.36, max 10.84)","0.94 (min 0.71, max 1.40)","11.23 (min 10.91, max 12.00)","1.00 (min 0.87, max 1.18)" + "1048576","10.46 (min 9.35, max 10.92)","0.99 (min 0.74, max 1.31)","11.20 (min 10.83, max 12.01)","1.02 (min 0.85, max 1.19)" + "5242880","10.69 (min 9.03, max 11.30)","0.91 (min 0.61, max 1.29)","11.57 (min 10.87, max 12.03)","1.07 (min 0.85, max 1.26)" The performance numbers were captured using the following: - SanDisk Max Endurance SD card (SDSQQVR-032G-GN6IA) - Partition was mounted with async option - UBoot MMCSD ----------- - UBOOT MMCSD FAT ^^^^^^^^^^^^^^^ - .. csv-table:: UBOOT MMCSD FAT :header: "File size (bytes in hex)","am62xx_sk-fs: Write Throughput (Kbytes/sec)","am62xx_sk-fs: Read Throughput (Kbytes/sec)" - "400000","39009.52","83591.84" - "800000","40554.46","88086.02" - "1000000","44643.05","89530.05" - - - + "400000","35466.05 (min 16318.73, max 40960.00)","82755.92 (min 81920.00, max 83591.84)" + "800000","42607.92 (min 36735.43, max 46282.49)","87151.41 (min 86231.58, max 88086.02)" + "1000000","46774.89 (min 42335.92, max 49201.20)","89653.03 (min 89530.05, max 90021.98)" .. csv-table:: UBOOT MMCSD FAT :header: "File size (bytes in hex)","am62xx_lp_sk-fs: Write Throughput (Kbytes/sec)","am62xx_lp_sk-fs: Read Throughput (Kbytes/sec)" - "400000","35008.55","81920.00" - "800000","32379.45","87148.94" - "1000000","49799.39","90021.98" - - - + "400000","36399.32 (min 30567.16, max 39766.99)","82636.50 (min 81920.00, max 83591.84)" + "800000","41351.40 (min 35008.55, max 46545.45)","87148.94" + "1000000","48424.06 (min 44281.08, max 50103.98)","89670.60 (min 89530.05, max 90021.98)" .. csv-table:: UBOOT MMCSD FAT :header: "File size (bytes in hex)","am62xxsip_sk-fs: Write Throughput (Kbytes/sec)","am62xxsip_sk-fs: Read Throughput (Kbytes/sec)" - "400000","31507.69","81920.00" - "800000","42890.05","87148.94" - "1000000","49648.48","89530.05" - - + "400000","31694.74 (min 18875.58, max 39384.62)","81820.63 (min 78769.23, max 83591.84)" + "800000","37983.33 (min 20897.96, max 45765.36)","86655.57 (min 85333.33, max 88086.02)" + "1000000","41131.43 (min 21005.13, max 49053.89)","89444.00 (min 88562.16, max 90021.98)" The performance numbers were captured using the following: - SanDisk Max Endurance SD card (SDSQQVR-032G-GN6IA) - | USB Driver ---------- - USB Device Controller ^^^^^^^^^^^^^^^^^^^^^ - .. csv-table:: USBDEVICE HIGHSPEED SLAVE_READ_THROUGHPUT :header: "Number of Blocks","am62xx_lp_sk-fs: Throughput (MB/sec)","am62xx_sk-fs: Throughput (MB/sec)","am62xxsip_sk-fs: Throughput (MB/sec)" - "150","33.00","42.50","43.50" - - + "150","33.11 (min 30.30, max 34.50)","43.23 (min 42.60, max 44.20)","44.00 (min 43.60, max 44.40)" .. csv-table:: USBDEVICE HIGHSPEED SLAVE_WRITE_THROUGHPUT :header: "Number of Blocks","am62xx_lp_sk-fs: Throughput (MB/sec)","am62xx_sk-fs: Throughput (MB/sec)","am62xxsip_sk-fs: Throughput (MB/sec)" - "150","30.70","39.80","37.10" - + "150","29.70 (min 26.70, max 32.00)","41.21 (min 40.30, max 42.90)","40.01 (min 37.50, max 42.30)" | CRYPTO Driver ------------- - OpenSSL Performance ^^^^^^^^^^^^^^^^^^^ .. csv-table:: OpenSSL Performance :header: "Algorithm","Buffer Size (in bytes)","am62xx_lp_sk-fs: throughput (KBytes/Sec)","am62xx_sk-fs: throughput (KBytes/Sec)","am62xxsip_sk-fs: throughput (KBytes/Sec)" - "aes-128-cbc","1024","19332.10","21814.61","21901.65" - "aes-128-cbc","16","344.83","380.01","370.25" - "aes-128-cbc","16384","112579.93","116370.09","124261.72" - "aes-128-cbc","256","6121.81","6160.55","6302.89" - "aes-128-cbc","64","1532.95","1542.44","1626.22" - "aes-128-cbc","8192","84322.99","88956.93","93115.73" - "aes-128-ecb","1024","20105.56","22847.49","22268.59" - "aes-128-ecb","16","362.49","383.55","378.92" - "aes-128-ecb","16384","114682.54","120569.86","127860.74" - "aes-128-ecb","256","6092.37","6171.05","6463.66" - "aes-128-ecb","64","1538.13","1548.27","1663.08" - "aes-128-ecb","8192","87067.31","92536.83","95701.67" - "aes-192-cbc","1024","19188.39","21499.22","21587.29" - "aes-192-cbc","16","345.95","383.05","370.81" - "aes-192-cbc","16384","105316.35","109843.80","116539.39" - "aes-192-cbc","256","6100.82","6159.79","6238.46" - "aes-192-cbc","64","1526.98","1543.04","1620.65" - "aes-192-cbc","8192","80538.28","84535.98","89066.15" - "aes-192-ecb","1024","19876.52","22543.70","22193.49" - "aes-192-ecb","16","361.37","383.07","382.09" - "aes-192-ecb","16384","111351.13","113628.50","121503.74" - "aes-192-ecb","256","6097.66","6170.03","6481.15" - "aes-192-ecb","64","1538.15","1546.99","1680.51" - "aes-192-ecb","8192","84372.14","88003.93","92105.39" - "aes-256-cbc","1024","18930.69","21275.65","21359.96" - "aes-256-cbc","16","346.96","382.25","370.81" - "aes-256-cbc","16384","98604.37","102520.15","109614.42" - "aes-256-cbc","256","6085.97","6156.37","6247.08" - "aes-256-cbc","64","1530.07","1540.33","1618.54" - "aes-256-cbc","8192","77313.37","81087.15","84762.62" - "aes-256-ecb","1024","19814.06","22423.21","22128.98" - "aes-256-ecb","16","362.64","383.66","376.89" - "aes-256-ecb","16384","103180.97","106779.99","114005.33" - "aes-256-ecb","256","6135.13","6169.94","6384.81" - "aes-256-ecb","64","1537.32","1547.33","1658.11" - "aes-256-ecb","8192","79563.43","84475.90","87960.23" - "sha256","1024","24798.21","29029.38","30274.56" - "sha256","16","426.65","481.71","501.07" - "sha256","16384","242909.18","261947.39","251062.95" - "sha256","256","6633.39","7654.49","7859.88" - "sha256","64","1676.12","1916.42","1985.81" - "sha256","8192","156958.72","174140.07","168424.79" - "sha512","1024","20430.17","23322.97","21332.99" - "sha512","16","398.69","480.28","483.14" - "sha512","16384","59561.30","65650.69","60030.98" - "sha512","256","6163.97","6760.70","6936.66" - "sha512","64","1589.91","1920.30","1929.90" - "sha512","8192","52232.19","58804.91","53398.19" - - + "aes-128-cbc","1024","20907.99 (min 19976.19, max 22306.47)","23639.08 (min 21773.65, max 24485.89)","22077.10 (min 21114.88, max 23049.56)" + "aes-128-cbc","16","364.55 (min 352.28, max 374.50)","387.41 (min 379.85, max 419.58)","380.12 (min 370.18, max 392.97)" + "aes-128-cbc","16384","116402.86 (min 113541.12, max 119870.81)","120229.89 (min 115938.65, max 131110.23)","122670.42 (min 117544.28, max 127505.75)" + "aes-128-cbc","256","5982.09 (min 5769.30, max 6152.11)","6286.31 (min 6142.29, max 7050.92)","6368.79 (min 6144.85, max 6681.17)" + "aes-128-cbc","64","1497.61 (min 1441.62, max 1537.66)","1584.44 (min 1541.50, max 1818.71)","1617.02 (min 1536.41, max 1708.99)" + "aes-128-cbc","8192","88300.89 (min 85458.94, max 91952.47)","93108.22 (min 88402.60, max 100466.69)","92829.70 (min 89186.30, max 96419.84)" + "aes-128-ecb","1024","21740.50 (min 20489.90, max 22819.16)","24123.86 (min 22792.87, max 25001.98)","22632.58 (min 21597.87, max 23622.31)" + "aes-128-ecb","16","370.24 (min 357.28, max 381.93)","390.43 (min 383.62, max 431.56)","386.75 (min 377.13, max 398.98)" + "aes-128-ecb","16384","120206.68 (min 117850.11, max 123016.53)","124764.84 (min 120045.57, max 136303.96)","126950.06 (min 121247.06, max 131765.59)" + "aes-128-ecb","256","5999.26 (min 5773.74, max 6163.88)","6343.30 (min 6170.97, max 7289.86)","6470.59 (min 6142.12, max 6830.59)" + "aes-128-ecb","64","1505.50 (min 1446.49, max 1541.23)","1624.92 (min 1547.71, max 1877.35)","1642.30 (min 1537.45, max 1747.48)" + "aes-128-ecb","8192","90868.39 (min 88468.14, max 92310.19)","97160.87 (min 91930.62, max 103997.44)","95978.84 (min 92334.76, max 99461.80)" + "aes-192-cbc","1024","20752.00 (min 19784.02, max 22273.71)","23517.06 (min 21488.64, max 24410.45)","21847.89 (min 20898.82, max 22822.57)" + "aes-192-cbc","16","365.52 (min 353.82, max 376.50)","388.34 (min 381.74, max 421.03)","379.18 (min 369.00, max 387.85)" + "aes-192-cbc","16384","110072.49 (min 107440.81, max 112295.94)","113373.87 (min 109625.34, max 124081.49)","116275.20 (min 112104.79, max 120176.64)" + "aes-192-cbc","256","5979.54 (min 5767.85, max 6141.44)","6288.97 (min 6152.28, max 7104.60)","6333.77 (min 6110.21, max 6583.64)" + "aes-192-cbc","64","1498.07 (min 1442.62, max 1538.50)","1588.33 (min 1542.44, max 1838.59)","1615.22 (min 1536.38, max 1698.15)" + "aes-192-cbc","8192","84092.59 (min 81810.77, max 86608.55)","88387.58 (min 84429.48, max 96318.81)","89152.51 (min 85595.48, max 92646.06)" + "aes-192-ecb","1024","21486.68 (min 20369.07, max 22924.63)","24089.77 (min 22578.52, max 25076.74)","22564.44 (min 21724.16, max 23545.86)" + "aes-192-ecb","16","370.41 (min 358.32, max 382.93)","390.16 (min 383.19, max 431.48)","387.65 (min 379.52, max 398.96)" + "aes-192-ecb","16384","114104.32 (min 112219.48, max 117456.90)","118111.57 (min 113617.58, max 129111.38)","120551.42 (min 114524.16, max 125572.44)" + "aes-192-ecb","256","5993.78 (min 5765.89, max 6156.20)","6344.05 (min 6169.69, max 7315.54)","6475.15 (min 6148.18, max 6893.74)" + "aes-192-ecb","64","1502.55 (min 1446.85, max 1541.78)","1627.19 (min 1546.43, max 1887.98)","1648.31 (min 1540.27, max 1742.19)" + "aes-192-ecb","8192","87736.66 (min 85093.03, max 91247.96)","92213.59 (min 87569.75, max 99887.79)","92321.11 (min 88678.40, max 95783.59)" + "aes-256-cbc","1024","20581.29 (min 19701.76, max 21914.28)","23211.82 (min 21145.26, max 24292.69)","21607.81 (min 20540.07, max 22718.46)" + "aes-256-cbc","16","365.27 (min 351.82, max 377.43)","388.41 (min 383.25, max 419.81)","379.23 (min 368.19, max 389.95)" + "aes-256-cbc","16384","102187.01 (min 99074.05, max 105633.11)","106252.97 (min 102176.09, max 115627.35)","107868.16 (min 102318.08, max 112678.23)" + "aes-256-cbc","256","5974.42 (min 5769.22, max 6132.31)","6279.75 (min 6146.82, max 7036.33)","6326.14 (min 6087.85, max 6636.97)" + "aes-256-cbc","64","1497.24 (min 1443.63, max 1538.05)","1587.18 (min 1540.95, max 1830.78)","1607.81 (min 1514.67, max 1704.75)" + "aes-256-cbc","8192","80066.90 (min 78809.77, max 81939.11)","84246.19 (min 80595.63, max 91176.96)","84435.29 (min 80655.70, max 87881.05)" + "aes-256-ecb","1024","21426.18 (min 20330.15, max 22955.35)","23968.47 (min 22278.83, max 24843.26)","22376.92 (min 21511.85, max 23244.80)" + "aes-256-ecb","16","370.62 (min 359.25, max 381.87)","390.07 (min 382.78, max 431.39)","387.06 (min 379.45, max 397.67)" + "aes-256-ecb","16384","107402.58 (min 105185.28, max 109685.42)","110622.72 (min 107080.36, max 120558.93)","112945.83 (min 108505.77, max 117036.37)" + "aes-256-ecb","256","5992.09 (min 5767.00, max 6159.53)","6339.20 (min 6167.81, max 7293.70)","6456.95 (min 6145.62, max 6806.61)" + "aes-256-ecb","64","1502.26 (min 1448.23, max 1542.25)","1624.00 (min 1546.86, max 1885.10)","1648.13 (min 1540.82, max 1750.91)" + "aes-256-ecb","8192","83537.24 (min 81562.28, max 84948.31)","87660.54 (min 84374.87, max 95049.05)","87739.05 (min 84350.29, max 90947.58)" + "sha256","1024","31667.97 (min 30793.05, max 32121.86)","36792.92 (min 36691.63, max 37363.03)","32547.50 (min 31477.76, max 33580.71)" + "sha256","16","535.08 (min 517.10, max 544.56)","581.78 (min 574.87, max 626.29)","546.96 (min 528.06, max 563.91)" + "sha256","16384","259375.10 (min 256791.89, max 261860.01)","294220.46 (min 292962.30, max 298920.62)","263269.72 (min 260674.90, max 268413.61)" + "sha256","256","8403.27 (min 8144.30, max 8599.30)","9269.37 (min 9191.00, max 9772.97)","8519.69 (min 8210.35, max 8809.05)" + "sha256","64","2118.85 (min 2050.79, max 2152.09)","2321.29 (min 2297.30, max 2466.28)","2161.82 (min 2093.80, max 2229.46)" + "sha256","8192","175455.91 (min 172878.51, max 179773.44)","197163.69 (min 196318.55, max 202429.78)","176976.21 (min 172785.66, max 181379.07)" + "sha512","1024","22679.64 (min 22215.00, max 23011.33)","24744.92 (min 24600.58, max 25694.21)","22754.13 (min 22400.00, max 23131.14)" + "sha512","16","522.33 (min 501.00, max 537.31)","577.81 (min 573.24, max 601.51)","529.39 (min 512.75, max 543.56)" + "sha512","16384","60596.22 (min 60304.04, max 60926.63)","67861.16 (min 67671.38, max 68299.43)","60706.82 (min 60342.27, max 61063.17)" + "sha512","256","7290.51 (min 7085.40, max 7548.84)","8234.50 (min 8163.75, max 8537.43)","7490.46 (min 7222.87, max 7709.53)" + "sha512","64","2095.92 (min 2021.93, max 2149.91)","2311.92 (min 2293.89, max 2405.40)","2119.25 (min 2058.05, max 2178.41)" + "sha512","8192","54249.47 (min 53824.17, max 54613.33)","60518.40 (min 60325.89, max 61390.85)","54479.87 (min 53963.43, max 54910.98)" .. csv-table:: OpenSSL CPU Load :header: "Algorithm","am62xx_lp_sk-fs: CPU Load","am62xx_sk-fs: CPU Load","am62xxsip_sk-fs: CPU Load" - "aes-128-cbc","35.00","35.00","35.00" - "aes-128-ecb","37.00","38.00","36.00" - "aes-192-cbc","35.00","36.00","35.00" - "aes-192-ecb","36.00","37.00","36.00" - "aes-256-cbc","35.00","35.00","34.00" - "aes-256-ecb","36.00","36.00","36.00" - "sha256","94.00","94.00","95.00" - "sha512","94.00","95.00","95.00" - - + "aes-128-cbc","36.63 (min 34.00, max 38.00)","36.88 (min 35.00, max 38.00)","36.38 (min 35.00, max 37.00)" + "aes-128-ecb","38.75 (min 36.00, max 40.00)","39.13 (min 37.00, max 40.00)","38.13 (min 36.00, max 39.00)" + "aes-192-cbc","37.00 (min 35.00, max 39.00)","37.50 (min 36.00, max 39.00)","35.75 (min 32.00, max 38.00)" + "aes-192-ecb","38.50 (min 36.00, max 40.00)","38.38 (min 37.00, max 40.00)","37.88 (min 36.00, max 39.00)" + "aes-256-cbc","36.88 (min 35.00, max 38.00)","36.75 (min 35.00, max 38.00)","36.13 (min 34.00, max 38.00)" + "aes-256-ecb","38.25 (min 36.00, max 40.00)","38.13 (min 37.00, max 39.00)","37.38 (min 35.00, max 39.00)" + "sha256","93.75 (min 93.00, max 94.00)","94.38 (min 93.00, max 95.00)","94.50 (min 93.00, max 95.00)" + "sha512","93.38 (min 92.00, max 94.00)","94.75 (min 94.00, max 95.00)","94.63 (min 94.00, max 95.00)" Listed for each algorithm are the code snippets used to run each benchmark test. @@ -1111,76 +781,12 @@ Listed for each algorithm are the code snippets used to run each time -v openssl speed -elapsed -evp aes-128-cbc - - IPSec Software Performance ^^^^^^^^^^^^^^^^^^^^^^^^^^ .. csv-table:: IPSec Software Performance :header: "Algorithm","am62xx_sk-fs: Throughput (Mbps)","am62xx_sk-fs: Packets/Sec","am62xx_sk-fs: CPU Load","am62xxsip_sk-fs: Throughput (Mbps)","am62xxsip_sk-fs: Packets/Sec","am62xxsip_sk-fs: CPU Load" - "aes128","1.20","0.00","51.32","4.20","0.00","70.26" - "aes192","1.30","0.00","51.25","2.90","0.00","79.48" - "aes256","1.20","0.00","51.52","216.40","19.00","28.32" - -Low Power Performance -------------------------- - -Power Performance -^^^^^^^^^^^^^^^^^ - -.. csv-table:: Deep Sleep Power Performance - :header: "Rail name","Rail voltage(V)","Power (mW)" - - "vdd_core","0.85","8.53" - "vddr_core","0.85","n/a" - "soc_dvdd_3v3","3.30","5.19" - "soc_dvdd_1v8","1.80","1.04" - "vdda_1v8","1.80","2.12" - "vdd_ddr4","1.10","7.50" - "Total"," ","24.37" - -.. csv-table:: MCU Only Power Performance - :header: "Rail name","Rail voltage(V)","Power (mW)" - - "vdd_core","0.85","109.46" - "vddr_core","0.85","n/a" - "soc_dvdd_3v3","3.30","12.97" - "soc_dvdd_1v8","1.80","0.77" - "vdda_1v8","1.80","10.94" - "vdd_ddr4","1.10","8.28" - "Total"," ","142.41" - -Partial I/O Data -- All voltage rails were measured to be near 0V - -.. note:: - - The measurements shown are from an SK-AM62B-P1. Results may vary based off of the board variant being used. - -Further optimizations are possible for these low power modes. Please refer to the AM62x Power Consumption App Note (https://www.ti.com/lit/pdf/spradg1) - -Resume Latency Performance -^^^^^^^^^^^^^^^^^^^^^^^^^^ - -.. csv-table:: LPM Resume Latency Performance - :header: "Low Power Mode","Total Resume Latency (ms)" - - "Deep Sleep", "137.03" - "MCU Only", "86.12" - -The performance numbers are measured without the Linux printk logs. To remove the -Linux printk logs, run the following commands in the terminal: - -.. code:: console - - # Detach kernel serial console - consoles=$(find /sys/bus/platform/devices/*.serial/ -name console) - for console in ${consoles}; do - echo -n N > ${console} - done - - -.. note:: - - The measurements shown are from using the default SDK with no extra optimizations. + "aes128","121.71 (min 2.30, max 305.50)","10.57 (min 0.00, max 27.00)","48.76 (min 28.52, max 54.93)","135.97 (min 4.10, max 338.50)","11.71 (min 0.00, max 30.00)","52.73 (min 47.19, max 58.90)" + "aes192","75.94 (min 0.20, max 228.80)","6.43 (min 0.00, max 20.00)","42.84 (min 28.19, max 50.88)","2.40 (min 2.20, max 2.60)","0.00","85.06 (min 83.00, max 87.11)" + "aes256","188.42 (min 1.30, max 302.20)","16.33 (min 0.00, max 26.00)","48.78 (min 28.23, max 54.44)","164.90 (min 4.80, max 331.20)","14.33 (min 0.00, max 29.00)","53.12 (min 28.47, max 65.09)" diff --git a/source/devices/AM62X/linux/RT_Linux_Performance_Guide.rst b/source/devices/AM62X/linux/RT_Linux_Performance_Guide.rst index ddc4099f2..7e8bd0727 100644 --- a/source/devices/AM62X/linux/RT_Linux_Performance_Guide.rst +++ b/source/devices/AM62X/linux/RT_Linux_Performance_Guide.rst @@ -1,6 +1,6 @@ -================================= - RT-linux 11.01 Performance Guide -================================= +======================================= + RT-linux 11.02.08.02 Performance Guide +======================================= .. rubric:: **Read This First** :name: read-this-first-kernel-perf-guide @@ -79,12 +79,3 @@ default SDK image using the SK-AM62B-P1_ reference board: Components section: :ref:`building-optee-with-prng`, and enabling the RNG node in the Linux kernel device tree. This way the HW TRNG is accessed from the kernel itself. - -.. csv-table:: - :header: "Latencies","CPU 0","CPU 1","CPU 2","CPU 3" - - "Minimum (usec)","5","5","5","5" - "Average (usec)","6","6","6","6" - "Maximum (usec)","62","46","47","52" - -.. image:: img/rt-cpu-method-all-latency-histogram.png diff --git a/source/devices/AM64X/linux/Linux_Performance_Guide.rst b/source/devices/AM64X/linux/Linux_Performance_Guide.rst index ea7ea2ce0..2b2772afa 100644 --- a/source/devices/AM64X/linux/Linux_Performance_Guide.rst +++ b/source/devices/AM64X/linux/Linux_Performance_Guide.rst @@ -1,6 +1,6 @@ -============================== - Linux 11.01 Performance Guide -============================== +==================================== + Linux 11.02.08.02 Performance Guide +==================================== .. rubric:: **Read This First** @@ -29,19 +29,3 @@ with drivers included in a particular release. For further information or to report any problems, contact https://e2e.ti.com/ or https://support.ti.com/ - -Linux OSPI Flash Driver ------------------------ - - -AM64XX-SK -^^^^^^^^^ - - -RAW -""" - -.. csv-table:: OSPI Raw Flash Driver - :header: "File size (Mbytes)","am64xx_sk-fs: Raw Read Throughput (Mbytes/sec)" - - "50","172.41" diff --git a/source/devices/AM64X/linux/RT_Linux_Performance_Guide.rst b/source/devices/AM64X/linux/RT_Linux_Performance_Guide.rst index 64f664c69..8d9e279cf 100644 --- a/source/devices/AM64X/linux/RT_Linux_Performance_Guide.rst +++ b/source/devices/AM64X/linux/RT_Linux_Performance_Guide.rst @@ -1,6 +1,6 @@ -================================ -RT-linux 11.01 Performance Guide -================================ +====================================== +RT-linux 11.02.08.02 Performance Guide +====================================== .. rubric:: **Read This First** :name: read-this-first-rt-kernel-perf-guide @@ -36,60 +36,14 @@ https://e2e.ti.com/ or https://support.ti.com/ System Benchmarks ----------------- -Stress-ng and Cyclic Test -^^^^^^^^^^^^^^^^^^^^^^^^^ - -.. _RT-linux-performance: - -stress-ng (next-generation) will stress test a embedded platform in various selectable ways. -It was designed to exercise various physical subsystems as well as the various -operating system kernel interfaces. stress-ng can also measure test throughput rates; -this can be useful to observe performance changes across different operating system or types of hardware. - -Cyclictest is most commonly used for benchmarking RT systems. -It is one of the most frequently used tools for evaluating the relative performance of real-time systems. -Some performance tests which use Cyclictest are System benchmarking, Latency debugging with tracing and -approximating application performance. - -Test commands used for running stress-ng and cyclictest together - -.. code:: console - - stress-ng --cpu-method=all -c 4 & - cyclictest -m -Sp80 -D6h -h400 -i200 -M -q - -The following summarizes the latencies observed using the yocto based -default SDK image: - -.. note:: - - A known issue in this SDK release is affecting this benchmark. - Using OP-TEE's PRNG drivers rather than the hardware accelerated TRNG - drivers restores the context switch latencies to the values you see - here. - - More information on switching to the PRNG drivers can be found in the - Foundational Components section, here :ref:`building-optee-with-prng` - -.. csv-table:: - :header: "Latencies","CPU 0","CPU 1" - - "Minimum (usec)","6","6" - "Average (usec)","10","9" - "Maximum (usec)","77","52" - -.. image:: img/rt-cpu-method-all-latency-histogram.png - -| - LMBench ^^^^^^^ -LMBench is a collection of microbenchmarks of which the memory bandwidth -and latency related ones are typically used to estimate processor -memory system performance. More information about lmbench at -http://lmbench.sourceforge.net/whatis_lmbench.html and -http://lmbench.sourceforge.net/man/lmbench.8.html - +LMBench is a collection of microbenchmarks of which the memory bandwidth +and latency related ones are typically used to estimate processor +memory system performance. More information about lmbench at +https://lmbench.sourceforge.net/whatis_lmbench.html and +https://lmbench.sourceforge.net/man/lmbench.8.html + **Latency**: lat_mem_rd-stride128-szN, where N is equal to or smaller than the cache size at given level measures the cache miss penalty. N that is at least double the size of last level cache is the latency to external memory. @@ -110,123 +64,121 @@ Execute the LMBench with the following: .. csv-table:: LMBench Benchmarks :header: "Benchmarks","am64xx-hsevm: perf" - "af_unix_sock_stream_latency (microsec)","43.92 (min 40.29, max 49.64)" - "af_unix_socket_stream_bandwidth (mb\s)","534.11 (min 521.33, max 538.82)" - "bw_file_rd-io-1mb (mb/s)","848.55 (min 833.06, max 870.93)" - "bw_file_rd-o2c-1mb (mb/s)","484.02 (min 461.04, max 493.83)" - "bw_mem-bcopy-16mb (mb/s)","985.60 (min 970.29, max 999.00)" - "bw_mem-bcopy-1mb (mb/s)","948.66 (min 922.65, max 989.94)" - "bw_mem-bcopy-2mb (mb/s)","966.59 (min 936.48, max 1006.88)" - "bw_mem-bcopy-4mb (mb/s)","942.89 (min 904.98, max 972.41)" - "bw_mem-bcopy-8mb (mb/s)","967.26 (min 924.00, max 997.13)" - "bw_mem-bzero-16mb (mb/s)","2116.75 (min 2116.40, max 2116.96)" - "bw_mem-bzero-1mb (mb/s)","1531.23 (min 922.65, max 2117.90)" - "bw_mem-bzero-2mb (mb/s)","1540.94 (min 936.48, max 2118.27)" - "bw_mem-bzero-4mb (mb/s)","1526.44 (min 904.98, max 2113.05)" - "bw_mem-bzero-8mb (mb/s)","1541.80 (min 924.00, max 2118.36)" - "bw_mem-cp-16mb (mb/s)","568.31 (min 522.04, max 598.00)" - "bw_mem-cp-1mb (mb/s)","1609.38 (min 584.20, max 2690.24)" - "bw_mem-cp-2mb (mb/s)","1447.17 (min 534.47, max 2359.88)" - "bw_mem-cp-4mb (mb/s)","1374.97 (min 536.91, max 2217.70)" - "bw_mem-cp-8mb (mb/s)","1342.76 (min 529.07, max 2152.56)" - "bw_mem-fcp-16mb (mb/s)","1012.13 (min 983.47, max 1038.08)" - "bw_mem-fcp-1mb (mb/s)","1597.21 (min 1037.88, max 2117.90)" - "bw_mem-fcp-2mb (mb/s)","1576.33 (min 1004.02, max 2118.27)" - "bw_mem-fcp-4mb (mb/s)","1577.93 (min 985.71, max 2113.05)" - "bw_mem-fcp-8mb (mb/s)","1573.48 (min 969.93, max 2118.36)" - "bw_mem-frd-16mb (mb/s)","1302.42 (min 1283.39, max 1312.98)" - "bw_mem-frd-1mb (mb/s)","1176.71 (min 1037.88, max 1287.47)" - "bw_mem-frd-2mb (mb/s)","1173.57 (min 1004.02, max 1329.12)" - "bw_mem-frd-4mb (mb/s)","1164.97 (min 985.71, max 1321.22)" - "bw_mem-frd-8mb (mb/s)","1173.06 (min 969.93, max 1334.22)" - "bw_mem-fwr-16mb (mb/s)","2121.88 (min 2118.36, max 2125.96)" - "bw_mem-fwr-1mb (mb/s)","1951.85 (min 1252.46, max 2690.24)" - "bw_mem-fwr-2mb (mb/s)","1824.75 (min 1296.39, max 2359.88)" - "bw_mem-fwr-4mb (mb/s)","1742.03 (min 1258.06, max 2217.70)" - "bw_mem-fwr-8mb (mb/s)","1729.04 (min 1285.76, max 2152.56)" - "bw_mem-rd-16mb (mb/s)","1338.76 (min 1331.78, max 1342.62)" - "bw_mem-rd-1mb (mb/s)","1078.25 (min 788.52, max 1365.85)" - "bw_mem-rd-2mb (mb/s)","1079.56 (min 790.93, max 1355.01)" - "bw_mem-rd-4mb (mb/s)","1086.93 (min 810.62, max 1351.58)" - "bw_mem-rd-8mb (mb/s)","1111.91 (min 863.19, max 1350.44)" - "bw_mem-rdwr-16mb (mb/s)","860.25 (min 847.73, max 871.32)" - "bw_mem-rdwr-1mb (mb/s)","705.72 (min 584.20, max 847.17)" - "bw_mem-rdwr-2mb (mb/s)","687.14 (min 534.47, max 851.18)" - "bw_mem-rdwr-4mb (mb/s)","681.11 (min 536.91, max 839.72)" - "bw_mem-rdwr-8mb (mb/s)","695.52 (min 529.07, max 856.16)" - "bw_mem-wr-16mb (mb/s)","889.48 (min 888.15, max 890.47)" - "bw_mem-wr-1mb (mb/s)","818.14 (min 785.67, max 847.17)" - "bw_mem-wr-2mb (mb/s)","817.43 (min 773.69, max 851.18)" - "bw_mem-wr-4mb (mb/s)","821.37 (min 784.01, max 843.79)" - "bw_mem-wr-8mb (mb/s)","862.85 (min 844.24, max 885.54)" - "bw_mmap_rd-mo-1mb (mb/s)","1297.19 (min 1274.58, max 1315.05)" - "bw_mmap_rd-o2c-1mb (mb/s)","467.73 (min 455.72, max 477.86)" - "bw_pipe (mb/s)","550.83 (min 538.93, max 563.59)" - "bw_unix (mb/s)","534.11 (min 521.33, max 538.82)" - "lat_connect (us)","76.50 (min 75.69, max 77.20)" - "lat_ctx-2-128k (us)","10.52 (min 9.79, max 11.79)" - "lat_ctx-2-256k (us)","25.39 (min 15.41, max 30.59)" - "lat_ctx-4-128k (us)","11.98 (min 11.81, max 12.29)" - "lat_ctx-4-256k (us)","12.54 (min 6.99, max 15.42)" - "lat_fs-0k (num_files)","195.75 (min 188.00, max 202.00)" - "lat_fs-10k (num_files)","86.50 (min 83.00, max 90.00)" - "lat_fs-1k (num_files)","134.25 (min 129.00, max 139.00)" - "lat_fs-4k (num_files)","119.75 (min 112.00, max 128.00)" - "lat_mem_rd-stride128-sz1000k (ns)","48.27 (min 48.18, max 48.38)" - "lat_mem_rd-stride128-sz125k (ns)","7.83 (min 7.81, max 7.86)" - "lat_mem_rd-stride128-sz250k (ns)","12.79 (min 9.36, max 18.06)" - "lat_mem_rd-stride128-sz31k (ns)","5.68 (min 5.13, max 6.57)" + "af_unix_sock_stream_latency (microsec)","42.81 (min 37.94, max 47.17)" + "af_unix_socket_stream_bandwidth (mb\s)","541.45 (min 530.54, max 556.53)" + "bw_file_rd-io-1mb (mb/s)","875.51 (min 850.20, max 890.31)" + "bw_file_rd-o2c-1mb (mb/s)","491.77 (min 456.00, max 508.82)" + "bw_mem-bcopy-16mb (mb/s)","969.07 (min 937.70, max 1007.87)" + "bw_mem-bcopy-1mb (mb/s)","947.26 (min 915.75, max 980.01)" + "bw_mem-bcopy-2mb (mb/s)","934.26 (min 902.53, max 970.87)" + "bw_mem-bcopy-4mb (mb/s)","949.68 (min 911.68, max 983.28)" + "bw_mem-bcopy-8mb (mb/s)","976.43 (min 911.99, max 1010.61)" + "bw_mem-bzero-16mb (mb/s)","2117.38 (min 2116.68, max 2118.08)" + "bw_mem-bzero-1mb (mb/s)","1532.87 (min 915.75, max 2119.87)" + "bw_mem-bzero-2mb (mb/s)","1524.64 (min 902.53, max 2117.90)" + "bw_mem-bzero-4mb (mb/s)","1532.55 (min 911.68, max 2118.64)" + "bw_mem-bzero-8mb (mb/s)","1546.42 (min 911.99, max 2118.36)" + "bw_mem-cp-16mb (mb/s)","592.63 (min 576.54, max 600.85)" + "bw_mem-cp-1mb (mb/s)","1585.65 (min 543.97, max 2718.45)" + "bw_mem-cp-2mb (mb/s)","1432.40 (min 524.11, max 2363.14)" + "bw_mem-cp-4mb (mb/s)","1376.53 (min 523.49, max 2214.43)" + "bw_mem-cp-8mb (mb/s)","1352.70 (min 523.01, max 2157.79)" + "bw_mem-fcp-16mb (mb/s)","1051.58 (min 1000.13, max 1099.43)" + "bw_mem-fcp-1mb (mb/s)","1591.05 (min 1028.10, max 2119.87)" + "bw_mem-fcp-2mb (mb/s)","1567.15 (min 987.33, max 2117.90)" + "bw_mem-fcp-4mb (mb/s)","1565.96 (min 982.08, max 2118.64)" + "bw_mem-fcp-8mb (mb/s)","1571.64 (min 971.46, max 2118.36)" + "bw_mem-frd-16mb (mb/s)","1317.14 (min 1282.36, max 1364.84)" + "bw_mem-frd-1mb (mb/s)","1170.35 (min 1028.10, max 1305.24)" + "bw_mem-frd-2mb (mb/s)","1167.91 (min 987.33, max 1373.86)" + "bw_mem-frd-4mb (mb/s)","1161.96 (min 982.08, max 1330.23)" + "bw_mem-frd-8mb (mb/s)","1175.62 (min 971.46, max 1385.76)" + "bw_mem-fwr-16mb (mb/s)","2122.36 (min 2106.37, max 2131.91)" + "bw_mem-fwr-1mb (mb/s)","1933.56 (min 1216.12, max 2718.45)" + "bw_mem-fwr-2mb (mb/s)","1822.22 (min 1261.83, max 2363.14)" + "bw_mem-fwr-4mb (mb/s)","1754.10 (min 1265.82, max 2214.43)" + "bw_mem-fwr-8mb (mb/s)","1736.68 (min 1236.09, max 2157.79)" + "bw_mem-rd-16mb (mb/s)","1366.15 (min 1338.24, max 1382.65)" + "bw_mem-rd-1mb (mb/s)","1100.78 (min 793.27, max 1403.09)" + "bw_mem-rd-2mb (mb/s)","1101.55 (min 801.18, max 1400.81)" + "bw_mem-rd-4mb (mb/s)","1105.82 (min 824.91, max 1399.09)" + "bw_mem-rd-8mb (mb/s)","1125.63 (min 861.05, max 1393.73)" + "bw_mem-rdwr-16mb (mb/s)","856.58 (min 844.73, max 870.65)" + "bw_mem-rdwr-1mb (mb/s)","693.30 (min 543.97, max 838.64)" + "bw_mem-rdwr-2mb (mb/s)","671.55 (min 524.11, max 834.84)" + "bw_mem-rdwr-4mb (mb/s)","684.01 (min 523.49, max 844.77)" + "bw_mem-rdwr-8mb (mb/s)","701.39 (min 523.01, max 857.08)" + "bw_mem-wr-16mb (mb/s)","893.90 (min 886.48, max 899.79)" + "bw_mem-wr-1mb (mb/s)","819.90 (min 754.86, max 847.17)" + "bw_mem-wr-2mb (mb/s)","814.11 (min 777.91, max 836.35)" + "bw_mem-wr-4mb (mb/s)","828.96 (min 793.41, max 876.33)" + "bw_mem-wr-8mb (mb/s)","864.35 (min 836.65, max 897.06)" + "bw_mmap_rd-mo-1mb (mb/s)","1320.67 (min 1272.50, max 1351.35)" + "bw_mmap_rd-o2c-1mb (mb/s)","474.18 (min 454.27, max 483.64)" + "bw_pipe (mb/s)","540.02 (min 518.86, max 558.01)" + "bw_unix (mb/s)","541.45 (min 530.54, max 556.53)" + "lat_connect (us)","75.76 (min 74.84, max 78.74)" + "lat_ctx-2-128k (us)","10.34 (min 8.76, max 11.41)" + "lat_ctx-2-256k (us)","22.65 (min 15.21, max 28.60)" + "lat_ctx-4-128k (us)","11.46 (min 10.21, max 12.85)" + "lat_ctx-4-256k (us)","10.78 (min 0.00, max 18.44)" + "lat_fs-0k (num_files)","198.38 (min 194.00, max 203.00)" + "lat_fs-10k (num_files)","88.38 (min 82.00, max 103.00)" + "lat_fs-1k (num_files)","132.88 (min 129.00, max 138.00)" + "lat_fs-4k (num_files)","118.50 (min 107.00, max 126.00)" + "lat_mem_rd-stride128-sz1000k (ns)","47.38 (min 46.80, max 48.23)" + "lat_mem_rd-stride128-sz125k (ns)","7.85 (min 7.80, max 7.97)" + "lat_mem_rd-stride128-sz250k (ns)","12.09 (min 10.07, max 14.63)" + "lat_mem_rd-stride128-sz31k (ns)","5.25 (min 3.07, max 5.90)" "lat_mem_rd-stride128-sz50 (ns)","3.02" - "lat_mem_rd-stride128-sz500k (ns)","43.72 (min 42.55, max 44.62)" - "lat_mem_rd-stride128-sz62k (ns)","7.41 (min 7.37, max 7.47)" - "lat_mmap-1m (us)","71.50 (min 65.00, max 79.00)" - "lat_ops-double-add (ns)","4.02 (min 4.02, max 4.03)" - "lat_ops-double-div (ns)","22.12 (min 22.12, max 22.13)" + "lat_mem_rd-stride128-sz500k (ns)","43.10 (min 41.58, max 44.38)" + "lat_mem_rd-stride128-sz62k (ns)","7.15 (min 6.43, max 7.42)" + "lat_mmap-1m (us)","69.00 (min 65.00, max 76.00)" + "lat_ops-double-add (ns)","4.02" + "lat_ops-double-div (ns)","22.13 (min 22.12, max 22.14)" "lat_ops-double-mul (ns)","4.02 (min 4.02, max 4.03)" "lat_ops-float-add (ns)","4.02" - "lat_ops-float-div (ns)","13.07 (min 13.07, max 13.08)" + "lat_ops-float-div (ns)","13.07" "lat_ops-float-mul (ns)","4.02" "lat_ops-int-add (ns)","1.01" "lat_ops-int-bit (ns)","0.67" - "lat_ops-int-div (ns)","6.04" - "lat_ops-int-mod (ns)","6.38 (min 6.37, max 6.39)" - "lat_ops-int-mul (ns)","4.35 (min 4.32, max 4.40)" + "lat_ops-int-div (ns)","6.03 (min 6.03, max 6.04)" + "lat_ops-int-mod (ns)","6.37 (min 6.37, max 6.39)" + "lat_ops-int-mul (ns)","4.34 (min 4.32, max 4.42)" "lat_ops-int64-add (ns)","1.01" "lat_ops-int64-bit (ns)","0.67" - "lat_ops-int64-div (ns)","9.56 (min 9.55, max 9.56)" - "lat_ops-int64-mod (ns)","7.38 (min 7.37, max 7.38)" - "lat_ops-int64-mul (ns)","5.01 (min 4.99, max 5.06)" - "lat_pagefault (us)","1.83 (min 1.81, max 1.84)" - "lat_pipe (us)","26.04 (min 25.91, max 26.16)" - "lat_proc-exec (us)","1208.90 (min 1194.20, max 1221.80)" - "lat_proc-fork (us)","1035.45 (min 1016.67, max 1052.33)" + "lat_ops-int64-div (ns)","9.56 (min 9.55, max 9.57)" + "lat_ops-int64-mod (ns)","7.38 (min 7.37, max 7.39)" + "lat_ops-int64-mul (ns)","5.01 (min 4.99, max 5.13)" + "lat_pagefault (us)","1.81 (min 1.76, max 1.84)" + "lat_pipe (us)","26.34 (min 25.73, max 27.06)" + "lat_proc-exec (us)","1176.48 (min 1144.00, max 1221.00)" + "lat_proc-fork (us)","1019.08 (min 1002.83, max 1054.80)" "lat_proc-proccall (us)","0.01" - "lat_select (us)","47.62 (min 46.19, max 49.96)" - "lat_sem (us)","3.47 (min 3.28, max 3.55)" - "lat_sig-catch (us)","5.64 (min 5.50, max 5.97)" - "lat_sig-install (us)","0.92 (min 0.90, max 0.94)" - "lat_sig-prot (us)","0.77 (min 0.49, max 0.88)" - "lat_syscall-fstat (us)","2.48 (min 2.33, max 2.69)" - "lat_syscall-null (us)","0.57 (min 0.57, max 0.58)" - "lat_syscall-open (us)","415.84 (min 400.86, max 439.75)" - "lat_syscall-read (us)","0.86 (min 0.82, max 0.93)" - "lat_syscall-stat (us)","6.86 (min 6.57, max 7.24)" - "lat_syscall-write (us)","0.80 (min 0.79, max 0.83)" - "lat_tcp (us)","1.10 (min 1.09, max 1.11)" - "lat_unix (us)","43.92 (min 40.29, max 49.64)" - "latency_for_0.50_mb_block_size (nanosec)","43.72 (min 42.55, max 44.62)" - "latency_for_1.00_mb_block_size (nanosec)","24.13 (min 0.00, max 48.38)" - "pipe_bandwidth (mb\s)","550.83 (min 538.93, max 563.59)" - "pipe_latency (microsec)","26.04 (min 25.91, max 26.16)" + "lat_select (us)","46.72 (min 46.13, max 47.43)" + "lat_sem (us)","3.45 (min 3.16, max 3.71)" + "lat_sig-catch (us)","5.78 (min 5.65, max 5.93)" + "lat_sig-install (us)","0.94 (min 0.93, max 1.00)" + "lat_sig-prot (us)","0.75 (min 0.69, max 0.81)" + "lat_syscall-fstat (us)","2.55 (min 2.49, max 2.67)" + "lat_syscall-null (us)","0.62 (min 0.60, max 0.68)" + "lat_syscall-open (us)","386.20 (min 345.40, max 419.63)" + "lat_syscall-read (us)","0.83 (min 0.82, max 0.88)" + "lat_syscall-stat (us)","6.88 (min 6.48, max 7.35)" + "lat_syscall-write (us)","0.79 (min 0.77, max 0.83)" + "lat_tcp (us)","1.12 (min 1.10, max 1.16)" + "lat_unix (us)","42.81 (min 37.94, max 47.17)" + "latency_for_0.50_mb_block_size (nanosec)","43.10 (min 41.58, max 44.38)" + "latency_for_1.00_mb_block_size (nanosec)","23.69 (min 0.00, max 48.23)" + "pipe_bandwidth (mb\s)","540.02 (min 518.86, max 558.01)" + "pipe_latency (microsec)","26.34 (min 25.73, max 27.06)" "procedure_call (microsec)","0.01" - "select_on_200_tcp_fds (microsec)","47.62 (min 46.19, max 49.96)" - "semaphore_latency (microsec)","3.47 (min 3.28, max 3.55)" - "signal_handler_latency (microsec)","0.92 (min 0.90, max 0.94)" - "signal_handler_overhead (microsec)","5.64 (min 5.50, max 5.97)" - "tcp_ip_connection_cost_to_localhost (microsec)","76.50 (min 75.69, max 77.20)" - "tcp_latency_using_localhost (microsec)","1.10 (min 1.09, max 1.11)" - - + "select_on_200_tcp_fds (microsec)","46.72 (min 46.13, max 47.43)" + "semaphore_latency (microsec)","3.45 (min 3.16, max 3.71)" + "signal_handler_latency (microsec)","0.94 (min 0.93, max 1.00)" + "signal_handler_overhead (microsec)","5.78 (min 5.65, max 5.93)" + "tcp_ip_connection_cost_to_localhost (microsec)","75.76 (min 74.84, max 78.74)" + "tcp_latency_using_localhost (microsec)","1.12 (min 1.10, max 1.16)" Dhrystone ^^^^^^^^^ @@ -238,9 +190,8 @@ cores the DMIPS/MHz score will be identical with the same compiler and flags. :header: "Benchmarks","am64xx-hsevm: perf" "cpu_clock (mhz)","1000.00" - "dhrystone_per_mhz (dmips/mhz)","2.88 (min 2.80, max 2.90)" - "dhrystone_per_second (dhrystonep)","5096153.75 (min 5000000.00, max 5128205.00)" - + "dhrystone_per_mhz (dmips/mhz)","2.90" + "dhrystone_per_second (dhrystonep)","5128205.00" Whetstone ^^^^^^^^^ @@ -248,9 +199,7 @@ Whetstone .. csv-table:: Whetstone Benchmarks :header: "Benchmarks","am64xx-hsevm: perf" - "whetstone (mips)","5000.00" - - + "whetstone (mips)","4583.33 (min 3333.30, max 5000.00)" Linpack ^^^^^^^ @@ -260,8 +209,7 @@ solving a dense linear system. .. csv-table:: Linpack Benchmarks :header: "Benchmarks","am64xx-hsevm: perf" - "linpack (kflops)","409028.75 (min 408609.00, max 409559.00)" - + "linpack (kflops)","407927.00 (min 406745.00, max 408901.00)" CoreMarkPro ^^^^^^^^^^^ @@ -271,36 +219,33 @@ While CoreMark stresses the CPU pipeline, CoreMark-Pro tests the entire processo adding comprehensive support for multicore technology, a combination of integer and floating-point workloads, and data sets for utilizing larger memory subsystems. - .. csv-table:: CoreMarkPro Benchmarks :header: "Benchmarks","am64xx-hsevm: perf" - "cjpeg-rose7-preset (workloads/)","29.56 (min 29.50, max 29.67)" + "cjpeg-rose7-preset (workloads/)","29.58 (min 29.41, max 29.67)" "core (workloads/)","0.21" - "coremark-pro ()","587.32 (min 583.40, max 594.37)" - "linear_alg-mid-100x100-sp (workloads/)","10.41 (min 10.40, max 10.42)" + "coremark-pro ()","588.47 (min 585.75, max 593.10)" + "linear_alg-mid-100x100-sp (workloads/)","10.41 (min 10.41, max 10.42)" "loops-all-mid-10k-sp (workloads/)","0.48" - "nnet_test (workloads/)","0.77" - "parser-125k (workloads/)","5.50 (min 5.35, max 5.71)" - "radix2-big-64k (workloads/)","20.12 (min 19.27, max 21.25)" - "sha-test (workloads/)","57.80" - "zip-test (workloads/)","15.44 (min 15.38, max 15.63)" - + "nnet_test (workloads/)","0.77 (min 0.76, max 0.77)" + "parser-125k (workloads/)","5.46 (min 5.21, max 5.62)" + "radix2-big-64k (workloads/)","20.60 (min 19.46, max 21.53)" + "sha-test (workloads/)","57.72 (min 57.47, max 57.80)" + "zip-test (workloads/)","15.47 (min 15.38, max 15.63)" .. csv-table:: CoreMarkProTwoCore Benchmarks :header: "Benchmarks","am64xx-hsevm: perf" - "cjpeg-rose7-preset (workloads/)","58.15 (min 57.47, max 59.17)" - "core (workloads/)","0.43" - "coremark-pro ()","1047.54 (min 1043.17, max 1054.31)" - "linear_alg-mid-100x100-sp (workloads/)","20.80 (min 20.77, max 20.82)" - "loops-all-mid-10k-sp (workloads/)","0.87 (min 0.87, max 0.88)" + "cjpeg-rose7-preset (workloads/)","55.33 (min 38.46, max 59.17)" + "core (workloads/)","0.43 (min 0.42, max 0.43)" + "coremark-pro ()","1041.66 (min 1003.86, max 1052.62)" + "linear_alg-mid-100x100-sp (workloads/)","20.81 (min 20.78, max 20.84)" + "loops-all-mid-10k-sp (workloads/)","0.88 (min 0.87, max 0.89)" "nnet_test (workloads/)","1.54" - "parser-125k (workloads/)","5.84 (min 5.71, max 5.93)" - "radix2-big-64k (workloads/)","32.26 (min 30.87, max 33.46)" - "sha-test (workloads/)","115.28 (min 114.94, max 116.28)" - "zip-test (workloads/)","28.37 (min 28.17, max 28.57)" - + "parser-125k (workloads/)","5.86 (min 5.56, max 6.15)" + "radix2-big-64k (workloads/)","32.59 (min 31.39, max 33.66)" + "sha-test (workloads/)","115.13 (min 114.94, max 116.28)" + "zip-test (workloads/)","28.17 (min 27.78, max 28.57)" MultiBench ^^^^^^^^^^ @@ -322,256 +267,64 @@ thread-enabled workloads to be tested. .. csv-table:: Multibench Benchmarks :header: "Benchmarks","am64xx-hsevm: perf" - "4m-check (workloads/)","281.56 (min 281.15, max 281.85)" - "4m-check-reassembly (workloads/)","61.33 (min 61.09, max 61.61)" - "4m-check-reassembly-tcp (workloads/)","36.25 (min 35.77, max 36.60)" - "4m-check-reassembly-tcp-cmykw2-rotatew2 (workloads/)","14.55 (min 14.38, max 14.71)" - "4m-check-reassembly-tcp-x264w2 (workloads/)","0.75 (min 0.74, max 0.76)" - "4m-cmykw2 (workloads/)","85.64 (min 84.64, max 86.24)" - "4m-cmykw2-rotatew2 (workloads/)","18.45 (min 17.29, max 19.80)" - "4m-reassembly (workloads/)","56.74 (min 56.63, max 56.88)" - "4m-rotatew2 (workloads/)","21.89 (min 20.05, max 23.13)" - "4m-tcp-mixed (workloads/)","85.56 (min 85.11, max 86.02)" - "4m-x264w2 (workloads/)","0.76 (min 0.76, max 0.77)" + "4m-check (workloads/)","282.33 (min 280.68, max 284.84)" + "4m-check-reassembly (workloads/)","61.37 (min 61.12, max 61.50)" + "4m-check-reassembly-tcp (workloads/)","36.64 (min 36.39, max 36.93)" + "4m-check-reassembly-tcp-cmykw2-rotatew2 (workloads/)","14.60 (min 14.57, max 14.63)" + "4m-check-reassembly-tcp-x264w2 (workloads/)","0.75 (min 0.74, max 0.75)" + "4m-cmykw2 (workloads/)","85.93 (min 85.80, max 86.17)" + "4m-cmykw2-rotatew2 (workloads/)","17.54 (min 16.62, max 18.35)" + "4m-reassembly (workloads/)","56.76 (min 56.34, max 57.24)" + "4m-rotatew2 (workloads/)","20.14 (min 18.86, max 21.70)" + "4m-tcp-mixed (workloads/)","84.66 (min 83.77, max 85.56)" + "4m-x264w2 (workloads/)","0.77 (min 0.76, max 0.77)" "empty-wld (workloads/)","1.00" - "idct-4m (workloads/)","13.68 (min 13.68, max 13.69)" - "idct-4mw1 (workloads/)","13.68 (min 13.67, max 13.69)" - "ippktcheck-4m (workloads/)","281.33 (min 280.65, max 282.01)" - "ippktcheck-4mw1 (workloads/)","281.37 (min 280.87, max 281.85)" - "ipres-4m (workloads/)","72.63 (min 72.46, max 72.92)" - "ipres-4mw1 (workloads/)","71.88 (min 71.29, max 72.39)" - "md5-4m (workloads/)","19.75 (min 19.58, max 19.93)" - "md5-4mw1 (workloads/)","19.74 (min 19.45, max 20.00)" - "rgbcmyk-4m (workloads/)","44.70 (min 44.68, max 44.72)" - "rgbcmyk-4mw1 (workloads/)","44.69 (min 44.68, max 44.70)" - "rotate-4ms1 (workloads/)","16.57 (min 16.51, max 16.59)" - "rotate-4ms1w1 (workloads/)","16.60 (min 16.59, max 16.61)" - "rotate-4ms64 (workloads/)","16.79 (min 16.79, max 16.80)" - "rotate-4ms64w1 (workloads/)","16.79 (min 16.76, max 16.80)" + "idct-4m (workloads/)","13.67 (min 13.65, max 13.68)" + "idct-4mw1 (workloads/)","13.67 (min 13.65, max 13.68)" + "ippktcheck-4m (workloads/)","282.00 (min 280.96, max 284.51)" + "ippktcheck-4mw1 (workloads/)","282.27 (min 281.37, max 284.61)" + "ipres-4m (workloads/)","72.04 (min 71.70, max 72.39)" + "ipres-4mw1 (workloads/)","72.29 (min 72.05, max 72.50)" + "md5-4m (workloads/)","19.98 (min 19.88, max 20.02)" + "md5-4mw1 (workloads/)","20.01 (min 19.94, max 20.06)" + "rgbcmyk-4m (workloads/)","44.75 (min 44.72, max 44.77)" + "rgbcmyk-4mw1 (workloads/)","44.72 (min 44.69, max 44.77)" + "rotate-4ms1 (workloads/)","16.62 (min 16.49, max 16.78)" + "rotate-4ms1w1 (workloads/)","16.57 (min 16.30, max 16.74)" + "rotate-4ms64 (workloads/)","16.83 (min 16.77, max 16.95)" + "rotate-4ms64w1 (workloads/)","16.82 (min 16.77, max 16.92)" "x264-4mq (workloads/)","0.41" "x264-4mqw1 (workloads/)","0.41" - - - - Boot-time Measurement --------------------- - Boot media: MMCSD ^^^^^^^^^^^^^^^^^ .. csv-table:: Linux boot time MMCSD :header: "Boot Configuration","am64xx-hsevm: Boot time in seconds: avg(min,max)" - "Linux boot time from SD with default rootfs (20 boot cycles)","22.75 (min 20.01, max 29.10)" - - + "Linux boot time from SD with default rootfs (20 boot cycles)","22.36 (min 20.60, max 27.42)" Boot time numbers [avg, min, max] are measured from "Starting kernel" to Linux prompt across 20 boot cycles. - -| - -Ethernet --------- -Ethernet performance benchmarks were measured using Netperf 2.7.1 https://hewlettpackard.github.io/netperf/doc/netperf.html -Test procedures were modeled after those defined in RFC-2544: -https://tools.ietf.org/html/rfc2544, where the DUT is the TI device -and the "tester" used was a Linux PC. To produce consistent results, -it is recommended to carry out performance tests in a private network and to avoid -running NFS on the same interface used in the test. In these results, -CPU utilization was captured as the total percentage used across all cores on the device, -while running the performance test over one external interface. - -UDP Throughput (0% loss) was measured by the procedure defined in RFC-2544 section 26.1: Throughput. -In this scenario, netperf options burst_size (-b) and wait_time (-w) are used to limit bandwidth -during different trials of the test, with the goal of finding the highest rate at which -no loss is seen. For example, to limit bandwidth to 500Mbits/sec with 1472B datagram: - -:: - - burst_size = / 8 (bits -> bytes) / / 100 (seconds -> 10 ms) - burst_size = 500000000 / 8 / 1472 / 100 = 425 - - wait_time = 10 milliseconds (minimum supported by Linux PC used for testing) - -UDP Throughput (possible loss) was measured by capturing throughput and packet loss statistics when -running the netperf test with no bandwidth limit (remove -b/-w options). - -In order to start a netperf client on one device, the other device must have netserver running. -To start netserver: - -:: - - netserver [-p ] [-4 (IPv4 addressing)] [-6 (IPv6 addressing)] - -Running the following shell script from the DUT will trigger netperf clients to measure -bidirectional TCP performance for 60 seconds and report CPU utilization. Parameter -k is used in -client commands to summarize selected statistics on their own line and -j is used to gain -additional timing measurements during the test. - -:: - - #!/bin/bash - for i in 1 - do - netperf -H -j -c -l 60 -t TCP_STREAM -- - -k DIRECTION,THROUGHPUT,MEAN_LATENCY,LOCAL_CPU_UTIL,REMOTE_CPU_UTIL,LOCAL_BYTES_SENT,REMOTE_BYTES_RECVD,LOCAL_SEND_SIZE & - - netperf -H -j -c -l 60 -t TCP_MAERTS -- - -k DIRECTION,THROUGHPUT,MEAN_LATENCY,LOCAL_CPU_UTIL,REMOTE_CPU_UTIL,LOCAL_BYTES_SENT,REMOTE_BYTES_RECVD,LOCAL_SEND_SIZE & - done - -Running the following commands will trigger netperf clients to measure UDP burst performance for -60 seconds at various burst/datagram sizes and report CPU utilization. - -- For UDP egress tests, run netperf client from DUT and start netserver on tester. - -:: - - netperf -H -j -c -l 60 -t UDP_STREAM -b -w -- -m - -k DIRECTION,THROUGHPUT,MEAN_LATENCY,LOCAL_CPU_UTIL,REMOTE_CPU_UTIL,LOCAL_BYTES_SENT,REMOTE_BYTES_RECVD,LOCAL_SEND_SIZE - -- For UDP ingress tests, run netperf client from tester and start netserver on DUT. - -:: - - netperf -H -j -C -l 60 -t UDP_STREAM -b -w -- -m - -k DIRECTION,THROUGHPUT,MEAN_LATENCY,LOCAL_CPU_UTIL,REMOTE_CPU_UTIL,LOCAL_BYTES_SENT,REMOTE_BYTES_RECVD,LOCAL_SEND_SIZE - - -CPSW/CPSW2g/CPSW3g Ethernet Driver -^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ - -- CPSW3g: AM64x - - -.. rubric:: TCP Bidirectional Throughput - :name: CPSW2g-tcp-bidirectional-throughput - -.. csv-table:: CPSW2g TCP Bidirectional Throughput - :header: "Command Used","am64xx-hsevm: THROUGHPUT (Mbits/sec)","am64xx-hsevm: CPU Load % (LOCAL_CPU_UTIL)" - - "netperf -H 192.168.0.1 -j -c -C -l 60 -t TCP_STREAM; netperf -H 192.168.0.1 -j -c -C -l 60 -t TCP_MAERTS","1058.45 (min 964.24, max 1158.01)","88.12 (min 79.19, max 99.75)" - -.. rubric:: TCP Bidirectional Throughput Interrupt Pacing - :name: CPSW2g-tcp-bidirectional-throughput-interrupt-pacing - -.. csv-table:: CPSW2g TCP Bidirectional Throughput Interrupt Pacing - :header: "Command Used","am64xx-hsevm: THROUGHPUT (Mbits/sec)","am64xx-hsevm: CPU Load % (LOCAL_CPU_UTIL)" - - "netperf -H 192.168.0.1 -j -c -C -l 60 -t TCP_STREAM; netperf -H 192.168.0.1 -j -c -C -l 60 -t TCP_MAERTS","1196.36","99.96" - -.. rubric:: UDP Throughput - :name: CPSW2g-udp-throughput-0-loss - -.. csv-table:: CPSW2g UDP Egress Throughput 0 loss - :header: "UDP Datagram Size(bytes) (LOCAL_SEND_SIZE)","am64xx-hsevm: THROUGHPUT (Mbits/sec)","am64xx-hsevm: Packets Per Second (kPPS)","am64xx-hsevm: CPU Load % (LOCAL_CPU_UTIL)" - - "64","40.58","80.00","79.03" - "128","79.43","78.00","77.99" - "256","154.99","62.00","77.67" - "1024","577.17","70.00","91.40" - "1472","589.21","49.00","85.92" - -.. csv-table:: CPSW2g UDP Ingress Throughput 0 loss - :header: "UDP Datagram Size(bytes) (LOCAL_SEND_SIZE)","am64xx-hsevm: THROUGHPUT (Mbits/sec)","am64xx-hsevm: Packets Per Second (kPPS)","am64xx-hsevm: CPU Load % (LOCAL_CPU_UTIL)" - - "64","2.92","6.00","0.18" - "128","6.96","7.00","7.83" - "256","15.56","8.00","1.2" - "1024","61.44","8.00","8.39" - "1472","88.32","8.00","8.17" - -ICSSG Ethernet Driver -^^^^^^^^^^^^^^^^^^^^^ - -.. rubric:: TCP Bidirectional Throughput - :name: tcp-bidirectional-throughput - -.. csv-table:: ICSSG TCP Bidirectional Throughput - :header: "Command Used","am64xx-hsevm: THROUGHPUT (Mbits/sec)","am64xx-hsevm: CPU Load % (LOCAL_CPU_UTIL)" - - "netperf -H 192.168.2.1 -j -c -C -l 60 -t TCP_STREAM; netperf -H 192.168.2.1 -j -c -C -l 60 -t TCP_MAERTS","1178","99.98" - - - - -.. rubric:: TCP Bidirectional Throughput Interrupt Pacing - :name: ICSSG-tcp-bidirectional-throughput-interrupt-pacing - -.. csv-table:: ICSSG TCP Bidirectional Throughput Interrupt Pacing - :header: "Command Used","am64xx-hsevm: THROUGHPUT (Mbits/sec)","am64xx-hsevm: CPU Load % (LOCAL_CPU_UTIL)" - - "netperf -H 192.168.2.1 -j -c -C -l 60 -t TCP_STREAM; netperf -H 192.168.2.1 -j -c -C -l 60 -t TCP_MAERTS","1198","99.41" - - - - -.. rubric:: UDP Egress Throughput - :name: udp-egress-throughput-0-loss - -.. csv-table:: ICSSG UDP Egress Throughput 0 loss - :header: "UDP Datagram Size(bytes)","am64xx-hsevm: THROUGHPUT (Mbits/sec)","am64xx-hsevm: Packets Per Second (kPPS)","am64xx-hsevm: CPU Load % (LOCAL_CPU_UTIL)" - - "64","41.45","48.87","77.24" - "128","81.40","59.85","76.77" - "256","156.24","65.53","76.00" - "1024","592.23","69.44","74.74" - "1472","834.46","68.89","74.10" - - - - -.. rubric:: UDP Ingress Throughput - :name: udp-ingress-throughput-0-loss - -.. csv-table:: ICSSG UDP Ingress Throughput 0 loss - :header: "UDP Datagram Size(bytes)","am64xx-hsevm: THROUGHPUT (Mbits/sec)","am64xx-hsevm: Packets Per Second (kPPS)","am64xx-hsevm: CPU Load %" - - "64","1.54","3.00","0.10" - "128","4.81","5.00","0.23" - "256","10.24","5.00","7.35" - "1024","40.14","5.00","3.28" - "1472","374.79","32","49.37" - -.. rubric:: Switch Mode - :name: icssg-switch-mode - -.. csv-table:: ICSSG Switch Mode Forwarding - :header: "Mode","am64xx-hsevm: THROUGHPUT (Mbits/sec)","am64xx-hsevm: CPU Load % (SENDER)","am64xx-hsevm: CPU Load % (FORWARDING)","am64xx-hsevm: CPU Load % (RECIEVER)" - - "Switch with HW Offload","929","94.07","0","83.73" - "Switch with SW Offload","915","96.23","30","85.38" - -.. rubric:: HSR Mode - :name: icssg-hsr-mode - -.. csv-table:: ICSSG HSR Mode Forwarding - :header: "Mode","am64xx-hsevm: THROUGHPUT (Mbits/sec)","am64xx-hsevm: CPU Load % (SENDER)","am64xx-hsevm: CPU Load % (FORWARDING)","am64xx-hsevm: CPU Load % (RECIEVER)" - - "HSR with HW Offload","466","62.01","0","69.11" - "HSR with SW Offload","387","65","29.96","70" - | OSPI Flash Driver ----------------- -AM64XX-EVM -^^^^^^^^^^ +.. rubric:: AM64XX-EVM + :name: am64xx-evm-ospi -RAW -""" +.. rubric:: RAW + :name: am64xx-evm-ospi-raw .. csv-table:: OSPI Raw Flash Driver :header: "File size (Mbytes)","am64xx-hsevm: Raw Read Throughput (Mbytes/sec)" - "50","142.86" - + "50","139.89 (min 113.64, max 147.06)" EMMC Driver ----------- @@ -583,17 +336,16 @@ EMMC Driver sensitive applications, umount the auto-mounted filesystem and re-mount in async mode. - EMMC EXT4 FIO 1G -"""""""""""""""" +^^^^^^^^^^^^^^^^ .. csv-table:: EMMC EXT4 FIO 1G :header: "Buffer size (bytes)","am64xx-hsevm: Write EXT4 Throughput (Mbytes/sec)","am64xx-hsevm: Write EXT4 CPU Load (%)","am64xx-hsevm: Read EXT4 Throughput (Mbytes/sec)","am64xx-hsevm: Read EXT4 CPU Load (%)" - "1m","60.85 (min 60.00, max 61.40)","3.92 (min 3.78, max 4.06)","175.00","7.36 (min 6.89, max 7.69)" - "4m","60.95 (min 60.10, max 61.60)","2.97 (min 2.80, max 3.07)","174.50 (min 174.00, max 175.00)","6.15 (min 5.69, max 6.48)" - "4k","49.05 (min 48.60, max 49.50)","55.20 (min 54.38, max 56.44)","56.08 (min 55.90, max 56.30)","48.50 (min 46.00, max 50.60)" - "256k","61.00 (min 60.50, max 61.40)","5.92 (min 5.70, max 6.06)","174.00","8.89 (min 8.66, max 9.25)" + "1m","60.75 (min 59.60, max 61.40)","4.00 (min 3.73, max 4.22)","175.00","7.20 (min 6.77, max 7.82)" + "4m","60.83 (min 59.80, max 61.70)","2.88 (min 2.78, max 2.95)","174.75 (min 174.00, max 175.00)","5.76 (min 5.30, max 6.12)" + "4k","49.86 (min 49.10, max 50.40)","52.21 (min 51.71, max 52.53)","56.18 (min 56.00, max 56.40)","47.11 (min 46.00, max 49.21)" + "256k","60.75 (min 59.70, max 61.50)","5.94 (min 5.65, max 6.25)","174.00","8.90 (min 8.58, max 9.48)" EMMC EXT4 """"""""" @@ -601,23 +353,11 @@ EMMC EXT4 .. csv-table:: EMMC EXT4 :header: "Buffer size (bytes)","am64xx-hsevm: Write EXT4 Throughput (Mbytes/sec)","am64xx-hsevm: Write EXT4 CPU Load (%)","am64xx-hsevm: Read EXT4 Throughput (Mbytes/sec)","am64xx-hsevm: Read EXT4 CPU Load (%)" - "102400","54.23 (min 49.95, max 56.05)","11.05 (min 9.63, max 15.65)","174.86 (min 168.13, max 177.19)","29.58 (min 27.83, max 30.56)" - "262144","53.37 (min 48.45, max 55.70)","10.88 (min 9.40, max 15.57)","180.84 (min 177.78, max 181.98)","33.37 (min 30.28, max 40.18)" - "524288","53.33 (min 49.35, max 55.13)","11.16 (min 9.74, max 14.88)","182.92 (min 182.86, max 183.01)","27.58 (min 27.03, max 27.93)" - "1048576","53.90 (min 49.57, max 56.36)","10.75 (min 9.38, max 14.46)","182.86 (min 182.82, max 182.90)","27.68 (min 26.79, max 28.57)" - "5242880","53.72 (min 49.33, max 55.38)","10.40 (min 9.11, max 14.18)","182.79 (min 182.63, max 182.88)","27.64 (min 27.03, max 28.57)" - -EMMC EXT2 -""""""""" - -.. csv-table:: EMMC EXT2 - :header: "Buffer size (bytes)","am64xx-hsevm: Write EXT2 Throughput (Mbytes/sec)","am64xx-hsevm: Write EXT2 CPU Load (%)","am64xx-hsevm: Read EXT2 Throughput (Mbytes/sec)","am64xx-hsevm: Read EXT2 CPU Load (%)" - - "102400","50.24 (min 41.49, max 52.87)","11.45 (min 9.39, max 18.33)","173.05 (min 172.80, max 173.40)","31.11 (min 30.28, max 32.14)" - "262144","51.48 (min 42.38, max 54.31)","11.49 (min 9.18, max 18.46)","176.38 (min 173.55, max 177.82)","32.51 (min 30.28, max 36.28)" - "524288","51.72 (min 42.47, max 54.95)","11.45 (min 9.44, max 18.60)","177.33 (min 174.83, max 178.79)","28.11 (min 27.19, max 28.70)" - "1048576","51.82 (min 42.51, max 54.93)","11.24 (min 9.23, max 18.05)","178.63 (min 178.27, max 178.86)","27.70 (min 27.43, max 27.83)" - "5242880","51.62 (min 41.99, max 54.77)","11.30 (min 9.32, max 18.16)","178.55 (min 178.35, max 178.84)","28.07 (min 27.68, max 28.70)" + "102400","53.87 (min 49.65, max 55.64)","11.09 (min 9.38, max 15.25)","176.52 (min 171.28, max 177.31)","29.36 (min 28.30, max 29.63)" + "262144","53.52 (min 49.20, max 55.06)","11.06 (min 9.50, max 15.22)","181.79 (min 181.43, max 182.11)","30.36 (min 29.36, max 31.53)" + "524288","53.64 (min 49.72, max 55.58)","10.94 (min 9.33, max 14.88)","182.88 (min 182.70, max 183.02)","27.74 (min 26.13, max 29.20)" + "1048576","53.83 (min 49.26, max 55.68)","10.72 (min 9.28, max 14.60)","182.91 (min 182.86, max 183.00)","26.93 (min 25.45, max 28.57)" + "5242880","53.93 (min 49.61, max 56.34)","10.61 (min 9.26, max 14.60)","182.80 (min 182.62, max 182.95)","27.64 (min 26.61, max 28.57)" EMMC VFAT """"""""" @@ -625,11 +365,11 @@ EMMC VFAT .. csv-table:: EMMC VFAT :header: "Buffer size (bytes)","am64xx-hsevm: Write VFAT Throughput (Mbytes/sec)","am64xx-hsevm: Write VFAT CPU Load (%)","am64xx-hsevm: Read VFAT Throughput (Mbytes/sec)","am64xx-hsevm: Read VFAT CPU Load (%)" - "102400","48.75 (min 39.83, max 52.16)","13.28 (min 11.30, max 19.92)","166.81 (min 166.61, max 167.05)","31.22 (min 30.70, max 32.17)" - "262144","50.50 (min 41.55, max 53.41)","13.72 (min 11.39, max 20.25)","168.89 (min 164.53, max 170.76)","34.76 (min 30.70, max 46.28)" - "524288","50.46 (min 41.61, max 53.75)","13.86 (min 11.72, max 19.63)","169.99 (min 169.68, max 170.18)","27.74 (min 27.50, max 28.10)" - "1048576","50.81 (min 41.99, max 54.38)","13.60 (min 11.53, max 20.17)","169.57 (min 169.41, max 169.83)","27.50" - "5242880","50.90 (min 41.73, max 54.15)","13.40 (min 11.56, max 19.68)","169.96 (min 169.64, max 170.06)","28.10 (min 27.50, max 28.69)" + "102400","49.34 (min 40.10, max 53.27)","13.58 (min 11.41, max 20.45)","166.32 (min 164.99, max 167.10)","30.88 (min 29.20, max 31.90)" + "262144","50.55 (min 41.76, max 53.49)","13.71 (min 11.72, max 20.37)","168.61 (min 161.34, max 171.00)","35.58 (min 29.57, max 50.82)" + "524288","50.67 (min 41.94, max 53.88)","14.01 (min 11.56, max 20.24)","169.98 (min 169.68, max 170.20)","27.60 (min 27.50, max 28.10)" + "1048576","50.86 (min 41.78, max 54.00)","13.53 (min 11.59, max 20.00)","169.78 (min 169.62, max 169.88)","27.34 (min 26.05, max 28.10)" + "5242880","50.75 (min 41.22, max 54.11)","13.44 (min 11.66, max 19.75)","170.06 (min 169.90, max 170.19)","27.70 (min 27.27, max 28.33)" UBoot EMMC Driver ----------------- @@ -637,8 +377,8 @@ UBoot EMMC Driver .. csv-table:: UBOOT EMMC RAW :header: "File size (bytes in hex)","am64xx-hsevm: Write Throughput (Kbytes/sec)","am64xx-hsevm: Read Throughput (Kbytes/sec)" - "2000000","60406.03 (min 60014.65, max 61248.60)","169126.01 (min 168907.22, max 169782.38)" - "4000000","61165.23 (min 60907.06, max 61826.42)","173032.57 (min 172918.21, max 173375.66)" + "2000000","59674.24 (min 56594.13, max 61134.33)","168800.07 (min 168041.03, max 169782.38)" + "4000000","60491.03 (min 57387.04, max 61768.14)","172690.99 (min 172463.16, max 173375.66)" MMCSD ----- @@ -651,68 +391,34 @@ MMCSD sensitive applications, umount the auto-mounted filesystem and re-mount in async mode. - MMC EXT4 FIO 1G -""""""""""""""" - +^^^^^^^^^^^^^^^ .. csv-table:: MMC EXT4 FIO 1G :header: "Buffer size (bytes)","am64xx-hsevm: Write EXT4 Throughput (Mbytes/sec)","am64xx-hsevm: Write EXT4 CPU Load (%)","am64xx-hsevm: Read EXT4 Throughput (Mbytes/sec)","am64xx-hsevm: Read EXT4 CPU Load (%)" - "4m","42.15 (min 41.50, max 43.00)","2.62 (min 2.56, max 2.71)","86.95 (min 86.80, max 87.10)","3.73 (min 3.60, max 3.92)" - "1m","41.95 (min 41.10, max 42.30)","3.52 (min 3.34, max 3.70)","86.95 (min 86.90, max 87.10)","5.01 (min 4.85, max 5.31)" - "4k","2.76 (min 2.71, max 2.82)","7.73 (min 7.65, max 7.76)","12.70 (min 12.50, max 12.80)","15.07 (min 14.49, max 15.69)" - "256k","36.50 (min 35.50, max 37.30)","4.48 (min 4.17, max 4.66)","83.10 (min 83.00, max 83.20)","6.78 (min 5.99, max 7.20)" - + "1m","42.00 (min 41.40, max 42.50)","3.43 (min 3.33, max 3.67)","86.94 (min 86.70, max 87.30)","5.02 (min 4.81, max 5.29)" + "4m","41.90 (min 41.20, max 42.70)","2.59 (min 2.51, max 2.67)","86.33 (min 82.30, max 87.10)","3.73 (min 3.38, max 3.99)" + "4k","2.76 (min 2.70, max 2.87)","7.29 (min 7.00, max 8.06)","12.76 (min 12.70, max 12.80)","14.14 (min 13.37, max 14.99)" + "256k","37.41 (min 36.60, max 38.70)","4.53 (min 4.26, max 4.84)","83.15 (min 82.80, max 83.80)","6.69 (min 6.42, max 7.06)" MMC EXT4 -"""""""" - - +^^^^^^^^ .. csv-table:: MMC EXT4 :header: "Buffer size (bytes)","am64xx-hsevm: Write Raw Throughput (Mbytes/sec)","am64xx-hsevm: Write Raw CPU Load (%)","am64xx-hsevm: Read Raw Throughput (Mbytes/sec)","am64xx-hsevm: Read Raw CPU Load (%)" - "102400","35.51 (min 33.07, max 37.45)","7.64 (min 6.31, max 11.15)","73.92 (min 70.24, max 78.38)","13.81 (min 12.28, max 15.00)" - "262144","35.56 (min 34.43, max 37.31)","7.63 (min 6.38, max 11.15)","79.33 (min 76.51, max 82.53)","13.86 (min 13.06, max 14.92)" - "524288","36.53 (min 35.02, max 37.89)","7.53 (min 6.06, max 11.27)","90.56 (min 90.39, max 90.83)","13.27 (min 12.78, max 13.60)" - "1048576","36.79 (min 35.77, max 38.36)","7.50 (min 6.21, max 11.07)","89.75 (min 88.59, max 90.86)","12.83 (min 12.45, max 13.16)" - "5242880","36.94 (min 36.11, max 38.11)","7.24 (min 6.02, max 11.13)","90.18 (min 88.74, max 90.76)","13.42 (min 13.16, max 13.60)" - - -MMC EXT3 -"""""""" - - -.. csv-table:: MMC EXT3 - :header: "Buffer size (bytes)","am64xx-hsevm: Write Raw Throughput (Mbytes/sec)","am64xx-hsevm: Write Raw CPU Load (%)","am64xx-hsevm: Read Raw Throughput (Mbytes/sec)","am64xx-hsevm: Read Raw CPU Load (%)" - - "102400","35.60 (min 29.10, max 38.72)","9.59 (min 7.56, max 16.54)","75.63 (min 73.59, max 77.51)","14.68 (min 13.67, max 15.38)" - "262144","34.94 (min 29.45, max 38.84)","8.94 (min 7.00, max 15.25)","85.00 (min 84.90, max 85.05)","14.19 (min 12.77, max 15.06)" - "524288","35.04 (min 29.43, max 40.16)","8.87 (min 6.99, max 15.13)","89.16 (min 88.79, max 89.60)","13.62 (min 13.36, max 14.29)" - "1048576","34.48 (min 29.87, max 36.97)","8.60 (min 6.82, max 14.08)","88.16 (min 84.43, max 89.47)","13.86 (min 13.42, max 14.22)" - "5242880","36.10 (min 29.24, max 40.71)","8.85 (min 6.89, max 15.43)","85.76 (min 84.45, max 89.52)","14.01 (min 13.58, max 14.69)" - - -MMC EXT2 -"""""""" - -.. csv-table:: MMC EXT2 - :header: "Buffer size (bytes)","am64xx-hsevm: Write Raw Throughput (Mbytes/sec)","am64xx-hsevm: Write Raw CPU Load (%)","am64xx-hsevm: Read Raw Throughput (Mbytes/sec)","am64xx-hsevm: Read Raw CPU Load (%)" - - "102400","37.83 (min 32.12, max 39.96)","8.88 (min 7.14, max 14.78)","77.57 (min 77.14, max 77.81)","14.41 (min 13.90, max 15.06)" - "262144","35.82 (min 31.13, max 38.76)","8.27 (min 6.17, max 13.51)","84.06 (min 80.46, max 85.35)","13.15 (min 12.12, max 14.51)" - "524288","37.30 (min 31.09, max 41.07)","8.11 (min 6.16, max 14.38)","87.09 (min 84.25, max 89.67)","13.89 (min 13.52, max 14.29)" - "1048576","35.75 (min 29.84, max 39.26)","7.80 (min 6.20, max 13.56)","89.35 (min 88.93, max 89.64)","13.62 (min 13.36, max 13.85)" - "5242880","36.21 (min 30.33, max 40.10)","7.78 (min 6.06, max 14.01)","88.34 (min 84.79, max 89.80)","14.20 (min 13.85, max 14.69)" - + "102400","29.65 (min 27.48, max 32.92)","6.38 (min 5.22, max 9.52)","38.94 (min 37.34, max 41.04)","7.41 (min 7.07, max 7.77)" + "262144","28.96 (min 27.17, max 31.59)","6.52 (min 5.28, max 9.31)","40.55 (min 39.38, max 41.90)","6.57 (min 6.20, max 7.11)" + "524288","29.58 (min 27.10, max 32.84)","6.12 (min 4.95, max 9.82)","45.12 (min 42.60, max 45.56)","6.75 (min 6.36, max 6.99)" + "1048576","29.85 (min 28.58, max 32.27)","6.13 (min 4.97, max 9.06)","45.39 (min 45.16, max 45.52)","6.71 (min 6.36, max 7.17)" + "5242880","29.78 (min 28.51, max 33.57)","5.85 (min 4.81, max 8.70)","45.22 (min 44.88, max 45.51)","6.85 (min 6.51, max 7.33)" The performance numbers were captured using the following: - SanDisk Max Endurance SD card (SDSQQVR-032G-GN6IA) - Partition was mounted with async option - | CRYPTO Driver @@ -724,68 +430,66 @@ OpenSSL Performance .. csv-table:: OpenSSL Performance :header: "Algorithm","Buffer Size (in bytes)","am64xx-hsevm: throughput (KBytes/Sec)" - "aes-128-cbc","1024","20959.06 (min 19965.27, max 21320.36)" - "aes-128-cbc","16","314.21 (min 306.05, max 318.36)" - "aes-128-cbc","16384","133997.91 (min 131858.43, max 135550.29)" - "aes-128-cbc","256","5437.10 (min 5301.33, max 5531.31)" - "aes-128-cbc","64","1338.92 (min 1300.12, max 1358.95)" - "aes-128-cbc","8192","97014.44 (min 95608.83, max 97957.21)" - "aes-128-ecb","1024","20929.19 (min 19151.87, max 21648.38)" - "aes-128-ecb","16","316.54 (min 312.22, max 321.90)" - "aes-128-ecb","16384","138835.29 (min 138067.97, max 139225.77)" - "aes-128-ecb","256","5569.86 (min 5543.42, max 5597.95)" - "aes-128-ecb","64","1381.94 (min 1351.47, max 1404.52)" - "aes-128-ecb","8192","98376.36 (min 97315.50, max 99846.83)" - "aes-192-cbc","1024","20155.73 (min 18997.25, max 21175.98)" - "aes-192-cbc","16","301.27 (min 292.46, max 316.99)" - "aes-192-cbc","16384","126993.75 (min 126528.17, max 127391.06)" - "aes-192-cbc","256","5340.86 (min 5230.76, max 5599.91)" - "aes-192-cbc","64","1325.11 (min 1298.11, max 1391.21)" - "aes-192-cbc","8192","93233.83 (min 92883.63, max 93566.29)" - "aes-192-ecb","1024","21606.31 (min 21497.86, max 21739.18)" - "aes-192-ecb","16","308.54 (min 297.98, max 319.48)" - "aes-192-ecb","16384","130969.60 (min 130804.39, max 131055.62)" - "aes-192-ecb","256","5439.27 (min 5317.21, max 5579.35)" - "aes-192-ecb","64","1347.27 (min 1306.52, max 1391.27)" - "aes-192-ecb","8192","95673.69 (min 95341.23, max 96144.04)" - "aes-256-cbc","1024","20149.93 (min 18618.71, max 21155.16)" - "aes-256-cbc","16","305.02 (min 291.87, max 317.27)" - "aes-256-cbc","16384","119682.39 (min 119177.22, max 120083.80)" - "aes-256-cbc","256","5467.90 (min 5210.97, max 5604.61)" - "aes-256-cbc","64","1361.79 (min 1306.24, max 1398.59)" - "aes-256-cbc","8192","89436.84 (min 89022.46, max 89754.28)" - "aes-256-ecb","1024","21332.99 (min 20724.05, max 21572.27)" - "aes-256-ecb","16","309.47 (min 297.86, max 319.90)" - "aes-256-ecb","16384","123528.53 (min 122836.31, max 124245.33)" - "aes-256-ecb","256","5514.73 (min 5286.66, max 5620.48)" - "aes-256-ecb","64","1361.30 (min 1325.67, max 1396.20)" - "aes-256-ecb","8192","91379.71 (min 90923.01, max 92198.23)" - "sha256","1024","26057.22 (min 25825.96, max 26321.58)" - "sha256","16","433.83 (min 431.97, max 435.66)" - "sha256","16384","209231.87 (min 208125.95, max 210031.96)" - "sha256","256","6812.05 (min 6772.82, max 6881.45)" - "sha256","64","1721.55 (min 1711.42, max 1737.02)" - "sha256","8192","141288.79 (min 140610.22, max 141890.90)" - "sha512","1024","18045.35 (min 18011.14, max 18106.71)" - "sha512","16","420.20 (min 419.00, max 421.30)" - "sha512","16384","48089.77 (min 48016.04, max 48147.11)" - "sha512","256","5989.50 (min 5978.62, max 6010.03)" - "sha512","64","1682.55 (min 1675.90, max 1690.75)" - "sha512","8192","43149.99 (min 43092.65, max 43242.84)" - + "aes-128-cbc","1024","21201.11 (min 19586.05, max 21629.27)" + "aes-128-cbc","16","305.74 (min 295.07, max 317.97)" + "aes-128-cbc","16384","137300.65 (min 134600.02, max 139203.93)" + "aes-128-cbc","256","5427.83 (min 5317.12, max 5639.77)" + "aes-128-cbc","64","1333.09 (min 1290.43, max 1389.82)" + "aes-128-cbc","8192","98276.35 (min 96264.19, max 99693.91)" + "aes-128-ecb","1024","21623.04 (min 20551.00, max 22215.00)" + "aes-128-ecb","16","312.77 (min 297.66, max 329.37)" + "aes-128-ecb","16384","141950.29 (min 140525.57, max 143638.53)" + "aes-128-ecb","256","5490.12 (min 5154.73, max 5683.37)" + "aes-128-ecb","64","1360.48 (min 1284.46, max 1411.31)" + "aes-128-ecb","8192","101527.21 (min 99691.18, max 102948.86)" + "aes-192-cbc","1024","21028.78 (min 19525.97, max 21523.11)" + "aes-192-cbc","16","311.25 (min 294.13, max 320.98)" + "aes-192-cbc","16384","128866.99 (min 127462.06, max 130378.41)" + "aes-192-cbc","256","5524.78 (min 5259.43, max 5622.10)" + "aes-192-cbc","64","1364.05 (min 1286.27, max 1390.40)" + "aes-192-cbc","8192","94148.27 (min 92752.55, max 95668.91)" + "aes-192-ecb","1024","21608.83 (min 20942.51, max 22065.83)" + "aes-192-ecb","16","314.19 (min 301.85, max 325.51)" + "aes-192-ecb","16384","132728.15 (min 132104.19, max 133327.53)" + "aes-192-ecb","256","5513.00 (min 5258.24, max 5673.05)" + "aes-192-ecb","64","1369.78 (min 1305.26, max 1411.67)" + "aes-192-ecb","8192","97255.42 (min 96520.87, max 98402.30)" + "aes-256-cbc","1024","21003.86 (min 18761.39, max 21494.78)" + "aes-256-cbc","16","314.16 (min 297.62, max 322.65)" + "aes-256-cbc","16384","121110.53 (min 120105.64, max 122344.79)" + "aes-256-cbc","256","5537.48 (min 5443.41, max 5665.71)" + "aes-256-cbc","64","1377.82 (min 1358.29, max 1398.68)" + "aes-256-cbc","8192","90706.26 (min 89451.18, max 91501.91)" + "aes-256-ecb","1024","21289.98 (min 20055.38, max 21793.11)" + "aes-256-ecb","16","308.54 (min 300.03, max 320.75)" + "aes-256-ecb","16384","125571.07 (min 124474.71, max 127385.60)" + "aes-256-ecb","256","5471.54 (min 5277.53, max 5680.98)" + "aes-256-ecb","64","1351.16 (min 1297.41, max 1409.83)" + "aes-256-ecb","8192","93359.79 (min 92383.91, max 94601.22)" + "sha256","1024","28245.16 (min 27951.45, max 28524.20)" + "sha256","16","471.00 (min 466.66, max 475.25)" + "sha256","16384","218273.11 (min 216738.47, max 220250.11)" + "sha256","256","7394.91 (min 7313.49, max 7465.56)" + "sha256","64","1871.55 (min 1853.21, max 1889.11)" + "sha256","8192","149173.25 (min 148398.08, max 149848.06)" + "sha512","1024","18903.94 (min 18712.58, max 19061.76)" + "sha512","16","449.39 (min 444.90, max 451.80)" + "sha512","16384","48433.15 (min 48059.73, max 48562.18)" + "sha512","256","6372.07 (min 6279.94, max 6436.78)" + "sha512","64","1803.87 (min 1779.22, max 1823.55)" + "sha512","8192","43742.21 (min 43578.71, max 43835.39)" .. csv-table:: OpenSSL CPU Load :header: "Algorithm","am64xx-hsevm: CPU Load" - "aes-128-cbc","43.25 (min 43.00, max 44.00)" - "aes-128-ecb","45.00 (min 44.00, max 46.00)" - "aes-192-cbc","42.75 (min 42.00, max 44.00)" - "aes-192-ecb","44.25 (min 44.00, max 45.00)" - "aes-256-cbc","42.75 (min 42.00, max 44.00)" - "aes-256-ecb","43.75 (min 43.00, max 44.00)" + "aes-128-cbc","43.25 (min 42.00, max 44.00)" + "aes-128-ecb","45.13 (min 43.00, max 46.00)" + "aes-192-cbc","43.75 (min 43.00, max 45.00)" + "aes-192-ecb","44.63 (min 44.00, max 45.00)" + "aes-256-cbc","43.63 (min 43.00, max 44.00)" + "aes-256-ecb","43.88 (min 43.00, max 45.00)" "sha256","93.00" - "sha512","93.00" - + "sha512","92.50 (min 90.00, max 93.00)" Listed for each algorithm are the code snippets used to run each benchmark test. @@ -793,11 +497,10 @@ Listed for each algorithm are the code snippets used to run each benchmark test. time -v openssl speed -elapsed -evp aes-128-cbc - | RP Message Inter-Processor Communication (IPC) Latency ------------------------------------------------------- +------------------------------------------------------- RP Message latency Performance ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ @@ -816,14 +519,13 @@ Test commands used for running IPC latency tests: Latencies reported: - .. csv-table:: :header: "Remote Processor","Message Size (in bytes)","Average round trip (usecs)","Max round trip (usecs)" - "R5F0_0","1","32","205" - "R5F0_0","490","162","272" - "M4F","1","41","186" - "M4F","490","301","446" + "R5F0_0","1","34","165" + "R5F0_0","490","155","279" + "M4F","1","45","138" + "M4F","490","285","408" .. image:: img/R5_0_0_m1_ipc_latency.png @@ -832,5 +534,3 @@ Latencies reported: .. image:: img/m4_0_m1_ipc_latency.png .. image:: img/m4_0_m490_ipc_latency.png - -| diff --git a/source/devices/AM64X/linux/img/R5_0_0_m1_ipc_latency.png b/source/devices/AM64X/linux/img/R5_0_0_m1_ipc_latency.png index b0c2b199d..f1dd44376 100644 Binary files a/source/devices/AM64X/linux/img/R5_0_0_m1_ipc_latency.png and b/source/devices/AM64X/linux/img/R5_0_0_m1_ipc_latency.png differ diff --git a/source/devices/AM64X/linux/img/R5_0_0_m490_ipc_latency.png b/source/devices/AM64X/linux/img/R5_0_0_m490_ipc_latency.png index 3a8c03dcf..4bf983ffc 100644 Binary files a/source/devices/AM64X/linux/img/R5_0_0_m490_ipc_latency.png and b/source/devices/AM64X/linux/img/R5_0_0_m490_ipc_latency.png differ diff --git a/source/devices/AM64X/linux/img/m4_0_m1_ipc_latency.png b/source/devices/AM64X/linux/img/m4_0_m1_ipc_latency.png index 48bd8c985..f94850b2f 100644 Binary files a/source/devices/AM64X/linux/img/m4_0_m1_ipc_latency.png and b/source/devices/AM64X/linux/img/m4_0_m1_ipc_latency.png differ diff --git a/source/devices/AM64X/linux/img/m4_0_m490_ipc_latency.png b/source/devices/AM64X/linux/img/m4_0_m490_ipc_latency.png index a1cf758d6..6869a47ab 100644 Binary files a/source/devices/AM64X/linux/img/m4_0_m490_ipc_latency.png and b/source/devices/AM64X/linux/img/m4_0_m490_ipc_latency.png differ