clpeak benchmark

AMD EPYC 7262 8-Core testing with a GIGABYTE MZ32-AR0-00 v01000100 (R21 BIOS) and NVIDIA GeForce RTX 4090 24GB on Ubuntu 22.04 via the Phoronix Test Suite.

Compare your own system(s) to this result file with the Phoronix Test Suite by running the command: phoronix-test-suite benchmark 2401230-NE-CLPEAKBEN88
Jump To Table - Results

Statistics

Remove Outliers Before Calculating Averages

Graph Settings

Prefer Vertical Bar Graphs

Multi-Way Comparison

Condense Multi-Option Tests Into Single Result Graphs

Table

Show Detailed System Result Table

Run Management

Result
Identifier
View Logs
Performance Per
Dollar
Date
Run
  Test
  Duration
NVIDIA GeForce RTX 4090
January 23
  5 Minutes
Only show results matching title/arguments (delimit multiple options with a comma):
Do not show results matching title/arguments (delimit multiple options with a comma):


{ "title": "clpeak benchmark", "last_modified": "2024-01-23 23:29:45", "description": "AMD EPYC 7262 8-Core testing with a GIGABYTE MZ32-AR0-00 v01000100 (R21 BIOS) and NVIDIA GeForce RTX 4090 24GB on Ubuntu 22.04 via the Phoronix Test Suite.", "systems": { "NVIDIA GeForce RTX 4090": { "identifier": "NVIDIA GeForce RTX 4090", "hardware": { "Processor": "AMD EPYC 7262 8-Core @ 3.20GHz (8 Cores \/ 16 Threads)", "Motherboard": "GIGABYTE MZ32-AR0-00 v01000100 (R21 BIOS)", "Chipset": "AMD Starship\/Matisse", "Memory": "128GB", "Disk": "1000GB Samsung SSD 980 PRO 1TB", "Graphics": "NVIDIA GeForce RTX 4090 24GB", "Audio": "NVIDIA Device 22ba", "Monitor": "DELL U2720Q", "Network": "2 x Intel I350" }, "software": { "OS": "Ubuntu 22.04", "Kernel": "6.5.0-14-generic (x86_64)", "Desktop": "GNOME Shell 42.9", "Display Server": "X Server 1.21.1.4", "Display Driver": "NVIDIA 535.154.05", "OpenGL": "4.6.0", "OpenCL": "OpenCL 3.0 CUDA 12.2.148", "Vulkan": "1.3.242", "Compiler": "GCC 11.4.0 + CUDA 11.8", "File-System": "ext4", "Screen Resolution": "3840x2160" }, "user": "skinguru", "timestamp": "2024-01-23 23:22:35", "client_version": "10.8.4", "data": { "compiler-configuration": "--build=x86_64-linux-gnu --disable-vtable-verify --disable-werror --enable-bootstrap --enable-cet --enable-checking=release --enable-clocale=gnu --enable-default-pie --enable-gnu-unique-object --enable-languages=c,ada,c++,go,brig,d,fortran,objc,obj-c++,m2 --enable-libphobos-checking=release --enable-libstdcxx-debug --enable-libstdcxx-time=yes --enable-link-serialization=2 --enable-multiarch --enable-multilib --enable-nls --enable-objc-gc=auto --enable-offload-targets=nvptx-none=\/build\/gcc-11-XeT9lY\/gcc-11-11.4.0\/debian\/tmp-nvptx\/usr,amdgcn-amdhsa=\/build\/gcc-11-XeT9lY\/gcc-11-11.4.0\/debian\/tmp-gcn\/usr --enable-plugin --enable-shared --enable-threads=posix --host=x86_64-linux-gnu --program-prefix=x86_64-linux-gnu- --target=x86_64-linux-gnu --with-abi=m64 --with-arch-32=i686 --with-build-config=bootstrap-lto-lean --with-default-libstdcxx-abi=new --with-gcc-major-version-only --with-multilib-list=m32,m64,mx32 --with-target-system-zlib=auto --with-tune=generic --without-cuda-driver -v", "graphics-compute-cores": "16384", "cpu-scaling-governor": "acpi-cpufreq performance (Boost: Enabled)", "cpu-microcode": "0x830107a", "bar1-visible-vram": "256 MiB", "vbios-version": "95.02.18.80.53", "kernel-extra-details": "Transparent Huge Pages: madvise", "security": "gather_data_sampling: Not affected + itlb_multihit: Not affected + l1tf: Not affected + mds: Not affected + meltdown: Not affected + mmio_stale_data: Not affected + retbleed: Mitigation of untrained return thunk; SMT enabled with STIBP protection + spec_rstack_overflow: Mitigation of safe RET + spec_store_bypass: Mitigation of SSB disabled via prctl + spectre_v1: Mitigation of usercopy\/swapgs barriers and __user pointer sanitization + spectre_v2: Mitigation of Retpolines IBPB: conditional STIBP: always-on RSB filling PBRSB-eIBRS: Not affected + srbds: Not affected + tsx_async_abort: Not affected" } } }, "results": { "96386307b2ac998f06ea9a6d1b9c38d8e4a89712": { "identifier": "pts\/clpeak-1.1.0", "title": "clpeak", "app_version": "1.1.2", "arguments": "--kernel-latency", "description": "OpenCL Test: Kernel Latency", "scale": "us", "proportion": "LIB", "display_format": "BAR_GRAPH", "results": { "NVIDIA GeForce RTX 4090": { "value": 6.20999999999999996447286321199499070644378662109375, "raw_values": [ 6.25, 6.17999999999999971578290569595992565155029296875, 6.19000000000000039079850466805510222911834716796875 ], "test_run_times": [ 0.61999999999999999555910790149937383830547332763671875, 0.4699999999999999733546474089962430298328399658203125, 0.460000000000000019984014443252817727625370025634765625 ], "details": { "compiler-options": { "compiler-type": "CXX", "compiler": "g++", "compiler-options": "-O3" } } } } }, "ffb3b54205b8820ee8989e7d07d1cde074069eba": { "identifier": "pts\/clpeak-1.1.0", "title": "clpeak", "app_version": "1.1.2", "arguments": "--compute-integer", "description": "OpenCL Test: Integer Compute", "scale": "GIOPS", "proportion": "HIB", "display_format": "BAR_GRAPH", "results": { "NVIDIA GeForce RTX 4090": { "value": 40578.0999999999985448084771633148193359375, "raw_values": [ 40207.9899999999979627318680286407470703125, 40807.2900000000008731149137020111083984375, 40719.02999999999883584678173065185546875 ], "test_run_times": [ 0.689999999999999946709294817992486059665679931640625, 0.66000000000000003108624468950438313186168670654296875, 0.67000000000000003996802888650563545525074005126953125 ], "details": { "compiler-options": { "compiler-type": "CXX", "compiler": "g++", "compiler-options": "-O3" } } } } }, "debc5751ccf59c27ad9a1f78be4407636859df64": { "identifier": "pts\/clpeak-1.1.0", "title": "clpeak", "app_version": "1.1.2", "arguments": "--compute-intfast", "description": "OpenCL Test: Integer 24-bit Compute", "scale": "GIOPS", "proportion": "HIB", "display_format": "BAR_GRAPH", "results": { "NVIDIA GeForce RTX 4090": { "value": 40776.550000000002910383045673370361328125, "raw_values": [ 40612.3499999999985448084771633148193359375, 40863.91000000000349245965480804443359375, 40853.3799999999973806552588939666748046875 ], "test_run_times": [ 0.68000000000000004884981308350688777863979339599609375, 0.68000000000000004884981308350688777863979339599609375, 0.68000000000000004884981308350688777863979339599609375 ], "details": { "compiler-options": { "compiler-type": "CXX", "compiler": "g++", "compiler-options": "-O3" } } } } }, "e05e38fa90546ff4d13bc1f0e8aa16d1344116a0": { "identifier": "pts\/clpeak-1.1.0", "title": "clpeak", "app_version": "1.1.2", "arguments": "--global-bandwidth", "description": "OpenCL Test: Global Memory Bandwidth", "scale": "GBPS", "proportion": "HIB", "display_format": "BAR_GRAPH", "results": { "NVIDIA GeForce RTX 4090": { "value": 869.3899999999999863575794734060764312744140625, "raw_values": [ 871.6200000000000045474735088646411895751953125, 864.9600000000000363797880709171295166015625, 871.5900000000000318323145620524883270263671875 ], "test_run_times": [ 2.939999999999999946709294817992486059665679931640625, 2.9900000000000002131628207280300557613372802734375, 2.95000000000000017763568394002504646778106689453125 ], "details": { "compiler-options": { "compiler-type": "CXX", "compiler": "g++", "compiler-options": "-O3" } } } } }, "6adc34691ca18c7d011f145ef12644d8cb89cb4d": { "identifier": "pts\/clpeak-1.1.0", "title": "clpeak", "app_version": "1.1.2", "arguments": "--compute-dp", "description": "OpenCL Test: Double-Precision Compute", "scale": "GFLOPS", "proportion": "HIB", "display_format": "BAR_GRAPH", "results": { "NVIDIA GeForce RTX 4090": { "value": 1346.220000000000027284841053187847137451171875, "raw_values": [ 1347.48000000000001818989403545856475830078125, 1345.720000000000027284841053187847137451171875, 1345.470000000000027284841053187847137451171875 ], "test_run_times": [ 8.3599999999999994315658113919198513031005859375, 8.3800000000000007815970093361102044582366943359375, 8.3699999999999992184029906638897955417633056640625 ], "details": { "compiler-options": { "compiler-type": "CXX", "compiler": "g++", "compiler-options": "-O3" } } } } }, "6f3c90b9a8b1544a888d3789724ed63af4d5d42b": { "identifier": "pts\/clpeak-1.1.0", "title": "clpeak", "app_version": "1.1.2", "arguments": "--compute-sp", "description": "OpenCL Test: Single-Precision Compute", "scale": "GFLOPS", "proportion": "HIB", "display_format": "BAR_GRAPH", "results": { "NVIDIA GeForce RTX 4090": { "value": 78861.240000000005238689482212066650390625, "raw_values": [ 77849.979999999995925463736057281494140625, 79352.740000000005238689482212066650390625, 79381.009999999994761310517787933349609375 ], "test_run_times": [ 0.70999999999999996447286321199499070644378662109375, 0.7199999999999999733546474089962430298328399658203125, 0.70999999999999996447286321199499070644378662109375 ], "details": { "compiler-options": { "compiler-type": "CXX", "compiler": "g++", "compiler-options": "-O3" } } } } }, "684173101726f852674e4d11d7fd63a3716942c9": { "identifier": "pts\/clpeak-1.1.0", "title": "clpeak", "app_version": "1.1.2", "arguments": "--transfer-bandwidth #read", "description": "OpenCL Test: Transfer Bandwidth enqueueReadBuffer", "scale": "GBPS", "proportion": "HIB", "display_format": "BAR_GRAPH", "results": { "NVIDIA GeForce RTX 4090": { "value": 9.32000000000000028421709430404007434844970703125, "raw_values": [ 9.2400000000000002131628207280300557613372802734375, 9.3599999999999994315658113919198513031005859375, 9.3599999999999994315658113919198513031005859375 ], "test_run_times": [ 37.4500000000000028421709430404007434844970703125, 36.97999999999999687361196265555918216705322265625, 37.1099999999999994315658113919198513031005859375 ], "details": { "compiler-options": { "compiler-type": "CXX", "compiler": "g++", "compiler-options": "-O3" } } } } }, "b6832318594b001f05c201b0906eb4f564cbe3d8": { "identifier": "pts\/clpeak-1.1.0", "title": "clpeak", "app_version": "1.1.2", "arguments": "--transfer-bandwidth #write", "description": "OpenCL Test: Transfer Bandwidth enqueueWriteBuffer", "scale": "GBPS", "proportion": "HIB", "display_format": "BAR_GRAPH", "results": { "NVIDIA GeForce RTX 4090": { "value": 11.71000000000000085265128291212022304534912109375, "raw_values": [ 11.839999999999999857891452847979962825775146484375, 11.7200000000000006394884621840901672840118408203125, 11.5800000000000000710542735760100185871124267578125 ], "test_run_times": [ 38.53999999999999914734871708787977695465087890625, 37.35000000000000142108547152020037174224853515625, 36.530000000000001136868377216160297393798828125 ], "details": { "compiler-options": { "compiler-type": "CXX", "compiler": "g++", "compiler-options": "-O3" } } } } } } }