From d4b208ca881acb3be102f3c0c28813d39dc73318 Mon Sep 17 00:00:00 2001 From: rfjakob Date: Sun, 5 Jun 2016 14:36:36 +0200 Subject: Created CPU Benchmarks (markdown) --- CPU-Benchmarks.md | 96 +++++++++++++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 96 insertions(+) create mode 100644 CPU-Benchmarks.md diff --git a/CPU-Benchmarks.md b/CPU-Benchmarks.md new file mode 100644 index 0000000..4225178 --- /dev/null +++ b/CPU-Benchmarks.md @@ -0,0 +1,96 @@ +Originally written by [@lxp}(https://github.com/lxp) in [Issue #23](https://github.com/rfjakob/gocryptfs/issues/23) + +``` +$ go version +go version go1.6 linux/amd64 +``` + +### AES-NI +**Skylake (Launch: Q3'15)** +``` +$ cat /proc/cpuinfo +model name : Intel(R) Core(TM) i3-6100U CPU @ 2.30GHz +flags : fpu vme de pse tsc msr pae mce cx8 apic sep mtrr pge mca cmov pat pse36 clflush dts acpi mmx fxsr sse sse2 ss ht tm pbe syscall nx pdpe1gb rdtscp lm constant_tsc arch_perfmon pebs bts rep_good nopl xtopology nonstop_tsc aperfmperf eagerfpu pni pclmulqdq dtes64 monitor ds_cpl vmx est tm2 ssse3 sdbg fma cx16 xtpr pdcm pcid sse4_1 sse4_2 x2apic movbe popcnt tsc_deadline_timer aes xsave avx f16c rdrand lahf_lm abm 3dnowprefetch ida arat epb pln pts dtherm hwp hwp_notify hwp_act_window hwp_epp intel_pt tpr_shadow vnmi flexpriority ept vpid fsgsbase tsc_adjust bmi1 hle avx2 smep bmi2 erms invpcid rtm mpx rdseed adx smap clflushopt xsaveopt xsavec xgetbv1 +$ ./stupidgcm.test -test.bench . +PASS +Benchmark4kEncStupidGCM-4 200000 10688 ns/op 383.22 MB/s +Benchmark4kEncGoGCM-4 300000 4073 ns/op 1005.57 MB/s +``` +**Haswell (Launch: Q2'14)** +``` +$ cat /proc/cpuinfo +model name : Intel(R) Core(TM) i5-4690K CPU @ 3.50GHz +flags : fpu vme de pse tsc msr pae mce cx8 apic sep mtrr pge mca cmov pat pse36 clflush dts acpi mmx fxsr sse sse2 ss ht tm pbe syscall nx pdpe1gb rdtscp lm constant_tsc arch_perfmon pebs bts rep_good nopl xtopology nonstop_tsc aperfmperf eagerfpu pni pclmulqdq dtes64 monitor ds_cpl vmx est tm2 ssse3 sdbg fma cx16 xtpr pdcm pcid sse4_1 sse4_2 x2apic movbe popcnt tsc_deadline_timer aes xsave avx f16c rdrand lahf_lm abm epb tpr_shadow vnmi flexpriority ept vpid fsgsbase tsc_adjust bmi1 hle avx2 smep bmi2 erms invpcid rtm xsaveopt dtherm ida arat pln pts +$ ./stupidgcm.test -test.bench . +PASS +Benchmark4kEncStupidGCM-4 200000 6710 ns/op 610.43 MB/s +Benchmark4kEncGoGCM-4 500000 2422 ns/op 1690.86 MB/s +``` + +**Ivy Bridge (Launch: Q2'12)** +``` +$ cat /proc/cpuinfo +model name : Intel(R) Core(TM) i5-3570 CPU @ 3.40GHz +flags : fpu vme de pse tsc msr pae mce cx8 apic sep mtrr pge mca cmov pat pse36 clflush dts acpi mmx fxsr sse sse2 ss ht tm pbe syscall nx rdtscp lm constant_tsc arch_perfmon pebs bts rep_good nopl xtopology nonstop_tsc aperfmperf eagerfpu pni pclmulqdq dtes64 monitor ds_cpl vmx smx est tm2 ssse3 cx16 xtpr pdcm pcid sse4_1 sse4_2 x2apic popcnt tsc_deadline_timer aes xsave avx f16c rdrand lahf_lm ida arat epb xsaveopt pln pts dtherm tpr_shadow vnmi flexpriority ept vpid fsgsbase smep erms +$ ./stupidgcm.test -test.bench . +PASS +Benchmark4kEncStupidGCM-4 200000 14684 ns/op 278.94 MB/s +Benchmark4kEncGoGCM-4 300000 7792 ns/op 525.62 MB/s +``` + +**Sandy Bridge (Launch: Q1'11)** +``` +$ cat /proc/cpuinfo +model name : Intel(R) Core(TM) i5-2520M CPU @ 2.50GHz +flags : fpu vme de pse tsc msr pae mce cx8 apic sep mtrr pge mca cmov pat pse36 clflush dts acpi mmx fxsr sse sse2 ss ht tm pbe syscall nx rdtscp lm constant_tsc arch_perfmon pebs bts nopl xtopology nonstop_tsc aperfmperf eagerfpu pni pclmulqdq dtes64 monitor ds_cpl vmx smx est tm2 ssse3 cx16 xtpr pdcm pcid sse4_1 sse4_2 x2apic popcnt tsc_deadline_timer aes xsave avx lahf_lm ida arat epb xsaveopt pln pts dtherm tpr_shadow vnmi flexpriority ept vpid +$ ./stupidgcm.test -test.bench . +PASS +Benchmark4kEncStupidGCM-4 100000 19070 ns/op 214.78 MB/s +Benchmark4kEncGoGCM-4 200000 10981 ns/op 373.01 MB/s +``` + +**Westmere (Launch: Q1'10)** +``` +$ cat /proc/cpuinfo +model name : Intel(R) Xeon(R) CPU E5620 @ 2.40GHz +flags : fpu vme de pse tsc msr pae mce cx8 apic sep mtrr pge mca cmov pat pse36 clflush dts acpi mmx fxsr sse sse2 ss ht tm pbe syscall nx pdpe1gb rdtscp lm constant_tsc arch_perfmon pebs bts rep_good nopl xtopology nonstop_tsc aperfmperf pni pclmulqdq dtes64 monitor ds_cpl vmx smx est tm2 ssse3 cx16 xtpr pdcm pcid dca sse4_1 sse4_2 popcnt aes lahf_lm epb tpr_shadow vnmi flexpriority ept vpid dtherm ida arat +$ ./stupidgcm.test -test.bench . +PASS +Benchmark4kEncStupidGCM-16 100000 18297 ns/op 223.85 MB/s +Benchmark4kEncGoGCM-16 200000 9579 ns/op 427.58 MB/s +``` + +### no AES-NI + +**Ivy Bridge (Launch: Q1'13)** +``` +$ cat /proc/cpuinfo +model name : Intel(R) Pentium(R) CPU G2130 @ 3.20GHz +flags : fpu vme de pse tsc msr pae mce cx8 apic sep mtrr pge mca cmov pat pse36 clflush dts acpi mmx fxsr sse sse2 ss ht tm pbe syscall nx rdtscp lm constant_tsc arch_perfmon pebs bts rep_good nopl xtopology nonstop_tsc aperfmperf eagerfpu pni pclmulqdq dtes64 monitor ds_cpl vmx est tm2 ssse3 cx16 xtpr pdcm pcid sse4_1 sse4_2 popcnt tsc_deadline_timer xsave lahf_lm arat epb xsaveopt pln pts dtherm tpr_shadow vnmi flexpriority ept vpid fsgsbase smep erms +$ ./stupidgcm.test -test.bench . +PASS +Benchmark4kEncStupidGCM-2 100000 22691 ns/op 180.51 MB/s +Benchmark4kEncGoGCM-2 20000 92810 ns/op 44.13 MB/s +``` + +**Nehalem (Launch: Q3'09)** +``` +$ cat /proc/cpuinfo +model name : Intel(R) Xeon(R) CPU X3460 @ 2.80GHz +flags : fpu vme de pse tsc msr pae mce cx8 apic sep mtrr pge mca cmov pat pse36 clflush dts acpi mmx fxsr sse sse2 ss ht tm pbe syscall nx rdtscp lm constant_tsc arch_perfmon pebs bts rep_good nopl xtopology nonstop_tsc aperfmperf pni dtes64 monitor ds_cpl vmx smx est tm2 ssse3 cx16 xtpr pdcm sse4_1 sse4_2 popcnt lahf_lm ida dtherm tpr_shadow vnmi flexpriority ept vpid +$ ./stupidgcm.test -test.bench . +PASS +Benchmark4kEncStupidGCM-8 50000 35247 ns/op 116.21 MB/s +Benchmark4kEncGoGCM-8 20000 92230 ns/op 44.41 MB/s +``` + +**Core (Launch: Q1'08)** +``` +$ cat /proc/cpuinfo +model name : Intel(R) Core(TM)2 Duo CPU E7400 @ 2.80GHz +flags : fpu vme de pse tsc msr pae mce cx8 apic sep mtrr pge mca cmov pat pse36 clflush dts acpi mmx fxsr sse sse2 ss ht tm pbe syscall nx lm constant_tsc arch_perfmon pebs bts rep_good nopl aperfmperf pni dtes64 monitor ds_cpl est tm2 ssse3 cx16 xtpr pdcm sse4_1 xsave lahf_lm dtherm +$ ./stupidgcm.test -test.bench . +PASS +Benchmark4kEncStupidGCM-2 30000 46697 ns/op 87.71 MB/s +Benchmark4kEncGoGCM-2 10000 194095 ns/op 21.10 MB/s +``` \ No newline at end of file -- cgit v1.2.3