Skip to content
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.

Commit 28daee3

Browse files
authoredJul 22, 2020
Rollup merge of #74367 - Neutron3529:patch-1, r=nagisa
Rearrange the pipeline of `pow` to gain efficiency The check of the `exp` parameter seems useless if we execute the while-loop more than once. The original implementation of `pow` function using one more comparison if the `exp==0` and may break the pipeline of the cpu, which may generate a slower code. The performance gap between the old and the new implementation may be small, but IMO, at least the newer one looks more beautiful. --- bench prog: ``` #![feature(test)] extern crate test; #[macro_export]macro_rules! timing{ ($a:expr)=>{let time=std::time::Instant::now();{$a;}print!("{:?} ",time.elapsed())}; ($a:expr,$b:literal)=>{let time=std::time::Instant::now();let mut a=0;for _ in 0..$b{a^=$a;}print!("{:?} {} ",time.elapsed(),a)} } #[inline] pub fn pow_rust(x:i64, mut exp: u32) -> i64 { let mut base = x; let mut acc = 1; while exp > 1 { if (exp & 1) == 1 { acc = acc * base; } exp /= 2; base = base * base; } if exp == 1 { acc = acc * base; } acc } #[inline] pub fn pow_new(x:i64, mut exp: u32) -> i64 { if exp==0{ 1 }else{ let mut base = x; let mut acc = 1; while exp > 1 { if (exp & 1) == 1 { acc = acc * base; } exp >>= 1; base = base * base; } acc * base } } fn main(){ let a=2i64; let b=1_u32; println!(); timing!(test::black_box(a).pow(test::black_box(b)),100000000); timing!(pow_new(test::black_box(a),test::black_box(b)),100000000); timing!(pow_rust(test::black_box(a),test::black_box(b)),100000000); println!(); timing!(test::black_box(a).pow(test::black_box(b)),100000000); timing!(pow_new(test::black_box(a),test::black_box(b)),100000000); timing!(pow_rust(test::black_box(a),test::black_box(b)),100000000); println!(); timing!(test::black_box(a).pow(test::black_box(b)),100000000); timing!(pow_new(test::black_box(a),test::black_box(b)),100000000); timing!(pow_rust(test::black_box(a),test::black_box(b)),100000000); println!(); timing!(test::black_box(a).pow(test::black_box(b)),100000000); timing!(pow_new(test::black_box(a),test::black_box(b)),100000000); timing!(pow_rust(test::black_box(a),test::black_box(b)),100000000); println!(); timing!(test::black_box(a).pow(test::black_box(b)),100000000); timing!(pow_new(test::black_box(a),test::black_box(b)),100000000); timing!(pow_rust(test::black_box(a),test::black_box(b)),100000000); println!(); timing!(test::black_box(a).pow(test::black_box(b)),100000000); timing!(pow_new(test::black_box(a),test::black_box(b)),100000000); timing!(pow_rust(test::black_box(a),test::black_box(b)),100000000); println!(); timing!(test::black_box(a).pow(test::black_box(b)),100000000); timing!(pow_new(test::black_box(a),test::black_box(b)),100000000); timing!(pow_rust(test::black_box(a),test::black_box(b)),100000000); println!(); timing!(test::black_box(a).pow(test::black_box(b)),100000000); timing!(pow_new(test::black_box(a),test::black_box(b)),100000000); timing!(pow_rust(test::black_box(a),test::black_box(b)),100000000); println!(); } ``` bench in my laptop: ``` neutron@Neutron:/me/rust$ rc commit.rs rustc commit.rs && ./commit 3.978419716s 0 4.079765171s 0 3.964630622s 0 3.997127013s 0 4.260304804s 0 3.997638211s 0 3.963195544s 0 4.11657718s 0 4.176054164s 0 3.830128579s 0 3.980396122s 0 3.937258567s 0 3.986055948s 0 4.127804162s 0 4.018943411s 0 4.185568857s 0 4.217512517s 0 3.98313603s 0 3.863018225s 0 4.030447988s 0 3.694878237s 0 4.206987927s 0 4.137608047s 0 4.115564664s 0 neutron@Neutron:/me/rust$ rc commit.rs -O rustc commit.rs -O && ./commit 162.111993ms 0 165.107125ms 0 166.26924ms 0 175.20479ms 0 205.062565ms 0 176.278791ms 0 174.408975ms 0 166.526899ms 0 201.857604ms 0 146.190062ms 0 168.592821ms 0 154.61411ms 0 199.678912ms 0 168.411598ms 0 162.129996ms 0 147.420765ms 0 209.759326ms 0 154.807907ms 0 165.507134ms 0 188.476239ms 0 157.351524ms 0 121.320123ms 0 126.401229ms 0 114.86428ms 0 ```
2 parents 298a38b + 364cacb commit 28daee3

File tree

3 files changed

+101
-44
lines changed

3 files changed

+101
-44
lines changed
 

‎src/libcore/num/mod.rs

+44-43
Original file line numberDiff line numberDiff line change
@@ -1095,6 +1095,9 @@ $EndFeature, "
10951095
without modifying the original"]
10961096
#[inline]
10971097
pub const fn checked_pow(self, mut exp: u32) -> Option<Self> {
1098+
if exp == 0 {
1099+
return Some(1);
1100+
}
10981101
let mut base = self;
10991102
let mut acc: Self = 1;
11001103

@@ -1105,15 +1108,11 @@ $EndFeature, "
11051108
exp /= 2;
11061109
base = try_opt!(base.checked_mul(base));
11071110
}
1108-
1111+
// since exp!=0, finally the exp must be 1.
11091112
// Deal with the final bit of the exponent separately, since
11101113
// squaring the base afterwards is not necessary and may cause a
11111114
// needless overflow.
1112-
if exp == 1 {
1113-
acc = try_opt!(acc.checked_mul(base));
1114-
}
1115-
1116-
Some(acc)
1115+
Some(try_opt!(acc.checked_mul(base)))
11171116
}
11181117
}
11191118

@@ -1622,6 +1621,9 @@ $EndFeature, "
16221621
without modifying the original"]
16231622
#[inline]
16241623
pub const fn wrapping_pow(self, mut exp: u32) -> Self {
1624+
if exp == 0 {
1625+
return 1;
1626+
}
16251627
let mut base = self;
16261628
let mut acc: Self = 1;
16271629

@@ -1633,14 +1635,11 @@ $EndFeature, "
16331635
base = base.wrapping_mul(base);
16341636
}
16351637

1638+
// since exp!=0, finally the exp must be 1.
16361639
// Deal with the final bit of the exponent separately, since
16371640
// squaring the base afterwards is not necessary and may cause a
16381641
// needless overflow.
1639-
if exp == 1 {
1640-
acc = acc.wrapping_mul(base);
1641-
}
1642-
1643-
acc
1642+
acc.wrapping_mul(base)
16441643
}
16451644
}
16461645

@@ -1989,6 +1988,9 @@ $EndFeature, "
19891988
without modifying the original"]
19901989
#[inline]
19911990
pub const fn overflowing_pow(self, mut exp: u32) -> (Self, bool) {
1991+
if exp == 0 {
1992+
return (1,false);
1993+
}
19921994
let mut base = self;
19931995
let mut acc: Self = 1;
19941996
let mut overflown = false;
@@ -2007,16 +2009,13 @@ $EndFeature, "
20072009
overflown |= r.1;
20082010
}
20092011

2012+
// since exp!=0, finally the exp must be 1.
20102013
// Deal with the final bit of the exponent separately, since
20112014
// squaring the base afterwards is not necessary and may cause a
20122015
// needless overflow.
2013-
if exp == 1 {
2014-
r = acc.overflowing_mul(base);
2015-
acc = r.0;
2016-
overflown |= r.1;
2017-
}
2018-
2019-
(acc, overflown)
2016+
r = acc.overflowing_mul(base);
2017+
r.1 |= overflown;
2018+
r
20202019
}
20212020
}
20222021

@@ -2040,6 +2039,9 @@ $EndFeature, "
20402039
#[inline]
20412040
#[rustc_inherit_overflow_checks]
20422041
pub const fn pow(self, mut exp: u32) -> Self {
2042+
if exp == 0 {
2043+
return 1;
2044+
}
20432045
let mut base = self;
20442046
let mut acc = 1;
20452047

@@ -2051,14 +2053,11 @@ $EndFeature, "
20512053
base = base * base;
20522054
}
20532055

2056+
// since exp!=0, finally the exp must be 1.
20542057
// Deal with the final bit of the exponent separately, since
20552058
// squaring the base afterwards is not necessary and may cause a
20562059
// needless overflow.
2057-
if exp == 1 {
2058-
acc = acc * base;
2059-
}
2060-
2061-
acc
2060+
acc * base
20622061
}
20632062
}
20642063

@@ -3295,6 +3294,9 @@ assert_eq!(", stringify!($SelfT), "::MAX.checked_pow(2), None);", $EndFeature, "
32953294
without modifying the original"]
32963295
#[inline]
32973296
pub const fn checked_pow(self, mut exp: u32) -> Option<Self> {
3297+
if exp == 0 {
3298+
return Some(1);
3299+
}
32983300
let mut base = self;
32993301
let mut acc: Self = 1;
33003302

@@ -3306,14 +3308,12 @@ assert_eq!(", stringify!($SelfT), "::MAX.checked_pow(2), None);", $EndFeature, "
33063308
base = try_opt!(base.checked_mul(base));
33073309
}
33083310

3311+
// since exp!=0, finally the exp must be 1.
33093312
// Deal with the final bit of the exponent separately, since
33103313
// squaring the base afterwards is not necessary and may cause a
33113314
// needless overflow.
3312-
if exp == 1 {
3313-
acc = try_opt!(acc.checked_mul(base));
3314-
}
33153315

3316-
Some(acc)
3316+
Some(try_opt!(acc.checked_mul(base)))
33173317
}
33183318
}
33193319

@@ -3704,6 +3704,9 @@ assert_eq!(3u8.wrapping_pow(6), 217);", $EndFeature, "
37043704
without modifying the original"]
37053705
#[inline]
37063706
pub const fn wrapping_pow(self, mut exp: u32) -> Self {
3707+
if exp == 0 {
3708+
return 1;
3709+
}
37073710
let mut base = self;
37083711
let mut acc: Self = 1;
37093712

@@ -3715,14 +3718,11 @@ assert_eq!(3u8.wrapping_pow(6), 217);", $EndFeature, "
37153718
base = base.wrapping_mul(base);
37163719
}
37173720

3721+
// since exp!=0, finally the exp must be 1.
37183722
// Deal with the final bit of the exponent separately, since
37193723
// squaring the base afterwards is not necessary and may cause a
37203724
// needless overflow.
3721-
if exp == 1 {
3722-
acc = acc.wrapping_mul(base);
3723-
}
3724-
3725-
acc
3725+
acc.wrapping_mul(base)
37263726
}
37273727
}
37283728

@@ -4029,6 +4029,9 @@ assert_eq!(3u8.overflowing_pow(6), (217, true));", $EndFeature, "
40294029
without modifying the original"]
40304030
#[inline]
40314031
pub const fn overflowing_pow(self, mut exp: u32) -> (Self, bool) {
4032+
if exp == 0{
4033+
return (1,false);
4034+
}
40324035
let mut base = self;
40334036
let mut acc: Self = 1;
40344037
let mut overflown = false;
@@ -4047,16 +4050,14 @@ assert_eq!(3u8.overflowing_pow(6), (217, true));", $EndFeature, "
40474050
overflown |= r.1;
40484051
}
40494052

4053+
// since exp!=0, finally the exp must be 1.
40504054
// Deal with the final bit of the exponent separately, since
40514055
// squaring the base afterwards is not necessary and may cause a
40524056
// needless overflow.
4053-
if exp == 1 {
4054-
r = acc.overflowing_mul(base);
4055-
acc = r.0;
4056-
overflown |= r.1;
4057-
}
4057+
r = acc.overflowing_mul(base);
4058+
r.1 |= overflown;
40584059

4059-
(acc, overflown)
4060+
r
40604061
}
40614062
}
40624063

@@ -4077,6 +4078,9 @@ Basic usage:
40774078
#[inline]
40784079
#[rustc_inherit_overflow_checks]
40794080
pub const fn pow(self, mut exp: u32) -> Self {
4081+
if exp == 0 {
4082+
return 1;
4083+
}
40804084
let mut base = self;
40814085
let mut acc = 1;
40824086

@@ -4088,14 +4092,11 @@ Basic usage:
40884092
base = base * base;
40894093
}
40904094

4095+
// since exp!=0, finally the exp must be 1.
40914096
// Deal with the final bit of the exponent separately, since
40924097
// squaring the base afterwards is not necessary and may cause a
40934098
// needless overflow.
4094-
if exp == 1 {
4095-
acc = acc * base;
4096-
}
4097-
4098-
acc
4099+
acc * base
40994100
}
41004101
}
41014102

‎src/libcore/tests/num/int_macros.rs

+32-1
Original file line numberDiff line numberDiff line change
@@ -255,12 +255,43 @@ macro_rules! int_module {
255255
#[test]
256256
fn test_pow() {
257257
let mut r = 2 as $T;
258-
259258
assert_eq!(r.pow(2), 4 as $T);
260259
assert_eq!(r.pow(0), 1 as $T);
260+
assert_eq!(r.wrapping_pow(2), 4 as $T);
261+
assert_eq!(r.wrapping_pow(0), 1 as $T);
262+
assert_eq!(r.checked_pow(2), Some(4 as $T));
263+
assert_eq!(r.checked_pow(0), Some(1 as $T));
264+
assert_eq!(r.overflowing_pow(2), (4 as $T, false));
265+
assert_eq!(r.overflowing_pow(0), (1 as $T, false));
266+
assert_eq!(r.saturating_pow(2), 4 as $T);
267+
assert_eq!(r.saturating_pow(0), 1 as $T);
268+
269+
r = MAX;
270+
// use `^` to represent .pow() with no overflow.
271+
// if itest::MAX == 2^j-1, then itest is a `j` bit int,
272+
// so that `itest::MAX*itest::MAX == 2^(2*j)-2^(j+1)+1`,
273+
// thussaturating_pow the overflowing result is exactly 1.
274+
assert_eq!(r.wrapping_pow(2), 1 as $T);
275+
assert_eq!(r.checked_pow(2), None);
276+
assert_eq!(r.overflowing_pow(2), (1 as $T, true));
277+
assert_eq!(r.saturating_pow(2), MAX);
278+
//test for negative exponent.
261279
r = -2 as $T;
262280
assert_eq!(r.pow(2), 4 as $T);
263281
assert_eq!(r.pow(3), -8 as $T);
282+
assert_eq!(r.pow(0), 1 as $T);
283+
assert_eq!(r.wrapping_pow(2), 4 as $T);
284+
assert_eq!(r.wrapping_pow(3), -8 as $T);
285+
assert_eq!(r.wrapping_pow(0), 1 as $T);
286+
assert_eq!(r.checked_pow(2), Some(4 as $T));
287+
assert_eq!(r.checked_pow(3), Some(-8 as $T));
288+
assert_eq!(r.checked_pow(0), Some(1 as $T));
289+
assert_eq!(r.overflowing_pow(2), (4 as $T, false));
290+
assert_eq!(r.overflowing_pow(3), (-8 as $T, false));
291+
assert_eq!(r.overflowing_pow(0), (1 as $T, false));
292+
assert_eq!(r.saturating_pow(2), 4 as $T);
293+
assert_eq!(r.saturating_pow(3), -8 as $T);
294+
assert_eq!(r.saturating_pow(0), 1 as $T);
264295
}
265296
}
266297
};

‎src/libcore/tests/num/uint_macros.rs

+25
Original file line numberDiff line numberDiff line change
@@ -184,6 +184,31 @@ macro_rules! uint_module {
184184
assert_eq!($T::from_str_radix("Z", 10).ok(), None::<$T>);
185185
assert_eq!($T::from_str_radix("_", 2).ok(), None::<$T>);
186186
}
187+
188+
#[test]
189+
fn test_pow() {
190+
let mut r = 2 as $T;
191+
assert_eq!(r.pow(2), 4 as $T);
192+
assert_eq!(r.pow(0), 1 as $T);
193+
assert_eq!(r.wrapping_pow(2), 4 as $T);
194+
assert_eq!(r.wrapping_pow(0), 1 as $T);
195+
assert_eq!(r.checked_pow(2), Some(4 as $T));
196+
assert_eq!(r.checked_pow(0), Some(1 as $T));
197+
assert_eq!(r.overflowing_pow(2), (4 as $T, false));
198+
assert_eq!(r.overflowing_pow(0), (1 as $T, false));
199+
assert_eq!(r.saturating_pow(2), 4 as $T);
200+
assert_eq!(r.saturating_pow(0), 1 as $T);
201+
202+
r = MAX;
203+
// use `^` to represent .pow() with no overflow.
204+
// if itest::MAX == 2^j-1, then itest is a `j` bit int,
205+
// so that `itest::MAX*itest::MAX == 2^(2*j)-2^(j+1)+1`,
206+
// thussaturating_pow the overflowing result is exactly 1.
207+
assert_eq!(r.wrapping_pow(2), 1 as $T);
208+
assert_eq!(r.checked_pow(2), None);
209+
assert_eq!(r.overflowing_pow(2), (1 as $T, true));
210+
assert_eq!(r.saturating_pow(2), MAX);
211+
}
187212
}
188213
};
189214
}

0 commit comments

Comments
 (0)
Please sign in to comment.