Eric Dumazet | 6a2d7a9 | 2006-12-13 00:34:27 -0800 | [diff] [blame] | 1 | #ifndef _LINUX_RECIPROCAL_DIV_H |
| 2 | #define _LINUX_RECIPROCAL_DIV_H |
| 3 | |
| 4 | #include <linux/types.h> |
| 5 | |
| 6 | /* |
Hannes Frederic Sowa | 809fa97 | 2014-01-22 02:29:41 +0100 | [diff] [blame^] | 7 | * This algorithm is based on the paper "Division by Invariant |
| 8 | * Integers Using Multiplication" by Torbjörn Granlund and Peter |
| 9 | * L. Montgomery. |
Eric Dumazet | 6a2d7a9 | 2006-12-13 00:34:27 -0800 | [diff] [blame] | 10 | * |
Hannes Frederic Sowa | 809fa97 | 2014-01-22 02:29:41 +0100 | [diff] [blame^] | 11 | * The assembler implementation from Agner Fog, which this code is |
| 12 | * based on, can be found here: |
| 13 | * http://www.agner.org/optimize/asmlib.zip |
Eric Dumazet | 6a2d7a9 | 2006-12-13 00:34:27 -0800 | [diff] [blame] | 14 | * |
Hannes Frederic Sowa | 809fa97 | 2014-01-22 02:29:41 +0100 | [diff] [blame^] | 15 | * This optimization for A/B is helpful if the divisor B is mostly |
| 16 | * runtime invariant. The reciprocal of B is calculated in the |
| 17 | * slow-path with reciprocal_value(). The fast-path can then just use |
| 18 | * a much faster multiplication operation with a variable dividend A |
| 19 | * to calculate the division A/B. |
Eric Dumazet | 6a2d7a9 | 2006-12-13 00:34:27 -0800 | [diff] [blame] | 20 | */ |
| 21 | |
Hannes Frederic Sowa | 809fa97 | 2014-01-22 02:29:41 +0100 | [diff] [blame^] | 22 | struct reciprocal_value { |
| 23 | u32 m; |
| 24 | u8 sh1, sh2; |
| 25 | }; |
Eric Dumazet | 6a2d7a9 | 2006-12-13 00:34:27 -0800 | [diff] [blame] | 26 | |
Hannes Frederic Sowa | 809fa97 | 2014-01-22 02:29:41 +0100 | [diff] [blame^] | 27 | struct reciprocal_value reciprocal_value(u32 d); |
Eric Dumazet | 6a2d7a9 | 2006-12-13 00:34:27 -0800 | [diff] [blame] | 28 | |
Hannes Frederic Sowa | 809fa97 | 2014-01-22 02:29:41 +0100 | [diff] [blame^] | 29 | static inline u32 reciprocal_divide(u32 a, struct reciprocal_value R) |
Eric Dumazet | 6a2d7a9 | 2006-12-13 00:34:27 -0800 | [diff] [blame] | 30 | { |
Hannes Frederic Sowa | 809fa97 | 2014-01-22 02:29:41 +0100 | [diff] [blame^] | 31 | u32 t = (u32)(((u64)a * R.m) >> 32); |
| 32 | return (t + ((a - t) >> R.sh1)) >> R.sh2; |
Eric Dumazet | 6a2d7a9 | 2006-12-13 00:34:27 -0800 | [diff] [blame] | 33 | } |
Hannes Frederic Sowa | 809fa97 | 2014-01-22 02:29:41 +0100 | [diff] [blame^] | 34 | |
| 35 | #endif /* _LINUX_RECIPROCAL_DIV_H */ |