00001 /* 00002 * See the dyninst/COPYRIGHT file for copyright information. 00003 * 00004 * We provide the Paradyn Tools (below described as "Paradyn") 00005 * on an AS IS basis, and do not warrant its validity or performance. 00006 * We reserve the right to update, modify, or discontinue this 00007 * software at any time. We shall have no obligation to supply such 00008 * updates or modifications or any other form of support to you. 00009 * 00010 * By your use of Paradyn, you understand and agree that we (or any 00011 * other person or entity with proprietary rights in Paradyn) are 00012 * under no obligation to provide either maintenance services, 00013 * update services, notices of latent defects, or correction of 00014 * defects for Paradyn. 00015 * 00016 * This library is free software; you can redistribute it and/or 00017 * modify it under the terms of the GNU Lesser General Public 00018 * License as published by the Free Software Foundation; either 00019 * version 2.1 of the License, or (at your option) any later version. 00020 * 00021 * This library is distributed in the hope that it will be useful, 00022 * but WITHOUT ANY WARRANTY; without even the implied warranty of 00023 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU 00024 * Lesser General Public License for more details. 00025 * 00026 * You should have received a copy of the GNU Lesser General Public 00027 * License along with this library; if not, write to the Free Software 00028 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA 00029 */ 00030 00031 #include "common/h/headers.h" 00032 #include "common/h/irixKludges.h" 00033 00034 // copied from solarisKludges.C 00035 unsigned long long PDYN_div1000(unsigned long long in) { 00036 /* Divides by 1000 without an integer division instruction or library call, both of 00037 * which are slow. 00038 * We do only shifts, adds, and subtracts. 00039 * 00040 * We divide by 1000 in this way: 00041 * multiply by 1/1000, or multiply by (1/1000)*2^30 and then right-shift by 30. 00042 * So what is 1/1000 * 2^30? 00043 * It is 1,073,742. (actually this is rounded) 00044 * So we can multiply by 1,073,742 and then right-shift by 30 (neat, eh?) 00045 * 00046 * Now for multiplying by 1,073,742... 00047 * 1,073,742 = (1,048,576 + 16384 + 8192 + 512 + 64 + 8 + 4 + 2) 00048 * or, slightly optimized: 00049 * = (1,048,576 + 16384 + 8192 + 512 + 64 + 16 - 2) 00050 * for a total of 8 shifts and 6 add/subs, or 14 operations. 00051 * 00052 */ 00053 00054 unsigned long long temp = in << 20; // multiply by 1,048,576 00055 // beware of overflow; left shift by 20 is quite a lot. 00056 // If you know that the input fits in 32 bits (4 billion) then 00057 // no problem. But if it's much bigger then start worrying... 00058 00059 temp += in << 14; // 16384 00060 temp += in << 13; // 8192 00061 temp += in << 9; // 512 00062 temp += in << 6; // 64 00063 temp += in << 4; // 16 00064 temp -= in >> 2; // 2 00065 00066 return (temp >> 30); // divide by 2^30 00067 } 00068 00069 // copied from solarisKludges.C 00070 unsigned long long PDYN_divMillion(unsigned long long in) { 00071 /* Divides by 1,000,000 without an integer division instruction or library call, 00072 * both of which are slow. 00073 * We do only shifts, adds, and subtracts. 00074 * 00075 * We divide by 1,000,000 in this way: 00076 * multiply by 1/1,000,000, or multiply by (1/1,000,000)*2^30 and then right-shift 00077 * by 30. So what is 1/1,000,000 * 2^30? 00078 * It is 1,074. (actually this is rounded) 00079 * So we can multiply by 1,074 and then right-shift by 30 (neat, eh?) 00080 * 00081 * Now for multiplying by 1,074 00082 * 1,074 = (1024 + 32 + 16 + 2) 00083 * for a total of 4 shifts and 4 add/subs, or 8 operations. 00084 * 00085 * Note: compare with div1000 -- it's cheaper to divide by a million than 00086 * by a thousand (!) 00087 * 00088 */ 00089 00090 unsigned long long temp = in << 10; // multiply by 1024 00091 // beware of overflow...if the input arg uses more than 52 bits 00092 // than start worrying about whether (in << 10) plus the smaller additions 00093 // we're gonna do next will fit in 64... 00094 00095 temp += in << 5; // 32 00096 temp += in << 4; // 16 00097 temp += in << 1; // 2 00098 00099 return (temp >> 30); // divide by 2^30 00100 } 00101 00102 // copied from solarisKludges.C 00103 unsigned long long PDYN_mulMillion(unsigned long long in) { 00104 unsigned long long result = in; 00105 00106 /* multiply by 125 by multiplying by 128 and subtracting 3x */ 00107 result = (result << 7) - result - result - result; 00108 00109 /* multiply by 125 again, for a total of 15625x */ 00110 result = (result << 7) - result - result - result; 00111 00112 /* multiply by 64, for a total of 1,000,000x */ 00113 result <<= 6; 00114 00115 /* cost was: 3 shifts and 6 subtracts 00116 * cost of calling mul1000(mul1000()) would be: 6 shifts and 4 subtracts 00117 * 00118 * Another algorithm is to multiply by 2^6 and then 5^6. 00119 * The former is super-cheap (one shift); the latter is more expensive. 00120 * 5^6 = 15625 = 16384 - 512 - 256 + 8 + 1 00121 * so multiplying by 5^6 means 4 shift operations and 4 add/sub ops 00122 * so multiplying by 1000000 means 5 shift operations and 4 add/sub ops. 00123 * That may or may not be cheaper than what we're doing (3 shifts; 6 subtracts); 00124 * I'm not sure. --ari 00125 */ 00126 00127 return result; 00128 }
1.6.1