~ubuntu-branches/ubuntu/lucid/silo/lucid

« back to all changes in this revision

Viewing changes to common/urem.S

Committer: Bazaar Package Importer
Author(s): Fabio M. Di Nitto
Date: 2007-10-25 09:28:08 UTC
mto: This revision was merged to the branch mainline in revision 16.
Revision ID: james.westby@ubuntu.com-20071025092808-pnva6x2ggmlkd65e

Tags: upstream-1.4.13a+git20070930

Import upstream version 1.4.13a+git20070930

files added:
COPYING

Makefile

Rules.make

common

common/Makefile

common/bin2h.c

common/console.c

common/divdi3.S

common/ffs.c

common/inflate.c

common/jmp.S

common/malloc.c

common/printf.c

common/prom.c

common/rem.S

common/sdiv.S

common/stringops1.c

common/stringops2.c

common/tree.c

common/udiv.S

common/udivdi3.S

common/urem.S

docs

docs/README

docs/README.tilo

etc/silo.conf

first

first-isofs

first-isofs/Makefile

first-isofs/README.SILO_ISOFS

first-isofs/crt0.S

first-isofs/isofs.c

first/Makefile

first/fd.S

first/first.S

first/generic.S

first/ieee32.S

first/ieee32.h

first/ultra.S

include

include/asm

include/asm/idprom.h

include/asm/machines.h

include/asm/mostek.h

include/asm/openprom.h

include/et

include/et/com_err.h

include/ext2fs

include/ext2fs/bitops.h

include/ext2fs/ext2_err.h

include/ext2fs/ext2_io.h

include/ext2fs/ext2fs.h

include/md-int.h

include/non-linux

include/non-linux/ext2_fs.h

include/non-linux/types.h

include/non-linux/ufs_fs.h

include/promlib.h

include/rock.h

include/silo.h

include/stringops.h

include/ufs

include/ufs/ufs_fs.h

include/ufs/ufs_fs_i.h

include/ufs/ufs_fs_sb.h

man/maketilo.1

man/silo.8

man/silo.conf.5

man/tilo.1

second

second/Makefile

second/bmark.S

second/cfg.c

second/cmdline.c

second/crt0.S

second/decomp.c

second/disk.c

second/file.c

second/file.h

second/fs

second/fs/ext2.c

second/fs/iom.c

second/fs/isofs.c

second/fs/romfs.c

second/fs/ufs.c

second/ls.c

second/main.c

second/mark.S

second/memory.c

second/misc.c

second/mul.S

second/muldi3.S

second/ranges.c

second/strtol.c

second/timer.c

second/umul.S

second/util.c

silo

silo.spec

silo/Makefile

silo/confcheck.c

silo/floppy.label

silo/prom.c

silo/prom.h

silo/silo.c

silo/silocheck.c

tilo

tilo/Makefile

tilo/crt0.S

tilo/maketilo.c

tilo/tilo.c

tilo/tilo.sh

files removed:
.bzr-builddeb

.bzr-builddeb/default.conf

debian

debian/README.build

debian/TODO

debian/changelog

debian/compat

debian/control

debian/copyright

debian/local

debian/local/siloconfig

debian/packages.d

debian/packages.d/silo.in

debian/patches

debian/patches/10-silo_new_ufs_superblock.patch

debian/patches/30-silo_use_bash_because_dash_sucks.patch

debian/patches/40-silo_needs_ufs_headers.patch

debian/patches/50-silo_needs_printf_instead_of_echo.patch

debian/rules

debian/scripts

debian/scripts/dbs-build.mk

debian/scripts/dh_split

debian/scripts/file2cat

silo-1.4.13.tar.bz2

Show diffs side-by-side

added added

removed removed

common/urem.S

/* $Id: urem.S,v 1.2 2001/06/06 17:04:50 bencollins Exp $

* urem.S: This routine was taken from glibc-1.09 and is covered

* by the GNU Library General Public License Version 2.

/* This file is generated from divrem.m4; DO NOT EDIT! */

* Division and remainder, from Appendix E of the Sparc Version 8

* Architecture Manual, with fixes from Gordon Irlam.

* Input: dividend and divisor in %o0 and %o1 respectively.

* m4 parameters:

* .urem name of function to generate

* rem rem=div => %o0 / %o1; rem=rem => %o0 % %o1

* false false=true => signed; false=false => unsigned

* Algorithm parameters:

* N how many bits per iteration we try to get (4)

* WORDSIZE total number of bits (32)

* Derived constants:

* TOPBITS number of bits in the top decade of a number

* Important variables:

* Q the partial quotient under development (initially 0)

* R the remainder so far, initially the dividend

* ITER number of main division loop iterations required;

* equal to ceil(log2(quotient) / N). Note that this

* is the log base (2^N) of the quotient.

* V the current comparand, initially divisor*2^(ITER*N-1)

* Cost:

* Current estimate for non-large dividend is

* ceil(log2(quotient) / N) * (10 + 7N/2) + C

* A large dividend is one greater than 2^(31-TOPBITS) and takes a

* different path, as the upper bits of the quotient must be developed

* one bit at a time.

.globl .urem

.urem:

! Ready to divide. Compute size of quotient; scale comparand.

orcc %o1, %g0, %o5

bne 1f

mov %o0, %o3

! Divide by zero trap. If it returns, return 0 (about as

! wrong as possible, but that is what SunOS does...).

! ta ST_DIV0 -- Not for SILO

retl

clr %o0

cmp %o3, %o5 ! if %o1 exceeds %o0, done

blu Lgot_result ! (and algorithm fails otherwise)

clr %o2

sethi %hi(1 << (32 - 4 - 1)), %g1

cmp %o3, %g1

blu Lnot_really_big

clr %o4

! Here the dividend is >= 2**(31-N) or so. We must be careful here,

! as our usual N-at-a-shot divide step will cause overflow and havoc.

! The number of bits in the result here is N*ITER+SC, where SC <= N.

! Compute ITER in an unorthodox manner: know we need to shift V into

! the top decade: so do not even bother to compare to R.

cmp %o5, %g1

bgeu 3f

mov 1, %g7

sll %o5, 4, %o5

b 1b

add %o4, 1, %o4

! Now compute %g7.

addcc %o5, %o5, %o5

bcc Lnot_too_big

add %g7, 1, %g7

! We get here if the %o1 overflowed while shifting.

! This means that %o3 has the high-order bit set.

! Restore %o5 and subtract from %o3.

sll %g1, 4, %g1 ! high order bit

srl %o5, 1, %o5 ! rest of %o5

add %o5, %g1, %o5

b Ldo_single_div

sub %g7, 1, %g7

Lnot_too_big:

100

101

cmp %o5, %o3

102

blu 2b

103

nop

104

105

be Ldo_single_div

106

nop

107

/* NB: these are commented out in the V8-Sparc manual as well */

108

/* (I do not understand this) */

109

! %o5 > %o3: went too far: back up 1 step

110

! srl %o5, 1, %o5

111

! dec %g7

112

! do single-bit divide steps

113

114

! We have to be careful here. We know that %o3 >= %o5, so we can do the

115

! first divide step without thinking. BUT, the others are conditional,

116

! and are only done if %o3 >= 0. Because both %o3 and %o5 may have the high-

117

! order bit set in the first step, just falling into the regular

118

! division loop will mess up the first time around.

119

! So we unroll slightly...

120

Ldo_single_div:

121

subcc %g7, 1, %g7

122

bl Lend_regular_divide

123

nop

124

125

sub %o3, %o5, %o3

126

mov 1, %o2

127

128

b Lend_single_divloop

129

nop

130

Lsingle_divloop:

131

sll %o2, 1, %o2

132

bl 1f

133

srl %o5, 1, %o5

134

! %o3 >= 0

135

sub %o3, %o5, %o3

136

b 2f

137

add %o2, 1, %o2

138

1: ! %o3 < 0

139

add %o3, %o5, %o3

140

sub %o2, 1, %o2

141

142

Lend_single_divloop:

143

subcc %g7, 1, %g7

144

bge Lsingle_divloop

145

tst %o3

146

147

b,a Lend_regular_divide

148

149

Lnot_really_big:

150

151

sll %o5, 4, %o5

152

153

cmp %o5, %o3

154

bleu 1b

155

addcc %o4, 1, %o4

156

157

be Lgot_result

158

sub %o4, 1, %o4

159

160

tst %o3 ! set up for initial iteration

161

Ldivloop:

162

sll %o2, 4, %o2

163

! depth 1, accumulated bits 0

164

bl L.1.16

165

srl %o5,1,%o5

166

! remainder is positive

167

subcc %o3,%o5,%o3

168

! depth 2, accumulated bits 1

169

bl L.2.17

170

srl %o5,1,%o5

171

! remainder is positive

172

subcc %o3,%o5,%o3

173

! depth 3, accumulated bits 3

174

bl L.3.19

175

srl %o5,1,%o5

176

! remainder is positive

177

subcc %o3,%o5,%o3

178

! depth 4, accumulated bits 7

179

bl L.4.23

180

srl %o5,1,%o5

181

! remainder is positive

182

subcc %o3,%o5,%o3

183

b 9f

184

add %o2, (7*2+1), %o2

185

186

L.4.23:

187

! remainder is negative

188

addcc %o3,%o5,%o3

189

b 9f

190

add %o2, (7*2-1), %o2

191

192

L.3.19:

193

! remainder is negative

194

addcc %o3,%o5,%o3

195

! depth 4, accumulated bits 5

196

bl L.4.21

197

srl %o5,1,%o5

198

! remainder is positive

199

subcc %o3,%o5,%o3

200

b 9f

201

add %o2, (5*2+1), %o2

202

203

L.4.21:

204

! remainder is negative

205

addcc %o3,%o5,%o3

206

b 9f

207

add %o2, (5*2-1), %o2

208

209

L.2.17:

210

! remainder is negative

211

addcc %o3,%o5,%o3

212

! depth 3, accumulated bits 1

213

bl L.3.17

214

srl %o5,1,%o5

215

! remainder is positive

216

subcc %o3,%o5,%o3

217

! depth 4, accumulated bits 3

218

bl L.4.19

219

srl %o5,1,%o5

220

! remainder is positive

221

subcc %o3,%o5,%o3

222

b 9f

223

add %o2, (3*2+1), %o2

224

225

L.4.19:

226

! remainder is negative

227

addcc %o3,%o5,%o3

228

b 9f

229

add %o2, (3*2-1), %o2

230

231

L.3.17:

232

! remainder is negative

233

addcc %o3,%o5,%o3

234

! depth 4, accumulated bits 1

235

bl L.4.17

236

srl %o5,1,%o5

237

! remainder is positive

238

subcc %o3,%o5,%o3

239

b 9f

240

add %o2, (1*2+1), %o2

241

242

L.4.17:

243

! remainder is negative

244

addcc %o3,%o5,%o3

245

b 9f

246

add %o2, (1*2-1), %o2

247

248

L.1.16:

249

! remainder is negative

250

addcc %o3,%o5,%o3

251

! depth 2, accumulated bits -1

252

bl L.2.15

253

srl %o5,1,%o5

254

! remainder is positive

255

subcc %o3,%o5,%o3

256

! depth 3, accumulated bits -1

257

bl L.3.15

258

srl %o5,1,%o5

259

! remainder is positive

260

subcc %o3,%o5,%o3

261

! depth 4, accumulated bits -1

262

bl L.4.15

263

srl %o5,1,%o5

264

! remainder is positive

265

subcc %o3,%o5,%o3

266

b 9f

267

add %o2, (-1*2+1), %o2

268

269

L.4.15:

270

! remainder is negative

271

addcc %o3,%o5,%o3

272

b 9f

273

add %o2, (-1*2-1), %o2

274

275

L.3.15:

276

! remainder is negative

277

addcc %o3,%o5,%o3

278

! depth 4, accumulated bits -3

279

bl L.4.13

280

srl %o5,1,%o5

281

! remainder is positive

282

subcc %o3,%o5,%o3

283

b 9f

284

add %o2, (-3*2+1), %o2

285

286

L.4.13:

287

! remainder is negative

288

addcc %o3,%o5,%o3

289

b 9f

290

add %o2, (-3*2-1), %o2

291

292

L.2.15:

293

! remainder is negative

294

addcc %o3,%o5,%o3

295

! depth 3, accumulated bits -3

296

bl L.3.13

297

srl %o5,1,%o5

298

! remainder is positive

299

subcc %o3,%o5,%o3

300

! depth 4, accumulated bits -5

301

bl L.4.11

302

srl %o5,1,%o5

303

! remainder is positive

304

subcc %o3,%o5,%o3

305

b 9f

306

add %o2, (-5*2+1), %o2

307

308

L.4.11:

309

! remainder is negative

310

addcc %o3,%o5,%o3

311

b 9f

312

add %o2, (-5*2-1), %o2

313

314

L.3.13:

315

! remainder is negative

316

addcc %o3,%o5,%o3

317

! depth 4, accumulated bits -7

318

bl L.4.9

319

srl %o5,1,%o5

320

! remainder is positive

321

subcc %o3,%o5,%o3

322

b 9f

323

add %o2, (-7*2+1), %o2

324

325

L.4.9:

326

! remainder is negative

327

addcc %o3,%o5,%o3

328

b 9f

329

add %o2, (-7*2-1), %o2

330

331

332

Lend_regular_divide:

333

subcc %o4, 1, %o4

334

bge Ldivloop

335

tst %o3

336

337

bl,a Lgot_result

338

! non-restoring fixup here (one instruction only!)

339

add %o3, %o1, %o3

340

341

Lgot_result:

342

343

retl

344

mov %o3, %o0

345

346

.globl .urem_patch

347

.urem_patch:

348

wr %g0, 0x0, %y

349

nop

350

nop

351

nop

352

udiv %o0, %o1, %o2

353

umul %o2, %o1, %o2

354

retl

355

sub %o0, %o2, %o0

Older »