~jderose/ubuntu/raring/python3.3/fix-1131183

« back to all changes in this revision

Viewing changes to debian/pyhtml2devhelp.py

Committer: Package Import Robot
Author(s): Matthias Klose
Date: 2013-01-26 15:47:17 UTC
Revision ID: package-import@ubuntu.com-20130126154717-9mu2ob20tnuxbkok

Tags: 3.3.0-10ubuntu1

* Merge with Debian; remaining changes:
- Build-depend on python3:any instead of python3.

files added:
debian/patches/config-update.diff

files removed:
debian/patches/cross-build.diff

files modified:
debian/changelog

debian/control

debian/control.in

debian/depgraph.py

debian/libPVER-dbg.overrides.in

debian/mincheck.py

debian/patches/hg-updates.diff

debian/patches/hurd-path_max.diff

debian/patches/multiarch.diff

debian/patches/series.in

debian/patches/site-locations.diff

debian/pyhtml2devhelp.py

debian/pymindeps.py

debian/rules

debian/script.py

Show diffs side-by-side

added added

removed removed

debian/pyhtml2devhelp.py

#! /usr/bin/python

#! /usr/bin/python3

import formatter, htmllib

from html.parser import HTMLParser

import formatter

import os, sys, re

class PyHTMLParser(htmllib.HTMLParser):

class PyHTMLParser(HTMLParser):

pages_to_include = set(('whatsnew/index.html', 'tutorial/index.html', 'using/index.html',

'reference/index.html', 'library/index.html', 'howto/index.html',

'extending/index.html', 'c-api/index.html', 'install/index.html',

'distutils/index.html'))

def __init__(self, formatter, basedir, fn, indent, parents=set()):

htmllib.HTMLParser.__init__(self, formatter)

HTMLParser.__init__(self, formatter)

self.basedir = basedir

self.dir, self.fn = os.path.split(fn)

self.data = ''

text = self.link['text']

indent = self.indent + self.sub_indent

if self.last_indent == indent:

print '%s' % (' ' * self.last_indent)

print('%s' % (' ' * self.last_indent))

self.sub_count -= 1

print '%s' % (' ' * indent, new_href, text)

print('%s' % (' ' * indent, new_href, text))

self.sub_count += 1

self.last_indent = self.indent + self.sub_indent

def handle_starttag(self, tag, attrs):

if tag == 'a':

self.start_a(attrs)

elif tag == 'li':

self.start_li(attrs)

def handle_endtag(self, tag):

if tag == 'a':

self.end_a()

elif tag == 'li':

self.end_li()

def start_li(self, attrs):

self.sub_indent += 1

self.next_link = True

def end_li(self):

indent = self.indent + self.sub_indent

if self.sub_count > 0:

print '%s' % (' ' * self.last_indent)

print('%s' % (' ' * self.last_indent))

self.sub_count -= 1

self.last_indent -= 1

self.sub_indent -= 1

'license.html', 'copyright.html'):

return

if self.link.has_key('class'):

if 'class' in self.link:

if self.link['class'] in ('biglink'):

process = True

if self.link['class'] in ('reference external'):

100

101

def finish(self):

102

if self.sub_count > 0:

print '%s' % (' ' * self.last_indent)

103

print('%s' % (' ' * self.last_indent))

104

105

def handle_data(self, data):

106

self.data += data

112

parser = PyHTMLParser(formatter.NullFormatter(),

100

113

self.basedir, href, self.indent + 1,

101

114

self.parents)

102

text = file(self.basedir + '/' + href).read()

115

text = open(self.basedir + '/' + href, encoding='latin_1').read()

103

116

parser.feed(text)

104

117

parser.finish()

105

118

parser.close()

106

119

if parent in self.parents:

107

120

self.parents.remove(parent)

108

121

109

class PyIdxHTMLParser(htmllib.HTMLParser):

122

class PyIdxHTMLParser(HTMLParser):

110

123

def __init__(self, formatter, basedir, fn, indent):

111

htmllib.HTMLParser.__init__(self, formatter)

124

HTMLParser.__init__(self, formatter)

112

125

self.basedir = basedir

113

126

self.dir, self.fn = os.path.split(fn)

114

127

self.data = ''

136

149

# Save it in case we need it again

137

150

self.last_text = re.sub(' \([\w\-\.\s]+\)', '', text)

138

151

indent = self.indent

139

print '%s<function link="%s" name="%s"/>' % (' ' * indent, new_href, text)

152

print('%s<function link="%s" name="%s"/>' % (' ' * indent, new_href, text))

153

154

def handle_starttag(self, tag, attrs):

155

if tag == 'a':

156

self.start_a(attrs)

157

elif tag == 'dl':

158

self.start_dl(attrs)

159

elif tag == 'dt':

160

self.start_dt(attrs)

161

elif tag == 'h2':

162

self.start_h2(attrs)

163

elif tag == 'td':

164

self.start_td(attrs)

165

elif tag == 'table':

166

self.start_table(attrs)

167

168

def handle_endtag(self, tag):

169

if tag == 'a':

170

self.end_a()

171

elif tag == 'dl':

172

self.end_dl()

173

elif tag == 'dt':

174

self.end_dt()

175

elif tag == 'h2':

176

self.end_h2()

177

elif tag == 'td':

178

self.end_td()

179

elif tag == 'table':

180

self.end_table()

140

181

141

182

def start_dl(self, attrs):

142

183

if self.last_text:

165

206

if v == '_':

166

207

self.active = True

167

208

209

def end_h2(self):

210

pass

211

168

212

def start_td(self, attrs):

169

213

self.indented = False

170

214

self.last_text = ''

171

215

216

def end_td(self):

217

pass

218

172

219

def start_table(self, attrs):

173

220

pass

174

221

184

231

self.data = ''

185

232

186

233

def end_a(self):

187

text = self.data.replace('\t', '').replace('\n', ' ').replace('&', '&').replace('<', '<').replace('>', '>')

234

text = self.data.replace('\t', '').replace('\n', ' ')

235

text = text.replace("Whats ", "What's ")

188

236

self.link['text'] = text

189

237

# handle a tag without href attribute

190

238

try:

196

244

def handle_data(self, data):

197

245

self.data += data

198

246

247

def handle_entityref(self, name):

248

self.data += '&%s;' % name

249

199

250

def main():

200

251

base = sys.argv[1]

201

252

fn = sys.argv[2]

202

253

version = sys.argv[3]

203

254

204

255

parser = PyHTMLParser(formatter.NullFormatter(), base, fn, indent=0)

205

print '<?xml version="1.0" encoding="iso-8859-1"?>'

206

print '<book title="Python %s Documentation" name="Python %s" version="%s" link="index.html">' % (version, version, version)

207

print '<chapters>'

256

print('<?xml version="1.0" encoding="iso-8859-1"?>')

257

print('<book title="Python %s Documentation" name="Python %s" version="%s" link="index.html">' % (version, version, version))

258

print('<chapters>')

208

259

parser.parse_file(fn)

209

print '</chapters>'

260

print('</chapters>')

210

261

211

print '<functions>'

262

print('<functions>')

212

263

213

264

fn = 'genindex-all.html'

214

265

parser = PyIdxHTMLParser(formatter.NullFormatter(), base, fn, indent=1)

215

text = file(base + '/' + fn).read()

266

text = open(base + '/' + fn, encoding='latin_1').read()

216

267

parser.feed(text)

217

268

parser.close()

218

269

219

print '</functions>'

220

print '</book>'

270

print('</functions>')

271

print('</book>')

221

272

222

273

main()

Older »