2000-07-20 18:29:24 -04:00
|
|
|
|
#!/usr/bin/env python
|
|
|
|
|
"""
|
|
|
|
|
convert PEP's to (X)HTML - courtesy of /F
|
|
|
|
|
|
2000-08-28 12:00:49 -04:00
|
|
|
|
Usage: %(PROGRAM)s [options] [peps]
|
|
|
|
|
|
2000-08-15 01:53:19 -04:00
|
|
|
|
Options:
|
2000-07-24 23:51:44 -04:00
|
|
|
|
|
2000-08-28 12:00:49 -04:00
|
|
|
|
-u/--user
|
|
|
|
|
SF username
|
|
|
|
|
|
2000-08-15 01:53:19 -04:00
|
|
|
|
-i/--install
|
2001-03-20 10:07:21 -05:00
|
|
|
|
After generating the HTML, install it and the plain text source file
|
|
|
|
|
(.txt) SourceForge. In that case the user's name is used in the scp
|
|
|
|
|
and ssh commands, unless sf_username is given (in which case, it is
|
|
|
|
|
used instead). Without -i, sf_username is ignored.
|
2000-07-24 23:51:44 -04:00
|
|
|
|
|
2000-11-03 10:43:28 -05:00
|
|
|
|
-q/--quiet
|
|
|
|
|
Turn off verbose messages.
|
|
|
|
|
|
2000-08-15 01:53:19 -04:00
|
|
|
|
-h/--help
|
|
|
|
|
Print this help message and exit.
|
2001-11-12 09:58:07 -05:00
|
|
|
|
|
|
|
|
|
The optional argument `peps' is a list of either pep numbers or .txt files.
|
2000-07-20 18:29:24 -04:00
|
|
|
|
"""
|
|
|
|
|
|
2000-08-15 01:53:19 -04:00
|
|
|
|
import sys
|
|
|
|
|
import os
|
|
|
|
|
import re
|
|
|
|
|
import cgi
|
|
|
|
|
import glob
|
|
|
|
|
import getopt
|
2001-07-05 14:44:20 -04:00
|
|
|
|
import errno
|
2000-07-20 18:29:24 -04:00
|
|
|
|
|
2000-08-15 01:53:19 -04:00
|
|
|
|
PROGRAM = sys.argv[0]
|
2001-06-05 13:21:19 -04:00
|
|
|
|
RFCURL = 'http://www.faqs.org/rfcs/rfc%d.html'
|
2001-07-05 14:44:20 -04:00
|
|
|
|
PEPURL = 'pep-%04d.html'
|
2000-07-20 18:44:36 -04:00
|
|
|
|
|
2000-08-15 01:53:19 -04:00
|
|
|
|
|
|
|
|
|
|
|
|
|
|
HOST = "shell.sourceforge.net" # host for update
|
2001-05-01 13:53:52 -04:00
|
|
|
|
HDIR = "/home/groups/p/py/python/htdocs/peps" # target host directory
|
2000-07-28 02:40:10 -04:00
|
|
|
|
LOCALVARS = "Local Variables:"
|
2000-07-25 00:12:28 -04:00
|
|
|
|
|
2000-08-15 01:53:19 -04:00
|
|
|
|
# The generated HTML doesn't validate -- you cannot use <hr> and <h3> inside
|
|
|
|
|
# <pre> tags. But if I change that, the result doesn't look very nice...
|
2000-07-24 23:51:44 -04:00
|
|
|
|
DTD = ('<!DOCTYPE html PUBLIC "-//W3C//DTD HTML 4.0 Transitional//EN"\n'
|
|
|
|
|
' "http://www.w3.org/TR/REC-html40/loose.dtd">')
|
2000-07-20 18:44:36 -04:00
|
|
|
|
|
2001-08-14 17:42:39 -04:00
|
|
|
|
fixpat = re.compile("((http|ftp):[-_a-zA-Z0-9/.+~:?#$=&,]+)|(pep-\d+(.txt)?)|"
|
2001-07-05 14:44:20 -04:00
|
|
|
|
"(RFC[- ]?(?P<rfcnum>\d+))|"
|
|
|
|
|
"(PEP\s+(?P<pepnum>\d+))|"
|
|
|
|
|
".")
|
2000-07-20 18:29:24 -04:00
|
|
|
|
|
2001-08-14 17:42:39 -04:00
|
|
|
|
EMPTYSTRING = ''
|
|
|
|
|
SPACE = ' '
|
|
|
|
|
|
2000-08-15 01:53:19 -04:00
|
|
|
|
|
|
|
|
|
|
|
|
|
|
def usage(code, msg=''):
|
2002-02-04 17:38:27 -05:00
|
|
|
|
print >> sys.stderr, __doc__ % globals()
|
2000-08-15 01:53:19 -04:00
|
|
|
|
if msg:
|
2001-08-14 12:45:19 -04:00
|
|
|
|
print >> sys.stderr, msg
|
2000-08-15 01:53:19 -04:00
|
|
|
|
sys.exit(code)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
2000-07-24 23:51:44 -04:00
|
|
|
|
def fixanchor(current, match):
|
2000-07-20 18:29:24 -04:00
|
|
|
|
text = match.group(0)
|
|
|
|
|
link = None
|
2001-08-14 17:42:39 -04:00
|
|
|
|
if text.startswith('http:') or text.startswith('ftp:'):
|
|
|
|
|
# Strip off trailing punctuation. Pattern taken from faqwiz.
|
|
|
|
|
ltext = list(text)
|
|
|
|
|
while ltext:
|
|
|
|
|
c = ltext.pop()
|
|
|
|
|
if c not in '();:,.?\'"<>':
|
|
|
|
|
ltext.append(c)
|
|
|
|
|
break
|
|
|
|
|
link = EMPTYSTRING.join(ltext)
|
|
|
|
|
elif text.startswith('pep-') and text <> current:
|
2000-07-20 18:29:24 -04:00
|
|
|
|
link = os.path.splitext(text)[0] + ".html"
|
2001-08-14 17:42:39 -04:00
|
|
|
|
elif text.startswith('PEP'):
|
2001-07-05 14:44:20 -04:00
|
|
|
|
pepnum = int(match.group('pepnum'))
|
|
|
|
|
link = PEPURL % pepnum
|
2001-08-14 17:42:39 -04:00
|
|
|
|
elif text.startswith('RFC'):
|
2001-07-05 14:44:20 -04:00
|
|
|
|
rfcnum = int(match.group('rfcnum'))
|
2001-06-05 13:21:19 -04:00
|
|
|
|
link = RFCURL % rfcnum
|
2000-07-20 18:29:24 -04:00
|
|
|
|
if link:
|
2001-08-14 12:45:19 -04:00
|
|
|
|
return '<a href="%s">%s</a>' % (link, cgi.escape(text))
|
2000-07-20 18:44:36 -04:00
|
|
|
|
return cgi.escape(match.group(0)) # really slow, but it works...
|
2000-07-20 18:29:24 -04:00
|
|
|
|
|
2000-08-15 01:53:19 -04:00
|
|
|
|
|
|
|
|
|
|
2000-07-20 18:29:24 -04:00
|
|
|
|
def fixfile(infile, outfile):
|
2001-08-14 12:45:19 -04:00
|
|
|
|
basename = os.path.basename(infile)
|
2000-07-20 18:29:24 -04:00
|
|
|
|
# convert plain text pep to minimal XHTML markup
|
2001-07-05 14:44:20 -04:00
|
|
|
|
try:
|
|
|
|
|
fi = open(infile)
|
|
|
|
|
except IOError, e:
|
|
|
|
|
if e.errno <> errno.ENOENT: raise
|
|
|
|
|
print >> sys.stderr, 'Error: Skipping missing PEP file:', e.filename
|
|
|
|
|
return
|
2000-07-20 18:29:24 -04:00
|
|
|
|
fo = open(outfile, "w")
|
2001-08-14 12:45:19 -04:00
|
|
|
|
print >> fo, DTD
|
|
|
|
|
print >> fo, '<html>'
|
|
|
|
|
print >> fo, '<head>'
|
2000-07-20 18:29:24 -04:00
|
|
|
|
# head
|
|
|
|
|
header = []
|
2000-07-20 18:44:36 -04:00
|
|
|
|
pep = ""
|
|
|
|
|
title = ""
|
2000-07-20 18:29:24 -04:00
|
|
|
|
while 1:
|
|
|
|
|
line = fi.readline()
|
2000-07-27 15:18:59 -04:00
|
|
|
|
if not line.strip():
|
2000-07-20 18:29:24 -04:00
|
|
|
|
break
|
2000-07-27 15:18:59 -04:00
|
|
|
|
if line[0].strip():
|
|
|
|
|
if ":" not in line:
|
|
|
|
|
break
|
|
|
|
|
key, value = line.split(":", 1)
|
|
|
|
|
value = value.strip()
|
|
|
|
|
header.append((key, value))
|
|
|
|
|
else:
|
|
|
|
|
# continuation line
|
|
|
|
|
key, value = header[-1]
|
|
|
|
|
value = value + line
|
|
|
|
|
header[-1] = key, value
|
2000-07-20 18:29:24 -04:00
|
|
|
|
if key.lower() == "title":
|
2000-07-20 18:44:36 -04:00
|
|
|
|
title = value
|
2000-07-27 15:18:59 -04:00
|
|
|
|
elif key.lower() == "pep":
|
2000-07-20 18:44:36 -04:00
|
|
|
|
pep = value
|
|
|
|
|
if pep:
|
|
|
|
|
title = "PEP " + pep + " -- " + title
|
|
|
|
|
if title:
|
2001-08-14 12:45:19 -04:00
|
|
|
|
print >> fo, ' <title>%s</title>' % cgi.escape(title)
|
|
|
|
|
print >> fo, ' <link rel="STYLESHEET" href="style.css">'
|
|
|
|
|
print >> fo, '</head>'
|
2000-07-20 18:29:24 -04:00
|
|
|
|
# body
|
2001-08-14 12:45:19 -04:00
|
|
|
|
print >> fo, '<body bgcolor="white">'
|
|
|
|
|
print >> fo, '<div class="navigation">'
|
|
|
|
|
print >> fo, '[<b><a href="../">home</a></b>]'
|
|
|
|
|
if basename <> 'pep-0000.txt':
|
|
|
|
|
print >> fo, '[<b><a href=".">index</a></b>]'
|
|
|
|
|
print >> fo, '[<b><a href="pep-%04d.txt">PEP source</a></b>]' % int(pep)
|
|
|
|
|
print >> fo, '</div>'
|
|
|
|
|
print >> fo, '<div class="header">\n<table border="0">'
|
2000-07-20 18:29:24 -04:00
|
|
|
|
for k, v in header:
|
2001-03-21 12:26:05 -05:00
|
|
|
|
if k.lower() in ('author', 'discussions-to'):
|
2000-08-17 00:27:04 -04:00
|
|
|
|
mailtos = []
|
|
|
|
|
for addr in v.split():
|
|
|
|
|
if '@' in addr:
|
|
|
|
|
mailtos.append(
|
|
|
|
|
'<a href="mailto:%s?subject=PEP%%20%s">%s</a>' %
|
|
|
|
|
(addr, pep, addr))
|
2001-03-21 13:59:03 -05:00
|
|
|
|
elif addr.startswith('http:'):
|
|
|
|
|
mailtos.append(
|
|
|
|
|
'<a href="%s">%s</a>' % (addr, addr))
|
2000-08-17 00:27:04 -04:00
|
|
|
|
else:
|
|
|
|
|
mailtos.append(addr)
|
2001-08-14 17:42:39 -04:00
|
|
|
|
v = SPACE.join(mailtos)
|
2001-03-21 12:26:05 -05:00
|
|
|
|
elif k.lower() in ('replaces', 'replaced-by'):
|
|
|
|
|
peps = ''
|
|
|
|
|
for pep in v.split():
|
|
|
|
|
pep = int(pep)
|
|
|
|
|
peps += '<a href="pep-%04d.html">%i</a> ' % (pep, pep)
|
|
|
|
|
v = peps
|
2000-08-17 00:27:04 -04:00
|
|
|
|
else:
|
|
|
|
|
v = cgi.escape(v)
|
2001-08-14 12:45:19 -04:00
|
|
|
|
print >> fo, ' <tr><th align="right">%s:</th><td>%s</td></tr>' % (
|
|
|
|
|
cgi.escape(k), v)
|
|
|
|
|
print >> fo, '</table>'
|
|
|
|
|
print >> fo, '</div>'
|
|
|
|
|
print >> fo, '<hr />'
|
|
|
|
|
print >> fo, '<pre>'
|
2000-07-20 18:29:24 -04:00
|
|
|
|
while 1:
|
|
|
|
|
line = fi.readline()
|
|
|
|
|
if not line:
|
|
|
|
|
break
|
2001-08-14 12:45:19 -04:00
|
|
|
|
if line[0] == '\f':
|
|
|
|
|
continue
|
|
|
|
|
if line.strip() == LOCALVARS:
|
|
|
|
|
break
|
|
|
|
|
if line[0].strip():
|
|
|
|
|
if line.strip() == LOCALVARS:
|
|
|
|
|
break
|
|
|
|
|
print >> fo, '</pre>'
|
|
|
|
|
print >> fo, '<h3>%s</h3>' % line.strip()
|
|
|
|
|
print >> fo, '<pre>',
|
|
|
|
|
else:
|
|
|
|
|
# PEP 0 has some special treatment
|
|
|
|
|
if basename == 'pep-0000.txt':
|
|
|
|
|
parts = line.split()
|
|
|
|
|
if len(parts) > 1 and re.match(r'\s*\d{1,4}', parts[1]):
|
|
|
|
|
# This is a PEP summary line, which we need to hyperlink
|
|
|
|
|
url = PEPURL % int(parts[1])
|
|
|
|
|
print >> fo, re.sub(
|
|
|
|
|
parts[1],
|
|
|
|
|
'<a href="%s">%s</a>' % (url, parts[1]),
|
|
|
|
|
line, 1),
|
|
|
|
|
continue
|
|
|
|
|
elif parts and '@' in parts[-1]:
|
|
|
|
|
# This is a pep email address line, so hyperlink it
|
|
|
|
|
url = '<a href="mailto:%s">%s</a>' % (parts[-1], parts[-1])
|
|
|
|
|
print >> fo, re.sub(
|
|
|
|
|
parts[-1], url, line, 1),
|
|
|
|
|
continue
|
|
|
|
|
line = fixpat.sub(lambda x, c=infile: fixanchor(c, x), line)
|
|
|
|
|
fo.write(line)
|
|
|
|
|
print >> fo, '</pre>'
|
|
|
|
|
print >> fo, '</body>'
|
|
|
|
|
print >> fo, '</html>'
|
2000-07-25 00:12:28 -04:00
|
|
|
|
fo.close()
|
|
|
|
|
os.chmod(outfile, 0664)
|
2000-07-20 18:29:24 -04:00
|
|
|
|
|
2001-08-14 12:45:19 -04:00
|
|
|
|
|
2000-08-28 12:00:49 -04:00
|
|
|
|
|
|
|
|
|
def find_pep(pep_str):
|
|
|
|
|
"""Find the .txt file indicated by a cmd line argument"""
|
|
|
|
|
if os.path.exists(pep_str):
|
|
|
|
|
return pep_str
|
|
|
|
|
num = int(pep_str)
|
|
|
|
|
return "pep-%04d.txt" % num
|
|
|
|
|
|
2000-09-06 21:26:46 -04:00
|
|
|
|
def make_html(file, verbose=0):
|
2000-08-28 12:00:49 -04:00
|
|
|
|
newfile = os.path.splitext(file)[0] + ".html"
|
2000-09-06 21:26:46 -04:00
|
|
|
|
if verbose:
|
|
|
|
|
print file, "->", newfile
|
2000-08-28 12:00:49 -04:00
|
|
|
|
fixfile(file, newfile)
|
|
|
|
|
return newfile
|
2000-07-24 23:51:44 -04:00
|
|
|
|
|
2001-03-20 10:07:21 -05:00
|
|
|
|
def push_pep(htmlfiles, txtfiles, username, verbose):
|
2000-09-08 11:31:36 -04:00
|
|
|
|
if verbose:
|
|
|
|
|
quiet = ""
|
|
|
|
|
else:
|
|
|
|
|
quiet = "-q"
|
|
|
|
|
if username:
|
|
|
|
|
username = username + "@"
|
|
|
|
|
target = username + HOST + ":" + HDIR
|
2001-03-20 10:07:21 -05:00
|
|
|
|
files = htmlfiles[:]
|
|
|
|
|
files.extend(txtfiles)
|
2000-09-08 11:31:36 -04:00
|
|
|
|
files.append("style.css")
|
2001-03-20 10:07:21 -05:00
|
|
|
|
filelist = SPACE.join(files)
|
2000-09-08 11:31:36 -04:00
|
|
|
|
rc = os.system("scp %s %s %s" % (quiet, filelist, target))
|
|
|
|
|
if rc:
|
|
|
|
|
sys.exit(rc)
|
|
|
|
|
rc = os.system("ssh %s%s chmod 664 %s/*" % (username, HOST, HDIR))
|
|
|
|
|
if rc:
|
|
|
|
|
sys.exit(rc)
|
|
|
|
|
|
2000-08-15 01:53:19 -04:00
|
|
|
|
|
2000-07-24 23:51:44 -04:00
|
|
|
|
def main():
|
2000-08-15 01:53:19 -04:00
|
|
|
|
# defaults
|
|
|
|
|
update = 0
|
|
|
|
|
username = ''
|
2000-09-06 21:26:46 -04:00
|
|
|
|
verbose = 1
|
2000-08-15 01:53:19 -04:00
|
|
|
|
|
|
|
|
|
try:
|
2000-11-01 18:45:47 -05:00
|
|
|
|
opts, args = getopt.getopt(sys.argv[1:], 'ihqu:',
|
|
|
|
|
['install', 'help', 'quiet', 'user='])
|
2000-08-15 01:53:19 -04:00
|
|
|
|
except getopt.error, msg:
|
|
|
|
|
usage(1, msg)
|
|
|
|
|
|
|
|
|
|
for opt, arg in opts:
|
|
|
|
|
if opt in ('-h', '--help'):
|
|
|
|
|
usage(0)
|
|
|
|
|
elif opt in ('-i', '--install'):
|
|
|
|
|
update = 1
|
2000-08-28 12:00:49 -04:00
|
|
|
|
elif opt in ('-u', '--user'):
|
2000-09-08 11:31:36 -04:00
|
|
|
|
username = arg
|
2000-09-06 21:26:46 -04:00
|
|
|
|
elif opt in ('-q', '--quiet'):
|
|
|
|
|
verbose = 0
|
2000-08-15 01:53:19 -04:00
|
|
|
|
|
2000-08-28 12:00:49 -04:00
|
|
|
|
if args:
|
2001-03-20 10:07:21 -05:00
|
|
|
|
peptxt = []
|
2000-08-28 12:00:49 -04:00
|
|
|
|
html = []
|
|
|
|
|
for pep in args:
|
|
|
|
|
file = find_pep(pep)
|
2001-03-20 10:07:21 -05:00
|
|
|
|
peptxt.append(file)
|
2000-09-06 21:26:46 -04:00
|
|
|
|
newfile = make_html(file, verbose=verbose)
|
2000-08-28 12:00:49 -04:00
|
|
|
|
html.append(newfile)
|
|
|
|
|
else:
|
|
|
|
|
# do them all
|
2001-03-20 10:07:21 -05:00
|
|
|
|
peptxt = []
|
2000-08-28 12:00:49 -04:00
|
|
|
|
for file in glob.glob("pep-*.txt"):
|
2001-03-20 10:07:21 -05:00
|
|
|
|
peptxt.append(file)
|
2000-09-06 21:26:46 -04:00
|
|
|
|
make_html(file, verbose=verbose)
|
2000-09-08 11:31:36 -04:00
|
|
|
|
html = ["pep-*.html"]
|
2000-07-24 23:51:44 -04:00
|
|
|
|
if update:
|
2001-03-20 10:07:21 -05:00
|
|
|
|
push_pep(html, peptxt, username, verbose)
|
2000-07-24 23:51:44 -04:00
|
|
|
|
|
2001-08-14 12:45:19 -04:00
|
|
|
|
|
2000-08-15 01:53:19 -04:00
|
|
|
|
|
2000-07-24 23:51:44 -04:00
|
|
|
|
if __name__ == "__main__":
|
|
|
|
|
main()
|