1996-11-27 15:52:01 -04:00
|
|
|
#! /usr/bin/env python
|
1994-05-27 10:32:41 -03:00
|
|
|
#######################################################################
|
|
|
|
# Newslist $Revision$
|
|
|
|
#
|
|
|
|
# Syntax:
|
|
|
|
# newslist [ -a ]
|
|
|
|
#
|
2004-07-18 02:56:09 -03:00
|
|
|
# This is a program to create a directory full of HTML pages
|
1994-05-27 10:32:41 -03:00
|
|
|
# which between them contain links to all the newsgroups available
|
|
|
|
# on your server.
|
|
|
|
#
|
2004-07-18 02:56:09 -03:00
|
|
|
# The -a option causes a complete list of all groups to be read from
|
1994-05-27 10:32:41 -03:00
|
|
|
# the server rather than just the ones which have appeared since last
|
|
|
|
# execution. This recreates the local list from scratch. Use this on
|
1994-05-27 10:33:17 -03:00
|
|
|
# the first invocation of the program, and from time to time thereafter.
|
2004-07-18 02:56:09 -03:00
|
|
|
# When new groups are first created they may appear on your server as
|
1994-05-27 10:33:17 -03:00
|
|
|
# empty groups. By default, empty groups are ignored by the -a option.
|
|
|
|
# However, these new groups will not be created again, and so will not
|
|
|
|
# appear in the server's list of 'new groups' at a later date. Hence it
|
|
|
|
# won't appear until you do a '-a' after some articles have appeared.
|
2004-07-18 02:56:09 -03:00
|
|
|
#
|
1994-05-27 10:33:17 -03:00
|
|
|
# I should really keep a list of ignored empty groups and re-check them
|
|
|
|
# for articles on every run, but I haven't got around to it yet.
|
1994-05-27 10:32:41 -03:00
|
|
|
#
|
|
|
|
# This assumes an NNTP news feed.
|
|
|
|
#
|
2004-07-18 02:56:09 -03:00
|
|
|
# Feel free to copy, distribute and modify this code for
|
|
|
|
# non-commercial use. If you make any useful modifications, let me
|
1994-05-27 10:32:41 -03:00
|
|
|
# know!
|
|
|
|
#
|
|
|
|
# (c) Quentin Stafford-Fraser 1994
|
|
|
|
# fraser@europarc.xerox.com qs101@cl.cam.ac.uk
|
|
|
|
# #
|
|
|
|
#######################################################################
|
|
|
|
import sys,nntplib, string, marshal, time, os, posix, string
|
|
|
|
|
|
|
|
#######################################################################
|
|
|
|
# Check these variables before running! #
|
|
|
|
|
|
|
|
# Top directory.
|
|
|
|
# Filenames which don't start with / are taken as being relative to this.
|
1994-05-27 10:33:17 -03:00
|
|
|
topdir='/anfs/qsbigdisc/web/html/newspage'
|
1994-05-27 10:32:41 -03:00
|
|
|
|
|
|
|
# The name of your NNTP host
|
2004-07-18 02:56:09 -03:00
|
|
|
# eg.
|
1994-05-27 10:33:17 -03:00
|
|
|
# newshost = 'nntp-serv.cl.cam.ac.uk'
|
2004-07-18 02:56:09 -03:00
|
|
|
# or use following to get the name from the NNTPSERVER environment
|
1994-05-27 10:32:41 -03:00
|
|
|
# variable:
|
1994-05-27 10:33:17 -03:00
|
|
|
# newshost = posix.environ['NNTPSERVER']
|
|
|
|
newshost = 'nntp-serv.cl.cam.ac.uk'
|
1994-05-27 10:32:41 -03:00
|
|
|
|
|
|
|
# The filename for a local cache of the newsgroup list
|
|
|
|
treefile = 'grouptree'
|
|
|
|
|
|
|
|
# The filename for descriptions of newsgroups
|
|
|
|
# I found a suitable one at ftp.uu.net in /uunet-info/newgroups.gz
|
|
|
|
# You can set this to '' if you don't wish to use one.
|
1994-05-27 10:33:17 -03:00
|
|
|
descfile = 'newsgroups'
|
1994-05-27 10:32:41 -03:00
|
|
|
|
|
|
|
# The directory in which HTML pages should be created
|
|
|
|
# eg.
|
|
|
|
# pagedir = '/usr/local/lib/html/newspage'
|
2004-07-18 02:56:09 -03:00
|
|
|
# pagedir = 'pages'
|
1994-05-27 10:32:41 -03:00
|
|
|
pagedir = topdir
|
|
|
|
|
|
|
|
# The html prefix which will refer to this directory
|
2004-07-18 02:56:09 -03:00
|
|
|
# eg.
|
|
|
|
# httppref = '/newspage/',
|
1994-05-27 10:33:17 -03:00
|
|
|
# or leave blank for relative links between pages: (Recommended)
|
|
|
|
# httppref = ''
|
1994-05-27 10:32:41 -03:00
|
|
|
httppref = ''
|
|
|
|
|
2004-07-18 02:56:09 -03:00
|
|
|
# The name of the 'root' news page in this directory.
|
1994-05-27 10:32:41 -03:00
|
|
|
# A .html suffix will be added.
|
1994-05-27 10:33:17 -03:00
|
|
|
rootpage = 'root'
|
1994-05-27 10:32:41 -03:00
|
|
|
|
|
|
|
# Set skipempty to 0 if you wish to see links to empty groups as well.
|
|
|
|
# Only affects the -a option.
|
1994-05-27 10:33:17 -03:00
|
|
|
skipempty = 1
|
|
|
|
|
|
|
|
# pagelinkicon can contain html to put an icon after links to
|
|
|
|
# further pages. This helps to make important links stand out.
|
|
|
|
# Set to '' if not wanted, or '...' is quite a good one.
|
|
|
|
pagelinkicon='... <img src="http://pelican.cl.cam.ac.uk/icons/page.xbm"> '
|
1994-05-27 10:32:41 -03:00
|
|
|
|
|
|
|
# ---------------------------------------------------------------------
|
|
|
|
# Less important personal preferences:
|
|
|
|
|
|
|
|
# Sublistsize controls the maximum number of items the will appear as
|
|
|
|
# an indented sub-list before the whole thing is moved onto a different
|
2004-07-18 02:56:09 -03:00
|
|
|
# page. The smaller this is, the more pages you will have, but the
|
1994-05-27 10:32:41 -03:00
|
|
|
# shorter each will be.
|
|
|
|
sublistsize = 4
|
|
|
|
|
|
|
|
# That should be all. #
|
|
|
|
#######################################################################
|
|
|
|
|
1994-08-19 12:02:57 -03:00
|
|
|
for dir in os.curdir, os.environ['HOME']:
|
1998-09-14 13:44:15 -03:00
|
|
|
rcfile = os.path.join(dir, '.newslistrc.py')
|
|
|
|
if os.path.exists(rcfile):
|
2007-07-17 17:59:35 -03:00
|
|
|
print(rcfile)
|
1998-09-14 13:44:15 -03:00
|
|
|
execfile(rcfile)
|
|
|
|
break
|
1994-08-19 12:02:57 -03:00
|
|
|
|
1994-05-27 10:32:41 -03:00
|
|
|
from nntplib import NNTP
|
|
|
|
from stat import *
|
|
|
|
|
1997-12-09 15:39:12 -04:00
|
|
|
rcsrev = '$Revision$'
|
2007-07-17 17:59:35 -03:00
|
|
|
rcsrev = string.join([s for s in string.split(rcsrev) if '$' not in s])
|
1994-05-27 10:32:41 -03:00
|
|
|
desc = {}
|
|
|
|
|
|
|
|
# Make (possibly) relative filenames into absolute ones
|
|
|
|
treefile = os.path.join(topdir,treefile)
|
|
|
|
descfile = os.path.join(topdir,descfile)
|
|
|
|
page = os.path.join(topdir,pagedir)
|
|
|
|
|
|
|
|
# First the bits for creating trees ---------------------------
|
|
|
|
|
|
|
|
# Addtotree creates/augments a tree from a list of group names
|
|
|
|
def addtotree(tree, groups):
|
2007-07-17 17:59:35 -03:00
|
|
|
print('Updating tree...')
|
2004-07-18 02:56:09 -03:00
|
|
|
for i in groups:
|
1998-09-14 13:44:15 -03:00
|
|
|
parts = string.splitfields(i,'.')
|
|
|
|
makeleaf(tree, parts)
|
1994-05-27 10:32:41 -03:00
|
|
|
|
|
|
|
# Makeleaf makes a leaf and the branch leading to it if necessary
|
|
|
|
def makeleaf(tree,path):
|
2004-07-18 02:56:09 -03:00
|
|
|
j = path[0]
|
|
|
|
l = len(path)
|
1994-05-27 10:32:41 -03:00
|
|
|
|
2007-07-17 17:59:35 -03:00
|
|
|
if j not in tree:
|
2004-07-18 02:56:09 -03:00
|
|
|
tree[j] = {}
|
|
|
|
if l == 1:
|
|
|
|
tree[j]['.'] = '.'
|
|
|
|
if l > 1:
|
|
|
|
makeleaf(tree[j],path[1:])
|
1994-05-27 10:32:41 -03:00
|
|
|
|
2004-07-18 02:56:09 -03:00
|
|
|
# Then the bits for outputting trees as pages ----------------
|
1994-05-27 10:32:41 -03:00
|
|
|
|
|
|
|
# Createpage creates an HTML file named <root>.html containing links
|
|
|
|
# to those groups beginning with <root>.
|
|
|
|
|
|
|
|
def createpage(root, tree, p):
|
2004-07-18 02:56:09 -03:00
|
|
|
filename = os.path.join(pagedir,root+'.html')
|
|
|
|
if root == rootpage:
|
|
|
|
detail = ''
|
|
|
|
else:
|
|
|
|
detail = ' under ' + root
|
|
|
|
f = open(filename,'w')
|
|
|
|
# f.write('Content-Type: text/html\n')
|
|
|
|
f.write('<TITLE>Newsgroups available' + detail + '</TITLE>\n')
|
|
|
|
f.write('<H1>Newsgroups available' + detail +'</H1>\n')
|
|
|
|
f.write('<A HREF="'+httppref+rootpage+'.html">Back to top level</A><P>\n')
|
|
|
|
printtree(f,tree,0,p)
|
|
|
|
f.write('<I>This page automatically created by \'newslist\' v. '+rcsrev+'.')
|
|
|
|
f.write(time.ctime(time.time()) + '</I><P>')
|
|
|
|
f.close()
|
1994-05-27 10:32:41 -03:00
|
|
|
|
|
|
|
# Printtree prints the groups as a bulleted list. Groups with
|
|
|
|
# more than <sublistsize> subgroups will be put on a separate page.
|
|
|
|
# Other sets of subgroups are just indented.
|
|
|
|
|
|
|
|
def printtree(f, tree, indent, p):
|
2004-07-18 02:56:09 -03:00
|
|
|
global desc
|
|
|
|
l = len(tree)
|
|
|
|
|
|
|
|
if l > sublistsize and indent>0:
|
|
|
|
# Create a new page and a link to it
|
|
|
|
f.write('<LI><B><A HREF="'+httppref+p[1:]+'.html">')
|
|
|
|
f.write(p[1:]+'.*')
|
|
|
|
f.write('</A></B>'+pagelinkicon+'\n')
|
|
|
|
createpage(p[1:], tree, p)
|
|
|
|
return
|
|
|
|
|
2007-08-06 18:07:53 -03:00
|
|
|
kl = sorted(tree.keys())
|
2004-07-18 02:56:09 -03:00
|
|
|
|
|
|
|
if l > 1:
|
|
|
|
if indent > 0:
|
|
|
|
# Create a sub-list
|
|
|
|
f.write('<LI>'+p[1:]+'\n<UL>')
|
|
|
|
else:
|
|
|
|
# Create a main list
|
|
|
|
f.write('<UL>')
|
|
|
|
indent = indent + 1
|
|
|
|
|
|
|
|
for i in kl:
|
|
|
|
if i == '.':
|
|
|
|
# Output a newsgroup
|
|
|
|
f.write('<LI><A HREF="news:' + p[1:] + '">'+ p[1:] + '</A> ')
|
2007-07-17 17:59:35 -03:00
|
|
|
if p[1:] in desc:
|
2004-07-18 02:56:09 -03:00
|
|
|
f.write(' <I>'+desc[p[1:]]+'</I>\n')
|
|
|
|
else:
|
|
|
|
f.write('\n')
|
|
|
|
else:
|
|
|
|
# Output a hierarchy
|
|
|
|
printtree(f,tree[i], indent, p+'.'+i)
|
|
|
|
|
|
|
|
if l > 1:
|
|
|
|
f.write('\n</UL>')
|
1994-05-27 10:32:41 -03:00
|
|
|
|
|
|
|
# Reading descriptions file ---------------------------------------
|
|
|
|
|
|
|
|
# This returns an array mapping group name to its description
|
|
|
|
|
1994-05-27 10:33:17 -03:00
|
|
|
def readdesc(descfile):
|
2004-07-18 02:56:09 -03:00
|
|
|
global desc
|
1994-05-27 10:32:41 -03:00
|
|
|
|
2004-07-18 02:56:09 -03:00
|
|
|
desc = {}
|
1994-05-27 10:32:41 -03:00
|
|
|
|
2004-07-18 02:56:09 -03:00
|
|
|
if descfile == '':
|
1998-09-14 13:44:15 -03:00
|
|
|
return
|
1994-05-27 10:32:41 -03:00
|
|
|
|
2004-07-18 02:56:09 -03:00
|
|
|
try:
|
|
|
|
d = open(descfile, 'r')
|
2007-07-17 17:59:35 -03:00
|
|
|
print('Reading descriptions...')
|
2004-07-18 02:56:09 -03:00
|
|
|
except (IOError):
|
2007-07-17 17:59:35 -03:00
|
|
|
print('Failed to open description file ' + descfile)
|
2004-07-18 02:56:09 -03:00
|
|
|
return
|
|
|
|
l = d.readline()
|
|
|
|
while l != '':
|
|
|
|
bits = string.split(l)
|
|
|
|
try:
|
|
|
|
grp = bits[0]
|
|
|
|
dsc = string.join(bits[1:])
|
|
|
|
if len(dsc)>1:
|
|
|
|
desc[grp] = dsc
|
|
|
|
except (IndexError):
|
|
|
|
pass
|
|
|
|
l = d.readline()
|
1994-05-27 10:32:41 -03:00
|
|
|
|
1994-05-27 10:33:17 -03:00
|
|
|
# Check that ouput directory exists, ------------------------------
|
|
|
|
# and offer to create it if not
|
1994-05-27 10:32:41 -03:00
|
|
|
|
1994-05-27 10:33:17 -03:00
|
|
|
def checkopdir(pagedir):
|
2004-07-18 02:56:09 -03:00
|
|
|
if not os.path.isdir(pagedir):
|
2007-07-17 17:59:35 -03:00
|
|
|
print('Directory '+pagedir+' does not exist.')
|
|
|
|
print('Shall I create it for you? (y/n)')
|
2004-07-18 02:56:09 -03:00
|
|
|
if sys.stdin.readline()[0] == 'y':
|
|
|
|
try:
|
2007-07-17 17:59:35 -03:00
|
|
|
os.mkdir(pagedir,0o777)
|
2004-07-18 02:56:09 -03:00
|
|
|
except:
|
2007-07-17 17:59:35 -03:00
|
|
|
print('Sorry - failed!')
|
2004-07-18 02:56:09 -03:00
|
|
|
sys.exit(1)
|
|
|
|
else:
|
2007-07-17 17:59:35 -03:00
|
|
|
print('OK. Exiting.')
|
1998-09-14 13:44:15 -03:00
|
|
|
sys.exit(1)
|
1994-05-27 10:32:41 -03:00
|
|
|
|
1994-05-27 10:33:17 -03:00
|
|
|
# Read and write current local tree ----------------------------------
|
1994-05-27 10:32:41 -03:00
|
|
|
|
1994-05-27 10:33:17 -03:00
|
|
|
def readlocallist(treefile):
|
2007-07-17 17:59:35 -03:00
|
|
|
print('Reading current local group list...')
|
2004-07-18 02:56:09 -03:00
|
|
|
tree = {}
|
|
|
|
try:
|
|
|
|
treetime = time.localtime(os.stat(treefile)[ST_MTIME])
|
|
|
|
except:
|
2007-07-17 17:59:35 -03:00
|
|
|
print('\n*** Failed to open local group cache '+treefile)
|
|
|
|
print('If this is the first time you have run newslist, then')
|
|
|
|
print('use the -a option to create it.')
|
2004-07-18 02:56:09 -03:00
|
|
|
sys.exit(1)
|
|
|
|
treedate = '%02d%02d%02d' % (treetime[0] % 100 ,treetime[1], treetime[2])
|
|
|
|
try:
|
|
|
|
dump = open(treefile,'r')
|
|
|
|
tree = marshal.load(dump)
|
|
|
|
dump.close()
|
|
|
|
except (IOError):
|
2007-07-17 17:59:35 -03:00
|
|
|
print('Cannot open local group list ' + treefile)
|
2004-07-18 02:56:09 -03:00
|
|
|
return (tree, treedate)
|
1994-05-27 10:33:17 -03:00
|
|
|
|
|
|
|
def writelocallist(treefile, tree):
|
2004-07-18 02:56:09 -03:00
|
|
|
try:
|
|
|
|
dump = open(treefile,'w')
|
|
|
|
groups = marshal.dump(tree,dump)
|
|
|
|
dump.close()
|
2007-07-17 17:59:35 -03:00
|
|
|
print('Saved list to '+treefile+'\n')
|
2004-07-18 02:56:09 -03:00
|
|
|
except:
|
2007-07-17 17:59:35 -03:00
|
|
|
print('Sorry - failed to write to local group cache '+treefile)
|
|
|
|
print('Does it (or its directory) have the correct permissions?')
|
2004-07-18 02:56:09 -03:00
|
|
|
sys.exit(1)
|
1994-05-27 10:33:17 -03:00
|
|
|
|
|
|
|
# Return list of all groups on server -----------------------------
|
|
|
|
|
|
|
|
def getallgroups(server):
|
2007-07-17 17:59:35 -03:00
|
|
|
print('Getting list of all groups...')
|
2004-07-18 02:56:09 -03:00
|
|
|
treedate='010101'
|
|
|
|
info = server.list()[1]
|
|
|
|
groups = []
|
2007-07-17 17:59:35 -03:00
|
|
|
print('Processing...')
|
2004-07-18 02:56:09 -03:00
|
|
|
if skipempty:
|
2007-07-17 17:59:35 -03:00
|
|
|
print('\nIgnoring following empty groups:')
|
2004-07-18 02:56:09 -03:00
|
|
|
for i in info:
|
|
|
|
grpname = string.split(i[0])[0]
|
|
|
|
if skipempty and string.atoi(i[1]) < string.atoi(i[2]):
|
2007-07-17 17:59:35 -03:00
|
|
|
print(grpname+' ', end=' ')
|
2004-07-18 02:56:09 -03:00
|
|
|
else:
|
|
|
|
groups.append(grpname)
|
2007-07-17 17:59:35 -03:00
|
|
|
print('\n')
|
2004-07-18 02:56:09 -03:00
|
|
|
if skipempty:
|
2007-07-17 17:59:35 -03:00
|
|
|
print('(End of empty groups)')
|
2004-07-18 02:56:09 -03:00
|
|
|
return groups
|
1994-05-27 10:33:17 -03:00
|
|
|
|
|
|
|
# Return list of new groups on server -----------------------------
|
|
|
|
|
|
|
|
def getnewgroups(server, treedate):
|
2007-07-17 17:59:35 -03:00
|
|
|
print('Getting list of new groups since start of '+treedate+'...', end=' ')
|
2004-07-18 02:56:09 -03:00
|
|
|
info = server.newgroups(treedate,'000001')[1]
|
2007-07-17 17:59:35 -03:00
|
|
|
print('got %d.' % len(info))
|
|
|
|
print('Processing...', end=' ')
|
2004-07-18 02:56:09 -03:00
|
|
|
groups = []
|
|
|
|
for i in info:
|
|
|
|
grpname = string.split(i)[0]
|
|
|
|
groups.append(grpname)
|
2007-07-17 17:59:35 -03:00
|
|
|
print('Done')
|
2004-07-18 02:56:09 -03:00
|
|
|
return groups
|
1994-05-27 10:33:17 -03:00
|
|
|
|
|
|
|
# Now the main program --------------------------------------------
|
1994-05-27 10:32:41 -03:00
|
|
|
|
1994-05-27 10:33:17 -03:00
|
|
|
def main():
|
2004-07-18 02:56:09 -03:00
|
|
|
global desc
|
|
|
|
|
|
|
|
tree={}
|
|
|
|
|
|
|
|
# Check that the output directory exists
|
|
|
|
checkopdir(pagedir);
|
|
|
|
|
|
|
|
try:
|
2007-07-17 17:59:35 -03:00
|
|
|
print('Connecting to '+newshost+'...')
|
2004-07-18 02:56:09 -03:00
|
|
|
if sys.version[0] == '0':
|
|
|
|
s = NNTP.init(newshost)
|
|
|
|
else:
|
|
|
|
s = NNTP(newshost)
|
|
|
|
connected = 1
|
2007-01-10 12:19:56 -04:00
|
|
|
except (nntplib.error_temp, nntplib.error_perm) as x:
|
2007-07-17 17:59:35 -03:00
|
|
|
print('Error connecting to host:', x)
|
|
|
|
print('I\'ll try to use just the local list.')
|
2004-07-18 02:56:09 -03:00
|
|
|
connected = 0
|
|
|
|
|
|
|
|
# If -a is specified, read the full list of groups from server
|
|
|
|
if connected and len(sys.argv) > 1 and sys.argv[1] == '-a':
|
|
|
|
|
|
|
|
groups = getallgroups(s)
|
|
|
|
|
|
|
|
# Otherwise just read the local file and then add
|
|
|
|
# groups created since local file last modified.
|
|
|
|
else:
|
|
|
|
|
|
|
|
(tree, treedate) = readlocallist(treefile)
|
|
|
|
if connected:
|
|
|
|
groups = getnewgroups(s, treedate)
|
|
|
|
|
|
|
|
if connected:
|
|
|
|
addtotree(tree, groups)
|
|
|
|
writelocallist(treefile,tree)
|
|
|
|
|
|
|
|
# Read group descriptions
|
|
|
|
readdesc(descfile)
|
|
|
|
|
2007-07-17 17:59:35 -03:00
|
|
|
print('Creating pages...')
|
2004-07-18 02:56:09 -03:00
|
|
|
createpage(rootpage, tree, '')
|
2007-07-17 17:59:35 -03:00
|
|
|
print('Done')
|
1994-05-27 10:32:41 -03:00
|
|
|
|
2004-09-11 13:34:35 -03:00
|
|
|
if __name__ == "__main__":
|
|
|
|
main()
|
1994-05-27 10:32:41 -03:00
|
|
|
|
|
|
|
# That's all folks
|
|
|
|
######################################################################
|