X-Git-Url: https://codewiz.org/gitweb?a=blobdiff_plain;f=geekigeeki.py;h=b34f152188b0544747471a796258d521f9eb0aba;hb=014d5c705784bfe7b47731ad5cc50568fc5e63cf;hp=a0345ee950f0c0fc750e874717dc9d5e34ddbad6;hpb=727c1cfdb0040ca5d95efb81c975d36d1f568c0b;p=geekigeeki.git diff --git a/geekigeeki.py b/geekigeeki.py index a0345ee..b34f152 100755 --- a/geekigeeki.py +++ b/geekigeeki.py @@ -1,8 +1,9 @@ -#! /usr/bin/env python +#!/usr/bin/python +# -*- coding: utf-8 -*- # # Copyright 1999, 2000 Martin Pool # Copyright 2002 Gerardo Poggiali -# Copyright 2007 Bernardo Innocenti +# Copyright 2007, 2008 Bernardo Innocenti # # This program is free software: you can redistribute it and/or modify # it under the terms of the GNU General Public License as published by @@ -17,15 +18,18 @@ # You should have received a copy of the GNU General Public License # along with this program. If not, see . -__version__ = '$Id$'[4:-2] +__version__ = '$Id$'[4:12] -import cgi, sys, string, os, re, errno, time, stat +from time import clock +start_time = clock() + +import cgi, sys, os, re, errno, stat from os import path, environ # Regular expression defining a WikiWord # (but this definition is also assumed in other places) -file_re = re.compile(r"^\b([A-Za-z0-9_\.\-]+)\b$") -word_re = re.compile(r"^\b([A-Z][a-z]+){2,}\b$") +file_re = re.compile(r"^\b([A-Za-z0-9_\.\-/]+)\b$") +word_re = re.compile(r"^\b((([A-Z][a-z]+){2,}/)*([A-Z][a-z]+){2,})\b$") img_re = re.compile(r"^.*\.(png|gif|jpg|jpeg)$", re.IGNORECASE) url_re = re.compile(r"^[a-z]{3,8}://[^\s'\"]+\S$") @@ -53,25 +57,33 @@ def get_hostname(addr): try: from socket import gethostbyaddr return gethostbyaddr(addr)[0] + ' (' + addr + ')' - except: + except Exception, er: return addr +def relative_url(pathname, privileged=False): + if not (url_re.match(pathname) or pathname.startswith('/')): + if privileged: + url = privileged_path() + else: + url = script_name() + pathname = url + '/' + pathname + return pathname + # Formatting stuff -------------------------------------------------- -def emit_header(type="text/html"): - print "Content-type: " + type + "; charset=utf-8" - print +def emit_header(mime_type="text/html"): + print "Content-type: " + mime_type + "; charset=utf-8\n" -def send_guru(msg, msg_type): - if msg is None or msg == '': return +def send_guru(msg_text, msg_type): + if not msg_text: return print '
'
     if msg_type == 'error':
         print '    Software Failure.  Press left mouse button to continue.\n'
-    print msg
+    print msg_text
     if msg_type == 'error':
         print '      Guru Meditation #DEADBEEF.ABADC0DE'
     print '
' - # FIXME: This simple JS snippet is harder to pass than ACID 3.0 + # FIXME: This little JS snippet is harder to pass than ACID 3.0 print """ """ -def send_title(name, text="Limbo", msg=None, msg_type='error'): +def send_title(name, text="Limbo", msg_text=None, msg_type='error'): global title_done if title_done: return # Head emit_header() - print """ - -""" + print '' + print '' + + site_name = globals().get('site_name', 'Unconfigured Site') print "%s: %s" % (site_name, text) print ' ' if not name: print ' ' - if css_url: - print ' ' % css_url + for css in css_url: + print ' ' % relative_url(css) print '' # Body @@ -119,24 +132,26 @@ def send_title(name, text="Limbo", msg=None, msg_type='error'): print '' title_done = True - send_guru(msg, msg_type) + send_guru(msg_text, msg_type) # Navbar print '' -def link_tag(params, text=None, ss_class=None, authentication=False): +def link_tag(params, text=None, ss_class=None, privileged=False): if text is None: text = params # default classattr = '' @@ -155,11 +170,9 @@ def link_tag(params, text=None, ss_class=None, authentication=False): # Prevent crawlers from following links potentially added by spammers or to generated pages if ss_class == 'external' or ss_class == 'navlink': classattr += 'rel="nofollow" ' - if authentication: - path = privileged_path() - else: - path = script_name() - return '%s' % (classattr, path, params, text) + elif url_re.match(params): + classattr += 'rel="nofollow" ' + return '%s' % (classattr, relative_url(params, privileged=privileged), text) # Search --------------------------------------------------- @@ -184,13 +197,12 @@ def do_fullsearch(needle): for (count, page_name) in hits: print '
  • ' + Page(page_name).link_to() print ' . . . . ' + `count` - print ['match', 'matches'][count <> 1] + print ['match', 'matches'][count != 1] print '

  • ' print "" print_search_stats(len(hits), len(all_pages)) - def do_titlesearch(needle): # TODO: check needle is legal -- but probably we can just accept any RE send_title(None, "Title search for \"" + needle + '"') @@ -206,18 +218,13 @@ def do_titlesearch(needle): print_search_stats(len(hits), len(all_pages)) - def print_search_stats(hits, searched): print "

    %d hits out of %d pages searched.

    " % (hits, searched) -def do_edit(pagename): - Page(pagename).send_editor() - def do_raw(pagename): Page(pagename).send_raw() -def do_savepage(pagename): - global form +def do_edit(pagename): pg = Page(pagename) if 'preview' in form: pg.send_editor(form['savetext'].value) @@ -225,40 +232,32 @@ def do_savepage(pagename): pg.save_text(form['savetext'].value) pg.send_page() elif 'cancel' in form: - pg.msg = 'Editing canceled' + pg.msg_text = 'Editing canceled' pg.msg_type = 'notice' pg.send_page() else: - raise 'What did you press?' + pg.send_editor() def make_index_key(): - s = '

    ' - links = map(lambda ch: '%s' % (ch, ch), - string.lowercase) - s = s + string.join(links, ' | ') - s = s + '

    ' - return s - + links = map(lambda ch: '%s' % (ch, ch), 'abcdefghijklmnopqrstuvwxyz') + return '

    '+ ' | '.join(links) + '

    ' def page_list(): - return filter(word_re.match, os.listdir(text_dir)) - + return filter(word_re.match, os.listdir(data_dir)) def send_footer(name, mod_string=None): - if debug_cgi: + if globals().get('debug_cgi', False): cgi.print_arguments() cgi.print_form(cgi.FieldStorage()) cgi.print_environ() - global __version__ print '' - # ---------------------------------------------------------- # Macros def _macro_TitleSearch(*vargs): @@ -291,8 +290,8 @@ def _macro_WordIndex(*vargs): last_letter = None # set title for word in all_words: - letter = string.lower(word[0]) - if letter <> last_letter: + letter = word[0].lower() + if letter != last_letter: s = s + ';

    %s

    ' % (letter, letter) last_letter = letter @@ -313,13 +312,13 @@ def _macro_TitleIndex(*vargs): pages.sort() current_letter = None for name in pages: - letter = string.lower(name[0]) - if letter <> current_letter: - s = s + '

    %s

    ' % (letter, letter) + letter = name[0].lower() + if letter != current_letter: + s += '

    %s

    ' % (letter, letter) current_letter = letter else: - s = s + '
    ' - s = s + Page(name).link_to() + s += '
    ' + s += Page(name).link_to() return s @@ -332,23 +331,28 @@ class PageFormatter: """ def __init__(self, raw): self.raw = raw - self.is_em = self.is_b = 0 self.h_level = 0 - self.h_count = 0 - self.list_indents = [] - self.in_pre = False - self.in_table = False - self.tr_cnt = 0 - self.in_var = False + self.in_pre = self.in_table = False self.in_header = True + self.list_indents = [] + self.tr_cnt = self.h_cnt = 0 + self.styles = { + #wiki html enabled? + "//": ["em", False], + "''": ["em", False], + "**": ["b", False], + "'''": ["b", False], + "##": ["tt", False], + "``": ["tt", False], + "__": ["u", False], + "^^": ["sup", False], + ",,": ["sub", False] + } - def _emph_repl(self, word): - if len(word) == 3: - self.is_b = not self.is_b - return ['', ''][self.is_b] - else: - self.is_em = not self.is_em - return ['', ''][self.is_em] + def _b_repl(self, word): + style = self.styles[word] + style[1] = not style[1] + return ['' def _tit_repl(self, word): if self.h_level: @@ -356,10 +360,14 @@ class PageFormatter: self.h_level = 0 else: self.h_level = len(word) - 1 - self.h_count += 1 - result = '* ' % (self.h_level, self.h_count, self.h_count) + self.h_cnt += 1 + #abridged = re.sub('[^a-z_]', '', word.lower().replace(' ', '_')) + result = '¶ ' % (self.h_level, self.h_cnt, self.h_cnt) return result + def _br_repl(self, word): + return '
    ' + def _rule_repl(self, word): return self._undent() + '\n
    \n' % (len(word) - 2) @@ -367,7 +375,7 @@ class PageFormatter: return Page(word).link_to() def _img_repl(self, word): - path = script_name() + '/' + word; + path = relative_url(word) return '' % (path, path) def _url_repl(self, word): @@ -377,21 +385,22 @@ class PageFormatter: return '%s' % (word, word) def _hurl_repl(self, word): - m = re.compile("\[\[(\S+)([^\]]*)\]\]").match(word) + m = re.compile("\[\[([^ \t\n\r\f\v\|]+)(?:\s*\|\s*([^\]]+)|)\]\]").match(word) name = m.group(1) - descr = m.group(2).strip() or name + descr = m.group(2) or name macro = globals().get('_macro_' + name) if macro: return apply(macro, (name, descr)) elif img_re.match(name): - return '%s' % (name, name, descr) - elif url_re.match(name): - return '%s' % (name, descr) - elif name.startswith('/'): - return '%s' % (name, descr) + name = relative_url(name) + # The "extthumb" nonsense works around a limitation of the HTML block model + return '
    %s
    %s
    ' % (name, name, descr, descr) else: - return link_tag(name, descr) + if img_re.match(descr): + descr = '' + + return link_tag(name, descr, 'wikilink') def _email_repl(self, word): return '%s' % (word, word) @@ -417,22 +426,7 @@ class PageFormatter: return '' def _hi_repl(self, word): - if word == 'FIXME': - cl = 'error' - elif word == 'DONE': - cl = 'success' - elif word == 'TODO': - cl = 'notice' - return '' + word + '' - - def _var_repl(self, word): - if word == '{{' and not self.in_var: - self.in_var = True - return '' - elif self.in_var: - self.in_var = False - return '' - return '' + return '' + word + '' def _tr_repl(self, word): out = '' @@ -441,16 +435,17 @@ class PageFormatter: self.tr_cnt = 0 out = '

    \n' self.tr_cnt += 1 - return out + '' + return out + ['' + return ['', ''][word.strip() == '||='] return '' def _indent_level(self): @@ -488,12 +483,13 @@ class PageFormatter: # For each line, we scan through looking for magic # strings, outputting verbatim any intervening text - # TODO: highlight search words (look at referer) + # TODO: highlight search words (look at referrer) scan_re = re.compile( r"(?:" # Formatting - + r"(?P'{2,3})" + + r"(?P\*\*|'''|//|''|##|``|__|\^\^|,,)" + r"|(?P\={2,6})" + + r"|(?P
    \\\\)" + r"|(?P^-{3,})" + r"|(?P<(/|)(div|span|iframe)[^<>]*>)" + r"|(?P[<>&])" @@ -502,34 +498,33 @@ class PageFormatter: # Links + r"|(?P\b[a-zA-Z0-9_-]+\.(png|gif|jpg|jpeg|bmp))" + r"|(?P\b(?:[A-Z][a-z]+){2,}\b)" - + r"|(?P\[\[\S+[^\]]*\]\])" + + r"|(?P\[\[([^ \t\n\r\f\v\|]+)(?:\s*\|\s*([^\]]+)|)\]\])" + r"|(?P(http|https|ftp|mailto)\:[^\s'\"]+\S)" + r"|(?P[-\w._+]+\@[\w.-]+)" # Lists, divs, spans - + r"|(?P
  • ^\s+\*)" - + r"|(?P
    (\{\{\{|\s*\}\}\}))"
    -            + r"|(?P(\{\{|\}\}))"
    +            + r"|(?P
  • ^\s+[\*#] +)" + + r"|(?P
    \{\{\{|\s*\}\}\})"
     
                 # Tables
    -            + r"|(?P
  • ^\s*\|\|\s*)" - + r"|(?P\s*\|\|\s*$)" - + r"|(?P^\s*\|\|(=|)\s*)" + + r"|(?P\s*\|\|(=|)\s*$)" + + r"|(?P
    ' + out = out + '
    ', ''][word.strip() == '||='] - def _tre_repl(self, word): + def _td_repl(self, word): if self.in_table: - return '
    ', ''][word.strip() == '||='] return '' - def _td_repl(self, word): + def _tre_repl(self, word): if self.in_table: - return '' + return ['
    \s*\|\|\s*)" + + r"|(?P
    \s*\|\|(=|)\s*)" + r")") pre_re = re.compile( r"(?:" + r"(?P
    \s*\}\}\})"
    +            + r"|(?P[<>&])"
                 + r")")
             blank_re = re.compile(r"^\s*$")
             indent_re = re.compile(r"^\s*")
             tr_re = re.compile(r"^\s*\|\|")
             eol_re = re.compile(r"\r?\n")
    -        raw = string.expandtabs(self.raw)
    -        for line in eol_re.split(raw):
    +        for line in eol_re.split(self.raw.expandtabs()):
                 # Skip ACLs
                 if self.in_header:
                     if line.startswith('#'):
    -                   continue
    +                    continue
                     self.in_header = False
     
                 if self.in_pre:
    @@ -555,30 +550,27 @@ class PageFormatter:
     class Page:
         def __init__(self, page_name):
             self.page_name = page_name
    -        self.msg = ''
    +        self.msg_text = ''
             self.msg_type = 'error'
    -        self.attrs = {}
     
         def split_title(self):
    -        # look for the end of words and the start of a new word,
    -        # and insert a space there
    +        # look for the end of words and the start of a new word and insert a space there
             return re.sub('([a-z])([A-Z])', r'\1 \2', self.page_name)
     
         def _text_filename(self):
    -        return path.join(text_dir, self.page_name)
    +        return path.join(data_dir, self.page_name)
     
         def _tmp_filename(self):
    -        return path.join(text_dir, ('#' + self.page_name + '.' + `os.getpid()` + '#'))
    +        return path.join(data_dir, ('#' + self.page_name.replace('/','_') + '.' + `os.getpid()` + '#'))
     
         def exists(self):
             try:
                 os.stat(self._text_filename())
    -            return 1
    +            return True
             except OSError, er:
                 if er.errno == errno.ENOENT:
    -                return 0
    -            else:
    -                raise er
    +                return False
    +            raise er
     
         def link_to(self):
             word = self.page_name
    @@ -589,17 +581,18 @@ class Page:
     
         def get_raw_body(self):
             try:
    -            return open(self._text_filename(), 'rt').read()
    +            return open(self._text_filename(), 'rb').read()
             except IOError, er:
                 if er.errno == errno.ENOENT:
    -                # just doesn't exist, use default
    -                return 'Describe %s here.' % self.page_name
    -            else:
    -                raise er
    +                return '' # just doesn't exist, use default
    +            if er.errno == errno.EISDIR:
    +                return 'DIR'
    +            raise er
     
         def get_attrs(self):
    -        if self.attrs:
    +        if self.__dict__.has_key('attrs'):
                 return self.attrs
    +        self.attrs = {}
             try:
                 file = open(self._text_filename(), 'rt')
                 attr_re = re.compile(r"^#(\S*)(.*)$")
    @@ -614,18 +607,17 @@ class Page:
                     raise er
             return self.attrs
     
    +    def get_attr(self, name, default):
    +        return self.get_attrs().get(name, default)
    +
         def can(self, action, default=True):
    -        attrs = self.get_attrs()
             try:
    -            # SomeUser:read,write All:read
    -            acl = attrs["acl"]
    +            #acl SomeUser:read,write All:read
    +            acl = self.get_attr("acl", None)
                 for rule in acl.split():
    -                (user,perms) = rule.split(':')
    +                (user, perms) = rule.split(':')
                     if user == remote_user() or user == "All":
    -                    if action in perms.split(','):
    -                        return True
    -                    else:
    -                        return False
    +                    return action in perms.split(',')
                 return False
             except Exception, er:
                 pass
    @@ -641,7 +633,12 @@ class Page:
             page_name = None
             if self.can_write():
                 page_name = self.page_name
    -        send_title(page_name, self.split_title(), msg=self.msg, msg_type=self.msg_type)
    +
    +        #css foo.css bar.css
    +        global css_url
    +        css_url = self.get_attr("css", "").split() + css_url
    +
    +        send_title(page_name, self.split_title(), msg_text=self.msg_text, msg_type=self.msg_type)
             if self.can_read():
                 PageFormatter(self.get_raw_body()).print_html()
             else:
    @@ -649,14 +646,17 @@ class Page:
             send_footer(page_name, self._last_modified())
     
         def _last_modified(self):
    -        if not self.exists():
    +        try:
    +            from time import localtime, strftime
    +            modtime = localtime(os.stat(self._text_filename())[stat.ST_MTIME])
    +        except OSError, er:
    +            if er.errno != errno.ENOENT:
    +                raise er
                 return None
    -        from time import localtime, strftime
    -        modtime = localtime(os.stat(self._text_filename())[stat.ST_MTIME])
             return strftime(datetime_fmt, modtime)
     
         def send_editor(self, preview=None):
    -        send_title(None, 'Edit ' + self.split_title(), msg=self.msg, msg_type=self.msg_type)
    +        send_title(None, 'Edit ' + self.split_title(), msg_text=self.msg_text, msg_type=self.msg_type)
             if not self.can_write():
                 send_guru("Write access denied by ACLs", "error")
                 return
    @@ -665,9 +665,9 @@ class Page:
                 + ' for ' + cgi.escape(remote_user())
                 + ' from ' + cgi.escape(get_hostname(remote_host()))
                 + '

    ') - print '
    ' % (script_name(), self.page_name) - print '' % (self.page_name) - print """""" % (preview or self.get_raw_body()) + print '
    ' % relative_url(self.page_name) + print '' % (self.page_name) + print """""" % (preview or self.get_raw_body()) print """
    @@ -683,12 +683,13 @@ class Page: print "
    " send_footer(self.page_name) - def send_raw(self): - if not self.can_read(): - send_title(None, msg='Read access denied by ACLs', msg_type='notice') - return - emit_header("text/plain") - print self.get_raw_body() + def send_raw(self, mimetype='text/plain'): + if self.can_read(): + body = self.get_raw_body() + emit_header(mimetype) + print body + else: + send_title(None, msg_text='Read access denied by ACLs', msg_type='notice') def _write_file(self, text): tmp_filename = self._tmp_filename() @@ -699,12 +700,12 @@ class Page: try: os.remove(text) except OSError, er: - if er.errno <> errno.ENOENT: raise er + if er.errno != errno.ENOENT: raise er os.rename(tmp_filename, text) def save_text(self, newtext): if not self.can_write(): - self.msg = 'Write access denied by ACLs' + self.msg_text = 'Write access denied by ACLs' self.msg_type = 'error' return @@ -713,55 +714,32 @@ class Page: if post_edit_hook: # FIXME: what's the std way to perform shell quoting in python? cmd = ( post_edit_hook - + " '" + text_dir + '/' + self.page_name + + " '" + data_dir + '/' + self.page_name + "' '" + remote_user() + "' '" + remote_host() + "'" ) out = os.popen(cmd) - msg = out.read() + output = out.read() rc = out.close() if rc: - self.msg += "Post-editing hook returned %d.\n" % rc - self.msg += 'Command was: ' + cmd + '\n' - if msg: - self.msg += 'Output follows:\n' + msg + self.msg_text += "Post-editing hook returned %d.\n" % rc + self.msg_text += 'Command was: ' + cmd + '\n' + if output: + self.msg_text += 'Output follows:\n' + output else: - self.msg = 'Thank you for your contribution. Your attention to detail is appreciated.' + self.msg_text = 'Thank you for your contribution. Your attention to detail is appreciated.' self.msg_type = 'success' -def send_verbatim(filename, mime_type='application/octet-stream'): - pathname = path.join(text_dir, filename) - data = open(pathname, 'rb').read() - emit_header(mime_type) - sys.stdout.write(data) - # Main --------------------------------------------------------------- try: - # Configuration values - site_name = 'Codewiz' - - # set to None for read-only sites, leave empty ('') to allow anonymous edits - # otherwise, set to a URL that requires authentication - privileged_url = 'https://www.codewiz.org/~bernie/wiki' - - data_dir = '/home/bernie/public_html/wiki' - text_dir = path.join(data_dir, 'text') - css_url = '../wikidata/geekigeeki.css' # optional stylesheet link - history_url = '../wikigit/wiki.git' - post_edit_hook = './post_edit_hook.sh' - datetime_fmt = '%a %d %b %Y %I:%M %p' - allow_edit = True # Is it possible to edit pages? - show_hosts = True # show hostnames? - nonexist_pfx = '' # prefix before nonexistent link (usually '?') - debug_cgi = False # Set to True for CGI var dump - + execfile("geekigeeki.conf.py") form = cgi.FieldStorage() - - handlers = { 'fullsearch': do_fullsearch, - 'titlesearch': do_titlesearch, - 'edit': do_edit, - 'raw': do_raw, - 'savepage': do_savepage } + handlers = { + 'fullsearch': do_fullsearch, + 'titlesearch': do_titlesearch, + 'edit': do_edit, + 'raw': do_raw, + } for cmd in handlers.keys(): if form.has_key(cmd): @@ -779,19 +757,19 @@ try: Page(query).send_page() elif img_re.match(query): #FIXME: use correct mime type - send_verbatim(query, 'image/jpeg') + Page(query).send_raw(mimetype='image/jpeg') else: - send_verbatim(query) + Page(query).send_raw(mimetype='application/octet-stream') else: - # TODO: return 404? - send_title(None, msg='Can\'t work out query: ' + query) -except: + print "Status: 404 Not Found" + send_title(None, msg_text='Can\'t work out query: ' + query) +except Exception: import traceback - msg=traceback.format_exc() + msg_text = traceback.format_exc() if title_done: - send_guru(msg, "error") + send_guru(msg_text, "error") else: - send_title(None, msg=msg) + send_title(None, msg_text=msg_text) send_footer(None) sys.stdout.flush()