2 # -*- coding: utf-8 -*-
4 # Copyright 1999, 2000 Martin Pool <mbp@humbug.org.au>
5 # Copyright 2002 Gerardo Poggiali
6 # Copyright 2007, 2008 Bernie Innocenti <bernie@codewiz.org>
8 # This program is free software: you can redistribute it and/or modify
9 # it under the terms of the GNU General Public License as published by
10 # the Free Software Foundation, either version 3 of the License, or
11 # (at your option) any later version.
13 # This program is distributed in the hope that it will be useful, but
14 # WITHOUT ANY WARRANTY; without even the implied warranty of
15 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16 # General Public License for more details.
18 # You should have received a copy of the GNU General Public License
19 # along with this program. If not, see <http://www.gnu.org/licenses/>.
21 __version__ = '$Id$'[4:12]
23 from time import clock
26 import cgi, sys, os, re, errno, stat
27 from os import path, environ
29 # Regular expression defining a WikiWord
30 # (but this definition is also assumed in other places)
31 word_re = re.compile(r"^\b((([A-Z][a-z0-9]+){2,}/)*([A-Z][a-z0-9]+){2,})\b$")
32 # FIXME: we accept stuff like foo/../bar and we shouldn't
33 file_re = re.compile(r"^\b([A-Za-z0-9_\-][A-Za-z0-9_\.\-/]*)\b$")
34 img_re = re.compile(r"^.*\.(png|gif|jpg|jpeg|bmp|ico)$", re.IGNORECASE)
35 url_re = re.compile(r"^[a-z]{3,8}://[^\s'\"]+\S$")
36 link_re = re.compile("(?:\[\[|{{)([^\s\|]+)(?:\s*\|\s*([^\]]+)|)(?:\]\]|}})")
41 # CGI stuff ---------------------------------------------------------
44 return environ.get('SCRIPT_NAME', '')
46 def privileged_path():
47 return privileged_url or script_name()
50 user = environ.get('REMOTE_USER', '')
51 if user is None or user == '' or user == 'anonymous':
52 user = 'AnonymousCoward'
56 return environ.get('REMOTE_ADDR', '')
58 def get_hostname(addr):
60 from socket import gethostbyaddr
61 return gethostbyaddr(addr)[0] + ' (' + addr + ')'
65 def relative_url(pathname, privileged=False):
66 if not (url_re.match(pathname) or pathname.startswith('/')):
68 url = privileged_path()
71 pathname = url + '/' + pathname
75 return re.sub(' ', '-', re.sub('[^a-z0-9_ ]', '', s.lower()).strip())
77 # Formatting stuff --------------------------------------------------
78 def emit_header(mime_type="text/html"):
79 print "Content-type: " + mime_type + "; charset=utf-8\n"
81 def send_guru(msg_text, msg_type):
82 if not msg_text: return
83 print '<pre id="guru" onclick="this.style.display = \'none\'" class="' + msg_type + '">'
84 if msg_type == 'error':
85 print ' Software Failure. Press left mouse button to continue.\n'
87 if msg_type == 'error':
88 print ' Guru Meditation #DEADBEEF.ABADC0DE'
90 # FIXME: This little JS snippet is harder to pass than ACID 3.0
92 <script language="JavaScript" type="text/javascript">
93 var guru = document.getElementById('guru');
94 // Firefox 2.0 doesn't take border-color, but returns border-top-color fine
95 var color = document.defaultView.getComputedStyle(guru,null).getPropertyValue('border-top-color');
98 guru.style.setProperty('border-color', color, '');
99 setTimeout('guruOff()', 1000);
102 guru.style.setProperty('border-color', '#000000', '');
103 setTimeout('guruOn()', 1000);
105 // Safari 2.0 returns this rgba crap
106 // Konqueror 3.5.6 doesn't seem to support computed properties
107 if (color && color != 'rgba(0, 0, 0, 0)') {
108 //window.alert("enabled! color='" + color + "'");
113 def send_title(name, text="Limbo", msg_text=None, msg_type='error', writable=False):
115 if title_done: return
119 print '<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"'
120 print ' "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">'
121 print '<html xmlns="http://www.w3.org/1999/xhtml" lang="en" xml:lang="en">'
123 site_name = globals().get('site_name', 'Unconfigured Site')
124 print "<head><title>%s: %s</title>" % (site_name, text)
125 print ' <meta http-equiv="Content-Type" content="application/xhtml+xml; charset=utf-8" />'
127 print ' <meta name="robots" content="noindex,nofollow" />'
129 print ' <link rel="stylesheet" type="text/css" href="%s" />' % relative_url(css)
131 print ' <link rel="icon" href="%s" />' % relative_url(icon_url)
133 if name and writable and privileged_url is not None:
134 print ' <link rel="alternate" type="application/x-wiki" title="Edit this page" href="%s" \>' \
135 % (privileged_path() + '?edit=' + name)
137 if history_url is not None:
138 print ' <link rel="alternate" type="application/rss+xml" title="RSS" href="%s" />' \
139 % (history_url + '?a=rss')
144 if name and writable and privileged_url is not None:
145 print '<body ondblclick="location.href=\'' + privileged_path() + '?edit=' + name + '\'">'
150 send_guru(msg_text, msg_type)
153 print '<div class="nav">'
155 print ' <b>' + link_tag('?fullsearch=' + name, text, 'navlink') + '</b> '
157 print ' <b>' + text + '</b> '
158 print ' | ' + link_tag('FrontPage', 'Home', 'navlink')
159 print ' | ' + link_tag('FindPage', 'Find Page', 'navlink')
160 if 'history_url' in globals():
161 print ' | <a href="' + history_url + '" class="navlink">Recent Changes</a>'
163 print ' | <a href="' + history_url + '?a=history;f=' + name + '" class="navlink">Page History</a>'
166 print ' | ' + link_tag('?raw=' + name, 'Raw Text', 'navlink')
167 if privileged_url is not None:
169 print ' | ' + link_tag('?edit=' + name, 'Edit', 'navlink', privileged=True)
171 print ' | ' + link_tag(name, 'Login', 'navlink', privileged=True)
174 print ' | <i>Immutable Page</i>'
177 if user != 'AnonymousCoward':
178 print ' | <span class="login"><i>logged in as <b>' + cgi.escape(user) + '</b></i></span>'
182 def link_tag(params, text=None, ss_class=None, privileged=False):
184 text = params # default
187 classattr += 'class="%s" ' % ss_class
188 # Prevent crawlers from following links potentially added by spammers or to generated pages
189 if ss_class == 'external' or ss_class == 'navlink':
190 classattr += 'rel="nofollow" '
191 elif url_re.match(params):
192 classattr += 'rel="nofollow" '
193 return '<a %shref="%s">%s</a>' % (classattr, relative_url(params, privileged=privileged), text)
195 # Search ---------------------------------------------------
197 def handle_fullsearch(needle):
198 send_title(None, 'Full text search for "%s"' % (needle))
200 needle_re = re.compile(needle, re.IGNORECASE)
202 all_pages = page_list()
203 for page_name in all_pages:
204 body = Page(page_name).get_raw_body()
205 count = len(needle_re.findall(body))
207 hits.append((count, page_name))
209 # The default comparison for tuples compares elements in order,
210 # so this sorts by number of hits
215 for (count, page_name) in hits:
216 print '<li><p>' + Page(page_name).link_to()
217 print ' . . . . ' + `count`
218 print ['match', 'matches'][count != 1]
222 print_search_stats(len(hits), len(all_pages))
224 def handle_titlesearch(needle):
225 # TODO: check needle is legal -- but probably we can just accept any RE
226 send_title(None, "Title search for \"" + needle + '"')
228 needle_re = re.compile(needle, re.IGNORECASE)
229 all_pages = page_list()
230 hits = filter(needle_re.search, all_pages)
233 for filename in hits:
234 print '<li><p>' + Page(filename).link_to() + "</p></li>"
237 print_search_stats(len(hits), len(all_pages))
239 def print_search_stats(hits, searched):
240 print "<p>%d hits out of %d pages searched.</p>" % (hits, searched)
242 def handle_raw(pagename):
243 Page(pagename).send_raw()
245 def handle_edit(pagename):
248 if form['file'].value:
249 pg.save(form['file'].file.read())
251 pg.save(form['savetext'].value.replace('\r\n', '\n'))
253 elif 'cancel' in form:
254 pg.msg_text = 'Editing canceled'
255 pg.msg_type = 'notice'
257 else: # preview or edit
259 if 'preview' in form:
260 text = form['savetext'].value
263 def make_index_key():
264 links = map(lambda ch: '<a href="#%s">%s</a>' % (ch, ch), 'abcdefghijklmnopqrstuvwxyz')
265 return '<p><center>'+ ' | '.join(links) + '</center></p>'
267 def page_list(dir = None, re = word_re):
268 return filter(re.match, os.listdir(dir or data_dir))
270 def send_footer(name, mod_string=None):
271 if globals().get('debug_cgi', False):
272 cgi.print_arguments()
275 print '<div id="footer"><hr />'
276 print ('<p class="copyright"><span class="benchmark">generated in %0.3fs</span>' +
277 ' by <a href="http://www.codewiz.org/wiki/GeekiGeeki">GeekiGeeki</a>' +
278 ' version %s</p>') % (clock() - start_time, __version__)
280 print '<p class="modified">last modified %s</p>' % mod_string
281 print '</div></body></html>'
284 """Object that turns Wiki markup into HTML.
286 All formatting commands can be parsed one line at a time, though
287 some state is carried over between lines.
289 def __init__(self, raw):
292 self.in_pre = self.in_html = self.in_table = self.in_li = False
293 self.in_header = True
294 self.list_indents = []
305 "^^": ["sup", False],
309 def _b_repl(self, word):
310 style = self.styles[word]
311 style[1] = not style[1]
312 return ['</', '<'][style[1]] + style[0] + '>'
314 def _tit_repl(self, word):
316 result = '</h%d><p>\n' % self.h_level
319 self.h_level = len(word) - 1
320 link = permalink(self.line)
321 result = '\n</p><h%d id="%s"><a class="heading" href="#%s">¶</a> ' % (self.h_level, link, link)
324 def _br_repl(self, word):
327 def _rule_repl(self, word):
328 return self._undent() + '\n<hr size="%d" noshade="noshade" />\n' % (len(word) - 2)
330 def _word_repl(self, word):
331 return Page(word).link_to()
333 def _img_repl(self, word):
334 path = relative_url(word)
335 return '<a href="%s"><img border="0" src="%s" /></a>' % (path, path)
337 def _url_repl(self, word):
338 if img_re.match(word):
339 return '<a href="%s"><img border="0" src="%s" /></a>' % (word, word)
341 return '<a href="%s" rel="nofollow" class="external">%s</a>' % (word, word)
343 def _macro_repl(self, word):
344 m = re.compile("\<\<([^\s\|\>]+)(?:\s*\|\s*([^\>]+)|)\>\>").match(word)
348 argv.extend(m.group(2).split('|'))
349 argv = map(str.strip, argv)
351 macro = globals().get('_macro_' + name)
353 execfile("macros/" + name + ".py", globals())
354 macro = globals().get('_macro_' + name)
358 return '<strong class="error"><<' + '|'.join(argv) + '>></strong>'
360 def _hurl_repl(self, word):
361 m = link_re.match(word)
363 if m.group(2) is None:
365 elif img_re.match(m.group(2)):
366 descr = '<img border="0" src="' + descr + '" />'
370 return link_tag(name, descr, 'wikilink')
372 def _inl_repl(self, word):
373 m = link_re.match(word)
375 descr = m.group(2) or name
376 name = relative_url(name)
377 argv = descr.split('|')
381 args = '?' + '&'.join(argv)
386 # The "extthumb" nonsense works around a limitation of the HTML block model
387 return '<div class="extthumb"><div class="thumb"><a href="%s"><img border="0" src="%s" alt="%s" /></a><div class="caption">%s</div></div></div>' \
388 % (name, name + args, descr, descr)
390 return '<a href="%s"><img border="0" src="%s" /></a>' % (name, name + args)
392 def _email_repl(self, word):
393 return '<a href="mailto:%s">%s</a>' % (word, word)
395 def _html_repl(self, word):
397 return word; # Pass through
399 def _ent_repl(self, s):
400 if self.in_html and s == '>':
403 return {'&': '&',
407 def _li_repl(self, match):
414 def _pre_repl(self, word):
415 if word == '{{{' and not self.in_pre:
423 def _hi_repl(self, word):
424 return '<strong class="highlight ' + word + '">' + word + '</strong>'
426 def _tr_repl(self, word):
428 if not self.in_table:
431 out = '</p><table><tbody>\n'
433 out = out + '<tr class="' + ['even', 'odd'][self.tr_cnt % 2] + '">'
434 return out + ['<td>', '<th>'][word.strip() == '||=']
436 def _td_repl(self, word):
438 return ['</td><td>', '</th><th>'][word.strip() == '||=']
441 def _tre_repl(self, word):
443 return ['</td></tr>', '</th></tr>'][word.strip() == '||=']
446 def _indent_level(self):
447 return len(self.list_indents) and self.list_indents[-1]
449 def _indent_to(self, new_level):
450 if self._indent_level() == new_level:
453 while self._indent_level() > new_level:
454 del(self.list_indents[-1])
457 self.in_li = False # FIXME
459 while self._indent_level() < new_level:
460 self.list_indents.append(new_level)
467 res += '</ul>' * len(self.list_indents)
469 self.list_indents = []
472 def replace(self, match):
473 for type, hit in match.groupdict().items():
475 return getattr(self, '_' + type + '_repl')(hit)
477 raise "Can't handle match " + `match`
479 def print_html(self):
480 print '<div class="wiki"><p>'
482 # For each line, we scan through looking for magic
483 # strings, outputting verbatim any intervening text
484 # TODO: highlight search words (look at referrer)
485 scan_re = re.compile(
488 + r"(?P<b>\*\*|'''|//|''|##|``|__|\^\^|,,)"
489 + r"|(?P<tit>\={2,6})"
491 + r"|(?P<rule>^-{3,})"
492 + r"|(?P<hi>\b(FIXME|TODO|DONE)\b)"
495 + r"|(?P<macro>\<\<([^\s\|\>]+)(?:\s*\|\s*([^\>]+)|)\>\>)"
496 + r"|(?P<hurl>\[\[([^\s\|]+)(?:\s*\|\s*([^\]]+)|)\]\])"
499 + r"|(?P<html><(/|)(br|hr|div|form|iframe|input|span))"
502 # Auto links (LEGACY)
503 + r"|(?P<img>\b[a-zA-Z0-9_/-]+\.(png|gif|jpg|jpeg|bmp|ico))"
504 + r"|(?P<word>\b(?:[A-Z][a-z]+){2,}\b)"
505 + r"|(?P<url>(http|https|ftp|mailto)\:[^\s'\"]+\S)"
506 + r"|(?P<email>[-\w._+]+\@[\w.-]+)"
509 + r"|(?P<li>^\s+[\*#] +)"
510 + r"|(?P<pre>\{\{\{|\s*\}\}\})"
511 + r"|(?P<inl>\{\{([^\s\|]+)(?:\s*\|\s*([^\]]+)|)\}\})"
514 + r"|(?P<tr>^\s*\|\|(=|)\s*)"
515 + r"|(?P<tre>\s*\|\|(=|)\s*$)"
516 + r"|(?P<td>\s*\|\|(=|)\s*)"
520 + r"(?P<pre>\s*\}\}\})"
523 blank_re = re.compile(r"^\s*$")
524 indent_re = re.compile(r"^\s*")
525 tr_re = re.compile(r"^\s*\|\|")
526 eol_re = re.compile(r"\r?\n")
527 for self.line in eol_re.split(self.raw.expandtabs()):
530 if self.line.startswith('#'):
532 self.in_header = False
535 print re.sub(pre_re, self.replace, self.line)
537 if self.in_table and not tr_re.match(self.line):
538 self.in_table = False
539 print '</tbody></table><p>'
541 if blank_re.match(self.line):
544 indent = indent_re.match(self.line)
545 print self._indent_to(len(indent.group(0)))
546 print re.sub(scan_re, self.replace, self.line)
548 if self.in_pre: print '</pre>'
549 if self.in_table: print '</tbody></table><p>'
554 def __init__(self, page_name):
555 self.page_name = page_name
557 self.msg_type = 'error'
559 def split_title(self):
560 # look for the end of words and the start of a new word and insert a space there
561 return re.sub('([a-z])([A-Z])', r'\1 \2', self.page_name)
564 return path.join(data_dir, self.page_name)
566 def _tmp_filename(self):
567 return path.join(data_dir, ('#' + self.page_name.replace('/','_') + '.' + `os.getpid()` + '#'))
571 os.stat(self._filename())
574 if er.errno == errno.ENOENT:
579 word = self.page_name
581 return link_tag(word, word, 'wikilink')
583 return link_tag(word, nonexist_pfx + word, 'nonexistent')
585 def get_raw_body(self):
587 return open(self._filename(), 'rb').read()
589 if er.errno == errno.ENOENT:
590 return '' # just doesn't exist, use default
591 if er.errno == errno.EISDIR:
592 return self.format_dir()
595 def format_dir(self):
598 for dir in self.page_name.split('/'):
599 path = (path + '/' + dir) if path else dir
600 out += '[[' + path + '|' + dir + ']]/'
603 for file in page_list(self._filename(), file_re):
604 if img_re.match(file):
606 maxwidth_arg = '|maxwidth=' + str(image_maxwidth)
607 out += '{{' + self.page_name + '/' + file + '|' + file + maxwidth_arg + '}}\n'
609 out += ' * [[' + self.page_name + '/' + file + ']]\n'
612 if 'attrs' in self.__dict__:
616 file = open(self._filename(), 'rt')
617 attr_re = re.compile(r"^#(\S*)(.*)$")
619 m = attr_re.match(line)
622 self.attrs[m.group(1)] = m.group(2).strip()
623 #print "bernie: attrs[" + m.group(1) + "] = " + m.group(2) + "<br>\n"
625 if er.errno != errno.ENOENT:
629 def get_attr(self, name, default):
630 return self.get_attrs().get(name, default)
632 def can(self, action, default=True):
635 #acl SomeUser:read,write All:read
636 acl = self.get_attr("acl", None)
637 for rule in acl.split():
638 (user, perms) = rule.split(':')
639 if user == remote_user() or user == "All":
640 return action in perms.split(',')
642 except Exception, er:
644 self.msg_text = 'Illegal acl line: ' + acl
648 return self.can("write", True)
651 return self.can("read", True)
653 def send_naked(self):
655 WikiFormatter(self.get_raw_body()).print_html()
657 send_guru("Read access denied by ACLs", "notice")
662 css_url = self.get_attr("css", "").split() + css_url
664 send_title(self.page_name, self.split_title(),
665 msg_text=self.msg_text, msg_type=self.msg_type, writable=self.can_write())
667 send_footer(self.page_name, self._last_modified())
669 def _last_modified(self):
671 from time import localtime, strftime
672 modtime = localtime(os.stat(self._filename())[stat.ST_MTIME])
674 if er.errno != errno.ENOENT:
677 return strftime(datetime_fmt, modtime)
679 def send_editor(self, preview=None):
680 send_title(None, 'Edit ' + self.split_title(), msg_text=self.msg_text, msg_type=self.msg_type)
681 if not self.can_write():
682 send_guru("Write access denied by ACLs", "error")
687 file = form['file'].value
689 print ('<p><b>Editing ' + self.page_name
690 + ' for ' + cgi.escape(remote_user())
691 + ' from ' + cgi.escape(get_hostname(remote_host()))
693 print '<div class="editor"><form method="post" enctype="multipart/form-data" action="%s">' % relative_url(self.page_name)
694 print '<input type="hidden" name="edit" value="%s">' % (self.page_name)
695 print '<textarea wrap="off" spellcheck="true" id="editor" name="savetext" rows="17" cols="100">%s</textarea>' % (preview or self.get_raw_body())
696 print 'Or upload a file: <input type="file" name="file" value="%s" />' % file
699 <input type="submit" name="save" value="Save" />
700 <input type="submit" name="preview" value="Preview" />
701 <input type="reset" value="Reset" />
702 <input type="submit" name="cancel" value="Cancel" />
705 print "<p>" + Page('EditingTips').link_to() + "</p>"
707 print "<div class='preview'>"
708 WikiFormatter(preview).print_html()
710 send_footer(self.page_name)
712 def send_raw(self, mimetype='text/plain'):
714 body = self.get_raw_body()
715 emit_header(mimetype)
718 send_title(None, msg_text='Read access denied by ACLs', msg_type='notice')
720 def send_image(self, mimetype, args=[]):
721 if 'maxwidth' in args:
723 emit_header(mimetype)
725 subprocess.check_call(['gm', 'convert', self._filename(),
726 '-scale', args['maxwidth'].value + ' >', '-'])
728 self.send_raw(mimetype)
730 def _write_file(self, data):
731 tmp_filename = self._tmp_filename()
732 open(tmp_filename, 'wb').write(data)
733 name = self._filename()
735 # Bad Bill! POSIX rename ought to replace. :-(
739 if er.errno != errno.ENOENT: raise er
740 os.rename(tmp_filename, name)
742 def save(self, newdata):
743 if not self.can_write():
744 self.msg_text = 'Write access denied by ACLs'
745 self.msg_type = 'error'
748 self._write_file(newdata)
751 # FIXME: what's the std way to perform shell quoting in python?
752 cmd = ( post_edit_hook
753 + " '" + data_dir + '/' + self.page_name
754 + "' '" + remote_user()
755 + "' '" + remote_host() + "'"
761 self.msg_text += "Post-editing hook returned %d.\n" % rc
762 self.msg_text += 'Command was: ' + cmd + '\n'
764 self.msg_text += 'Output follows:\n' + output
766 self.msg_text = 'Thank you for your contribution. Your attention to detail is appreciated.'
767 self.msg_type = 'success'
769 # Main ---------------------------------------------------------------
771 execfile("geekigeeki.conf.py")
772 form = cgi.FieldStorage()
775 handler = globals().get('handle_' + cmd)
777 handler(form[cmd].value)
780 path_info = environ.get('PATH_INFO', '')
781 if len(path_info) and path_info[0] == '/':
782 query = path_info[1:] or 'FrontPage'
784 query = environ.get('QUERY_STRING', '') or 'FrontPage'
786 if file_re.match(query):
787 if word_re.match(query):
790 from mimetypes import MimeTypes
791 type, encoding = MimeTypes().guess_type(query)
792 #type = type or 'text/plain'
793 #Page(query).send_raw(mimetype=type)
795 if type.startswith('image/'):
796 Page(query).send_image(mimetype=type,args=form)
798 Page(query).send_raw(mimetype=type)
802 print "Status: 404 Not Found"
803 send_title(None, msg_text='Can\'t work out query: ' + query)
807 msg_text = traceback.format_exc()
809 send_guru(msg_text, "error")
811 send_title(None, msg_text=msg_text)