2007-05-27 05:25:55 -06:00
|
|
|
#!/usr/local/plan9/bin/rc
|
2008-09-26 06:23:19 -06:00
|
|
|
. ./cgilib.rc
|
2007-05-27 05:25:55 -06:00
|
|
|
cd ..
|
|
|
|
|
2008-09-25 03:06:14 -06:00
|
|
|
forbidden_uri_chars='[^a-zA-Z0-9_+\-\/\.]'
|
|
|
|
response_format=html
|
|
|
|
|
2008-09-24 12:21:32 -06:00
|
|
|
fn get_lib_file {
|
2008-09-04 17:11:14 -06:00
|
|
|
wantedfile = $1
|
2008-09-24 12:21:32 -06:00
|
|
|
if (test -f $sitedir/_werc/lib/$wantedfile)
|
|
|
|
echo -n $sitedir/_werc/lib/$wantedfile
|
2008-10-13 17:10:34 -06:00
|
|
|
if not if(! ~ $#masterSite 0 && test -f sites/$masterSite/_werc/lib/$wantedfile)
|
2008-09-24 12:21:32 -06:00
|
|
|
echo -n sites/$masterSite/_werc/lib/$wantedfile
|
|
|
|
if not if (test -f lib/$wantedfile)
|
|
|
|
echo -n lib/$wantedfile
|
2008-09-04 17:11:14 -06:00
|
|
|
}
|
|
|
|
|
2007-05-28 20:04:05 -06:00
|
|
|
# Title
|
|
|
|
fn gentitle {
|
2007-06-09 15:36:37 -06:00
|
|
|
echo '<h1 class="headerTitle"><a href="/">' ^ $"siteTitle ^ ' <span id="headerSubTitle">' ^ $"siteSubTitle ^ '</span></a></h1>'
|
2007-05-28 20:04:05 -06:00
|
|
|
}
|
|
|
|
|
2007-06-14 22:36:06 -06:00
|
|
|
# Don't change var name or trailing ';', some dirs change the filter!
|
2008-09-25 03:06:14 -06:00
|
|
|
dirfilter = '/\/[._]/d; /'^$forbidden_uri_chars^'/d; /\/robots.\txt$/d; /\/sitemap\.txt$/d; s,^\./,,; s,\.md$,,; s,\.html,,; s,\.txt,,; '
|
2008-07-04 20:32:29 -06:00
|
|
|
|
2008-09-24 12:21:32 -06:00
|
|
|
# To be used from config files
|
2008-07-04 20:32:29 -06:00
|
|
|
fn hide_paths {
|
2008-10-13 17:13:00 -06:00
|
|
|
for(i in $*)
|
|
|
|
dirfilter = $dirfilter^'/^'$i'$/d; '
|
2008-07-04 20:32:29 -06:00
|
|
|
}
|
2007-06-03 21:26:58 -06:00
|
|
|
|
2007-05-27 20:07:40 -06:00
|
|
|
# Sidebar
|
|
|
|
fn menu {
|
2008-10-13 17:16:41 -06:00
|
|
|
ls -F $1 | sed $dirfilter | awk -F/ '
|
2008-09-11 17:31:32 -06:00
|
|
|
BEGIN { print "<ul class=\"side-bar\">" }
|
2007-05-27 20:07:40 -06:00
|
|
|
END { print "</ul>" }
|
2008-06-27 22:26:28 -06:00
|
|
|
# Should add \. to the list of allowed chars in file names, but need to find a way to filter out .txt and so on
|
2007-06-03 21:26:58 -06:00
|
|
|
/^([a-zA-Z0-9+_\-]+[\/*]?)+$/ && $NF != "index" {
|
2007-05-27 20:07:40 -06:00
|
|
|
isdir = match($0, "/$")
|
2007-06-03 21:26:58 -06:00
|
|
|
sub("[*/]$", "")
|
|
|
|
|
2007-06-03 22:52:33 -06:00
|
|
|
path = bname = $0
|
2007-05-27 20:07:40 -06:00
|
|
|
sub("^(.*/)?([0-9]+_)?", "", bname)
|
|
|
|
gsub("_", " ", bname)
|
|
|
|
|
2007-06-03 21:26:58 -06:00
|
|
|
if(isdir) {
|
|
|
|
bname = bname "/"
|
|
|
|
path = $0 "/"
|
|
|
|
}
|
2007-05-27 20:07:40 -06:00
|
|
|
|
2008-07-04 14:49:05 -06:00
|
|
|
if(index(ENVIRON["REQUEST_URI"] "/", "/" path) == 1) {
|
2007-05-27 20:07:40 -06:00
|
|
|
if(isdir) {
|
2007-06-03 21:26:58 -06:00
|
|
|
print "<li><a href=\"/" path "\" class=\"thisPage\">»<i> " bname "</i></a>"
|
|
|
|
system("rc -c ''menu " path "''")
|
2007-05-27 20:07:40 -06:00
|
|
|
} else {
|
2007-06-03 21:26:58 -06:00
|
|
|
print "<li><a href=\"/" path "\" class=\"thisPage\">»<i> " bname "</i></a>"
|
2007-05-27 20:07:40 -06:00
|
|
|
}
|
|
|
|
} else
|
2007-06-03 21:26:58 -06:00
|
|
|
print "<li><a href=\"/" path "\">› " bname "</a>"
|
2007-05-27 20:07:40 -06:00
|
|
|
|
|
|
|
print "</li>"
|
|
|
|
}'
|
|
|
|
}
|
|
|
|
|
|
|
|
fn gensidebar {
|
2007-06-03 21:26:58 -06:00
|
|
|
@{
|
|
|
|
cd $sitedir
|
|
|
|
menu .
|
|
|
|
}
|
2007-05-27 20:07:40 -06:00
|
|
|
}
|
|
|
|
|
2007-06-02 23:36:01 -06:00
|
|
|
fn sortedBlogPostList {
|
2007-06-03 21:26:58 -06:00
|
|
|
# the /./ is added so we can sort -t. and order only the file name
|
2007-06-05 03:08:24 -06:00
|
|
|
if (! ~ $#* 0)
|
2008-08-28 15:33:53 -06:00
|
|
|
ls $*^'/./' | grep '/[0-9]+.*\.md$'| sort -r -t. +1
|
2007-06-02 23:36:01 -06:00
|
|
|
}
|
2007-05-27 20:07:40 -06:00
|
|
|
|
2008-09-21 09:01:51 -06:00
|
|
|
fn gen_blog_post_title {
|
2007-06-13 04:13:49 -06:00
|
|
|
title=`{basename $1 | sed 's/^[0-9\-]*_(.*)\.md$/\1/; s/_/ /g' }
|
2007-06-27 05:11:05 -06:00
|
|
|
permlink= `{echo $1 | sed 's,^/[a-z/]*www/,/,; s,^sites/[^/]*/*/,/,; s/\.md$//' }
|
2007-06-13 04:13:49 -06:00
|
|
|
du=`{ls -l $1}
|
2008-09-30 02:41:10 -06:00
|
|
|
by = ''
|
|
|
|
if (! ~ $#blogAuthor 0)
|
|
|
|
by='By '$"blogAuthor
|
|
|
|
if not if (~ $#blogDirs 1)
|
|
|
|
by='By '$du(4)
|
|
|
|
echo '##<a href="'^$"permlink^'">' $"title^'</a> *( '$by Last mod: $du(7 8 9) ' )*'
|
2007-06-13 04:13:49 -06:00
|
|
|
}
|
|
|
|
|
2008-07-15 19:05:41 -06:00
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
# Handlers
|
|
|
|
fn set_handler {
|
|
|
|
handler = $1
|
|
|
|
shift
|
|
|
|
handler_args = $*
|
|
|
|
}
|
|
|
|
|
2008-09-26 02:35:12 -06:00
|
|
|
fn md_handler { cat $* | $formatter }
|
2008-07-15 19:05:41 -06:00
|
|
|
|
2008-09-26 02:35:12 -06:00
|
|
|
fn tpl_handler { template $1 }
|
2008-07-15 19:05:41 -06:00
|
|
|
|
|
|
|
fn html_handler {
|
|
|
|
cat $1 | /bin/sed '0,/<[Bb][Oo][Dd][Yy][^>]*>/d; /<\/[Bb][Oo][Dd][Yy]>/,$d'
|
|
|
|
}
|
|
|
|
|
|
|
|
fn txt_handler {
|
|
|
|
echo '<pre>'
|
|
|
|
# XXX Insering a blank line between lines in input is good for fortunes.txt, but maybe not for other .txt files
|
|
|
|
# XXX Words are not broken, even if they are way beyond 82 chars long
|
2008-09-14 23:23:00 -06:00
|
|
|
cat $1 |sed 's/$/\n/g; s/</\</g; s/>/\>/g' |fmt -l 82 -j
|
2008-07-15 19:05:41 -06:00
|
|
|
echo '</pre>'
|
|
|
|
}
|
|
|
|
|
|
|
|
fn dir_listing_handler {
|
2008-10-13 17:25:37 -06:00
|
|
|
d = `{basename -d $1}
|
|
|
|
echo '<h1 style="text-transform: capitalize;">' `{echo $d|sed -e 's,.*//,,g' -e 's,/$,,' -e 's,/, / ,g' } '</h1>'
|
2008-07-15 19:05:41 -06:00
|
|
|
echo '<ul style="text-transform: capitalize;">'
|
2008-10-13 17:40:20 -06:00
|
|
|
ls -F $d | sed -e $dirfilter' s,^'$sitedir'/.*/([^$].*),<li><a href="\1">\1</a></li>,' # XXX I'm not sure what the [^$] does there
|
2008-07-15 19:05:41 -06:00
|
|
|
echo '</ul>'
|
|
|
|
}
|
|
|
|
|
2008-10-13 17:40:20 -06:00
|
|
|
fn 404_handler { template `{ get_lib_file 404.tpl } }
|
2008-07-15 19:05:41 -06:00
|
|
|
|
|
|
|
fn blog_post_handler {
|
2008-09-21 09:01:51 -06:00
|
|
|
gen_blog_post_title $1 | $formatter
|
2008-07-15 19:05:41 -06:00
|
|
|
$formatter < $1
|
|
|
|
}
|
|
|
|
|
|
|
|
fn debug_handler {
|
|
|
|
echo '<pre>'
|
2008-10-13 17:40:20 -06:00
|
|
|
env | escape_html
|
2008-09-26 06:23:19 -06:00
|
|
|
echo ---------------------
|
|
|
|
umask
|
2008-07-15 19:05:41 -06:00
|
|
|
echo '</pre>'
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
fn select_handler {
|
2008-09-25 03:06:14 -06:00
|
|
|
|
2008-06-27 22:07:59 -06:00
|
|
|
if (test -f $body.md) {
|
|
|
|
if (! ~ $#inBlog 0)
|
2008-07-15 19:05:41 -06:00
|
|
|
set_handler blog_post_handler $body.md
|
|
|
|
if not
|
|
|
|
set_handler md_handler $body.md
|
2008-09-26 06:23:19 -06:00
|
|
|
|
|
|
|
if (! ~ $#allowComments 0 && ~ $REQUEST_METHOD POST) {
|
|
|
|
get_post_args comment_user_name comment_text
|
|
|
|
ddir = $body.md_werc/comments/
|
|
|
|
umask 002
|
|
|
|
mkdir -m 775 -p $ddir
|
|
|
|
d = `{date -n} # Obvious race
|
|
|
|
{ echo '% user_name='^$comment_user_name'
|
|
|
|
|
|
|
|
'^$comment_text } > $ddir/$d.rec
|
|
|
|
}
|
2007-06-13 04:13:49 -06:00
|
|
|
}
|
2008-07-15 19:05:41 -06:00
|
|
|
if not if (~ $body */_debug)
|
|
|
|
set_handler debug_handler
|
2008-06-27 22:07:59 -06:00
|
|
|
if not if (test -f $body.tpl)
|
2008-07-15 19:05:41 -06:00
|
|
|
set_handler tpl_handler $body.tpl
|
|
|
|
|
2008-06-27 22:07:59 -06:00
|
|
|
if not if (test -f $body.html)
|
2008-07-15 19:05:41 -06:00
|
|
|
set_handler html_handler $body.html
|
|
|
|
|
2008-10-13 17:48:17 -06:00
|
|
|
# Explicit .html urls, unfortunately usually the web server will handle this as static files
|
2008-06-27 22:07:59 -06:00
|
|
|
if not if (~ $body *.html && test -f $body)
|
2008-10-13 17:46:52 -06:00
|
|
|
perm_redirect `{ echo $REQUEST_URI|sed 's/.html$//' }
|
2008-07-15 19:05:41 -06:00
|
|
|
|
2008-09-30 07:28:48 -06:00
|
|
|
# Rss feeds. TODO: we should check that the request is for a real blog dir
|
|
|
|
if not if (~ $REQUEST_URI */index.rss) {
|
|
|
|
uri = `{echo $uri | sed 's/index.rss$//'}
|
2008-10-13 17:49:35 -06:00
|
|
|
if (~ $#blogDirs 0)
|
2008-09-30 07:28:48 -06:00
|
|
|
blogDirs = $sitedir^$uri
|
|
|
|
uri=$baseuri$"uri
|
|
|
|
master_template=feeds/rss20.tpl
|
|
|
|
response_format=raw
|
|
|
|
}
|
|
|
|
|
2008-09-25 03:06:14 -06:00
|
|
|
# Blog handler
|
|
|
|
if not if (~ $body */[bB]log/index */[bB]log//index || ! ~ $#blogDirs 0) {
|
|
|
|
if (~ $#blogDirs 0)
|
|
|
|
blogDirs = `{basename -d $body}
|
|
|
|
|
|
|
|
rssuri=`{basename -d $uri}
|
|
|
|
rssuri=$baseuri`{cleanname $"rssuri^/index.rss}
|
|
|
|
extraHeaders=$"extraHeaders ^ \
|
|
|
|
'<link rel="alternate" type="application/rss+xml" title="RSS" href="'$rssuri'" />
|
|
|
|
'
|
2008-10-17 19:32:13 -06:00
|
|
|
set_handler tpl_handler lib/feeds/html.tpl
|
2008-09-25 03:06:14 -06:00
|
|
|
}
|
|
|
|
|
2008-07-15 19:05:41 -06:00
|
|
|
# Global tpl (eg sitemap.tpl)
|
2008-09-24 12:21:32 -06:00
|
|
|
if not if (test -f lib/^$uri^.tpl)
|
|
|
|
set_handler tpl_handler lib/^$uri^.tpl
|
2008-07-15 19:05:41 -06:00
|
|
|
|
|
|
|
if not if (test -f $body.txt)
|
|
|
|
set_handler txt_handler $body.txt
|
|
|
|
|
|
|
|
# Dir listing
|
2008-09-25 03:06:14 -06:00
|
|
|
if not if(~ $body */index)
|
2008-07-15 19:05:41 -06:00
|
|
|
set_handler dir_listing_handler $body
|
|
|
|
|
|
|
|
# File not found
|
2008-09-25 03:06:14 -06:00
|
|
|
if not {
|
2008-07-15 19:05:41 -06:00
|
|
|
set_handler 404_handler $body
|
|
|
|
dprint 'NOT FOUND: '$SERVER_NAME^$REQUEST_URI^' - '^$"HTTP_REFERER^' - '^$"HTTP_USER_AGENT
|
2008-09-16 14:29:52 -06:00
|
|
|
echo 'Status: 404 Not Found'
|
2008-06-06 01:39:07 -06:00
|
|
|
}
|
2007-06-03 21:26:58 -06:00
|
|
|
|
2007-05-28 20:04:05 -06:00
|
|
|
}
|
2007-05-27 20:07:40 -06:00
|
|
|
|
2007-06-02 23:36:01 -06:00
|
|
|
|
2008-07-15 19:05:41 -06:00
|
|
|
fn genbody {
|
|
|
|
$handler $handler_args
|
2008-07-05 17:49:45 -06:00
|
|
|
}
|
2008-09-16 18:16:33 -06:00
|
|
|
|
|
|
|
|
|
|
|
# Careful, the proper p9p path might not be set until initrc.local is sourced
|
|
|
|
path=(. $PLAN9/bin ./bin/ /bin/ /usr/bin)
|
|
|
|
|
|
|
|
site=$SERVER_NAME
|
2008-09-24 12:21:32 -06:00
|
|
|
headers=lib/headers.tpl
|
|
|
|
master_template=default_master.tpl
|
2008-09-16 18:16:33 -06:00
|
|
|
sidebar=sidebar
|
|
|
|
baseuri=http://$site/
|
2008-09-21 09:01:51 -06:00
|
|
|
for(i in siteTitle siteSubTitle pageTitle extraHeaders)
|
2008-09-16 18:16:33 -06:00
|
|
|
$i = ''
|
|
|
|
|
2008-07-15 19:05:41 -06:00
|
|
|
. etc/initrc
|
|
|
|
|
2008-09-16 18:16:33 -06:00
|
|
|
if(test -f etc/initrc.local)
|
|
|
|
. etc/initrc.local
|
|
|
|
|
|
|
|
|
|
|
|
# Parse request URL
|
2008-09-25 03:06:14 -06:00
|
|
|
uri = `{echo -n $REQUEST_URI | sed -e 's/\?.*//; s/'^$forbidden_uri_chars^'//g; s/\.\.*/./g;' -e '1q'}
|
2008-10-13 22:59:19 -06:00
|
|
|
ifs='/' { args = `{echo -n $uri} }
|
2008-09-16 18:16:33 -06:00
|
|
|
|
2008-07-05 17:49:45 -06:00
|
|
|
|
2008-07-08 16:55:45 -06:00
|
|
|
if(! ~ $#debug 0)
|
2008-08-26 21:27:40 -06:00
|
|
|
dprint ' ' $SERVER_NAME^$REQUEST_URI^' - '^$"HTTP_USER_AGENT
|
2008-07-08 16:55:45 -06:00
|
|
|
|
2008-10-17 19:26:54 -06:00
|
|
|
# Hack: preload post data so we can access it from templates where cgi's stdin is not accesible
|
|
|
|
if(~ $REQUEST_METHOD POST) {
|
|
|
|
get_post_args
|
|
|
|
login_user
|
|
|
|
}
|
2008-09-21 09:01:51 -06:00
|
|
|
|
2007-06-03 21:26:58 -06:00
|
|
|
if (! ~ $args '') {
|
2008-08-28 15:32:07 -06:00
|
|
|
if (~ $args($#args) 'index')
|
|
|
|
perm_redirect `{ echo $REQUEST_URI | sed 's,/index$,/,' }
|
|
|
|
|
2008-09-21 09:01:51 -06:00
|
|
|
pageTitle=`{echo $args | sed -e 's/ / - /g' -e 's/_/ /g'}
|
2007-06-03 21:26:58 -06:00
|
|
|
body=$uri
|
2007-06-02 23:36:01 -06:00
|
|
|
}
|
2008-08-28 15:32:07 -06:00
|
|
|
if not {
|
|
|
|
body='/'
|
|
|
|
}
|
2007-06-02 23:36:01 -06:00
|
|
|
|
2007-06-03 21:26:58 -06:00
|
|
|
fpath=$sitedir
|
2008-06-27 22:07:59 -06:00
|
|
|
for (i in ('' $args)) {
|
2007-06-03 21:26:58 -06:00
|
|
|
fpath = $fpath/$i
|
2007-06-13 04:13:49 -06:00
|
|
|
# We don't want blog settings to cascade into posts, note that we are inBlog instead
|
2008-06-27 22:07:59 -06:00
|
|
|
if (! ~ $#blogDirs 0 && ! ~ $body */index.rss */[bB]log */[bB]log/) {
|
2007-06-13 04:13:49 -06:00
|
|
|
inBlog = $blogDirs
|
|
|
|
blogDirs = ()
|
|
|
|
}
|
2007-06-15 06:10:31 -06:00
|
|
|
|
2008-06-27 22:07:59 -06:00
|
|
|
if (test -f $fpath/_config)
|
2008-09-26 02:35:12 -06:00
|
|
|
. $fpath/_config # DEPRECATED
|
2008-09-24 12:21:32 -06:00
|
|
|
if (test -f $fpath/_werc/config)
|
|
|
|
. $fpath/_werc/config
|
2007-06-15 06:15:35 -06:00
|
|
|
|
2008-06-27 22:07:59 -06:00
|
|
|
if (~ $#blogDirs 0 && ~ $#inBlog 0 && ~ $i [Bb]log)
|
2007-06-15 06:15:35 -06:00
|
|
|
inBlog = 'yes'
|
2007-06-03 21:26:58 -06:00
|
|
|
}
|
2007-06-02 23:36:01 -06:00
|
|
|
|
2008-07-06 21:40:39 -06:00
|
|
|
# Redirections and other preprocessing
|
|
|
|
if (~ $#redirectPermanent 1)
|
2008-07-07 16:23:00 -06:00
|
|
|
perm_redirect $"redirectPermanent
|
2008-07-06 21:40:39 -06:00
|
|
|
|
2008-07-11 23:34:43 -06:00
|
|
|
if not if (~ $#redirectPermanent 2 && {echo $SERVER_NAME^$REQUEST_URI|grep -s $redirectPermanent(1) }) {
|
2008-07-05 17:23:41 -06:00
|
|
|
# Experimental regexp sub-based redirect, probably should find a nicer interface
|
|
|
|
# For now only used at sites/harmful.cat-v.org/software/OO_programming/_config
|
2008-09-26 02:35:12 -06:00
|
|
|
to=`{echo $SERVER_NAME^$REQUEST_URI|sed 's@'^$redirectPermanent(1)^'@'^$redirectPermanent(2)^'@'}
|
2008-07-05 17:23:41 -06:00
|
|
|
if(! ~ $to $REQUEST_URI)
|
2008-09-26 02:35:12 -06:00
|
|
|
perm_redirect $to
|
2008-06-27 16:53:24 -06:00
|
|
|
}
|
|
|
|
|
2008-09-21 09:01:51 -06:00
|
|
|
# Set Page title
|
|
|
|
if(~ $pageTitle '')
|
|
|
|
pageTitle=$siteTitle^' '^$siteSubTitle
|
|
|
|
if not
|
|
|
|
pageTitle=$"pageTitle^' | '^$"siteTitle^' '^$"siteSubTitle
|
2008-06-27 16:53:24 -06:00
|
|
|
|
2007-06-04 12:57:18 -06:00
|
|
|
|
|
|
|
body=$sitedir/$body
|
|
|
|
if (test -d $body) {
|
2008-07-06 21:40:39 -06:00
|
|
|
if(! ~ $body */)
|
|
|
|
perm_redirect $REQUEST_URI^'/'
|
2007-06-02 23:36:01 -06:00
|
|
|
body=$body/index
|
2007-06-04 12:57:18 -06:00
|
|
|
}
|
|
|
|
|
2008-09-25 03:06:14 -06:00
|
|
|
select_handler
|
2007-06-04 12:57:18 -06:00
|
|
|
|
2008-09-25 03:06:14 -06:00
|
|
|
# Template/body selection
|
|
|
|
master_template= `{get_lib_file $master_template}
|
2008-06-08 23:21:39 -06:00
|
|
|
|
2008-09-25 03:06:14 -06:00
|
|
|
if(~ $response_format html) {
|
2008-09-26 02:35:12 -06:00
|
|
|
# Is awk_buffer really useful?
|
|
|
|
template $headers $master_template | awk_buffer
|
2008-06-08 23:21:39 -06:00
|
|
|
echo '</body></html>'
|
2008-09-25 03:06:14 -06:00
|
|
|
}
|
|
|
|
if not if (~ $response_format raw) {
|
|
|
|
template < $master_template
|
|
|
|
}
|