# Apache configuration for COCANWIKI.
-# $Id: cocanwiki.conf,v 1.22 2005/11/16 16:06:33 rich Exp $
+# $Id: cocanwiki.conf,v 1.23 2005/11/23 11:32:37 rich Exp $
# Uncomment the following lines if necessary. You will probably need
# to adjust the paths to reflect where cocanwiki is really installed.
RewriteRule ^/_recent.rss$ /_bin/recent_rss.cmo [PT,L,QSA]
RewriteRule ^/_search$ /_bin/search.cmo [PT,L,QSA]
RewriteRule ^/_sitemap$ /_bin/sitemap.cmo [PT,L,QSA]
+RewriteRule ^/sitemap.xml$ /_bin/sitemap_xml.cmo [PT,L,QSA]
RewriteRule ^/_userprefs$ /_bin/user_prefs_form.cmo [PT,L,QSA]
RewriteRule ^/_users$ /_bin/users.cmo [PT,L,QSA]
(* COCANWIKI - a wiki written in Objective CAML.
* Written by Richard W.M. Jones <rich@merjis.com>.
* Copyright (C) 2004 Merjis Ltd.
- * $Id: cocanwiki_date.ml,v 1.2 2005/04/02 17:30:54 rich Exp $
+ * $Id: cocanwiki_date.ml,v 1.3 2005/11/23 11:32:38 rich Exp $
*
* This program is free software; you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
let printable_date_time (date, time) =
sprintf "%d %s %04d %02d:%02d" date.Dbi.day (short_month date.Dbi.month)
date.Dbi.year time.Dbi.hour time.Dbi.min
+
+(* ISO 8601 timestamp. *)
+let iso_8601_date_time (date, time) =
+ sprintf "%04d-%02d-%02dT%02d:%02d:%02d"
+ date.Dbi.year date.Dbi.month date.Dbi.day
+ time.Dbi.hour time.Dbi.min time.Dbi.sec ^
+ match time.Dbi.timezone with
+ | None -> "Z"
+ | Some t -> sprintf "+%02d:00" t
--- /dev/null
+(* COCANWIKI - a wiki written in Objective CAML.
+ * Written by Richard W.M. Jones <rich@merjis.com>.
+ * Copyright (C) 2004 Merjis Ltd.
+ * $Id: sitemap_xml.ml,v 1.1 2005/11/23 11:32:37 rich Exp $
+ *
+ * This program is free software; you can redistribute it and/or modify
+ * it under the terms of the GNU General Public License as published by
+ * the Free Software Foundation; either version 2 of the License, or
+ * (at your option) any later version.
+ *
+ * This program is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+ * GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program; see the file COPYING. If not, write to
+ * the Free Software Foundation, Inc., 59 Temple Place - Suite 330,
+ * Boston, MA 02111-1307, USA.
+ *)
+
+open Apache
+open Registry
+open Cgi
+open Printf
+
+open Cocanwiki
+open Cocanwiki_template
+open Cocanwiki_date
+open Cocanwiki_strings
+
+(* For Google sitemap.xml specification, please see:
+ * https://www.google.com/webmasters/sitemaps/docs/en_GB/protocol.html
+ *)
+
+let run r (q : cgi) (dbh : Dbi.connection) hostid { hostname = hostname } _ =
+ let template = get_template dbh hostid "sitemap.xml" in
+
+ (* Pull out all the current pages. *)
+ let sth = dbh#prepare_cached "select p.url, p.url = 'index',
+ p.last_modified_date
+ from pages p
+ where p.hostid = ? and p.url is not null
+ and p.redirect is null
+ order by 2 desc, 1" in
+ sth#execute [`Int hostid];
+
+ let table =
+ sth#map
+ (function [`String url; `Bool is_index;
+ `Timestamp last_modified_date] ->
+ let url = if is_index then "" else url in
+ let last_modified_date = iso_8601_date_time last_modified_date in
+ let priority = if is_index then "1.0" else "0.5" in
+ [ "url", Template.VarString url;
+ "last_modified_date", Template.VarString last_modified_date;
+ "priority", Template.VarString priority ]
+ | xs -> failwith (Dbi.sdebug xs)) in
+
+ template#set "hostname" hostname;
+ template#table "sitemap" table;
+
+ q#template ~content_type:"application/xml" template
+
+let () =
+ register_script ~restrict:[CanView] run
--- /dev/null
+<?xml version="1.0" encoding="UTF-8"?>
+<urlset xmlns="http://www.google.com/schemas/sitemap/0.84">
+
+<url>
+<loc>http://::hostname::/_recent</loc>
+<changefreq>daily</changefreq>
+</url>
+
+<url>
+<loc>http://::hostname::/_sitemap</loc>
+</url>
+
+::table(sitemap)::<url>
+<loc>http://::hostname::/::url_html::</loc>
+<lastmod>::last_modified_date_html::</lastmod>
+<priority>::priority_html::</priority>
+</url>
+::end::
+
+</urlset>
\ No newline at end of file