yacy_search_server/htroot/Wiki.java
orbiter c08f9b36a4 refactoring of wiki parser.
This was done to prepare the wiki parser as parser for wikipedia dumps, which will be used for performance test (to omit crawling)

git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@5785 6c8d7289-2bf4-0310-a012-ef5d649a1542
2009-04-08 15:28:45 +00:00

275 lines
12 KiB
Java

// Wiki.java
// -----------------------
// part of the AnomicHTTPD caching proxy
// (C) by Michael Peter Christen; mc@yacy.net
// first published on http://www.anomic.de
// Frankfurt, Germany, 2004
// last major change: 01.07.2003
//
// This program is free software; you can redistribute it and/or modify
// it under the terms of the GNU General Public License as published by
// the Free Software Foundation; either version 2 of the License, or
// (at your option) any later version.
//
// This program is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
// GNU General Public License for more details.
//
// You should have received a copy of the GNU General Public License
// along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
// Contains contributions from Alexander Schier [AS]
// and Marc Nause [MN]
// You must compile this file with
// javac -classpath .:../classes Wiki.java
// if the shell's current path is HTROOT
import java.io.IOException;
import java.io.UnsupportedEncodingException;
import java.text.SimpleDateFormat;
import java.util.Date;
import java.util.HashMap;
import java.util.Iterator;
import de.anomic.data.diff;
import de.anomic.data.wiki.wikiBoard;
import de.anomic.http.httpRequestHeader;
import de.anomic.plasma.plasmaSwitchboard;
import de.anomic.server.serverObjects;
import de.anomic.server.serverSwitch;
import de.anomic.yacy.yacyNewsPool;
import de.anomic.yacy.yacyNewsRecord;
public class Wiki {
//private static String ListLevel = "";
//private static String numListLevel = "";
private static SimpleDateFormat SimpleFormatter = new SimpleDateFormat("yyyy/MM/dd HH:mm:ss");
public static String dateString(final Date date) {
return SimpleFormatter.format(date);
}
public static serverObjects respond(final httpRequestHeader header, serverObjects post, final serverSwitch<?> env) throws IOException {
final plasmaSwitchboard sb = (plasmaSwitchboard) env;
final serverObjects prop = new serverObjects();
if (post == null) {
post = new serverObjects();
post.put("page", "start");
}
final boolean authenticated = sb.adminAuthenticated(header) >= 2;
final int display = ((post == null) || (!authenticated)) ? 0 : post.getInt("display", 0);
prop.put("display", display);
String access = sb.getConfig("WikiAccess", "admin");
final String pagename = get(post, "page", "start");
final String ip = get(post, httpRequestHeader.CONNECTION_PROP_CLIENTIP, "127.0.0.1");
String author = get(post, "author", "anonymous");
if (author.equals("anonymous")) {
author = wikiBoard.guessAuthor(ip);
if (author == null) {
if (sb.webIndex.peers().mySeed() == null) author = "anonymous";
else author = sb.webIndex.peers().mySeed().get("Name", "anonymous");
}
}
if (post != null && post.containsKey("access")) {
// only the administrator may change the access right
if (!sb.verifyAuthentication(header, true)) {
// check access right for admin
prop.put("AUTHENTICATE", "admin log-in"); // force log-in
return prop;
}
access = post.get("access", "admin");
sb.setConfig("WikiAccess", access);
}
if (access.equals("admin")) prop.put("mode_access", "0");
if (access.equals("all")) prop.put("mode_access", "1");
wikiBoard.entry page = sb.wikiDB.read(pagename);
if (post != null && post.containsKey("submit")) {
if ((access.equals("admin") && (!sb.verifyAuthentication(header, true)))) {
// check access right for admin
prop.put("AUTHENTICATE", "admin log-in"); // force log-in
return prop;
}
// store a new page
byte[] content;
try {
content = post.get("content", "").getBytes("UTF-8");
} catch (final UnsupportedEncodingException e) {
content = post.get("content", "").getBytes();
}
final wikiBoard.entry newEntry = sb.wikiDB.newEntry(pagename, author, ip, post.get("reason", "edit"), content);
sb.wikiDB.write(newEntry);
// create a news message
final HashMap<String, String> map = new HashMap<String, String>();
map.put("page", pagename);
map.put("author", author.replace(',', ' '));
if (post.get("content", "").trim().length() > 0 && !page.page().equals(content))
sb.webIndex.peers().newsPool.publishMyNews(yacyNewsRecord.newRecord(sb.webIndex.peers().mySeed(), yacyNewsPool.CATEGORY_WIKI_UPDATE, map));
page = newEntry;
prop.putHTML("LOCATION", "/Wiki.html?page=" + pagename);
}
if (post != null && post.containsKey("edit")) {
if ((access.equals("admin") && (!sb.verifyAuthentication(header, true)))) {
// check access right for admin
prop.put("AUTHENTICATE", "admin log-in"); // force log-in
return prop;
}
// edit the page
try {
prop.put("mode", "1"); //edit
prop.putHTML("mode_author", author);
prop.putHTML("mode_page-code", new String(page.page(), "UTF-8"));
prop.putHTML("mode_pagename", pagename);
} catch (final UnsupportedEncodingException e) {}
}
//contributed by [MN]
else if (post != null && post.containsKey("preview")) {
// preview the page
prop.put("mode", "2");//preview
prop.putHTML("mode_pagename", pagename);
prop.putHTML("mode_author", author);
prop.put("mode_date", dateString(new Date()));
prop.putWiki("mode_page", post.get("content", ""));
prop.putHTML("mode_page-code", post.get("content", ""));
}
//end contrib of [MN]
else if (post != null && post.containsKey("index")) {
// view an index
prop.put("mode", "3"); //Index
String subject;
try {
final Iterator<byte[]> i = sb.wikiDB.keys(true);
wikiBoard.entry entry;
int count=0;
while (i.hasNext()) {
subject = new String(i.next());
entry = sb.wikiDB.read(subject);
prop.putHTML("mode_pages_"+count+"_name",wikiBoard.webalize(subject));
prop.putHTML("mode_pages_"+count+"_subject", subject);
prop.put("mode_pages_"+count+"_date", dateString(entry.date()));
prop.putHTML("mode_pages_"+count+"_author", entry.author());
count++;
}
prop.put("mode_pages", count);
} catch (final IOException e) {
prop.put("mode_error", "1"); //IO Error reading Wiki
prop.putHTML("mode_error_message", e.getMessage());
}
prop.putHTML("mode_pagename", pagename);
}
else if (post != null && post.containsKey("diff")) {
// Diff
prop.put("mode", "4");
prop.putHTML("mode_page", pagename);
prop.putHTML("mode_error_page", pagename);
try {
final Iterator<byte[]> it = sb.wikiDB.keysBkp(true);
wikiBoard.entry entry;
wikiBoard.entry oentry = null;
wikiBoard.entry nentry = null;
int count = 0;
boolean oldselected = false, newselected = false;
while (it.hasNext()) {
entry = sb.wikiDB.readBkp(new String(it.next()));
prop.put("mode_error_versions_" + count + "_date", wikiBoard.dateString(entry.date()));
prop.put("mode_error_versions_" + count + "_fdate", dateString(entry.date()));
if (wikiBoard.dateString(entry.date()).equals(post.get("old", null))) {
prop.put("mode_error_versions_" + count + "_oldselected", "1");
oentry = entry;
oldselected = true;
} else if (wikiBoard.dateString(entry.date()).equals(post.get("new", null))) {
prop.put("mode_error_versions_" + count + "_newselected", "1");
nentry = entry;
newselected = true;
}
count++;
}
count--; // don't show current version
if (!oldselected) // select latest old entry
prop.put("mode_error_versions_" + (count - 1) + "_oldselected", "1");
if (!newselected) // select latest new entry (== current)
prop.put("mode_error_curselected", "1");
if (count == 0) {
prop.put("mode_error", "2"); // no entries found
} else {
prop.put("mode_error_versions", count);
}
entry = sb.wikiDB.read(pagename);
if (entry != null) {
prop.put("mode_error_curdate", wikiBoard.dateString(entry.date()));
prop.put("mode_error_curfdate", dateString(entry.date()));
}
if (nentry == null) nentry = entry;
if (post.containsKey("compare") && oentry != null && nentry != null) {
// TODO: split into paragraphs and compare them with the same diff-algo
final diff diff = new diff(
new String(oentry.page(), "UTF-8"),
new String(nentry.page(), "UTF-8"), 3);
prop.put("mode_versioning_diff", de.anomic.data.diff.toHTML(new diff[] { diff }));
prop.put("mode_versioning", "1");
} else if (post.containsKey("viewold") && oentry != null) {
prop.put("mode_versioning", "2");
prop.putHTML("mode_versioning_pagename", pagename);
prop.putHTML("mode_versioning_author", oentry.author());
prop.put("mode_versioning_date", dateString(oentry.date()));
prop.putWiki("mode_versioning_page", oentry.page());
prop.putHTML("mode_versioning_page-code", new String(oentry.page(), "UTF-8"));
}
} catch (final IOException e) {
prop.put("mode_error", "1"); //IO Error reading Wiki
prop.putHTML("mode_error_message", e.getMessage());
}
}
else {
// show page
prop.put("mode", "0"); //viewing
prop.putHTML("mode_pagename", pagename);
prop.putHTML("mode_author", page.author());
prop.put("mode_date", dateString(page.date()));
prop.putWiki("mode_page", page.page());
prop.put("controls", "0");
prop.putHTML("controls_pagename", pagename);
}
// return rewrite properties
return prop;
}
/**
* get key from post, use dflt if (not present or post == null)
*
* @param post
* @param string
* @param string2
* @return
*/
private static String get(final serverObjects post, final String key, final String dflt) {
return (post == null ? dflt : post.get(key, dflt));
}
}