yacy_search_server/source/de/anomic/tools/loaderThreads.java
orbiter c12bb8a6d0 - refactoring of the http client
- added a protection against memory leaks for the access tracker

git-svn-id: https://svn.berlios.de/svnroot/repos/yacy/trunk@5621 6c8d7289-2bf4-0310-a012-ef5d649a1542
2009-02-19 16:24:46 +00:00

221 lines
7.5 KiB
Java

// loaderThreads.java
// ---------------------------
// (C) by Michael Peter Christen; mc@yacy.net
// first published on http://www.anomic.de
// Frankfurt, Germany, 2004
// last major change: 28.09.2004
//
// This program is free software; you can redistribute it and/or modify
// it under the terms of the GNU General Public License as published by
// the Free Software Foundation; either version 2 of the License, or
// (at your option) any later version.
//
// This program is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
// GNU General Public License for more details.
//
// You should have received a copy of the GNU General Public License
// along with this program; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
package de.anomic.tools;
import java.util.ArrayList;
import java.util.Hashtable;
import de.anomic.crawler.HTTPLoader;
import de.anomic.http.httpClient;
import de.anomic.http.httpRemoteProxyConfig;
import de.anomic.http.httpRequestHeader;
import de.anomic.kelondro.util.FileUtils;
import de.anomic.yacy.yacyURL;
public class loaderThreads {
// global values for loader threads
protected int timeout;
protected String user;
protected String password;
protected httpRemoteProxyConfig remoteProxyConfig;
// management objects for collection of threads
Hashtable<String, Thread> threads;
int completed, failed;
public loaderThreads() {
this(10000, null, null);
}
public loaderThreads(
final int timeout,
final String user,
final String password
) {
this.timeout = timeout;
this.user = user;
this.password = password;
this.threads = new Hashtable<String, Thread>();
this.completed = 0;
this.failed = 0;
}
public void newPropLoaderThread(final String name, final yacyURL url) {
newThread(name, url, new propLoader());
}
public void newThread(final String name, final yacyURL url, final loaderProcess process) {
final Thread t = new loaderThread(url, process);
threads.put(name, t);
t.start();
}
public void terminateThread(final String name) {
final loaderThread t = (loaderThread) threads.get(name);
if (t == null) throw new RuntimeException("no such thread: " + name);
t.terminate();
}
public int threadCompleted(final String name) {
final loaderThread t = (loaderThread) threads.get(name);
if (t == null) throw new RuntimeException("no such thread: " + name);
return t.completed();
}
public int threadStatus(final String name) {
final loaderThread t = (loaderThread) threads.get(name);
if (t == null) throw new RuntimeException("no such thread: " + name);
return t.status();
}
public int completed() {
return completed;
}
public int failed() {
return failed;
}
public int count() {
return threads.size();
}
public Exception threadError(final String name) {
final loaderThread t = (loaderThread) threads.get(name);
if (t == null) throw new RuntimeException("no such thread: " + name);
return t.error();
}
protected class loaderThread extends Thread {
private final yacyURL url;
private Exception error;
private final loaderProcess process;
private byte[] page;
private boolean loaded;
public loaderThread(final yacyURL url, final loaderProcess process) {
this.url = url;
this.process = process;
this.error = null;
this.page = null;
this.loaded = false;
}
public void run() {
try {
final httpRequestHeader reqHeader = new httpRequestHeader();
reqHeader.put(httpRequestHeader.USER_AGENT, HTTPLoader.crawlerUserAgent);
page = httpClient.wget(url.toString(), reqHeader, timeout);
loaded = true;
process.feed(page);
if (process.status() == loaderCore.STATUS_FAILED) {
error = process.error();
}
if ((process.status() == loaderCore.STATUS_COMPLETED) ||
(process.status() == loaderCore.STATUS_FINALIZED)) completed++;
if ((process.status() == loaderCore.STATUS_ABORTED) ||
(process.status() == loaderCore.STATUS_FAILED)) failed++;
} catch (final Exception e) {
error = e;
failed++;
}
}
public void terminate() {
process.terminate();
}
public boolean loaded() {
return loaded;
}
public int completed() {
if (process.status() == loaderCore.STATUS_READY) return 1;
if (process.status() == loaderCore.STATUS_RUNNING) return 9 + ((process.completed() * 9) / 10);
if (process.status() == loaderCore.STATUS_COMPLETED) return 100;
return 0;
}
public int status() {
return process.status(); // see constants in loaderCore
}
public Exception error() {
return error;
}
}
public static class propLoader extends loaderCore implements loaderProcess {
public propLoader() {
this.status = STATUS_READY;
}
public synchronized void feed(final byte[] v) {
this.status = STATUS_RUNNING;
this.completion = 1;
int line = 0;
String s, key, value;
int p;
final ArrayList<String> lines = FileUtils.strings(v, "UTF-8");
try {
while ((this.run) && (line < lines.size())) {
// parse line and construct a property
s = lines.get(line);
if ((s != null) && ((p = s.indexOf('=')) > 0)) {
key = s.substring(0, p).trim();
value = s.substring(p + 1).trim();
if (key.length() > 0) result.put(key, value);
}
// update thread information
line++;
this.completion = 100 * line / lines.size();
}
if (line == lines.size()) {
this.status = STATUS_COMPLETED;
} else {
this.status = STATUS_ABORTED;
}
return;
} catch (final Exception e) {
this.status = STATUS_FAILED;
this.error = e;
return;
}
}
}
/*
public static void main(String[] args) {
httpdProxyHandler.setRemoteProxyConfig(httpRemoteProxyConfig.init("192.168.1.122", 3128));
loaderThreads loader = new loaderThreads();
try {
loader.newPropLoaderThread("load1", new yacyURL("http://www.anomic.de/superseed.txt", null));
} catch (MalformedURLException e) {
}
}
*/
}