yacy_search_server/source/net/yacy/http/ProxyCacheHandler.java

98 lines
4.1 KiB
Java
Raw Normal View History

2011-04-13 15:28:28 +02:00
//
// ProxyCacheHandler
// Copyright 2004 by Michael Peter Christen; mc@yacy.net, Frankfurt a. M., Germany
// Copyright 2011 by Florian Richter
// First released 2011 at http://yacy.net
//
// $LastChangedDate$
// $LastChangedRevision$
// $LastChangedBy$
//
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; either
// version 2.1 of the License, or (at your option) any later version.
//
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
// Lesser General Public License for more details.
//
// You should have received a copy of the GNU Lesser General Public License
// along with this program in the file lgpl21.txt
// If not, see <http://www.gnu.org/licenses/>.
//
package net.yacy.http;
import java.io.IOException;
import java.util.Map.Entry;
2014-01-05 15:06:40 +01:00
import javax.servlet.ServletException;
2011-04-13 15:28:28 +02:00
import javax.servlet.http.HttpServletRequest;
import javax.servlet.http.HttpServletResponse;
2014-01-05 15:06:40 +01:00
import net.yacy.cora.document.id.DigestURL;
2011-04-13 15:28:28 +02:00
import net.yacy.cora.protocol.RequestHeader;
import net.yacy.cora.protocol.ResponseHeader;
import net.yacy.crawler.data.Cache;
import net.yacy.crawler.retrieval.Response;
import net.yacy.http.servlets.YaCyDefaultServlet;
2011-04-13 15:28:28 +02:00
import org.eclipse.jetty.server.Handler;
import org.eclipse.jetty.server.Request;
/**
* jetty http handler serves pages from cache if available and valid
2011-04-13 15:28:28 +02:00
*/
public class ProxyCacheHandler extends AbstractRemoteHandler implements Handler {
2014-01-05 15:06:40 +01:00
private void handleRequestFromCache(@SuppressWarnings("unused") HttpServletRequest request, HttpServletResponse response, ResponseHeader cachedResponseHeader, byte[] content) throws IOException {
// TODO: check if-modified
for (Entry<String, String> entry : cachedResponseHeader.entrySet()) {
response.addHeader(entry.getKey(), entry.getValue());
}
response.setStatus(HttpServletResponse.SC_NON_AUTHORITATIVE_INFORMATION);
response.getOutputStream().write(content);
2011-04-13 15:28:28 +02:00
// we handled this request, break out of handler chain
}
@Override
public void handleRemote(String target, Request baseRequest, HttpServletRequest request, HttpServletResponse response) throws IOException, ServletException {
if (request.getMethod().equals("GET")) {
String queryString = request.getQueryString() != null ? "?" + request.getQueryString() : "";
DigestURL url = new DigestURL(request.getRequestURL().toString() + queryString);
ResponseHeader cachedResponseHeader = Cache.getResponseHeader(url.hash());
2011-04-13 15:28:28 +02:00
if (cachedResponseHeader != null) {
RequestHeader proxyHeaders = ProxyHandler.convertHeaderFromJetty(request);
// TODO: this convertion is only necessary
final net.yacy.crawler.retrieval.Request yacyRequest = new net.yacy.crawler.retrieval.Request(
null,
url,
proxyHeaders.referer() == null ? null : new DigestURL(proxyHeaders.referer().toNormalform(true)).hash(),
"",
2011-05-09 18:20:34 +02:00
cachedResponseHeader.lastModified(),
sb.crawler.defaultProxyProfile.handle(),
0,
sb.crawler.defaultProxyProfile.timezoneOffset());
2011-04-13 15:28:28 +02:00
final Response cachedResponse = new Response(
yacyRequest,
proxyHeaders,
2011-04-13 15:28:28 +02:00
cachedResponseHeader,
sb.crawler.defaultProxyProfile,
2014-06-12 05:23:26 +02:00
false,
null);
byte[] cacheContent = Cache.getContent(url.hash());
2011-04-13 15:28:28 +02:00
if (cacheContent != null && cachedResponse.isFreshForProxy()) {
handleRequestFromCache(request, response, cachedResponseHeader, cacheContent);
baseRequest.setHandled(true);
2011-04-13 15:28:28 +02:00
}
}
}
}
2011-04-13 15:28:28 +02:00
}