2010-10-17 18:51:29 +02:00
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "DTD/xhtml1-transitional.dtd">
<!-- This page is only XHTML 1.0 Transitional because target is being used in a links -->
2007-11-15 04:03:18 +01:00
< html xmlns = "http://www.w3.org/1999/xhtml" >
2008-09-04 22:28:36 +02:00
#(reload)#::< meta http-equiv = "REFRESH" content = "5; url=/IndexControlURLs_p.html" > #(/reload)#
2007-11-15 04:03:18 +01:00
< head >
2013-02-24 18:09:34 +01:00
< title > YaCy '#[clientname]#': URL Database Administration< / title >
2007-11-15 04:03:18 +01:00
#%env/templates/metas.template%#
2010-05-05 23:12:58 +02:00
< script type = "text/javascript" >
2010-03-09 16:44:11 +01:00
//< ![CDATA[
function xmlhttpPost() {
2010-10-17 18:51:29 +02:00
var searchform = document.getElementById('searchform');
2010-03-09 16:44:11 +01:00
search(searchform.urlstring.value);
}
function search(query) {
var xmlHttpReq = false;
var self = this;
if (window.XMLHttpRequest) { // Mozilla/Safari
self.xmlHttpReq = new XMLHttpRequest();
}
else if (window.ActiveXObject) { // IE
self.xmlHttpReq = new ActiveXObject("Microsoft.XMLHTTP");
}
2013-06-25 16:36:05 +02:00
self.xmlHttpReq.open('GET', "/solr/select?q=sku:\"" + query + "\" OR host_s:\"" + query + "\" OR host_dnc_s:\"" + query + "\" OR host_organization_s:\"" + query + "\" OR host_organizationdnc_s:\"" + query + "\" OR host_subdomain_s:\"" + query + "\" OR url_paths_sxt:\"" + query + "\" OR url_file_name_s:\"" + query + "\"& start=0& rows=100& wt=yjson", true);
2010-03-09 16:44:11 +01:00
self.xmlHttpReq.setRequestHeader('Content-Type', 'application/x-www-form-urlencoded');
self.xmlHttpReq.onreadystatechange = function() {
if (self.xmlHttpReq.readyState == 4) {
updatepage(self.xmlHttpReq.responseText);
}
}
self.xmlHttpReq.send(null);
}
function updatepage(str) {
var raw = document.getElementById("raw");
if (raw != null) raw.innerHTML = str;
var rsp = eval("("+str+")");
var firstChannel = rsp.channels[0];
var totalResults = firstChannel.totalResults.replace(/[,.]/,"");
var startIndex = firstChannel.startIndex;
var itemsPerPage = firstChannel.itemsPerPage;
var navigation = firstChannel.navigation;
var html = "";
if (totalResults > 0 & & firstChannel.items.length > 0) {
var item;
html += "< table class = \"networkTable\" border = \"0\" cellpadding = \"2\" cellspacing = \"1\" width = \"99%\" > ";
html += "< tr class = \"TableHeader\" valign = \"bottom\" > ";
2010-10-17 18:51:29 +02:00
html += "< td > URL from index (total results = " + totalResults + ")< \/td>";
2010-03-09 16:44:11 +01:00
for (var i = 0; i < firstChannel.items.length ; i + + ) {
item = firstChannel.items[i];
2010-10-17 18:51:29 +02:00
html += "< tr class = \"TableCellLight\" > < td align = \"left\" > < a href = \"IndexControlURLs_p.html?urlstringsearch=&urlstring=" + item . link + " \ " > " + item.link + "< \/a>< \/td>";
2010-03-09 16:44:11 +01:00
}
2010-10-17 18:51:29 +02:00
html += "< \/table>";
2010-03-09 16:44:11 +01:00
}
document.getElementById("searchresults").innerHTML = html;
}
//]]>
< / script >
2007-11-15 04:03:18 +01:00
< / head >
< body id = "IndexControl" >
#%env/templates/header.template%#
#%env/templates/submenuIndexControl.template%#
2014-03-18 13:42:31 +01:00
< div id = "api" >
< a href = "solr/select?defType=edismax&start=0&rows=3&core=collection1&wt=html&q=id:%22#[urlhash]#%22" >
< img src = "env/grafics/api.png" width = "60" height = "40" alt = "API" / > < / a >
< span > These document details can be retrieved as < a href = "http://www.w3.org/TR/xhtml-rdfa-primer/" target = "_blank" > XHTML+RDFa< / a >
document containg < a href = "http://www.w3.org/RDF/" target = "_blank" > RDF< / a > annotations in < a href = "http://dublincore.org/" target = "_blank" > Dublin Core< / a > vocabulary.
The XHTML+RDFa data format is both a XML content format and a HTML display format and is considered as an important < a href = "http://www.w3.org/2001/sw/" target = "_blank" > Semantic Web< / a > content format.
The same content can also be retrieved as pure < a href = "api/yacydoc.xml?urlhash=#[urlhash]#" > XML metadata< / a > with DC tag name vocabulary.
Click the API icon to see an example call to the search rss API.
To see a list of all APIs, please visit the < a href = "http://www.yacy-websuche.de/wiki/index.php/Dev:API" target = "_blank" > API wiki page< / a > .< / span >
< / div >
2013-02-24 18:09:34 +01:00
< h2 > URL Database Administration< / h2 >
2007-11-15 04:03:18 +01:00
< p > The local index currently contains #[ucount]# URL references< / p >
2011-02-14 23:57:43 +01:00
< form action = "IndexControlURLs_p.html" id = "searchform" method = "post" enctype = "multipart/form-data" accept-charset = "UTF-8" onkeyup = "xmlhttpPost(); return false;" >
2007-11-15 04:03:18 +01:00
< fieldset > < legend > URL Retrieval< / legend >
< dl >
2009-10-09 16:44:20 +02:00
2007-11-15 04:03:18 +01:00
< dt class = "TableCellDark" > Retrieve by URL:< / dt >
< dd > < input type = "text" name = "urlstring" value = "#[urlstring]#" size = "40" maxlength = "250" / >
2014-03-20 22:52:01 +01:00
< input type = "submit" name = "urlstringsearch" value = "Show Details for URL" class = "btn btn-primary" style = "width:240px;" / > < br / >
2010-03-09 16:44:11 +01:00
< div id = "searchresults" > < / div >
2007-11-15 04:03:18 +01:00
< / dd >
2007-11-22 21:47:06 +01:00
< dt class = "TableCellDark" > Retrieve by URL-Hash:< / dt >
2007-11-15 04:03:18 +01:00
< dd > < input type = "text" name = "urlhash" value = "#[urlhash]#" size = "40" maxlength = "12" / >
2014-03-20 22:52:01 +01:00
< input type = "submit" name = "urlhashsearch" value = "Show Details for URL-Hash" class = "btn btn-primary" style = "width:240px;" / >
2007-11-15 04:03:18 +01:00
< / dd >
< / dl >
< / fieldset >
< / form >
2012-10-10 00:09:27 +02:00
< form action = "IndexControlURLs_p.html" method = "post" enctype = "multipart/form-data" accept-charset = "UTF-8" >
2014-08-27 00:45:39 +02:00
< fieldset # ( cleanup ) # disabled = "disabled" :: # ( / cleanup ) # > < legend > Cleanup< / legend >
2012-10-10 00:09:27 +02:00
< dl >
< dt class = "TableCellDark" > Index Deletion< / dt >
< dd > < input type = "checkbox" name = "deleteIndex" id = "deleteIndex"
2015-06-04 22:44:01 +02:00
onclick="x=document.getElementById('deleteIndex').checked;#(rwi)#::document.getElementById('deleteRWI').checked=x;#(/rwi)#document.getElementById('deleteRobots').checked=x;document.getElementById('deleteRobots').checked=x;document.getElementById('deleteCrawlQueues').checked=x;c='disabled';if(x){c='';};document.getElementById('deletecomplete').disabled=c;document.getElementById('deleteCache').disabled=c;document.getElementById('deleteFirstSeen').disabled=c;document.getElementById('deleteRobots').disabled=c;document.getElementById('deleteCrawlQueues').disabled=c;"
2014-03-18 13:42:31 +01:00
/> Delete local search index (embedded Solr and old Metadata)< br / >
2014-08-27 00:45:39 +02:00
#(cleanupsolr)#::< input type = "checkbox" name = "deleteRemoteSolr" id = "deleteRemoteSolr" onclick = "x=document.getElementById('deleteRemoteSolr').checked;c='disabled';if(x){c='';};document.getElementById('deletecomplete').disabled=c;" / > Delete remote solr index< br / > #(/cleanupsolr)#
#(cleanuprwi)#::< input type = "checkbox" name = "deleteRWI" id = "deleteRWI" onclick = "x=document.getElementById('deleteRWI').checked;c='disabled';if(x){c='';};document.getElementById('deletecomplete').disabled=c;" / > Delete RWI Index (DHT transmission words)< br / > #(/cleanuprwi)#
#(cleanupcitation)#::< input type = "checkbox" name = "deleteCitation" id = "deleteCitation" onclick = "x=document.getElementById('deleteCitation').checked;c='disabled';if(x){c='';};document.getElementById('deletecomplete').disabled=c;" / > Delete Citation Index (linking between URLs)< br / > #(/cleanupcitation)#
2014-11-13 00:58:58 +01:00
< input type = "checkbox" name = "deleteFirstSeen" id = "deleteFirstSeen" disabled = "disabled" / > Delete First-Seen Date Table< br / >
2014-03-18 13:42:31 +01:00
< input type = "checkbox" name = "deleteCache" id = "deleteCache" disabled = "disabled" / > Delete HTTP & FTP Cache< br / >
< input type = "checkbox" name = "deleteCrawlQueues" id = "deleteCrawlQueues" disabled = "disabled" / > Stop Crawler and delete Crawl Queues< br / >
< input type = "checkbox" name = "deleteRobots" id = "deleteRobots" disabled = "disabled" / > Delete robots.txt Cache< br / >
2014-08-27 00:31:03 +02:00
< input type = "submit" name = "deletecomplete" id = "deletecomplete" value = "Delete" disabled = "disabled" class = "btn btn-danger" style = "width:240px;" onclick = "return confirm('Confirm Deletion')" / >
2012-10-10 00:09:27 +02:00
< / dd >
< / dl >
< / fieldset >
< / form >
2010-03-09 16:44:11 +01:00
2015-06-04 23:03:46 +02:00
#(dumprestore)#::
< form action = "IndexControlURLs_p.html" method = "post" enctype = "multipart/form-data" accept-charset = "UTF-8" >
< fieldset > < legend > Optimize Solr< / legend >
< dl >
< dt > < / dt >
< dd > merge to max. < input type = "text" name = "optimizemax" value = "#[optimizemax]#" size = "6" maxlength = "6" / > segments
< input type = "submit" name = "optimizesolr" value = "Optimize Solr" class = "btn btn-primary" style = "width:240px;" / >
< / dd >
< / dl >
< / fieldset >
< / form >
< form action = "IndexControlURLs_p.html" method = "post" enctype = "multipart/form-data" accept-charset = "UTF-8" >
< fieldset > < legend > Reboot Solr Core< / legend >
< dl >
< dt > < / dt >
< dd > < input type = "submit" name = "rebootsolr" value = "Shut Down and Re-Start Solr" class = "btn btn-primary" style = "width:240px;" / >
< / dd >
< / dl >
< / fieldset >
< / form > ::
#(/dumprestore)#
2008-09-04 21:41:57 +02:00
#(statistics)#::
2011-02-14 23:57:43 +01:00
< form action = "IndexControlURLs_p.html" method = "post" enctype = "multipart/form-data" accept-charset = "UTF-8" >
2008-09-04 21:41:57 +02:00
< fieldset > < legend > Statistics about top-domains in URL Database< / legend >
< dl >
2015-05-29 15:05:52 +02:00
< dt > < / dt >
2008-09-04 21:41:57 +02:00
< dd > Show top < input type = "text" name = "lines" value = "#[lines]#" size = "6" maxlength = "6" / > domains from all URLs.
2014-03-20 22:52:01 +01:00
< input type = "submit" name = "statistics" value = "Generate Statistics" class = "btn btn-primary" style = "width:240px;" / >
2008-09-04 21:41:57 +02:00
< / dd >
< / dl >
< / fieldset >
< / form >
#(/statistics)#
2007-11-22 17:52:44 +01:00
2008-09-04 21:41:57 +02:00
#(statisticslines)#::
2010-10-17 18:51:29 +02:00
< p > < em > Statistics about the top-#[domains]# domains in the database:< / em > < / p >
2014-03-31 01:15:35 +02:00
< table >
2008-09-04 21:41:57 +02:00
< tr class = "TableHeader" >
< td align = "center" > < / td >
< td > < strong > Domain< / strong > < / td >
< td > < strong > URLs< / strong > < / td >
< / tr >
#{domains}#
< tr class = "TableCell#(dark)#Light::Dark#(/dark)#" >
< td >
2011-02-14 23:57:43 +01:00
< form action = "IndexControlURLs_p.html" method = "post" enctype = "multipart/form-data" accept-charset = "UTF-8" >
2008-09-04 21:41:57 +02:00
< div >
2013-01-24 12:39:19 +01:00
< input type = "hidden" name = "domain" value = "#[domain]#" / >
2008-09-04 21:41:57 +02:00
< input type = "hidden" name = "lines" value = "#[lines]#" / >
2014-06-22 23:33:59 +02:00
< input type = "submit" name = "deletedomain" value = "delete all" class = "btn btn-danger btn-xs" style = "padding: 0px 12px;" / >
2008-09-04 21:41:57 +02:00
< / div >
< / form >
< / td >
2010-10-17 18:51:29 +02:00
< td > < a href = "http://#[domain]#/" target = "_blank" > #[domain]#< / a > < / td >
2008-09-04 21:41:57 +02:00
< td > #[count]#< / td >
< / tr >
#{/domains}#
2010-10-17 18:51:29 +02:00
< / table >
2008-09-04 21:41:57 +02:00
#(/statisticslines)#
2007-11-22 17:52:44 +01:00
2007-11-15 04:03:18 +01:00
#(genUrlProfile)#
::No entry found for URL-hash #[urlhash]#
2014-02-10 21:40:42 +01:00
::< iframe src = "solr/select?defType=edismax&start=0&rows=3&core=collection1&wt=html&q=id:%22#[urlhash]#%22" width = "100%" height = "420" frameborder = "0" scrolling = "no" > < / iframe > < br / >
2014-03-18 13:42:31 +01:00
2011-02-14 23:57:43 +01:00
< form action = "ViewFile.html" method = "get" accept-charset = "UTF-8" >
2009-02-05 16:15:13 +01:00
< input type = "hidden" name = "viewMode" value = "parsed" / >
< input type = "hidden" name = "show" value = "Show" / >
< input type = "hidden" name = "urlHash" value = "#[urlhash]#" / >
2014-03-20 22:52:01 +01:00
< input type = "submit" value = "Show Content" name = "showcontent" class = "btn btn-primary" style = "width:240px;" / > < br / >
2009-02-05 16:15:13 +01:00
< / form >
2011-02-14 23:57:43 +01:00
< form action = "IndexControlURLs_p.html" method = "post" enctype = "multipart/form-data" accept-charset = "UTF-8" >
2007-11-15 04:03:18 +01:00
< input type = "hidden" name = "keystring" value = "" / >
< input type = "hidden" name = "keyhash" value = "" / >
< input type = "hidden" name = "urlstring" value = "" / >
< input type = "hidden" name = "urlhash" value = "#[urlhash]#" / >
2014-03-20 22:52:01 +01:00
< input type = "submit" value = "Delete URL" name = "urlhashdelete" class = "btn btn-primary" style = "width:240px;" / > < br / >
2007-11-15 04:03:18 +01:00
< span class = "small" > this may produce unresolved references at other word indexes but they do not harm< / span > < br / > < br / >
2014-03-20 22:52:01 +01:00
< input type = "submit" value = "Delete URL and remove all references from words" name = "urlhashdeleteall" class = "btn btn-primary" style = "width:240px;" / > < br / >
2007-11-15 04:03:18 +01:00
< span class = "small" > delete the reference to this url at every other word where the reference exists (very extensive, but prevents unresolved references)< / span > < br / >
< / form >
#(/genUrlProfile)#
2008-09-04 21:41:57 +02:00
2007-11-15 04:03:18 +01:00
#[result]#
#%env/templates/footer.template%#
< / body >
2013-12-26 01:16:53 +01:00
< / html >