yacy_search_server/htroot/IndexReIndexMonitor_p.html

170 lines
8.1 KiB
HTML
Raw Normal View History

<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" >
<head>
<title>YaCy '#[clientname]#': Field Re-Indexing</title>
#%env/templates/metas.template%#
</head>
<body id="IndexReindexMonitor">
#%env/templates/header.template%#
#%env/templates/submenuIndexControl.template%#
<h2>Field Re-Indexing</h2>
<p>In case that an index schema of the embedded/local index has changed, all documents with missing field entries can be indexed again with a reindex job.</p>
<form action="IndexReIndexMonitor_p.html" method="post" enctype="multipart/form-data" accept-charset="UTF-8">
<table><tr valign="top"><td>
<input type="hidden" name="transactionToken" value="#[transactionToken]#"/>
<fieldset>
<table>
<tr>
<td>Documents in current queue</td>
<td>#[querysize]#</td>
<td>#(reindexjobrunning)#::<input type="submit" value="refresh page" class="btn btn-success"/>#(/reindexjobrunning)#</td>
</tr>
<tr>
<td>Documents processed</td>
<td>#[docsprocessed]#</td>
<td></td>
</tr>
<tr>
<td>current select query </td>
<td>#[currentselectquery]#</td>
<td></td>
</tr>
<tr>
<td>&nbsp;</td>
<td></td>
<td></td>
</tr>
</table>
#(reindexjobrunning)#
<input type="submit" name="reindexnow" value="start reindex job now" class="btn btn-primary"/>
::<input type="submit" name="stopreindex" value="stop reindexing" class="btn btn-danger"/>
#(/reindexjobrunning)#
<p class="info">#[infomessage]#</p>
</fieldset>
</td><td>
#(reindexjobrunning)#::
<fieldset><legend>Remaining field list</legend>
<p>reindex documents containing these fields: </p>
<table>
<tr><th>Field</th><th>count</th></tr>
#{fieldlist}#
<tr>
<td>#[fieldname]#</td> <td align="right">#[fieldscore]#</td>
</tr>
#{/fieldlist}#
</table>
</fieldset>
#(/reindexjobrunning)#
</td></tr></table>
</form>
<h2>Re-Crawl Index Documents</h2>
<p>Searches the local index and selects documents to add to the crawler (recrawl the document).
This runs transparent as background job. Documents are added to the crawler only if no other crawls are active
and are added in small chunks.</p>
<div class="container-fluid">
<div class="row">
<form action="IndexReIndexMonitor_p.html?setup=recrawljob" method="post" enctype="multipart/form-data" accept-charset="UTF-8" class="col-md-10 col-lg-6">
<input type="hidden" name="transactionToken" value="#[transactionToken]#" />
<table><tr valign="top"><td>
#(recrawljobrunning)#
<fieldset>
#(error)#::
<div class="alert alert-danger" role="alert">Re-crawl works only with an embedded local Solr index!</div>
#(/error)#
<div class="form-group">
<label>Solr query <input type="text" name="recrawlquerytext" size="40" value="#[recrawlquerytext]#" /></label>
<input type="submit" name="simulateRecrawl" value="Simulate" class="btn btn-default" title="Check only how many documents would be selected for recrawl"/>
</div>
#(simulationResult)#
::
<div class="alert alert-success" role="alert">#[docCount]# #(showSelectLink)#document(s)::<a href="#[browseSelectedUrl]#" target="recrawlCandidates" title="Browse metadata of the #[rows]# first selected documents">document(s)</a>#(/showSelectLink)# selected for recrawl.</div>
::
<div class="alert alert-danger" role="alert">An error occurred when trying to run the selection query.</div>
::
<div class="alert alert-danger" role="alert">The Solr index is not connected. Please restart your peer.</div>
#(/simulationResult)#
<div class="form-group">
<label>Include failed URLs <input type="checkbox" name="includefailedurls" #(includefailedurls)#::checked="checked"#(/includefailedurls)# /></label>
</div>
<input type="submit" name="recrawlDefaults" value="Set defaults" class="btn btn-default" title="Reset to default values"/>
<input type="submit" name="recrawlnow" value="start recrawl job now" class="btn btn-primary"/>
to re-crawl documents selected with the given query.
</fieldset>::
#(/recrawljobrunning)#
</td>
<td>
#(recrawljobrunning)#::
<fieldset><legend>Re-Crawl Query Details</legend>
<table>
<tr>
<td>Documents to process</td><td>#[docCount]#</td>
</tr>
<tr>
<td>Current Query</td><td>#[recrawlquerytext]#</td>
</tr>
<tr>
<td>&nbsp;</td><td> </td>
</tr>
<tr>
<td>&nbsp;</td><td> </td>
</tr>
<tr>
<td>Edit Solr Query</td><td><input type="text" name="recrawlquerytext" size="40" value="#[recrawlquerytext]#" /><input type="submit" name="updquery" value="update" class="btn btn-sm btn-default"/></td>
</tr>
<tr>
<td>include failed urls</td><td><input type="checkbox" name="includefailedurls" onchange="this.form.submit()" #(includefailedurls)#::checked="checked"#(/includefailedurls)# /></td>
</tr>
</table>
<input type="submit" name="stoprecrawl" value="stop recrawl job" class="btn btn-danger"/>
</fieldset>
#(/recrawljobrunning)#
</td>
</tr></table>
</form>
#(recrawlReport)#::
<div class="col-md-10 col-lg-6">
<div class="panel panel-info">
<div class="panel-heading">
<h3 class="panel-title">#(jobStatus)#::::Last #(/jobStatus)#Re-Crawl job report</h3>
</div>
<div class="panel-body">
<table class="table">
<tbody>
<tr>
<th scope="row">Status</th>
<td>#(jobStatus)#Running::Shutdown in progress::Terminated#(/jobStatus)#</td>
</tr>
<tr>
<th scope="row">Start time</th>
<td>#[startTime]#</td>
</tr>
<tr>
<th scope="row">End time</th>
<td>#[endTime]#</td>
</tr>
<tr>
<th scope="row">Count</th>
<td>#[recrawledUrlsCount]# URLs added to the crawler queue for recrawl</td>
</tr>
</tbody>
</table>
#(jobStatus)#
<a class="btn btn-default" href="IndexReIndexMonitor_p.html" role="button"><span class="glyphicon glyphicon-refresh"></span> Refresh</a>
::
<a class="btn btn-default" href="IndexReIndexMonitor_p.html" role="button"><span class="glyphicon glyphicon-refresh"></span> Refresh</a>
::
#(/jobStatus)#
</div>
</div>
</div>
#(/recrawlReport)#
</div>
</div>
#%env/templates/footer.template%#
</body>
</html>