mirror of
https://github.com/yacy/yacy_search_server.git
synced 2024-09-21 00:00:13 +02:00
2fb6ebe88a
Background: some user report problem with connecting/crawling some sites via https which require SNI support (by default switched off in YaCy). On the other hand systems not demanding SNI support are sometimes not properly configured and due to a bug/feature in java 1.7 connection is aborted. The later is more often the case, so the default is still fine. With the java start parameter expert user can no alter the startparameter to -Djsse.enableSNIExtension=true (java default) if they crawl more hosts requiring SNI support. The alternative to let YaCy try both during https handshake (deep inside the httpclient) is not pursut at this time.
221 lines
6.2 KiB
Bash
Executable File
221 lines
6.2 KiB
Bash
Executable File
#!/usr/bin/env sh
|
|
JAVA="`which java`"
|
|
CONFIGFILE="DATA/SETTINGS/yacy.conf"
|
|
LOGFILE="yacy.log"
|
|
PIDFILE="yacy.pid"
|
|
OS="`uname`"
|
|
|
|
#get javastart args
|
|
JAVA_ARGS="-server -Djava.awt.headless=true -Dfile.encoding=UTF-8 -Djsse.enableSNIExtension=false";
|
|
#rem -Djsse.enableSNIExtension=false fix a ssl problem in Java 1.7, see http://teknosrc.com/javax-net-ssl-sslprotocolexception-handshake-alert-unrecognized_name-solved/
|
|
|
|
#JAVA_ARGS="-verbose:gc -XX:+PrintGCTimeStamps -XX:+PrintGCDetails $JAVA_ARGS";
|
|
|
|
#check if OS is Sun Solaris or one of the OpenSolaris distributions and use different version of id if necessary
|
|
if [ $OS = "SunOS" ]
|
|
then
|
|
# only this version of id supports the parameter -u
|
|
ID="/usr/xpg4/bin/id"
|
|
else
|
|
# regular id for any other case (especially Linux and OSX)
|
|
ID="id"
|
|
fi
|
|
|
|
if [ ! -x "$JAVA" ]
|
|
then
|
|
echo "The java command is not executable."
|
|
echo "Either you have not installed java or it is not in your PATH"
|
|
#Cron supports setting the path in
|
|
#echo "Has this script been invoked by CRON?"
|
|
#echo "if so, please set PATH in the crontab, or set the correct path in the variable in this script."
|
|
exit 1
|
|
fi
|
|
|
|
usage() {
|
|
cat - <<USAGE
|
|
startscript for YaCy on UNIX-like systems
|
|
Options
|
|
-h, --help show this help
|
|
-t, --tail-log show the output of "tail -f DATA/LOG/yacy00.log" after starting YaCy
|
|
-l, --logging save the output of YaCy to yacy.log
|
|
-d, --debug show the output of YaCy on the console
|
|
-p, --print-out only print the command, which would be executed to start YaCy
|
|
-g, --gui start a gui for YaCy
|
|
USAGE
|
|
}
|
|
|
|
#startup YaCy
|
|
cd "`dirname $0`"
|
|
|
|
if [ $OS = "OpenBSD" ]
|
|
then
|
|
if [ $(echo $@ | grep -o "\-\-" | wc -l) -ne 0 ]
|
|
then
|
|
echo "WARNING: Unfortunately this script does not support long options in $OS."
|
|
fi
|
|
|
|
options="`getopt hdlptg: $*`"
|
|
else
|
|
options="`getopt -n YaCy -o h,d,l,p,t,g -l help,debug,logging,print-out,tail-log,gui -- $@`"
|
|
fi
|
|
|
|
if [ $? -ne 0 ];then
|
|
|
|
exit 1;
|
|
fi
|
|
|
|
isparameter=0; #options or parameter part of getopts?
|
|
parameter="" #parameters will be collected here
|
|
|
|
LOGGING=0
|
|
DEBUG=0
|
|
PRINTONLY=0
|
|
TAILLOG=0
|
|
GUI=0
|
|
for option in $options;do
|
|
if [ $isparameter -ne 1 ];then #option
|
|
case $option in
|
|
-h|--help)
|
|
usage
|
|
exit 3
|
|
;;
|
|
-l|--logging)
|
|
LOGGING=1
|
|
if [ $DEBUG -eq 1 ];then
|
|
echo "can not combine -l and -d"
|
|
exit 1;
|
|
fi
|
|
;;
|
|
-d|--debug)
|
|
DEBUG=1
|
|
# enable asserts
|
|
JAVA_ARGS="$JAVA_ARGS -ea -Dcom.sun.management.jmxremote.port=9999 -Dcom.sun.management.jmxremote.authenticate=false -Dcom.sun.management.jmxremote.ssl=false"
|
|
if [ $LOGGING -eq 1 ];then
|
|
echo "can not combine -l and -d"
|
|
exit 1;
|
|
fi
|
|
;;
|
|
-p|--print-out)
|
|
PRINTONLY=1
|
|
;;
|
|
-t|--tail-log)
|
|
TAILLOG=1
|
|
;;
|
|
-g|--gui)
|
|
GUI=1
|
|
isparameter=1
|
|
;;
|
|
esac #case option
|
|
else #parameter
|
|
if [ x$option = "--" ];then #option / parameter separator
|
|
isparameter=1;
|
|
continue
|
|
else
|
|
parameter="$parameter $option"
|
|
fi
|
|
fi #parameter or option?
|
|
done
|
|
|
|
#echo $options;exit 0 #DEBUG for getopts
|
|
|
|
#check if Linux system supports large memory pages or if OS is Solaris which
|
|
#supports large memory pages since version 9
|
|
#(according to http://java.sun.com/javase/technologies/hotspot/largememory.jsp)
|
|
ENABLEHUGEPAGES=0;
|
|
|
|
if [ $OS = "Linux" ]
|
|
then
|
|
HUGEPAGESTOTAL="`cat /proc/meminfo | grep HugePages_Total | sed s/[^0-9]//g`"
|
|
if [ -n "$HUGEPAGESTOTAL" ] && [ $HUGEPAGESTOTAL -ne 0 ]
|
|
then
|
|
ENABLEHUGEPAGES=1
|
|
fi
|
|
# the G1 GC is on by default in Java7, so we try that here as well
|
|
# JAVA_ARGS="$JAVA_ARGS -XX:+UnlockExperimentalVMOptions -XX:+UseG1GC"
|
|
elif [ $OS = "SunOS" ]
|
|
then
|
|
# the UseConcMarkSweepGC option caused a full CPU usage - bug on Darwin.
|
|
# It was reported that the same option causes good performance on solaris.
|
|
JAVA_ARGS="$JAVA_ARGS -XX:+UseConcMarkSweepGC -XX:+CMSIncrementalMode"
|
|
ENABLEHUGEPAGES=1
|
|
fi
|
|
|
|
#turn on support for large memory pages if supported by OS
|
|
if [ $ENABLEHUGEPAGES -eq 1 ]
|
|
then
|
|
JAVA_ARGS="$JAVA_ARGS -XX:+UseLargePages"
|
|
fi
|
|
|
|
#turn on MMap for Solr if OS is a 64bit OS
|
|
if [ -n "`uname -m | grep 64`" ]; then JAVA_ARGS="$JAVA_ARGS -Dsolr.directoryFactory=solr.MMapDirectoryFactory"; fi
|
|
|
|
if [ ! -f $CONFIGFILE -a -f DATA/SETTINGS/httpProxy.conf ]
|
|
then
|
|
# old config if new does not exist
|
|
CONFIGFILE="DATA/SETTINGS/httpProxy.conf"
|
|
fi
|
|
if [ -f $CONFIGFILE ]
|
|
then
|
|
# startup memory
|
|
for i in Xmx Xms; do
|
|
j="`grep javastart_$i $CONFIGFILE | sed 's/^[^=]*=//'`";
|
|
if [ -n $j ]; then JAVA_ARGS="-$j $JAVA_ARGS"; fi;
|
|
done
|
|
|
|
# Priority
|
|
j="`grep javastart_priority $CONFIGFILE | sed 's/^[^=]*=//'`";
|
|
|
|
if [ ! -z "$j" ];then
|
|
if [ -n $j ]; then JAVA="nice -n $j $JAVA"; fi;
|
|
fi
|
|
|
|
PORT="`grep ^port= $CONFIGFILE | sed 's/^[^=]*=//'`";
|
|
|
|
# for i in `grep javastart $CONFIGFILE`;do
|
|
# i="${i#javastart_*=}";
|
|
# JAVA_ARGS="-$i $JAVA_ARGS";
|
|
# done
|
|
else
|
|
JAVA_ARGS="-Xmx600m -Xms180m $JAVA_ARGS";
|
|
PORT="8090"
|
|
fi
|
|
|
|
#echo "JAVA_ARGS: $JAVA_ARGS"
|
|
#echo "JAVA: $JAVA"
|
|
|
|
# generating the proper classpath
|
|
CLASSPATH=""
|
|
for N in lib/*.jar; do CLASSPATH="$CLASSPATH$N:"; done
|
|
CLASSPATH=".:htroot:$CLASSPATH"
|
|
|
|
cmdline="$JAVA $JAVA_ARGS -classpath $CLASSPATH net.yacy.yacy";
|
|
if [ $GUI -eq 1 ] #gui
|
|
then
|
|
cmdline="$cmdline -gui $parameter"
|
|
fi
|
|
if [ $DEBUG -eq 1 ] #debug
|
|
then
|
|
cmdline=$cmdline
|
|
elif [ $LOGGING -eq 1 ];then #logging
|
|
cmdline="$cmdline >> yacy.log & echo \$! > $PIDFILE"
|
|
else
|
|
cmdline="$cmdline >/dev/null 2>/dev/null &"
|
|
fi
|
|
if [ $PRINTONLY -eq 1 ];then
|
|
echo $cmdline
|
|
else
|
|
echo "****************** YaCy Web Crawler/Indexer & Search Engine *******************"
|
|
echo "**** (C) by Michael Peter Christen, usage granted under the GPL Version 2 ****"
|
|
echo "**** USE AT YOUR OWN RISK! Project home and releases: http://yacy.net/ ****"
|
|
echo "** LOG of YaCy: DATA/LOG/yacy00.log (and yacy<xx>.log) **"
|
|
echo "** STOP YaCy: execute stopYACY.sh and wait some seconds **"
|
|
echo "** GET HELP for YaCy: see http://wiki.yacy.net and http://forum.yacy.de **"
|
|
echo "*******************************************************************************"
|
|
echo " >> YaCy started as daemon process. Administration at http://localhost:$PORT << "
|
|
eval $cmdline
|
|
if [ "$TAILLOG" -eq "1" -a ! "$DEBUG" -eq "1" ];then
|
|
sleep 1
|
|
tail -f DATA/LOG/yacy00.log
|
|
fi
|
|
fi
|