【收藏】Linux服务器巡检的重要性,附脚本!

2022-10-27 19:09:15 浏览数 (1)

前言:

Linux服务器是系统重要的业务运行平台,对服务器进行巡检能够及时发现服务器的隐患,以便于改善和优化服务器的性能;观察服务器的运行状况,及时对设备进行调整,保证服务器的24小时不间断的工作;以及采集网内服务器信息。在此,为了便于运维人员顺利的完成服务器巡检工作,小编写了此文档,希望对Linux服务器的巡检工作起到指导、帮助的作用。

一、巡检项目

1、服务器硬件检查

2.操作系统检查

3.性能检查

4.安全检查

二、收集的脚本

巡检项信息如下(也可自行添加收集信息的模块):

1)、系统基本信息

2)、cpu信息

3)、ip网络信息

4)、cpu使用率

5)、连接数信息

6)、系统限制信息

7)、内存使用信息

8)、磁盘使用信息

9)、网络流量情况/系统资源变化

10)、cpu消耗情况前10排行

11)、cpu消耗按内存情况前10排行

12)、磁盘io情况

13)、系统定时任务列表

14)、系统定时任务脚本内容

脚本使用前注意事项

需要使用root用户执行 下载脚本:

  1. 使用说明 脚本中 ifconfig、mpstat、iostat命令有依赖,需要安装相关依赖包 yum -y install bc sysstat net-tools
  2. 执行chmod 777 oswatch.sh;然后直接sh oswatch.sh执行;
  1. 执行完巡检之后,将在脚本所在的路径下生成html巡检结果报告,如下:

脚本内容如下:

代码语言:javascript复制
#!/bin/bash
ipaddress=`ip a|grep "global"|awk '{print $2}' |awk -F/ '{print $1}'`
file_output=${ipaddress}'_os_linux_summary.html'
td_str=''
th_str=''
yum -y install bc sysstat net-tools;
sleep 10;
create_html_css(){
  echo -e "<html>
<head>
<style type="text/css">
    body        {font:12px Courier New,Helvetica,sansserif; color:black; background:White;}
    table,tr,td {font:12px Courier New,Helvetica,sansserif; color:Black; background:#FFFFCC; padding:0px 0px 0px 0px; margin:0px 0px 0px 0px;} 
    th          {font:bold 12px Courier New,Helvetica,sansserif; color:White; background:#0033FF; padding:0px 0px 0px 0px;} 
    h1          {font:bold 12pt Courier New,Helvetica,sansserif; color:Black; padding:0px 0px 0px 0px;} 
</style>
</head>
<body>"
}
create_html_head(){
echo -e "<h1>$1</h1>"
}
create_table_head1(){
  echo -e "<table width="68%" border="1" bordercolor="#000000" cellspacing="0px" style="border-collapse:collapse">"
}
create_table_head2(){
  echo -e "<table width="100%" border="1" bordercolor="#000000" cellspacing="0px" style="border-collapse:collapse">"
}
create_td(){
    td_str=`echo $1 | awk 'BEGIN{FS="|"}''{i=1; while(i<=NF) {print "<td>"$i"</td>";i  }}'`
}
create_th(){
    th_str=`echo $1|awk 'BEGIN{FS="|"}''{i=1; while(i<=NF) {print "<th>"$i"</th>";i  }}'`
}
create_tr1(){
  create_td "$1"
  echo -e "<tr>
    $td_str
  </tr>" >> $file_output
}
create_tr2(){
  create_th "$1"
  echo -e "<tr>
    $th_str
  </tr>" >> $file_output
}
create_tr3(){
  echo -e "<tr><td>
  <pre style="font-family:Courier New; word-wrap: break-word; white-space: pre-wrap; white-space: -moz-pre-wrap" >
  `cat $1`
  </pre></td></tr>" >> $file_output
}
create_table_end(){
  echo -e "</table>"
}
create_html_end(){
  echo -e "</body></html>"
}
NAME_VAL_LEN=12
name_val () {
   printf "% *s | %sn" "${NAME_VAL_LEN}" "$1" "$2"
}
get_physics(){
    name_val "巡检时间" "`date`"
    name_val "主机名" "`uname -n`"
    name_val "系统版本" "`cat /etc/{oracle,redhat,SuSE,centos}-release 2>/dev/null|sort -ru|head -n1`"
    name_val "内核版本" "`uname -r`"
    name_val "架构" "CPU=`lscpu|grep Architecture|awk -F: '{print $2}'|sed 's/^[[:space:]]*//g'`;OS=`getconf LONG_BIT`-bit"
}
get_cpuinfo () {
   file="/proc/cpuinfo"
   virtual=`grep -c ^processor "${file}"`
   physical=`grep 'physical id' "${file}" | sort -u | wc -l`
   cores=`grep 'cpu cores' "${file}" | head -n 1 | cut -d: -f2`
   model=`grep "model name" "${file}"|sort -u|awk -F: '{print $2}'`
   speed=`grep -i "cpu MHz" "${file}"|sort -u|awk -F: '{print $2}'`
   cache=`grep -i "cache size" "${file}"|sort -u|awk -F: '{print $2}'`
   SysCPUIdle=`vmstat | sed -n '$ p' | awk '{print $15}'`
   [ "${physical}" = "0" ] && physical="${virtual}"
   [ -z "${cores}" ] && cores=0
   cores=$((${cores} * ${physical}));
   htt=""
   if [ ${cores} -gt 0 -a $cores -lt $virtual ]; then htt=yes; else htt=no; fi
   name_val "线程" "physical = ${physical}, cores = ${cores}, virtual = ${virtual}, hyperthreading = ${htt}"
   name_val "cpu型号" "${physical} x ${model}"
   name_val "速度" "${virtual} x ${speed} MHz"
   name_val "缓存" "${virtual} x ${cache}"
   name_val "CPU空闲率(%)" "${SysCPUIdle}%"
}
get_netinfo(){
   echo "interface | status | ipadds     |      mtu    |  Speed     |     Duplex" >>/tmp/tmpnet_h1_`date  %y%m%d`.txt
   for ipstr in `ifconfig -a|grep ": flags"|awk  '{print $1}'|sed 's/.$//'`
   do
      ipadds=`ifconfig ${ipstr}|grep -w inet|awk '{print $2}'`
      mtu=`ifconfig ${ipstr}|grep mtu|awk '{print $NF}'`
      speed=`ethtool ${ipstr}|grep Speed|awk -F: '{print $2}'`
      duplex=`ethtool ${ipstr}|grep Duplex|awk -F: '{print $2}'`
      echo "${ipstr}"  "up" "${ipadds}" "${mtu}" "${speed}" "${duplex}"
      |awk '{print $1,"|", $2,"|", $3,"|", $4,"|", $5,"|", $6}'  >>/tmp/tmpnet1_`date  %y%m%d`.txt
   done
}
get_cpuuse(){
   echo "#######################################  cpu使用率  #######################################" >>/tmp/tmp_cpuuse_`date  %y%m%d`.txt
   mpstat -P ALL 10 8 >>/tmp/tmp_cpuuse_`date  %y%m%d`.txt
}
get_connections (){
  filemax=`cat /proc/sys/fs/file-max`
  name_val "Number of concurrent connections" "${filemax}"
}
get_ulimitinfo(){
   echo "#######################################  系统限制最大进程数  #######################################" >>/tmp/tmp_ulimitinfo_`date  %y%m%d`.txt
   ulimit -a >>/tmp/tmp_ulimitinfo_`date  %y%m%d`.txt
   echo "#######################################  env  #######################################" >>/tmp/tmp_ulimitinfo_`date  %y%m%d`.txt
   env >>/tmp/tmp_ulimitinfo_`date  %y%m%d`.txt
}
get_meminfo(){
   echo "Locator   |Size     |Speed       |Form Factor  | Type      |    Type Detail" >>/tmp/tmpmem3_h1_`date  %y%m%d`.txt
   dmidecode| grep -v "Memory Device Mapped Address"|grep -A12 -w "Memory Device" 
   |egrep "Locator:|Size:|Speed:|Form Factor:|Type:|Type Detail:" 
   |awk -F: '/Size|Type|Form.Factor|Type.Detail|^[t ] Locator/{printf("|%s", $2)}/^[t ] Speed/{print "|" $2}' 
   |grep -v "No Module Installed" 
   |awk -F"|" '{print $4,"|", $2,"|", $7,"|", $3,"|", $5,"|", $6}' >>/tmp/tmpmem3_t1_`date  %y%m%d`.txt
   free -glht >>/tmp/tmpmem2_`date  %y%m%d`.txt
   memtotal=`vmstat -s | head -1 | awk '{print $1}'`
   avm=`vmstat -s| sed -n '3p' | awk '{print $1}'`
   name_val "Mem_used_rate(%)" "`echo "100*${avm}/${memtotal}" | bc`%" >>/tmp/tmpmem1_`date  %y%m%d`.txt
  
}
get_diskinfo(){
   echo "Filesystem        |Type   |Size |  Used  | Avail | Use%  | Mounted on | Opts" >>/tmp/tmpdisk_h1_`date  %y%m%d`.txt
   df -ThP|grep -v tmpfs|sed '1d'|sort >/tmp/tmpdf1_`date  %y%m%d`.txt
   mount -l|awk '{print $1,$6}'|grep ^/|sort >/tmp/tmpdf2_`date  %y%m%d`.txt
   join /tmp/tmpdf1_`date  %y%m%d`.txt /tmp/tmpdf2_`date  %y%m%d`.txt
   |awk '{print $1,"|", $2,"|", $3,"|", $4,"|", $5,"|", $6,"|", $7,"|", $8}' >>/tmp/tmpdisk_t1_`date  %y%m%d`.txt 
   lsblk >>/tmp/tmpdisk1_`date  %y%m%d`.txt 
   for disk in `ls -l /sys/block|awk '{print $9}'|sed '/^$/d'|grep -v fd`
   do
      echo "${disk}" `cat /sys/block/${disk}/queue/scheduler`  >>/tmp/tmpdisk2_`date  %y%m%d`.txt 
   done
  echo "==========df -h============" >>/tmp/tmpdisk2_`date  %y%m%d`.txt  
  df -h >>/tmp/tmpdisk2_`date  %y%m%d`.txt 
  echo "==========mount============" >>/tmp/tmpdisk2_`date  %y%m%d`.txt  
  mount >>/tmp/tmpdisk2_`date  %y%m%d`.txt 
  echo "==========fdisk -l============" >>/tmp/tmpdisk2_`date  %y%m%d`.txt  
  fdisk -l >>/tmp/tmpdisk2_`date  %y%m%d`.txt 

   pvs >>/tmp/tmpdisk3_`date  %y%m%d`.txt
   echo "======================  =====  =====  =====  =====  =====  ==========  =======" >>/tmp/tmpdisk3_`date  %y%m%d`.txt
   vgs >>/tmp/tmpdisk3_`date  %y%m%d`.txt
   echo "======================  =====  =====  =====  =====  =====  ==========  =======" >>/tmp/tmpdisk3_`date  %y%m%d`.txt
   lvs >>/tmp/tmpdisk3_`date  %y%m%d`.txt
}
   ##xiao changge 
get_topproc(){
   #os load
   echo "#######################################  网络流量情况  #######################################" >>/tmp/tmpload_`date  %y%m%d`.txt
   sar -n DEV 10 6 >>/tmp/tmpload_`date  %y%m%d`.txt
   echo "#######################################  ip add  #######################################" >>/tmp/tmpload_`date  %y%m%d`.txt
   ip add >>/tmp/tmpload_`date  %y%m%d`.txt
   echo "#######################################  ss -t -a  #######################################" >>/tmp/tmpload_`date  %y%m%d`.txt
   ss -t -a  >>/tmp/tmpload_`date  %y%m%d`.txt
   echo "#######################################  netstat -lntp  #######################################" >>/tmp/tmpload_`date  %y%m%d`.txt
   netstat -lntp  >>/tmp/tmpload_`date  %y%m%d`.txt
   echo "#######################################  netstat -anp  #######################################" >>/tmp/tmpload_`date  %y%m%d`.txt
   netstat -anp  >>/tmp/tmpload_`date  %y%m%d`.txt
   echo "#######################################  netstat -rn  #######################################" >>/tmp/tmpload_`date  %y%m%d`.txt
   netstat -rn  >>/tmp/tmpload_`date  %y%m%d`.txt

   echo "#######################################  系统资源变化  #######################################" >>/tmp/tmptop_`date  %y%m%d`.txt
   vmstat -S M 10 6  >>/tmp/tmptop_`date  %y%m%d`.txt
   mpstat 1 5 >>/tmp/tmptop_`date  %y%m%d`.txt
   echo "#######################################  消耗CPU前十排行  #######################################" >>/tmp/tmptop_`date  %y%m%d`.txt
   ps aux|head -1 >>/tmp/tmptop_`date  %y%m%d`.txt
   ps aux|grep -v PID|sort -rn -k  3|head  >>/tmp/tmptop_`date  %y%m%d`.txt
   sleep 2;
   echo "#######################################  消耗内存前十排行  #######################################" >>/tmp/tmptop_`date  %y%m%d`.txt
   ps aux|head -1  >>/tmp/tmptop_`date  %y%m%d`.txt
   ps aux|grep -v PID|sort -rn -k  4|head  >>/tmp/tmptop_`date  %y%m%d`.txt
   sleep 2;
   echo "#######################################  TOP资源监控  #######################################" >>/tmp/tmptop_`date  %y%m%d`.txt
   top -bn1 -o "%CPU"|sed  -n '1,80p' >>/tmp/tmptop_`date  %y%m%d`.txt
   sleep 2;
  echo "#######################################  显示进程信息ps -ef  #######################################" >>/tmp/tmptop_`date  %y%m%d`.txt
   ps -ef >>/tmp/tmptop_`date  %y%m%d`.txt
   sleep 2;   
   
   #top i/o
   echo "#######################################  磁盘io情况  #######################################" >>/tmp/tmptopio_`date  %y%m%d`.txt
   iostat -k -d 10 5  >>/tmp/tmptopio_`date  %y%m%d`.txt
}
get_crontablist(){
   crontab -l >>/tmp/tmp_crontab_`date  %y%m%d`.txt
  if [ -s /tmp/tmp_crontab_`date  %y%m%d`.txt ] ; then 
    echo 'ths file is not empyt and file info'
  else
    echo '#### 无定时任务 ####' >>/tmp/tmp_crontab_`date  %y%m%d`.txt
  fi
}
get_crontab_content(){
   crontab_content_log=/tmp/tmp_crontab_content_`date  %y%m%d`.txt
   crontab -l|awk -F ' ' '{ print $NF}' >>$crontab_content_log

   contrab_num=`crontab -l|awk -F ' ' '{ print $NF}'|wc -l`
   if [ $contrab_num -ne 0 ];then
   count=1
   while [ $count -le $contrab_num ]
     do
       echo "#######################################  获取系统定时任务脚本 $count 内容开始  #######################################" >>/tmp/tmp_crontab_shellcontent_`date  %y%m%d`.txt
       cat `sed -n -e "${count}p" $crontab_content_log` >>/tmp/tmp_crontab_shellcontent_`date  %y%m%d`.txt
       echo -e "n#######################################  获取系统定时任务脚本 $count 内容结束  #######################################n" >>/tmp/tmp_crontab_shellcontent_`date  %y%m%d`.txt
     count=$[${count} 1]
     done
   else
     echo '#### 无定时执行脚本 ####' >>/tmp/tmp_crontab_shellcontent_`date  %y%m%d`.txt
   fi
}
create_html(){
  rm -rf $file_output
  touch $file_output
  create_html_css >> $file_output
  
  create_html_head "系统基本信息" >> $file_output
  create_table_head1 >> $file_output
  get_physics >>/tmp/tmpos_summ_`date  %y%m%d`.txt
  while read line
  do
    create_tr1 "$line" 
  done < /tmp/tmpos_summ_`date  %y%m%d`.txt
  create_table_end >> $file_output
  
  create_html_head "cpu信息" >> $file_output
  create_table_head1 >> $file_output
  get_cpuinfo >>/tmp/tmp_cpuinfo_`date  %y%m%d`.txt
  while read line
  do
    create_tr1 "$line" 
  done < /tmp/tmp_cpuinfo_`date  %y%m%d`.txt  
  create_table_end >> $file_output

  create_html_head "ip网络信息" >> $file_output
  create_table_head1 >> $file_output
  get_netinfo
  while read line
  do
    create_tr2 "$line" 
  done < /tmp/tmpnet_h1_`date  %y%m%d`.txt
  while read line
  do
    create_tr1 "$line" 
  done < /tmp/tmpnet1_`date  %y%m%d`.txt
  create_table_end >> $file_output

  create_html_head "cpu使用率" >> $file_output
  create_table_head1 >> $file_output
  get_cpuuse
  create_tr3 "/tmp/tmp_cpuuse_`date  %y%m%d`.txt"
  create_table_end >> $file_output

  create_html_head "连接数信息" >> $file_output
  create_table_head1 >> $file_output
  get_connections >>/tmp/tmp_connections_`date  %y%m%d`.txt
  while read line
  do
    create_tr1 "$line" 
  done < /tmp/tmp_connections_`date  %y%m%d`.txt  
  create_table_end >> $file_output

  create_html_head "系统限制信息" >> $file_output
  create_table_head1 >> $file_output
  get_ulimitinfo
  create_tr3 "/tmp/tmp_ulimitinfo_`date  %y%m%d`.txt"
  create_table_end >> $file_output  

  create_html_head "内存使用信息" >> $file_output
  create_table_head1 >> $file_output
  get_meminfo
  while read line
  do
    create_tr1 "$line" 
  done < /tmp/tmpmem1_`date  %y%m%d`.txt
  create_table_end >> $file_output
  
  create_table_head1 >> $file_output
  create_tr3 "/tmp/tmpmem2_`date  %y%m%d`.txt"
  create_table_end >> $file_output
  
  create_table_head1 >> $file_output
  while read line
  do
    create_tr2 "$line" 
  done < /tmp/tmpmem3_h1_`date  %y%m%d`.txt
  
  while read line
  do
    create_tr1 "$line" 
  done < /tmp/tmpmem3_t1_`date  %y%m%d`.txt
  create_table_end >> $file_output
  
  create_html_head "磁盘使用信息" >> $file_output
  create_table_head1 >> $file_output
  get_diskinfo
  while read line
  do
    create_tr2 "$line" 
  done < /tmp/tmpdisk_h1_`date  %y%m%d`.txt
  while read line
  do
    create_tr1 "$line" 
  done < /tmp/tmpdisk_t1_`date  %y%m%d`.txt
  create_table_end >> $file_output
  
  create_table_head1 >> $file_output
  create_tr3 "/tmp/tmpdisk1_`date  %y%m%d`.txt"
  create_table_end >> $file_output
  
  create_table_head1 >> $file_output
  create_tr3 "/tmp/tmpdisk2_`date  %y%m%d`.txt"
  create_table_end >> $file_output
  
  create_table_head1 >> $file_output
  create_tr3 "/tmp/tmpdisk3_`date  %y%m%d`.txt"
  create_table_end >> $file_output

  create_html_head "网络流量情况" >> $file_output
  create_table_head1 >> $file_output
  get_topproc
  create_tr3 "/tmp/tmpload_`date  %y%m%d`.txt"
  create_table_end >> $file_output
  
  create_html_head "性能相关监控" >> $file_output
  create_table_head1 >> $file_output
  sed -i 's/</----/g' "/tmp/tmptop_`date  %y%m%d`.txt"  >>/tmp/tmptop_`date  %y%m%d`.txt
  create_tr3 "/tmp/tmptop_`date  %y%m%d`.txt"
  create_table_end >> $file_output
  
  create_html_head "磁盘io情况" >> $file_output
  create_table_head1 >> $file_output
  create_tr3 "/tmp/tmptopio_`date  %y%m%d`.txt"
  create_table_end >> $file_output

  create_html_head "定时任务信息" >> $file_output
  create_table_head1 >> $file_output
  get_crontablist
  create_tr3 "/tmp/tmp_crontab_`date  %y%m%d`.txt"
  create_table_end >> $file_output

  create_html_head "定时任务脚本内容" >> $file_output
  create_table_head1 >> $file_output
  get_crontab_content
  create_tr3 "/tmp/tmp_crontab_shellcontent_`date  %y%m%d`.txt"
  create_table_end >> $file_output

  create_html_end >> $file_output
  sed -i 's/BORDER=1/width="68%" border="1" bordercolor="#000000" cellspacing="0px" style="border-collapse:collapse"/g' $file_output
  rm -rf /tmp/tmp*_`date  %y%m%d`.txt
}
# This script must be executed as root
RUID=`id|awk -F( '{print $1}'|awk -F= '{print $2}'`
if [ ${RUID} != "0" ];then
    echo"This script must be executed as root"
    exit 1
fi
PLATFORM=`uname`
if [ ${PLATFORM} = "HP-UX" ] ; then
    echo "This script does not support HP-UX platform for the time being"
exit 1
elif [ ${PLATFORM} = "SunOS" ] ; then
    echo "This script does not support SunOS platform for the time being"
exit 1
elif [ ${PLATFORM} = "AIX" ] ; then
    echo "This script does not support AIX platform for the time being"
exit 1
elif [ ${PLATFORM} = "Linux" ] ; then
  create_html
fi

执行完成后html展示截图:

Linux脚本链接:

https://pan.baidu.com/s/13eNUtJrVBo6DRdLenoWGDw

提取码: hm8u

0 人点赞