• Hadoop记录- Yarn Job MAX


    #!/bin/sh
    #yarn job status:NEW、NEW_SAVING、SUBMITTED、ACCEPTED、RUNNING、FINISHED、FAILED、KILLED
    nnum=$(xx/yarn application -list -appStates NEW | wc -l)
    nsnum=$(xx/yarn application -list -appStates NEW_SAVING | wc -l)
    snum=$(xx/yarn application -list -appStates SUBMITTED | wc -l)
    anum=$(xx/yarn application -list -appStates ACCEPTED | wc -l)
    rnum=$(/xx/yarn application -list -appStates RUNNING | wc -l)
    finum=$(xx/yarn application -list -appStates FINISHED | wc -l)
    fanum=$(xxx/yarn application -list -appStates FAILED | wc -l)
    knum=$(xxx/yarn application -list -appStates KILLED | wc -l)
    let nnum=nnum-2
    let nsnum=nsnum-2
    let snum=snum-2
    let anum=anum-2
    let rnum=rnum-2
    let finum=finum-2
    let fanum=fanum-2
    let knum=knum-2
    vnum=($nnum $nsnum $snum $anum $rnum $finum $fanum $knum)
    vkey=(NEW NEW_SAVING SUBMITTED ACCEPTED RUNNING FINISHED FAILED KILLED)
    url="http://xxx/monitor/report/sendReport"
    #yarn applicaiton -status application_1554987290796_77895
    for (( i = 0 ; i < ${#vnum[@]} ; i++ ))
    do
      for (( j = 0 ; j < ${#vkey[@]} ; j++ ))
      do
      if [ $i -eq $j ]
      then
      key="xx.yarn_job_state_"${vkey[$j]}"_count##xxx"
      value=${vnum[$i]}
      data="{"key":"$key","value":$value}"
      echo $data
      cmd="curl -s -X POST -H 'Content-type':'application/json' -d '${data}' ${url}"
      sh -c "$cmd"
      fi
      done
    done
    
    #!/bin/sh
    ip=xxx
    port=8088
    export HADOOP_HOME=/app/hadoop/bin
    rmstate1=$($HADOOP_HOME/yarn rmadmin -getServiceState rm1)
    rmstate2=$($HADOOP_HOME/yarn rmadmin -getServiceState rm2)
    if [[ $rmstate1 == *active* ]]
    then
       ip=xxx
    fi
    $HADOOP_HOME/yarn application -list -appStates RUNNING | awk '{print $1}' | grep -i "application" >appname.txt
    curl http://$ip:$port/ws/v1/cluster/scheduler | jq . | sed 's/"//g' > scheduler.json
    sed -i '1,5d' scheduler.json 
    sed -n -e :a -e '1,33!{P;N;D;};N;ba' scheduler.json > nscheduler.json
    cat nscheduler.json | grep -i "queueName" | awk -F ": " '{print $2}' | awk -F "," '{print $1}' > qname.txt
    cat nscheduler.json | grep -i "memory" | awk -F ": " '{print $2}' | awk -F "," '{print $1}' > memory.txt
    line=$(cat memory.txt | wc -l)
    for((j=2;j<$line;j=j+6))
    do
      sed -n '$jp' memory.txt >> maxmemory.txt  
    done
    app=($(cat appname.txt | awk '{print $1}'))
    for (( i = 0 ; i < ${#app[@]} ; i++ ))
    do
        queue=$(curl http://$ip:$port/ws/v1/cluster/apps/${app[$i]} | jq . | sed 's/"//g'  | grep -i "queue" | awk -F ":" '{print $2}')
        allocatedMB=$(curl http://$ip:$port/ws/v1/cluster/apps/${app[$i]} | jq . | sed 's/"//g'  | grep -i "allocatedMB" | awk -F ":" '{print $2}')
        nparr=($(cat nscheduler.json | grep -i "numPendingApps" | awk -F ": " '{print $2}' | awk -F "," '{print $1}'))
        for((j=0;j<=${#nparr[@]};j++))
        do
           if [${nparr[$j]} -gt 10 ]
           then
              qname=$(sed -n '$jp' qname.txt)
              mem=$(sed -n '$jp' maxmemory.txt)
              if [ $qname -eq $queue ]
              then
                     rate=$(echo "sclae=2; $allocatedMB/$mem" | bc) 
                     if [ $rate -gt 0.2 ]
                     then
                        $HADOOP_HOME/yarn application  -kill  ${app[$i]}
                     fi
              fi
            fi 
        done
    done
    #查看任务的详细信息
    #$HADOOP_HOME/yarn applicaiton -status ${app[$i]}
    curl http://$ip:$port/ws/v1/cluster/apps/application_1554987290796_688678
    #查看任务状态
    curl http://$ip:$port/ws/v1/cluster/apps/application_1409421698529_0012/state
    #kill任务
    curl -v -X PUT -d '{"state": "KILLED"}''http://$ip:$port/ws/v1/cluster/apps/application_1409421698529_0012'
    #队列资源信息
    curl http://$ip:$port/ws/v1/cluster/scheduler
    #查看指定队列的所有任务:
    curl http://$ip:$port/ws/v1/cluster/apps?queue=default
    #查看整个集群的指标
    curl http://$ip:$port/ws/v1/cluster/metrics
    #查看队列的状态
    yarn queue -status default
  • 相关阅读:
    2020第29周日
    pytest文档44-allure.dynamic动态生成用例标题
    python笔记46-史上最强大最好用的python日志模块nb_log
    pytest文档43-元数据使用(pytest-metadata)
    pytest文档42-fixture参数化params
    ASP.NET Core WebApi+EF Core入门到实战演练
    SqlParameter中的new SqlParameter("e",0)的陷阱坑,你知道?
    EF Linq中的左连接Left Join查询
    .NET Core EFCore零基础快速入门简单使用
    git报错,远程克隆和更新不下来解决方法
  • 原文地址:https://www.cnblogs.com/xinfang520/p/10725337.html
Copyright © 2020-2023  润新知