mindxdl--common--log

// Copyright (c) 2021. Huawei Technologies Co., Ltd. All rights reserved.

// Package common define common utils
package common

import (
   "bufio"
   "context"
   "errors"
   "io"
   "os"
   "path"
   "strconv"
   "strings"
   "sync"
   "time"

   "github.com/gin-gonic/gin"
   corev1 "k8s.io/api/core/v1"
   metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
   "k8s.io/apimachinery/pkg/labels"
   "k8s.io/client-go/kubernetes"

   "huawei.com/mindxdl/base/common/constants"
   "huawei.com/npu-exporter/hwlog"
)

var logChanMap map[string]chan bool

// LogQueryResp log query response
type LogQueryResp struct {
   LogContent string `json:"logContent"`
   RowNumber  uint64 `json:"rowNumber"`
}

const (
   checkServicePeriod = 5
   byteToMB           = 20
   maxLogSize         = 50
   // FileMode file mode
   FileMode = 0640
   // FolderMode folder mode
   FolderMode      = 0750
   runningStatus   = "Running"
   succeededStatus = "Succeeded"

   // LogFolder service log folder
   LogFolder = "ServiceLogs"
)

// GetLogFilePath get log file path
func GetLogFilePath(podName string, elem ...string) string {
   return path.Join(path.Join(elem...), podName+".log")
}

func getStoragePath(b BaseCtx, srcModule string) string {
   hwlog.RunLog.Infof("current component is %v", srcModule)
   return GetUserPath(b)
}

func getLogParentPath(b BaseCtx, srcModule, namespace string) string {
   return path.Join(getStoragePath(b, srcModule), LogFolder, namespace)
}

func getPodLogFilePath(b BaseCtx, srcModule, namespace, podName string) string {
   return GetLogFilePath(podName, getLogParentPath(b, srcModule, namespace))
}

func logToFile(podLog io.ReadCloser, logFilePath string, wg *sync.WaitGroup) {
   defer wg.Done()
   _, err := os.Stat(logFilePath)
   if err == nil || os.IsExist(err) {
      return
   }

   logFile, err := os.OpenFile(logFilePath, os.O_CREATE|os.O_WRONLY|os.O_TRUNC|os.O_APPEND, FileMode)
   if err != nil {
      hwlog.RunLog.Errorf("create %s log file failed", path.Base(logFilePath))
      return
   }
   defer logFile.Close()
   logWriter := bufio.NewWriter(logFile)
   if _, err := io.Copy(logWriter, podLog); err != nil {
      hwlog.RunLog.Errorf("write log file failed, path: %v, err: %v", path.Base(logFilePath), err)
   }
   if err := logWriter.Flush(); err != nil {
      hwlog.RunLog.Errorf("flush %s log file failed", path.Base(logFilePath))
   }
}

func closePodLogStream(podLogList map[string]io.ReadCloser) {
   for podName, podLog := range podLogList {
      if err := podLog.Close(); err != nil {
         hwlog.RunLog.Errorf("close %s log reader failed", podName)
      }
   }
}

func deleteOldLogFile(logDir string, oldPodNameList []string) {
   for _, podName := range oldPodNameList {
      if err := os.Remove(GetLogFilePath(podName, logDir)); err != nil {
         hwlog.RunLog.Errorf("remove log file failed, name: %v err: %v, please delete it manually",
            podName, err)
      }
   }
}

func findFirst(element string, list []string) int {
   for i, v := range list {
      if element == v {
         return i
      }
   }
   return -1
}

// getNewPodNameList return newly added pod name list
// Only will deleted pod names remain in oldPodNameList after this function
func getNewPodNameList(clientSet *kubernetes.Clientset, svcNamespace, svcName string,
   oldPodNameList []string) ([]string, []string) {
   labelSelector := labels.Set(map[string]string{"app": svcName}).AsSelector().String()
   podList, err := clientSet.CoreV1().Pods(svcNamespace).List(context.TODO(), metav1.ListOptions{
      LabelSelector: labelSelector,
   })
   if err != nil {
      return nil, nil
   }
   var podNameList []string
   for _, pod := range podList.Items {
      if pod.Status.Phase == runningStatus || pod.Status.Phase == succeededStatus {
         if index := findFirst(pod.Name, oldPodNameList); index == -1 {
            podNameList = append(podNameList, pod.Name)
         } else {
            oldPodNameList = append(oldPodNameList[:index], oldPodNameList[index+1:]...)
         }
      }
   }

   return podNameList, oldPodNameList
}

func updatePodLogList(clientSet *kubernetes.Clientset, svcNamespace string, podNameList, oldPodNameList []string,
   podLogList map[string]io.ReadCloser) {
   if podLogList == nil {
      podLogList = make(map[string]io.ReadCloser, len(podNameList))
   }
   opt := &corev1.PodLogOptions{
      Follow: true,
   }
   for _, podName := range podNameList {
      logRequest := clientSet.CoreV1().Pods(svcNamespace).GetLogs(podName, opt)
      if podLog, err := logRequest.Stream(context.TODO()); err == nil {
         podLogList[podName] = podLog
      }
   }
   for _, podName := range oldPodNameList {
      if err := podLogList[podName].Close(); err != nil {
         hwlog.RunLog.Errorf("close %s log reader failed", podName)
      }
      delete(podLogList, podName)
   }
}

func logRecordGoroutine(svcNameSpace, svcName, logDir string, stopCh <-chan bool) {
   var clientSet *kubernetes.Clientset
   var cliErr error
   podLogList := make(map[string]io.ReadCloser)
   var podNameList, oldPodNameList []string
   var wg sync.WaitGroup
   for {
      select {
      case <-stopCh:
         wg.Wait()
         closePodLogStream(podLogList)
         deleteOldLogFile(logDir, oldPodNameList)
         return
      default:
      }
      if clientSet == nil {
         if clientSet, cliErr = K8sClient(""); cliErr != nil {
            continue
         }
      }
      podNameList, oldPodNameList = getNewPodNameList(clientSet, svcNameSpace, svcName, oldPodNameList)
      updatePodLogList(clientSet, svcNameSpace, podNameList, oldPodNameList, podLogList)
      deleteOldLogFile(logDir, oldPodNameList)
      oldPodNameList = nil
      for podName := range podLogList {
         oldPodNameList = append(oldPodNameList, podName)
      }

      for _, podName := range podNameList {
         wg.Add(1)
         if _, ok := podLogList[podName]; ok {
            go logToFile(podLogList[podName], GetLogFilePath(podName, logDir), &wg)
         }
      }
      time.Sleep(checkServicePeriod * time.Second)
   }
}

// StartLogRecord start log record goroutine
func StartLogRecord(svcNamespace, svcName, srcModule string, b BaseCtx) {
   logParentDir := getLogParentPath(b, srcModule, svcNamespace)
   if err := os.MkdirAll(logParentDir, FolderMode); err != nil {
      hwlog.OpLog.WarnfWithCtx(b.Ctx, "log record failed: create the log folder failed, %s", err.Error())
      return
   }

   if logChanMap == nil {
      logChanMap = make(map[string]chan bool)
   }
   mapKey := srcModule + "-" + svcName
   logChanMap[mapKey] = make(chan bool, 1)
   hwlog.RunLog.InfofWithCtx(b.Ctx, "start to record log of service %v", svcName)
   go logRecordGoroutine(svcNamespace, svcName, logParentDir, logChanMap[mapKey])
}

// StopLogRecord stop log record goroutine
func StopLogRecord(svcName, srcModule string, b BaseCtx) {
   mapKey := srcModule + "-" + svcName
   if _, ok := logChanMap[mapKey]; ok && logChanMap[mapKey] != nil {
      logChanMap[mapKey] <- true
      close(logChanMap[mapKey])
      delete(logChanMap, mapKey)
   }
   hwlog.RunLog.InfofWithCtx(b.Ctx, "stop to record log of service %v", svcName)
}

func logQuery(logPath string, offset, limit uint64, b BaseCtx) (*LogQueryResp, error) {
   logFile, err := os.OpenFile(logPath, os.O_RDONLY, FileMode)
   if err != nil {
      hwlog.RunLog.ErrorWithCtx(b.Ctx, "Fail to get log file")
      return nil, err
   }
   defer logFile.Close()
   logReader := bufio.NewReader(logFile)
   logStrs := make([]string, 0, maxLogSize)
   var logLineByte []byte
   for line := uint64(0); line < offset+limit; line++ {
      lineByte, isPrefix, err := logReader.ReadLine()
      if err != nil {
         if err != io.EOF {
            hwlog.RunLog.ErrorfWithCtx(b.Ctx, "An error occurred while reading log file: %v", err)
            return nil, err
         }
         break
      }
      logLineByte = append(logLineByte, lineByte...)
      if isPrefix {
         continue
      }
      if line >= offset {
         logStrs = append(logStrs, string(logLineByte))
      }
      logLineByte = make([]byte, 0)
   }
   logQueryResp := LogQueryResp{
      LogContent: strings.Join(logStrs, "\n"),
      RowNumber:  uint64(len(logStrs)),
   }
   return &logQueryResp, nil
}

func getOffsetAndLimit(logOffset, logLimit string, b BaseCtx) (uint64, uint64, string) {
   offset, err := strconv.ParseUint(logOffset, BaseHex, BitSize64)
   if err != nil {
      hwlog.OpLog.ErrorfWithCtx(b.Ctx, "get service log offset convert to integer failed, err: %v", err)
      return 0, 0, ParamConvert2IntegerFailed
   }
   limit, err := strconv.ParseUint(logLimit, BaseHex, BitSize64)
   if err != nil {
      hwlog.OpLog.ErrorfWithCtx(b.Ctx, "get service log limit convert to integer failed, err: %v", err)
      return 0, 0, ParamConvert2IntegerFailed
   }
   if err := validLogLimitOffset(offset, limit); err != nil {
      hwlog.OpLog.ErrorfWithCtx(b.Ctx, "get service log param invalid: %v", err)
      return 0, 0, ParamInvalid
   }
   return offset, limit, Success
}

func validPodNameNamespace(podName, podNamespace string,
   search func(name, svcType string, uid uint64) error, b BaseCtx) string {
   if ok := ValidName("podName", podName, b); !ok {
      hwlog.RunLog.ErrorWithCtx(b.Ctx, "podName invalid")
      return ParamInvalid
   }
   if ok := ValidName("namespace", podNamespace, b); !ok {
      hwlog.RunLog.ErrorWithCtx(b.Ctx, "pod namespace invalid")
      return ParamInvalid
   }
   clientSet, cliErr := K8sClient("")
   if cliErr != nil {
      hwlog.RunLog.ErrorfWithCtx(b.Ctx, "Failed to get customClient err: %s", cliErr.Error())
      return GetK8sClientFailed
   }
   pod, err := clientSet.CoreV1().Pods(podNamespace).Get(context.Background(),
      podName, metav1.GetOptions{})
   if err != nil {
      hwlog.RunLog.ErrorWithCtx(b.Ctx, "the pod does not exist")
      return ParamInvalid
   }
   if svcType, ok := pod.Labels[constants.TrainManageName]; ok {
      name, ok := pod.Labels["dbjob-name"]
      if !ok {
         hwlog.RunLog.ErrorWithCtx(b.Ctx, "failed to get service name of the pod")
         return ParamInvalid
      }
      if err := search(name, svcType, b.HdInfo.UserID); err != nil {
         hwlog.RunLog.ErrorWithCtx(b.Ctx, "the pod does not belong to train manager")
         return ParamInvalid
      }
   } else {
      name, ok := pod.Labels["app"]
      if !ok {
         hwlog.RunLog.ErrorWithCtx(b.Ctx, "failed to get service name of the pod")
         return ParamInvalid
      }
      if err := search(name, "", b.HdInfo.UserID); err != nil {
         hwlog.RunLog.ErrorfWithCtx(b.Ctx, "the pod does not belong to task manager, %v", err)
         return ParamInvalid
      }
   }

   return ""
}

// QueryServiceLog query service log
func QueryServiceLog(srcModule string,
   search func(name, svcType string, uid uint64) error, b BaseCtx, c *gin.Context) {
   hwlog.OpLog.InfoWithCtx(b.Ctx, "start to query service log")
   offset, limit, errCode := getOffsetAndLimit(c.Query("offset"), c.Query("limit"), b)
   if errCode != Success {
      ConstructResp(c, errCode, "", nil)
      return
   }
   podName := c.Query("podName")
   podNamespace := c.Query("namespace")
   if err := validPodNameNamespace(podName, podNamespace, search, b); err != "" {
      ConstructResp(c, ParamInvalid, "", nil)
      return
   }
   logPath := getPodLogFilePath(b, srcModule, podNamespace, podName)
   log, err := logQuery(logPath, offset, limit, b)
   if err != nil {
      hwlog.OpLog.ErrorfWithCtx(b.Ctx, "query service pod log failed, err: %v", err)
      ConstructResp(c, QueryK8sPodLogFailed, "", nil)
      return
   }
   hwlog.OpLog.InfoWithCtx(b.Ctx, "query pod log succeed")
   ConstructResp(c, Success, "", log)
}

func downloadLogFile(writer io.Writer, logPath string, b BaseCtx) (int64, error) {
   if fi, err := os.Stat(logPath); err == nil {
      if fi.Size()>>byteToMB > maxLogSize {
         return 0, errors.New("the log file is too large, please download it by other way")
      }
   }
   logFile, err := os.OpenFile(logPath, os.O_RDONLY, FileMode)
   if err != nil {
      hwlog.RunLog.ErrorWithCtx(b.Ctx, "Fail to get log file")
      return 0, err
   }
   defer logFile.Close()
   return io.Copy(writer, logFile)
}

// DownloadServiceLog download log file
func DownloadServiceLog(srcModule string,
   search func(name, svcType string, uid uint64) error, b BaseCtx, c *gin.Context) {
   podName := c.Query("podName")
   podNamespace := c.Query("namespace")
   logFileSize := int64(0)
   c.Header(ContentDisposition, "attachment; filename="+podName+".log")
   c.Header(ContentType, "application/text/plain")
   c.Header(AcceptLength, strconv.FormatInt(logFileSize, BaseHex))

   if err := validPodNameNamespace(podName, podNamespace, search, b); err != "" {
      ConstructResp(c, ParamInvalid, "", nil)
      return
   }

   hwlog.OpLog.InfofWithCtx(b.Ctx, "get pod log podName(%v), namespace(%v)", podName, podNamespace)
   logPath := getPodLogFilePath(b, srcModule, podNamespace, podName)
   fileSize, err := downloadLogFile(c.Writer, logPath, b)
   if err != nil {
      hwlog.OpLog.ErrorfWithCtx(b.Ctx, "download service pod log failed, err: %v", err)
      ConstructResp(c, DownloadPodLogFileFailed, "", nil)
      return
   }
   c.Header(AcceptLength, strconv.FormatInt(fileSize, BaseHex))
   hwlog.OpLog.InfoWithCtx(b.Ctx, "pod log downloaded")
   ConstructResp(c, Success, "", nil)
}

mindxdl--common--log_record.go的更多相关文章

Socket聊天程序——Common
写在前面: 上一篇记录了Socket聊天程序的客户端设计,为了记录的完整性,这里还是将Socket聊天的最后一个模块--Common模块记录一下.Common的设计如下: 功能说明: Common模块 ...
angularjs 1 开发简单案例(包含common.js,service.js,controller.js,page)
common.js var app = angular.module('app', ['ngFileUpload']) .factory('SV_Common', function ($http) { ...
Common Bugs in C Programming
There are some Common Bugs in C Programming. Most of the contents are directly from or modified from ...
ANSI Common Lisp Practice - My Answers - Chatper - 3
Ok, Go ahead. 1 (a) (b) (c) (d) 2 注:union 在 Common Lisp 中的作用就是求两个集合的并集.但是这有一个前提,即给的两个列表已经满足集合的属性了.具体 ...
[LeetCode] Lowest Common Ancestor of a Binary Tree 二叉树的最小共同父节点
Given a binary tree, find the lowest common ancestor (LCA) of two given nodes in the tree. According ...
[LeetCode] Lowest Common Ancestor of a Binary Search Tree 二叉搜索树的最小共同父节点
Given a binary search tree (BST), find the lowest common ancestor (LCA) of two given nodes in the BS ...
[LeetCode] Longest Common Prefix 最长共同前缀
Write a function to find the longest common prefix string amongst an array of strings. 这道题让我们求一系列字符串 ...
48. 二叉树两结点的最低共同父结点(3种变种情况)[Get lowest common ancestor of binary tree]
[题目] 输入二叉树中的两个结点,输出这两个结点在数中最低的共同父结点. 二叉树的结点定义如下: C++ Code 123456 struct BinaryTreeNode { int ...
动态规划求最长公共子序列（Longest Common Subsequence, LCS）
1. 问题描述子串应该比较好理解,至于什么是子序列,这里给出一个例子:有两个母串 cnblogs belong 比如序列bo, bg, lg在母串cnblogs与belong中都出现过并且出现顺序与 ...
【leetcode】Longest Common Prefix
题目简述: Write a function to find the longest common prefix string amongst an array of strings. 解题思路: c ...

随机推荐

Electron学习（四）之应用程序打包
highlight: a11y-dark 写在前面人真的是会变得越来越懒的,也正是人的惰性吧,真的是很讽刺. 关于这个应用程序的开发,断更了很久,但是代码部分还算没落下吧,终于在周一.周二终把这个应 ...
django_day08_项目相关
django_day08_项目相关定义数据库表 from django.db import models # Create your models here. class User(models.M ...
校园网跨网段共享文件Samba+SSH
Introduction This tutorial contains screenshots for the English version of Windows 10. Separate inst ...
Mysqldump 的的 6 大使用场景的导出命令
Mysqldump 选项解析场景描述 1. 导出 db1.db2 两个数据库的所有数据. mysqldump -uroot -p -P8635 -h192.168.0.199 --hex-blob ...
Logstash：input plugin 介绍
Ceph 存储集群第一部分：配置和部署
内容来源于官方,经过个人实践操作整理,官方地址:http://docs.ceph.org.cn/rados/ 所有 Ceph 部署都始于 Ceph 存储集群. 基于 RADOS 的 Ceph 对象存储 ...
（编程语言界的丐帮 C#）.NET MD5 HASH 哈希加密与JAVA 互通
一.注意要点 1:输入字符串的的编码双方保持统一,如:UTF8: 2:HASH计算输出结果 byte[] 数组转String 时,编码要统一,如:转16进制小写字符串.当然也可以转Base64. 3: ...
MySQL学习(3)---MySQL常用命令
ps:此随笔基于mysql 5.7.*版本. 准备 net start mysql 启动MySQL服务 net stop mysql 关闭MySQL服务 mysql [-h<IP地址>] ...
大数据常用的Linux命令
Linux文件系统基础知识要想熟练使用命令,就先要熟练掌握Linux文件系统基础知识: 三个路径当前路径:也叫当前工作目录,就是当前状态下用户所处的位置相对路径:相对于当前工作目录开始的路径,会 ...
PyCharm安装PyQt5及其工具（Qt Designer、PyUIC、PyRcc）详细教程
摘要:Qt是常用的用户界面设计工具,而在Python中则使用PyQt这一工具包,它是Python编程语言和Qt库的成功融合.这篇博文通过图文详细介绍在PyCharm中如何完整优雅地安装配置PyQt5的 ...

mindxdl--common--log_record.go

mindxdl--common--log_record.go的更多相关文章

随机推荐

热门专题