This repository has been archived on 2025-09-14. You can view files and clone it, but cannot push or open issues or pull requests.
Files
linxin-coredump-tools/coredump-handler/coredump-handler.go

313 lines
9.3 KiB
Go
Raw Normal View History

2023-04-10 18:30:40 +08:00
package main
import (
2023-04-11 11:27:04 +08:00
"archive/zip"
2023-04-10 18:30:40 +08:00
"context"
"coredump-tools/config"
"coredump-tools/types"
"encoding/json"
2023-04-10 18:30:40 +08:00
"errors"
"flag"
2023-04-10 18:30:40 +08:00
"fmt"
"io"
"math"
2023-04-10 18:30:40 +08:00
"os"
"regexp"
"strconv"
"strings"
2023-04-10 18:30:40 +08:00
"github.com/containerd/containerd"
"github.com/containerd/containerd/namespaces"
"github.com/coreos/go-systemd/v22/journal"
"github.com/shirou/gopsutil/disk"
2023-04-10 18:30:40 +08:00
)
var coredump_config types.Coredump_config
2023-04-11 11:27:04 +08:00
func argsJudge() error {
if coredump_config.Initial_ns_pid == "" ||
coredump_config.Process_ns_pid == "" ||
coredump_config.Corepipe_config_path == "" ||
coredump_config.Timestamp == 0 ||
coredump_config.Process_exe_path == "" ||
coredump_config.GID == "" ||
coredump_config.Hostname == "" ||
coredump_config.UID == "" ||
coredump_config.Signal == -1 {
err := fmt.Sprintf("Failed to initialize command line parameters. -P=%s -p=%s -E=%s -configpath=%s -t=%d -g=%s -h=%s -s=%d -u=%s",
coredump_config.Initial_ns_pid,
coredump_config.Process_ns_pid,
coredump_config.Process_exe_path,
coredump_config.Corepipe_config_path,
coredump_config.Timestamp,
coredump_config.GID,
coredump_config.Hostname,
coredump_config.Signal,
coredump_config.UID)
return errors.New(err)
}
return nil
}
func isDiskSufficient(pipe_config types.Pipeconfig) (bool, error) {
percent, err := strconv.ParseInt(pipe_config.Total_file_mem_limit[:len(pipe_config.Total_file_mem_limit)-1], 10, 32)
2023-04-10 18:30:40 +08:00
if err != nil {
return false, err
}
// var stat syscall.Statfs_t
wd := pipe_config.Storage
2023-04-10 18:30:40 +08:00
if err != nil {
fmt.Println(err)
return false, err
}
diskinfo, err := disk.Usage(wd)
if err != nil {
return false, err
}
data, err := json.MarshalIndent(diskinfo, "", " ")
if err != nil {
info := fmt.Sprintf("diskinfo:%s", string(data))
journal.Print(journal.PriInfo, info)
}
usage := int64(math.Floor(diskinfo.UsedPercent + 0.5))
info := fmt.Sprintf("usage:%d,limited:%d", usage, percent)
journal.Print(journal.PriInfo, info)
2023-04-11 11:27:04 +08:00
if usage >= percent {
2023-04-10 18:30:40 +08:00
return false, nil
}
return true, nil
}
func createCoreDumpDir(pipe_config *types.Pipeconfig, args types.Coredump_config) error {
pipe_config.Storage = fmt.Sprintf("%s/coredump_%s_%s_%d", pipe_config.Storage, args.Initial_ns_pid, args.Process_ns_pid, args.Timestamp)
dirName := pipe_config.Storage
2023-04-10 18:30:40 +08:00
if _, err := os.Stat(dirName); os.IsNotExist(err) {
// 目录不存在,创建目录
if err := os.MkdirAll(dirName, os.ModePerm); err != nil {
return err
}
} else {
return errors.New("directory already exists")
}
return nil
}
func changeDirectory(dir string) error {
2023-04-10 18:30:40 +08:00
if err := os.Chdir(dir); err != nil {
return err
}
return nil
}
func getContainerId(pid string) (string, error) {
cgroup_path := fmt.Sprintf("/proc/%s/cgroup", pid)
content, err := os.ReadFile(cgroup_path)
2023-04-10 18:30:40 +08:00
if err != nil {
return "", err
}
re := regexp.MustCompile(`([a-f\d]{64})`)
match := re.FindStringSubmatch(string(content))
if len(match) < 2 {
return "", errors.New("failed to extract container ID from cgroup file")
}
containerID := match[1]
return containerID, nil
}
func getImageName(container_id string, sock_path string) (string, error) {
2023-04-10 18:30:40 +08:00
// 连接 containerd daemon
client, err := containerd.New(sock_path)
if err != nil {
return "", err
}
defer client.Close()
// 根据容器 ID 获取容器信息
ctx := namespaces.WithNamespace(context.Background(), "k8s.io")
container, err := client.LoadContainer(ctx, container_id)
if err != nil {
return "", err
}
// 获取容器关联的镜像信息
imageRef, err := container.Image(ctx)
if err != nil {
return "", err
}
return imageRef.Name(), nil
}
func writeCoreConfig(config types.Coredump_config) error {
filename := fmt.Sprintf("%s_%s_%d.info", config.Initial_ns_pid, config.Process_ns_pid, config.Timestamp)
2023-04-14 16:50:48 +08:00
file, err := os.Create(filename)
if err != nil {
return err
}
encoder := json.NewEncoder(file)
err = encoder.Encode(&config)
2023-04-10 18:30:40 +08:00
if err != nil {
return err
}
return nil
}
2023-04-14 16:50:48 +08:00
func writeCoreDumpToFile(config types.Coredump_config) error {
filename := fmt.Sprintf("%s_%s_%d.coredump", config.Initial_ns_pid, config.Process_ns_pid, config.Timestamp)
2023-04-14 16:50:48 +08:00
file, err := os.Create(filename)
2023-04-10 18:30:40 +08:00
if err != nil {
return err
}
defer file.Close()
// 创建一个管道
reader, writer := io.Pipe()
// 将标准输入连接到管道的写入端
go func() {
defer writer.Close()
io.Copy(writer, os.Stdin)
}()
// 从管道的读取端将内容写入文件
io.Copy(file, reader)
2023-04-10 18:30:40 +08:00
return nil
}
2023-05-09 17:36:04 +08:00
func writeMiniDumpToFile(config types.Coredump_config) error {
filename := fmt.Sprintf("%s_%s_%d.minidump", config.Initial_ns_pid, config.Process_ns_pid, config.Timestamp)
2023-05-09 17:36:04 +08:00
file, err := os.Create(filename)
if err != nil {
return err
}
defer file.Close()
// 创建一个管道
reader, writer := io.Pipe()
// 将标准输入连接到管道的写入端
go func() {
defer writer.Close()
io.Copy(writer, os.Stdin)
}()
// 从管道的读取端将内容写入文件
io.Copy(file, reader)
return nil
}
2023-04-14 16:50:48 +08:00
func compress(config types.Coredump_config) error {
2023-04-11 11:27:04 +08:00
// Create a new zip archive.
filename := fmt.Sprintf("%s_%s_%d.coredump", config.Initial_ns_pid, config.Process_ns_pid, config.Timestamp)
2023-04-14 16:50:48 +08:00
zipfile, err := os.Create(filename + ".zip")
2023-04-11 11:27:04 +08:00
if err != nil {
return err
}
defer zipfile.Close()
// Create a new zip writer.
zipwriter := zip.NewWriter(zipfile)
defer zipwriter.Close()
// Create a zip file header.
header := &zip.FileHeader{
2023-04-14 16:50:48 +08:00
Name: filename,
2023-04-11 11:27:04 +08:00
Method: zip.Deflate,
}
// Write the header to the zip file.
writer, err := zipwriter.CreateHeader(header)
if err != nil {
return err
}
io.Copy(writer, os.Stdin)
2023-04-11 11:27:04 +08:00
return nil
}
2023-04-10 18:30:40 +08:00
func main() {
info := fmt.Sprintf("start handle coredump")
journal.Print(journal.PriInfo, info)
flag.StringVar(&coredump_config.Initial_ns_pid, "P", "", "initial ns pid")
flag.StringVar(&coredump_config.Process_ns_pid, "p", "", "process ns pid")
flag.StringVar(&coredump_config.Process_exe_path, "E", "", "pathname of executable process")
flag.StringVar(&coredump_config.Corepipe_config_path, "C", "", "configfile's path")
flag.Int64Var(&coredump_config.Timestamp, "t", 0, "the time of coredump")
flag.StringVar(&coredump_config.GID, "g", "", "Numeric real GID of dumped process.")
flag.IntVar(&coredump_config.Signal, "s", -1, "Number of signal causing dump")
flag.StringVar(&coredump_config.UID, "u", "", "Numeric real UID of dumped process.")
flag.Parse()
var err error
coredump_config.Hostname, err = os.Hostname()
if err != nil {
journal.Print(journal.PriErr, err.Error())
}
info = fmt.Sprintf("initialize command line parameters. -P=%s -p=%s -E=%s -C=%s -t=%d -g=%s -h=%s -s=%d -u=%s", coredump_config.Initial_ns_pid, coredump_config.Process_ns_pid, coredump_config.Process_exe_path, coredump_config.Corepipe_config_path, coredump_config.Timestamp, coredump_config.GID, coredump_config.Hostname, coredump_config.Signal, coredump_config.UID)
2023-04-14 19:18:47 +08:00
journal.Print(journal.PriInfo, info)
coredump_config.Process_exe_path = strings.Replace(coredump_config.Process_exe_path, "!", "/", -1)
//判断参数读取是否正确
err = argsJudge()
2023-04-10 18:30:40 +08:00
if err != nil {
journal.Print(journal.PriErr, err.Error())
2023-04-10 18:30:40 +08:00
return
}
//读取config文件并初始化
pipe_config, err := config.PipeInit(coredump_config.Corepipe_config_path)
2023-04-10 18:30:40 +08:00
if err != nil {
journal.Print(journal.PriErr, err.Error())
2023-04-10 18:30:40 +08:00
return
}
if pipe_config.Storage_type == 0 {
return
}
//生成coredump存放文件夹
if _, err := os.Stat(pipe_config.Storage); os.IsNotExist(err) {
// 目录不存在,创建目录
if err := os.MkdirAll(pipe_config.Storage, os.ModePerm); err != nil {
journal.Print(journal.PriErr, err.Error())
return
}
}
//判断硬盘使用率
2023-04-12 17:52:13 +08:00
flag, err := isDiskSufficient(pipe_config)
2023-05-09 17:36:04 +08:00
if err != nil {
journal.Print(journal.PriErr, err.Error())
2023-04-10 18:30:40 +08:00
return
}
2023-05-09 17:36:04 +08:00
if !flag {
journal.Print(journal.PriErr, "Disk space exceeds limit")
return
}
//创建存储coredump内容文件夹
err = createCoreDumpDir(&pipe_config, coredump_config)
2023-04-10 18:30:40 +08:00
if err != nil {
journal.Print(journal.PriErr, err.Error())
2023-04-10 18:30:40 +08:00
return
}
coredump_config.Storage = pipe_config.Storage
//切换至存储coredump目录
err = changeDirectory(pipe_config.Storage)
2023-04-10 18:30:40 +08:00
if err != nil {
journal.Print(journal.PriErr, err.Error())
2023-04-10 18:30:40 +08:00
return
}
//查找发生coredump进程对应的container id
container_id, err := getContainerId(coredump_config.Initial_ns_pid)
//根据查找到的container id查找对应的image name
2023-04-10 18:30:40 +08:00
if err == nil && len(container_id) != 0 {
coredump_config.Image_name, err = getImageName(container_id, pipe_config.Containered_sock_path)
2023-04-10 18:30:40 +08:00
if err != nil {
journal.Print(journal.PriInfo, err.Error())
2023-04-10 18:30:40 +08:00
}
}
if coredump_config.Image_name == "" {
coredump_config.Image_name = "NULL"
}
//根据配置项选择存储coredump文件方式
if pipe_config.Compress == false {
2023-04-14 16:50:48 +08:00
err = writeCoreDumpToFile(coredump_config)
2023-04-11 11:27:04 +08:00
if err != nil {
journal.Print(journal.PriErr, err.Error())
2023-04-11 11:27:04 +08:00
}
coredump_config.Storage = fmt.Sprintf("%s/%s_%s_%d.coredump", pipe_config.Storage, coredump_config.Initial_ns_pid, coredump_config.Process_ns_pid, coredump_config.Timestamp)
} else {
2023-04-14 16:50:48 +08:00
err = compress(coredump_config)
2023-04-11 11:27:04 +08:00
if err != nil {
journal.Print(journal.PriErr, err.Error())
2023-04-11 11:27:04 +08:00
}
coredump_config.Storage = fmt.Sprintf("%s/%s_%s_%d.coredump.zip", pipe_config.Storage, coredump_config.Initial_ns_pid, coredump_config.Process_ns_pid, coredump_config.Timestamp)
}
//将image name写入coredump config
err = writeCoreConfig(coredump_config)
if err != nil {
journal.Print(journal.PriInfo, err.Error())
2023-04-10 18:30:40 +08:00
}
}