2023-04-10 18:30:40 +08:00
|
|
|
|
package main
|
|
|
|
|
|
|
|
|
|
|
|
import (
|
2023-04-11 11:27:04 +08:00
|
|
|
|
"archive/zip"
|
2023-04-10 18:30:40 +08:00
|
|
|
|
"context"
|
|
|
|
|
|
"coredump-handler/config"
|
2023-04-14 15:31:59 +08:00
|
|
|
|
"coredump-handler/types"
|
|
|
|
|
|
"encoding/json"
|
2023-04-10 18:30:40 +08:00
|
|
|
|
"errors"
|
2023-04-14 15:31:59 +08:00
|
|
|
|
"flag"
|
2023-04-10 18:30:40 +08:00
|
|
|
|
"fmt"
|
|
|
|
|
|
"io"
|
|
|
|
|
|
"os"
|
|
|
|
|
|
"regexp"
|
|
|
|
|
|
"strconv"
|
2023-04-14 15:31:59 +08:00
|
|
|
|
"strings"
|
2023-04-10 18:30:40 +08:00
|
|
|
|
"syscall"
|
|
|
|
|
|
|
|
|
|
|
|
"github.com/containerd/containerd"
|
|
|
|
|
|
"github.com/containerd/containerd/namespaces"
|
2023-04-12 16:13:21 +08:00
|
|
|
|
"github.com/coreos/go-systemd/v22/journal"
|
2023-04-10 18:30:40 +08:00
|
|
|
|
)
|
|
|
|
|
|
|
2023-04-11 11:27:04 +08:00
|
|
|
|
const chunkSize = 1024 * 1024 * 1024 // 1GB
|
2023-04-14 15:31:59 +08:00
|
|
|
|
var coredump_config types.Coredump_config
|
2023-04-11 11:27:04 +08:00
|
|
|
|
|
2023-04-14 15:31:59 +08:00
|
|
|
|
func argsJudge() error {
|
2023-04-18 15:27:42 +08:00
|
|
|
|
if coredump_config.Initial_ns_pid == "" || coredump_config.Process_ns_pid == "" || coredump_config.Corepipe_config_path == "" || coredump_config.Timestamp == 0 || coredump_config.Process_exe_path == "" || coredump_config.GID == "" || coredump_config.Hostname == "" || coredump_config.UID == "" || coredump_config.Signal == -1 {
|
|
|
|
|
|
err := fmt.Sprintf("Failed to initialize command line parameters. -P=%s -p=%s -E=%s -configpath=%s -t=%d -g=%s -h=%s -s=%d -u=%s", coredump_config.Initial_ns_pid, coredump_config.Process_ns_pid, coredump_config.Process_exe_path, coredump_config.Corepipe_config_path, coredump_config.Timestamp, coredump_config.GID, coredump_config.Hostname, coredump_config.Signal, coredump_config.UID)
|
2023-04-14 15:31:59 +08:00
|
|
|
|
return errors.New(err)
|
|
|
|
|
|
}
|
|
|
|
|
|
return nil
|
|
|
|
|
|
}
|
|
|
|
|
|
func isDiskSufficient(pipe_config types.Pipeconfig) (bool, error) {
|
2023-04-10 18:30:40 +08:00
|
|
|
|
percent, err := strconv.ParseFloat(pipe_config.Total_file_mem_limit[:len(pipe_config.Total_file_mem_limit)-1], 64)
|
|
|
|
|
|
if err != nil {
|
|
|
|
|
|
return false, err
|
|
|
|
|
|
}
|
|
|
|
|
|
percent = percent / 100.0
|
|
|
|
|
|
var stat syscall.Statfs_t
|
|
|
|
|
|
wd, err := syscall.Getwd()
|
|
|
|
|
|
if err != nil {
|
|
|
|
|
|
fmt.Println(err)
|
|
|
|
|
|
return false, err
|
|
|
|
|
|
}
|
|
|
|
|
|
syscall.Statfs(wd, &stat)
|
|
|
|
|
|
// 剩余空间的大小为块的数量 * 每个块的大小
|
|
|
|
|
|
// stat.Bfree表示可用的块的数量,stat.Bsize表示每个块的大小
|
2023-04-11 11:27:04 +08:00
|
|
|
|
usedSpace := (int64(stat.Blocks) - int64(stat.Bfree))
|
|
|
|
|
|
totalSpace := int64(stat.Blocks)
|
|
|
|
|
|
usage := float64(usedSpace) / float64(totalSpace)
|
|
|
|
|
|
if usage >= percent {
|
2023-04-10 18:30:40 +08:00
|
|
|
|
return false, nil
|
|
|
|
|
|
}
|
|
|
|
|
|
return true, nil
|
|
|
|
|
|
}
|
2023-04-14 15:31:59 +08:00
|
|
|
|
func createCoreDumpDir(pipe_config *types.Pipeconfig, args types.Coredump_config) error {
|
2023-04-27 17:20:57 +08:00
|
|
|
|
pipe_config.Storage = fmt.Sprintf("%s/%s_%s_%d_coredump", pipe_config.Storage, args.Initial_ns_pid, args.Process_ns_pid, args.Timestamp)
|
|
|
|
|
|
dirName := pipe_config.Storage
|
2023-04-10 18:30:40 +08:00
|
|
|
|
if _, err := os.Stat(dirName); os.IsNotExist(err) {
|
|
|
|
|
|
// 目录不存在,创建目录
|
|
|
|
|
|
if err := os.MkdirAll(dirName, os.ModePerm); err != nil {
|
|
|
|
|
|
return err
|
|
|
|
|
|
}
|
|
|
|
|
|
} else {
|
|
|
|
|
|
return errors.New("directory already exists")
|
|
|
|
|
|
}
|
|
|
|
|
|
return nil
|
|
|
|
|
|
}
|
2023-04-11 16:47:19 +08:00
|
|
|
|
func changeDirectory(dir string) error {
|
2023-04-10 18:30:40 +08:00
|
|
|
|
if err := os.Chdir(dir); err != nil {
|
|
|
|
|
|
return err
|
|
|
|
|
|
}
|
|
|
|
|
|
return nil
|
|
|
|
|
|
}
|
|
|
|
|
|
func getContainerId(pid string) (string, error) {
|
|
|
|
|
|
cgroup_path := fmt.Sprintf("/proc/%s/cgroup", pid)
|
2023-04-23 18:24:42 +08:00
|
|
|
|
content, err := os.ReadFile(cgroup_path)
|
2023-04-10 18:30:40 +08:00
|
|
|
|
if err != nil {
|
|
|
|
|
|
return "", err
|
|
|
|
|
|
}
|
|
|
|
|
|
re := regexp.MustCompile(`([a-f\d]{64})`)
|
|
|
|
|
|
match := re.FindStringSubmatch(string(content))
|
|
|
|
|
|
if len(match) < 2 {
|
|
|
|
|
|
return "", errors.New("failed to extract container ID from cgroup file")
|
|
|
|
|
|
}
|
|
|
|
|
|
containerID := match[1]
|
|
|
|
|
|
return containerID, nil
|
|
|
|
|
|
}
|
|
|
|
|
|
func getImageId(container_id string, sock_path string) (string, error) {
|
|
|
|
|
|
// 连接 containerd daemon
|
|
|
|
|
|
client, err := containerd.New(sock_path)
|
|
|
|
|
|
if err != nil {
|
|
|
|
|
|
return "", err
|
|
|
|
|
|
}
|
|
|
|
|
|
defer client.Close()
|
|
|
|
|
|
// 根据容器 ID 获取容器信息
|
|
|
|
|
|
ctx := namespaces.WithNamespace(context.Background(), "k8s.io")
|
|
|
|
|
|
container, err := client.LoadContainer(ctx, container_id)
|
|
|
|
|
|
if err != nil {
|
|
|
|
|
|
return "", err
|
|
|
|
|
|
}
|
|
|
|
|
|
// 获取容器关联的镜像信息
|
|
|
|
|
|
imageRef, err := container.Image(ctx)
|
|
|
|
|
|
if err != nil {
|
|
|
|
|
|
return "", err
|
|
|
|
|
|
}
|
|
|
|
|
|
return imageRef.Name(), nil
|
|
|
|
|
|
}
|
2023-04-14 15:31:59 +08:00
|
|
|
|
func writeCoreConfig(config types.Coredump_config) error {
|
2023-04-18 15:27:42 +08:00
|
|
|
|
filename := fmt.Sprintf("%s_%s_%d_coredump.config", config.Initial_ns_pid, config.Process_ns_pid, config.Timestamp)
|
2023-04-14 16:50:48 +08:00
|
|
|
|
file, err := os.Create(filename)
|
2023-04-14 15:31:59 +08:00
|
|
|
|
if err != nil {
|
|
|
|
|
|
return err
|
|
|
|
|
|
}
|
|
|
|
|
|
encoder := json.NewEncoder(file)
|
|
|
|
|
|
err = encoder.Encode(&config)
|
2023-04-10 18:30:40 +08:00
|
|
|
|
if err != nil {
|
|
|
|
|
|
return err
|
|
|
|
|
|
}
|
|
|
|
|
|
return nil
|
|
|
|
|
|
}
|
2023-04-14 16:50:48 +08:00
|
|
|
|
func writeCoreDumpToFile(config types.Coredump_config) error {
|
2023-04-18 15:27:42 +08:00
|
|
|
|
filename := fmt.Sprintf("%s_%s_%d_coredump.info", config.Initial_ns_pid, config.Process_ns_pid, config.Timestamp)
|
2023-04-14 16:50:48 +08:00
|
|
|
|
file, err := os.Create(filename)
|
2023-04-10 18:30:40 +08:00
|
|
|
|
if err != nil {
|
|
|
|
|
|
return err
|
|
|
|
|
|
}
|
|
|
|
|
|
defer file.Close()
|
|
|
|
|
|
|
2023-04-14 16:35:59 +08:00
|
|
|
|
// 创建一个管道
|
|
|
|
|
|
reader, writer := io.Pipe()
|
|
|
|
|
|
// 将标准输入连接到管道的写入端
|
|
|
|
|
|
go func() {
|
|
|
|
|
|
defer writer.Close()
|
|
|
|
|
|
io.Copy(writer, os.Stdin)
|
|
|
|
|
|
}()
|
|
|
|
|
|
|
|
|
|
|
|
// 从管道的读取端将内容写入文件
|
|
|
|
|
|
io.Copy(file, reader)
|
2023-04-10 18:30:40 +08:00
|
|
|
|
return nil
|
|
|
|
|
|
}
|
2023-04-14 16:50:48 +08:00
|
|
|
|
func compress(config types.Coredump_config) error {
|
2023-04-11 11:27:04 +08:00
|
|
|
|
// Create a new zip archive.
|
2023-04-18 15:27:42 +08:00
|
|
|
|
filename := fmt.Sprintf("%s_%s_%d_coredump.info", config.Initial_ns_pid, config.Process_ns_pid, config.Timestamp)
|
2023-04-14 16:50:48 +08:00
|
|
|
|
zipfile, err := os.Create(filename + ".zip")
|
2023-04-11 11:27:04 +08:00
|
|
|
|
if err != nil {
|
|
|
|
|
|
return err
|
|
|
|
|
|
}
|
|
|
|
|
|
defer zipfile.Close()
|
|
|
|
|
|
|
|
|
|
|
|
// Create a new zip writer.
|
|
|
|
|
|
zipwriter := zip.NewWriter(zipfile)
|
|
|
|
|
|
defer zipwriter.Close()
|
|
|
|
|
|
|
|
|
|
|
|
// Create a zip file header.
|
|
|
|
|
|
header := &zip.FileHeader{
|
2023-04-14 16:50:48 +08:00
|
|
|
|
Name: filename,
|
2023-04-11 11:27:04 +08:00
|
|
|
|
Method: zip.Deflate,
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
// Write the header to the zip file.
|
|
|
|
|
|
writer, err := zipwriter.CreateHeader(header)
|
|
|
|
|
|
if err != nil {
|
|
|
|
|
|
return err
|
|
|
|
|
|
}
|
2023-04-14 16:35:59 +08:00
|
|
|
|
io.Copy(writer, os.Stdin)
|
2023-04-11 11:27:04 +08:00
|
|
|
|
|
|
|
|
|
|
return nil
|
|
|
|
|
|
}
|
2023-04-10 18:30:40 +08:00
|
|
|
|
func main() {
|
2023-04-23 18:24:42 +08:00
|
|
|
|
info := fmt.Sprintf("start handle coredump")
|
|
|
|
|
|
journal.Print(journal.PriInfo, info)
|
2023-04-14 15:31:59 +08:00
|
|
|
|
flag.StringVar(&coredump_config.Initial_ns_pid, "P", "", "initial ns pid")
|
|
|
|
|
|
flag.StringVar(&coredump_config.Process_ns_pid, "p", "", "process ns pid")
|
|
|
|
|
|
flag.StringVar(&coredump_config.Process_exe_path, "E", "", "pathname of executable process")
|
|
|
|
|
|
flag.StringVar(&coredump_config.Corepipe_config_path, "configpath", "", "configfile's path")
|
2023-04-18 15:27:42 +08:00
|
|
|
|
flag.Int64Var(&coredump_config.Timestamp, "t", 0, "the time of coredump")
|
|
|
|
|
|
flag.StringVar(&coredump_config.GID, "g", "", "Numeric real GID of dumped process.")
|
|
|
|
|
|
flag.IntVar(&coredump_config.Signal, "s", -1, "Number of signal causing dump")
|
|
|
|
|
|
flag.StringVar(&coredump_config.UID, "u", "", "Numeric real UID of dumped process.")
|
2023-04-14 15:31:59 +08:00
|
|
|
|
flag.Parse()
|
2023-04-23 18:24:42 +08:00
|
|
|
|
var err error
|
|
|
|
|
|
coredump_config.Hostname, err = os.Hostname()
|
|
|
|
|
|
if err != nil {
|
|
|
|
|
|
journal.Print(journal.PriErr, err.Error())
|
|
|
|
|
|
}
|
|
|
|
|
|
info = fmt.Sprintf("initialize command line parameters. -P=%s -p=%s -E=%s -configpath=%s -t=%d -g=%s -h=%s -s=%d -u=%s", coredump_config.Initial_ns_pid, coredump_config.Process_ns_pid, coredump_config.Process_exe_path, coredump_config.Corepipe_config_path, coredump_config.Timestamp, coredump_config.GID, coredump_config.Hostname, coredump_config.Signal, coredump_config.UID)
|
2023-04-14 19:18:47 +08:00
|
|
|
|
journal.Print(journal.PriInfo, info)
|
2023-04-14 15:31:59 +08:00
|
|
|
|
coredump_config.Process_exe_path = strings.Replace(coredump_config.Process_exe_path, "!", "/", -1)
|
|
|
|
|
|
//判断参数读取是否正确
|
2023-04-23 18:24:42 +08:00
|
|
|
|
err = argsJudge()
|
2023-04-10 18:30:40 +08:00
|
|
|
|
if err != nil {
|
2023-04-12 16:13:21 +08:00
|
|
|
|
journal.Print(journal.PriErr, err.Error())
|
2023-04-10 18:30:40 +08:00
|
|
|
|
return
|
|
|
|
|
|
}
|
2023-04-11 16:47:19 +08:00
|
|
|
|
//读取config文件并初始化
|
2023-04-14 15:31:59 +08:00
|
|
|
|
pipe_config, err := config.PipeInit(coredump_config.Corepipe_config_path)
|
2023-04-10 18:30:40 +08:00
|
|
|
|
if err != nil {
|
2023-04-12 16:13:21 +08:00
|
|
|
|
journal.Print(journal.PriErr, err.Error())
|
2023-04-10 18:30:40 +08:00
|
|
|
|
return
|
|
|
|
|
|
}
|
2023-04-11 16:47:19 +08:00
|
|
|
|
//判断硬盘使用率
|
2023-04-12 17:52:13 +08:00
|
|
|
|
flag, err := isDiskSufficient(pipe_config)
|
2023-04-10 18:30:40 +08:00
|
|
|
|
if err != nil && !flag {
|
2023-04-12 16:13:21 +08:00
|
|
|
|
journal.Print(journal.PriErr, err.Error())
|
2023-04-10 18:30:40 +08:00
|
|
|
|
return
|
|
|
|
|
|
}
|
2023-04-11 16:47:19 +08:00
|
|
|
|
//创建存储coredump内容文件夹
|
2023-04-14 15:31:59 +08:00
|
|
|
|
err = createCoreDumpDir(&pipe_config, coredump_config)
|
2023-04-10 18:30:40 +08:00
|
|
|
|
if err != nil {
|
2023-04-12 16:13:21 +08:00
|
|
|
|
journal.Print(journal.PriErr, err.Error())
|
2023-04-10 18:30:40 +08:00
|
|
|
|
return
|
|
|
|
|
|
}
|
2023-04-27 17:20:57 +08:00
|
|
|
|
coredump_config.Storage = pipe_config.Storage
|
2023-04-11 16:47:19 +08:00
|
|
|
|
//切换至存储coredump目录
|
2023-04-27 17:20:57 +08:00
|
|
|
|
err = changeDirectory(pipe_config.Storage)
|
2023-04-10 18:30:40 +08:00
|
|
|
|
if err != nil {
|
2023-04-12 16:13:21 +08:00
|
|
|
|
journal.Print(journal.PriErr, err.Error())
|
2023-04-10 18:30:40 +08:00
|
|
|
|
return
|
|
|
|
|
|
}
|
2023-04-11 16:47:19 +08:00
|
|
|
|
//查找发生coredump进程对应的container id
|
2023-04-14 15:31:59 +08:00
|
|
|
|
container_id, err := getContainerId(coredump_config.Initial_ns_pid)
|
2023-04-11 16:47:19 +08:00
|
|
|
|
//根据查找到的container id查找对应的image name
|
2023-04-10 18:30:40 +08:00
|
|
|
|
if err == nil && len(container_id) != 0 {
|
2023-04-14 15:31:59 +08:00
|
|
|
|
coredump_config.Image_id, err = getImageId(container_id, pipe_config.Containered_sock_path)
|
2023-04-10 18:30:40 +08:00
|
|
|
|
if err != nil {
|
2023-04-12 16:13:21 +08:00
|
|
|
|
journal.Print(journal.PriInfo, err.Error())
|
2023-04-10 18:30:40 +08:00
|
|
|
|
}
|
|
|
|
|
|
}
|
2023-04-27 17:20:57 +08:00
|
|
|
|
if coredump_config.Image_id == "" {
|
|
|
|
|
|
coredump_config.Image_id = "NULL"
|
|
|
|
|
|
}
|
2023-04-11 16:47:19 +08:00
|
|
|
|
//根据配置项选择存储coredump文件方式
|
2023-04-27 17:20:57 +08:00
|
|
|
|
if pipe_config.Compress == false {
|
2023-04-14 16:50:48 +08:00
|
|
|
|
err = writeCoreDumpToFile(coredump_config)
|
2023-04-11 11:27:04 +08:00
|
|
|
|
if err != nil {
|
2023-04-12 16:13:21 +08:00
|
|
|
|
journal.Print(journal.PriErr, err.Error())
|
2023-04-11 11:27:04 +08:00
|
|
|
|
}
|
2023-04-27 17:20:57 +08:00
|
|
|
|
coredump_config.Storage = fmt.Sprintf("%s/%s_%s_%d_coredump.info", pipe_config.Storage, coredump_config.Initial_ns_pid, coredump_config.Process_ns_pid, coredump_config.Timestamp)
|
|
|
|
|
|
} else if pipe_config.Compress == true {
|
2023-04-14 16:50:48 +08:00
|
|
|
|
err = compress(coredump_config)
|
2023-04-11 11:27:04 +08:00
|
|
|
|
if err != nil {
|
2023-04-12 16:13:21 +08:00
|
|
|
|
journal.Print(journal.PriErr, err.Error())
|
2023-04-11 11:27:04 +08:00
|
|
|
|
}
|
2023-04-27 17:20:57 +08:00
|
|
|
|
coredump_config.Storage = fmt.Sprintf("%s/%s_%s_%d_coredump.info.zip", pipe_config.Storage, coredump_config.Initial_ns_pid, coredump_config.Process_ns_pid, coredump_config.Timestamp)
|
2023-04-23 18:24:42 +08:00
|
|
|
|
}
|
|
|
|
|
|
//将image name写入coredump config
|
|
|
|
|
|
err = writeCoreConfig(coredump_config)
|
|
|
|
|
|
if err != nil {
|
|
|
|
|
|
journal.Print(journal.PriInfo, err.Error())
|
2023-04-10 18:30:40 +08:00
|
|
|
|
}
|
|
|
|
|
|
}
|