155 lines
4.9 KiB
Go
155 lines
4.9 KiB
Go
package mime
|
||
|
||
import (
|
||
"b612.me/starlog"
|
||
"b612.me/staros"
|
||
"encoding/csv"
|
||
"github.com/gabriel-vasile/mimetype"
|
||
"github.com/spf13/cobra"
|
||
"io"
|
||
"os"
|
||
"path/filepath"
|
||
"strings"
|
||
)
|
||
|
||
var recursive, verbose, repair, appendOldName, onlyShowNotMatch, secondExt bool
|
||
var outputCsvPath string
|
||
var fromSize int
|
||
|
||
func init() {
|
||
Cmd.Flags().BoolVarP(&recursive, "recursive", "r", false, "递归检测文件夹中的所有文件")
|
||
Cmd.Flags().BoolVarP(&verbose, "verbose", "v", false, "详细模式,输出更多日志")
|
||
Cmd.Flags().BoolVarP(&repair, "repair", "R", false, "修复文件类型,尝试将文件类型修复为正确的类型")
|
||
Cmd.Flags().BoolVarP(&appendOldName, "append-mode", "a", false, "在修复文件名时,追加旧文件名后缀")
|
||
Cmd.Flags().StringVarP(&outputCsvPath, "output-csv", "o", "", "输出CSV文件路径,若不指定则不输出CSV")
|
||
Cmd.Flags().IntVarP(&fromSize, "from-size", "s", 0, "需要检测的地址偏移量,单位为字节,默认从0开始检测,负数表示从文件末尾开始计算偏移量")
|
||
Cmd.Flags().BoolVarP(&onlyShowNotMatch, "only-show-not-match", "m", false, "只显示文件类型不匹配的文件")
|
||
Cmd.Flags().BoolVarP(&secondExt, "second-ext", "S", false, "使用第二个扩展名进行匹配,适用于某些文件类型(如 .tar.gz .7z.001)")
|
||
}
|
||
|
||
var Cmd = &cobra.Command{
|
||
Use: "mime",
|
||
Short: "文件类型检测",
|
||
Long: `mime - 文件类型检测`,
|
||
Run: func(cmd *cobra.Command, args []string) {
|
||
var c *csv.Writer
|
||
if len(args) == 0 {
|
||
starlog.Errorf("请指定文件路径\n")
|
||
os.Exit(1)
|
||
}
|
||
if outputCsvPath != "" {
|
||
file, err := os.Create(outputCsvPath)
|
||
if err != nil {
|
||
starlog.Errorf("创建CSV文件 %s 失败: %v\n", outputCsvPath, err)
|
||
os.Exit(1)
|
||
}
|
||
defer file.Close()
|
||
c = csv.NewWriter(file)
|
||
c.Write([]string{"File Path", "Extension", "Detect File Type", "Detect File Extension", "Match"})
|
||
defer c.Flush()
|
||
}
|
||
for _, path := range args {
|
||
if staros.IsFolder(path) {
|
||
for _, file := range getFiles(path, recursive) {
|
||
Detect(c, file, fromSize, onlyShowNotMatch)
|
||
}
|
||
} else {
|
||
Detect(c, path, fromSize, onlyShowNotMatch)
|
||
}
|
||
}
|
||
},
|
||
}
|
||
|
||
func getFiles(folder string, recurring bool) []string {
|
||
files := make([]string, 0)
|
||
err := filepath.Walk(folder, func(path string, info os.FileInfo, err error) error {
|
||
if err != nil {
|
||
starlog.Errorf("walk folder %s error: %v", folder, err)
|
||
return err
|
||
}
|
||
if info.IsDir() {
|
||
if recurring {
|
||
return nil // 继续递归
|
||
}
|
||
return filepath.SkipDir // 不递归子目录
|
||
}
|
||
files = append(files, path)
|
||
return nil
|
||
})
|
||
if err != nil {
|
||
starlog.Errorf("walk folder %s error: %v", folder, err)
|
||
}
|
||
return files
|
||
}
|
||
|
||
func Detect(c *csv.Writer, path string, fromSize int, onlyShowNotMatch bool) {
|
||
f, err := os.Open(path)
|
||
if err != nil {
|
||
starlog.Errorf("open file %s error: %v\n", path, err)
|
||
os.Exit(1)
|
||
}
|
||
if fromSize > 0 {
|
||
f.Seek(int64(fromSize), io.SeekStart)
|
||
} else if fromSize < 0 {
|
||
f.Seek(int64(fromSize), io.SeekEnd)
|
||
}
|
||
tp, err := mimetype.DetectReader(f)
|
||
f.Close()
|
||
if err != nil {
|
||
starlog.Errorf("detect file type error: %v\n", err)
|
||
os.Exit(1)
|
||
}
|
||
ext := strings.ToLower(filepath.Ext(path))
|
||
ext2 := strings.ToLower(filepath.Ext(strings.TrimRight(path, ext)))
|
||
if verbose {
|
||
starlog.Infof("file path: %s\n", path)
|
||
starlog.Infof("file type: %s\n", tp.String())
|
||
starlog.Infof("file ext: %s\n", tp.Extension())
|
||
if ext2 == tp.Extension() && secondExt {
|
||
if !onlyShowNotMatch {
|
||
starlog.Infof("file type %s match extension %s\n", tp.String(), ext2)
|
||
}
|
||
} else if ext != tp.Extension() && tp.Extension() != "" {
|
||
starlog.Warningf("file type %s not match extension %s\n", tp.String(), ext)
|
||
} else if !onlyShowNotMatch {
|
||
starlog.Infof("file type %s match extension %s\n", tp.String(), ext)
|
||
}
|
||
} else {
|
||
if ext2 == tp.Extension() && secondExt {
|
||
if !onlyShowNotMatch {
|
||
starlog.Infof("%s: %s (%s) matched %s\n", path, tp.String(), tp.Extension(), ext2)
|
||
}
|
||
} else if ext != tp.Extension() && tp.Extension() != "" {
|
||
starlog.Warningf("%s: %s (%s) not match %s\n", path, tp.String(), tp.Extension(), ext)
|
||
} else if !onlyShowNotMatch {
|
||
starlog.Infof("%s: %s (%s) matched %s\n", path, tp.String(), tp.Extension(), ext)
|
||
}
|
||
}
|
||
if c != nil {
|
||
match := "false"
|
||
if ext == tp.Extension() {
|
||
match = "true"
|
||
}
|
||
err = c.Write([]string{path, ext, tp.String(), tp.Extension(), match})
|
||
if err != nil {
|
||
starlog.Errorf("write csv file %s error: %v\n", outputCsvPath, err)
|
||
}
|
||
}
|
||
if repair && ext != tp.Extension() && tp.Extension() != "" {
|
||
newPath := path[:len(path)-len(ext)] + tp.Extension()
|
||
if appendOldName {
|
||
newPath = path + tp.Extension()
|
||
}
|
||
err = os.Rename(path, newPath)
|
||
if err != nil {
|
||
starlog.Errorf("rename file %s to %s error: %v", path, newPath, err)
|
||
os.Exit(1)
|
||
}
|
||
if verbose {
|
||
starlog.Infof("file %s renamed to %s\n", path, newPath)
|
||
} else {
|
||
starlog.Infof("renamed: %s -> %s\n", path, newPath)
|
||
}
|
||
}
|
||
}
|