Implement type sussination

This commit is contained in:
2025-03-08 11:01:23 +01:00
parent fff7e62cd1
commit 1d0517ab66

65
main.go
View File

@@ -1,6 +1,8 @@
package main package main
import ( import (
"bufio"
"flag"
"fmt" "fmt"
"log" "log"
"os" "os"
@@ -27,14 +29,71 @@ func init() {
} }
func main() { func main() {
flag.Parse()
dir := flag.Arg(0)
if dir == "" {
dir = "."
}
dir = NormalizePath(dir)
log.Printf("Scanning directory: %s", dir)
files := make(chan string, 10000) files := make(chan string, 10000)
status := make(chan error) status := make(chan error)
go GetSyncFilesRecursively(".", files, status) go GetSyncFilesRecursively(dir, files, status)
typeByExtension := sync.Map{}
countByExtension := sync.Map{}
wg := sync.WaitGroup{}
for file := range files { for file := range files {
log.Println(file) wg.Add(1)
go func(file string) {
defer wg.Done()
f, err := os.Open(file)
if err != nil {
log.Printf("Error opening file %s: %v", file, err)
return
} }
scanner := bufio.NewScanner(f)
if scanner.Scan() {
ext := filepath.Ext(file)
count, _ := countByExtension.LoadOrStore(ext, 0)
if IsStringBinary(scanner.Text()) {
log.Printf("Binary file: %s (%s)", file, ext)
typeByExtension.Store(ext, "binary")
countByExtension.Store(ext, count.(int)+1)
} else {
log.Printf("Text file: %s (%s)", file, ext)
typeByExtension.Store(ext, "text")
countByExtension.Store(ext, count.(int)+1)
}
} else if err := scanner.Err(); err != nil {
log.Printf("Error reading line from file %s: %v", file, err)
}
f.Close()
}(file)
}
wg.Wait()
countByExtension.Range(func(key, value any) bool {
typ, ok := typeByExtension.Load(key)
if !ok {
typ = "unknown"
}
log.Printf("Extension: %s, Type: %s, Count: %d", key, typ, value.(int))
return true
})
}
func IsStringBinary(s string) bool {
for _, c := range s {
if c < ' ' || c > '~' {
return true
}
}
return false
} }
func GetSyncFilesRecursively(input string, output chan string, status chan error) { func GetSyncFilesRecursively(input string, output chan string, status chan error) {
@@ -141,7 +200,7 @@ func processDirectory(directory string, directories chan<- string, output chan<-
} }
} }
func NormalizePath(input, workdir string) string { func NormalizePath(input string) string {
input = filepath.Clean(input) input = filepath.Clean(input)
input = filepath.ToSlash(input) input = filepath.ToSlash(input)
input = strings.ReplaceAll(input, "\"", "") input = strings.ReplaceAll(input, "\"", "")