-
Notifications
You must be signed in to change notification settings - Fork 3
/
Copy pathprocess.go
116 lines (100 loc) · 1.93 KB
/
process.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
package main
import (
"bytes"
"fmt"
"io"
"os"
"sync"
)
func groupByHash(files []string, workers uint) (map[string][]string, error) {
type hashResult struct {
hash string
file string
err error
}
hashChan := make(chan string, len(files))
resultChan := make(chan hashResult, len(files))
var wg sync.WaitGroup
for range workers {
wg.Add(1)
go func() {
defer wg.Done()
for file := range hashChan {
h, err := createFileHash(file)
resultChan <- hashResult{h, file, err}
}
}()
}
go func() {
for _, file := range files {
hashChan <- file
}
close(hashChan)
}()
go func() {
wg.Wait()
close(resultChan)
}()
m := make(map[string][]string)
for res := range resultChan {
if res.err != nil {
return nil, res.err
}
m[res.hash] = append(m[res.hash], res.file)
}
mm := make(map[string][]string)
for k, v := range m {
if len(v) > 1 {
mm[k] = v
}
}
return mm, nil
}
func filesAreEqual(file1, file2 string) (bool, error) {
f1, err := os.Open(file1)
if err != nil {
return false, err
}
defer f1.Close()
f2, err := os.Open(file2)
if err != nil {
return false, err
}
defer f2.Close()
buf1 := make([]byte, 4096)
buf2 := make([]byte, 4096)
for {
n1, err1 := f1.Read(buf1)
n2, err2 := f2.Read(buf2)
if n1 != n2 || !bytes.Equal(buf1[:n1], buf2[:n2]) {
return false, nil
}
if err1 == io.EOF && err2 == io.EOF {
return true, nil
}
if err1 != nil || err2 != nil {
return false, fmt.Errorf("read error: %v, %v", err1, err2)
}
}
}
func partitionIntoEqualGroups(files []string) ([][]string, error) {
var groups [][]string
for _, file := range files {
matched := false
for i, group := range groups {
eq, err := filesAreEqual(group[0], file)
if err != nil {
return nil, err
}
if eq {
groups[i] = append(groups[i], file)
matched = true
break
}
}
if !matched {
groups = append(groups, []string{file})
}
}
return groups, nil
}