-
Notifications
You must be signed in to change notification settings - Fork 1
/
scan.go
92 lines (83 loc) · 1.91 KB
/
scan.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
package main
import (
"errors"
"fmt"
"github.com/spf13/viper"
"io"
"io/ioutil"
"net/http"
"os"
"os/exec"
"path/filepath"
"strings"
)
const mapping = `
{
"mappings": {
"file": {
"properties": {
"path": {
"type": "keyword"
},
"user": {
"type": "keyword"
},
"group": {
"type": "keyword"
},
"size": {
"type": "long"
},
"alloc_size": {
"type": "long"
},
"type": {
"type": "keyword"
},
"mtime": {
"type": "date"
},
"atime": {
"type": "date"
}
}
}
},
"settings": {
"number_of_shards": "10",
"number_of_replicas": "0"
}
}
`
const maxTikaSize = 65536
var client = &http.Client{Transport: &http.Transport{
MaxIdleConnsPerHost: 24,
}}
func sendFileToTika(filename string) (string, error) {
inp, _ := os.Open(filename)
request, _ := http.NewRequest("PUT", viper.GetString("tika_url"), &io.LimitedReader{R: inp, N: maxTikaSize})
request.Header.Add("Content-Disposition", fmt.Sprintf("attachment; filename=%s", strings.Replace(filepath.Base(filename), ":", "", -1)))
response, err := client.Do(request)
if err != nil {
return "", err
}
defer response.Body.Close()
contents, err := ioutil.ReadAll(response.Body)
if err != nil {
return "", err
}
return string(contents), nil
}
func getFileType(path string) (string, error) {
if viper.IsSet("tika_jar") {
retType, err := exec.Command("java", "-jar", viper.GetString("tika_jar"), "-d", path).Output()
retTypeStr := strings.TrimSpace(string(retType))
return retTypeStr, err
}
if viper.IsSet("tika_url") {
contentType, err := sendFileToTika(path)
retTypeStr := strings.TrimSpace(contentType)
return retTypeStr, err
}
return "", errors.New("Tika settings not set")
}