2023-06-15 01:08:09 +00:00
|
|
|
package search
|
|
|
|
|
|
|
|
import (
|
|
|
|
"log"
|
|
|
|
"os"
|
|
|
|
"path/filepath"
|
2023-06-18 15:04:31 +00:00
|
|
|
"sort"
|
2023-06-15 01:08:09 +00:00
|
|
|
"strings"
|
2023-06-16 17:29:43 +00:00
|
|
|
"sync"
|
2023-06-15 01:08:09 +00:00
|
|
|
"time"
|
2023-07-04 23:55:15 +00:00
|
|
|
"mime"
|
2023-06-15 01:08:09 +00:00
|
|
|
)
|
|
|
|
|
2023-06-16 17:29:43 +00:00
|
|
|
var (
|
2023-07-04 23:55:15 +00:00
|
|
|
rootPath string = "/srv"
|
2023-07-13 02:23:29 +00:00
|
|
|
indexes = map[string][]string{}
|
2023-06-18 15:04:31 +00:00
|
|
|
mutex sync.RWMutex
|
2023-06-16 17:29:43 +00:00
|
|
|
lastIndexed time.Time
|
|
|
|
)
|
2023-06-15 01:08:09 +00:00
|
|
|
|
2023-06-15 15:30:49 +00:00
|
|
|
func InitializeIndex(intervalMinutes uint32) {
|
2023-06-15 01:08:09 +00:00
|
|
|
// Initialize the indexes map
|
2023-06-16 17:29:43 +00:00
|
|
|
indexes = make(map[string][]string)
|
2023-07-13 02:23:29 +00:00
|
|
|
indexes["dirs"] = []string{}
|
|
|
|
indexes["files"] = []string{}
|
2023-06-16 17:29:43 +00:00
|
|
|
var numFiles, numDirs int
|
2023-06-15 15:30:49 +00:00
|
|
|
log.Println("Indexing files...")
|
2023-06-16 17:29:43 +00:00
|
|
|
lastIndexedStart := time.Now()
|
2023-06-15 01:08:09 +00:00
|
|
|
// Call the function to index files and directories
|
2023-06-18 15:04:31 +00:00
|
|
|
totalNumFiles, totalNumDirs, err := indexFiles(rootPath, &numFiles, &numDirs)
|
2023-06-15 01:08:09 +00:00
|
|
|
if err != nil {
|
|
|
|
log.Fatal(err)
|
|
|
|
}
|
2023-06-16 17:29:43 +00:00
|
|
|
lastIndexed = lastIndexedStart
|
2023-06-15 15:30:49 +00:00
|
|
|
go indexingScheduler(intervalMinutes)
|
|
|
|
log.Println("Successfully indexed files.")
|
2023-06-18 15:04:31 +00:00
|
|
|
log.Println("Files found :", totalNumFiles)
|
|
|
|
log.Println("Directories found :", totalNumDirs)
|
2023-06-15 01:08:09 +00:00
|
|
|
}
|
|
|
|
|
2023-06-15 15:30:49 +00:00
|
|
|
func indexingScheduler(intervalMinutes uint32) {
|
2023-06-18 15:04:31 +00:00
|
|
|
log.Printf("Indexing scheduler will run every %v minutes", intervalMinutes)
|
2023-06-15 15:30:49 +00:00
|
|
|
for {
|
|
|
|
time.Sleep(time.Duration(intervalMinutes) * time.Minute)
|
2023-06-16 17:29:43 +00:00
|
|
|
var numFiles, numDirs int
|
|
|
|
lastIndexedStart := time.Now()
|
2023-06-18 15:04:31 +00:00
|
|
|
totalNumFiles, totalNumDirs, err := indexFiles(rootPath, &numFiles, &numDirs)
|
2023-06-15 15:30:49 +00:00
|
|
|
if err != nil {
|
|
|
|
log.Fatal(err)
|
|
|
|
}
|
2023-06-16 17:29:43 +00:00
|
|
|
lastIndexed = lastIndexedStart
|
|
|
|
if totalNumFiles+totalNumDirs > 0 {
|
|
|
|
log.Println("re-indexing found changes and updated the index.")
|
|
|
|
}
|
2023-06-15 01:08:09 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// Define a function to recursively index files and directories
|
2023-06-18 15:04:31 +00:00
|
|
|
func indexFiles(path string, numFiles *int, numDirs *int) (int, int, error) {
|
2023-06-15 01:08:09 +00:00
|
|
|
// Check if the current directory has been modified since last indexing
|
|
|
|
dir, err := os.Open(path)
|
|
|
|
if err != nil {
|
|
|
|
// directory must have been deleted, remove from index
|
|
|
|
delete(indexes, path)
|
|
|
|
}
|
|
|
|
defer dir.Close()
|
|
|
|
dirInfo, err := dir.Stat()
|
|
|
|
if err != nil {
|
2023-06-18 15:04:31 +00:00
|
|
|
return *numFiles, *numDirs, err
|
2023-06-15 01:08:09 +00:00
|
|
|
}
|
|
|
|
// Compare the last modified time of the directory with the last indexed time
|
2023-06-16 17:29:43 +00:00
|
|
|
if dirInfo.ModTime().Before(lastIndexed) {
|
2023-06-18 15:04:31 +00:00
|
|
|
return *numFiles, *numDirs, nil
|
2023-06-15 01:08:09 +00:00
|
|
|
}
|
|
|
|
// Read the directory contents
|
|
|
|
files, err := dir.Readdir(-1)
|
|
|
|
if err != nil {
|
2023-06-18 15:04:31 +00:00
|
|
|
return *numFiles, *numDirs, err
|
2023-06-15 01:08:09 +00:00
|
|
|
}
|
|
|
|
// Iterate over the files and directories
|
|
|
|
for _, file := range files {
|
|
|
|
if file.IsDir() {
|
2023-06-16 17:29:43 +00:00
|
|
|
*numDirs++
|
2023-07-13 02:23:29 +00:00
|
|
|
addToIndex(path, file.Name(), true)
|
|
|
|
indexFiles(path+"/"+file.Name(), numFiles, numDirs) // recursive
|
|
|
|
} else {
|
|
|
|
*numFiles++
|
|
|
|
addToIndex(path, file.Name(), false)
|
2023-06-15 01:08:09 +00:00
|
|
|
}
|
|
|
|
}
|
2023-06-18 15:04:31 +00:00
|
|
|
return *numFiles, *numDirs, nil
|
2023-06-15 01:08:09 +00:00
|
|
|
}
|
|
|
|
|
2023-07-13 02:23:29 +00:00
|
|
|
func addToIndex(path string, fileName string, isDir bool) {
|
2023-06-16 17:29:43 +00:00
|
|
|
mutex.Lock()
|
|
|
|
defer mutex.Unlock()
|
2023-06-18 15:04:31 +00:00
|
|
|
path = strings.TrimPrefix(path, rootPath+"/")
|
|
|
|
path = strings.TrimSuffix(path, "/")
|
2023-07-13 02:23:29 +00:00
|
|
|
adjustedPath := path + "/" + fileName
|
2023-06-16 17:29:43 +00:00
|
|
|
if path == rootPath {
|
2023-07-13 02:23:29 +00:00
|
|
|
adjustedPath = fileName
|
2023-06-16 17:29:43 +00:00
|
|
|
}
|
2023-07-13 02:23:29 +00:00
|
|
|
if isDir {
|
|
|
|
indexes["dirs"] = append(indexes["dirs"], adjustedPath)
|
|
|
|
}else{
|
|
|
|
indexes["files"] = append(indexes["files"], adjustedPath)
|
2023-06-15 01:08:09 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-07-17 05:17:52 +00:00
|
|
|
func SearchAllIndexes(search string, scope string) ([]string, map[string]map[string]bool) {
|
2023-06-18 15:04:31 +00:00
|
|
|
searchOptions := ParseSearch(search)
|
2023-06-16 17:29:43 +00:00
|
|
|
mutex.RLock()
|
|
|
|
defer mutex.RUnlock()
|
2023-07-13 02:23:29 +00:00
|
|
|
fileListTypes := make(map[string]map[string]bool)
|
2023-07-17 05:17:52 +00:00
|
|
|
var matching []string
|
2023-07-13 02:23:29 +00:00
|
|
|
maximum := 125
|
|
|
|
|
2023-06-18 15:04:31 +00:00
|
|
|
for _, searchTerm := range searchOptions.Terms {
|
2023-07-04 23:55:15 +00:00
|
|
|
if searchTerm == "" {
|
|
|
|
continue
|
|
|
|
}
|
2023-07-13 02:23:29 +00:00
|
|
|
count := 0
|
2023-06-18 15:04:31 +00:00
|
|
|
// Iterate over the indexes
|
2023-07-13 02:23:29 +00:00
|
|
|
for _, dirName := range indexes["dirs"] {
|
2023-06-18 15:04:31 +00:00
|
|
|
if count > maximum {
|
|
|
|
break
|
|
|
|
}
|
2023-07-13 02:23:29 +00:00
|
|
|
pathName := scopedPathNameFilter(dirName, scope)
|
|
|
|
if pathName == "" {
|
|
|
|
continue
|
2023-06-16 17:29:43 +00:00
|
|
|
}
|
2023-07-17 05:17:52 +00:00
|
|
|
matches, fileType := containsSearchTerm(pathName, searchTerm, searchOptions.Conditions, true)
|
2023-07-13 02:23:29 +00:00
|
|
|
if !matches {
|
2023-06-15 15:30:49 +00:00
|
|
|
continue
|
|
|
|
}
|
2023-07-13 02:23:29 +00:00
|
|
|
count++
|
2023-07-17 05:17:52 +00:00
|
|
|
matching = append(matching, pathName+"/")
|
|
|
|
fileListTypes[pathName+"/"] = fileType
|
2023-07-13 02:23:29 +00:00
|
|
|
}
|
|
|
|
count = 0
|
|
|
|
for _, fileName := range indexes["files"] {
|
|
|
|
if count > maximum {
|
|
|
|
break
|
|
|
|
}
|
|
|
|
pathName := scopedPathNameFilter(fileName, scope)
|
2023-06-15 15:30:49 +00:00
|
|
|
if pathName == "" {
|
|
|
|
continue
|
2023-06-15 01:08:09 +00:00
|
|
|
}
|
2023-07-13 02:23:29 +00:00
|
|
|
// Check if the path name contains the search term
|
2023-07-17 05:17:52 +00:00
|
|
|
matches, fileType := containsSearchTerm(pathName, searchTerm, searchOptions.Conditions, false)
|
2023-07-13 02:23:29 +00:00
|
|
|
if !matches {
|
|
|
|
continue
|
|
|
|
}
|
2023-07-17 05:17:52 +00:00
|
|
|
matching = append(matching, pathName)
|
2023-07-13 02:23:29 +00:00
|
|
|
fileListTypes[pathName] = fileType
|
2023-06-18 15:04:31 +00:00
|
|
|
count++
|
2023-06-15 01:08:09 +00:00
|
|
|
}
|
|
|
|
}
|
2023-06-16 17:29:43 +00:00
|
|
|
// Sort the strings based on the number of elements after splitting by "/"
|
2023-07-17 05:17:52 +00:00
|
|
|
sort.Slice(matching, func(i, j int) bool {
|
|
|
|
parts1 := strings.Split(matching[i], "/")
|
|
|
|
parts2 := strings.Split(matching[j], "/")
|
2023-06-16 17:29:43 +00:00
|
|
|
return len(parts1) < len(parts2)
|
|
|
|
})
|
2023-07-17 05:17:52 +00:00
|
|
|
return matching, fileListTypes
|
2023-06-15 01:08:09 +00:00
|
|
|
}
|
|
|
|
|
2023-06-15 15:30:49 +00:00
|
|
|
func scopedPathNameFilter(pathName string, scope string) string {
|
|
|
|
scope = strings.TrimPrefix(scope, "/")
|
|
|
|
if strings.HasPrefix(pathName, scope) {
|
|
|
|
pathName = strings.TrimPrefix(pathName, scope)
|
|
|
|
} else {
|
|
|
|
pathName = ""
|
|
|
|
}
|
|
|
|
return pathName
|
|
|
|
}
|
|
|
|
|
2023-07-17 05:17:52 +00:00
|
|
|
func containsSearchTerm(pathName string, searchTerm string, conditions map[string]bool, isDir bool) (bool, map[string]bool) {
|
2023-07-13 02:23:29 +00:00
|
|
|
path := getLastPathComponent(pathName)
|
|
|
|
fileTypes := map[string]bool{}
|
|
|
|
matchesCondition := false
|
|
|
|
extension := filepath.Ext(strings.ToLower(path))
|
|
|
|
mimetype := mime.TypeByExtension(extension)
|
|
|
|
fileTypes["audio"] = strings.HasPrefix(mimetype, "audio")
|
|
|
|
fileTypes["image"] = strings.HasPrefix(mimetype, "image")
|
|
|
|
fileTypes["video"] = strings.HasPrefix(mimetype, "video")
|
|
|
|
fileTypes["doc"] = isDoc(extension)
|
|
|
|
fileTypes["archive"] = isArchive(extension)
|
2023-07-17 05:17:52 +00:00
|
|
|
fileTypes["dir"] = isDir
|
|
|
|
anyFilter := false
|
|
|
|
for t,v := range conditions {
|
|
|
|
if t == "exact" {
|
|
|
|
continue
|
2023-07-13 02:23:29 +00:00
|
|
|
}
|
2023-07-17 05:17:52 +00:00
|
|
|
matchesCondition = v == fileTypes[t]
|
|
|
|
anyFilter = true
|
2023-07-13 02:23:29 +00:00
|
|
|
}
|
|
|
|
if !anyFilter {
|
|
|
|
matchesCondition = true
|
|
|
|
}
|
2023-07-04 23:55:15 +00:00
|
|
|
if !conditions["exact"] {
|
|
|
|
path = strings.ToLower(path)
|
|
|
|
searchTerm = strings.ToLower(searchTerm)
|
|
|
|
}
|
2023-07-13 02:23:29 +00:00
|
|
|
return strings.Contains(path, searchTerm) && matchesCondition, fileTypes
|
|
|
|
}
|
|
|
|
|
|
|
|
func isDoc(extension string) bool {
|
|
|
|
for _, typefile := range documentTypes {
|
|
|
|
if extension == typefile {
|
|
|
|
return true
|
2023-07-04 23:55:15 +00:00
|
|
|
}
|
2023-07-13 02:23:29 +00:00
|
|
|
}
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
|
|
|
|
func isArchive(extension string) bool {
|
|
|
|
for _, typefile := range compressedFile {
|
|
|
|
if extension == typefile {
|
|
|
|
return true
|
2023-07-04 23:55:15 +00:00
|
|
|
}
|
2023-07-13 02:23:29 +00:00
|
|
|
}
|
|
|
|
return false
|
2023-06-15 01:08:09 +00:00
|
|
|
}
|
2023-06-18 15:04:31 +00:00
|
|
|
|
2023-06-15 01:08:09 +00:00
|
|
|
func getLastPathComponent(path string) string {
|
|
|
|
// Use filepath.Base to extract the last component of the path
|
|
|
|
return filepath.Base(path)
|
2023-06-18 15:04:31 +00:00
|
|
|
}
|