1
Fork 0
photoview/api/scanner/scanner.go

274 lines
6.4 KiB
Go
Raw Normal View History

2020-02-01 17:58:45 +01:00
package scanner
import (
"container/list"
"database/sql"
"fmt"
"io/ioutil"
"log"
"os"
"path"
2020-02-12 18:10:52 +01:00
"strconv"
"strings"
2020-02-01 17:58:45 +01:00
"github.com/h2non/filetype"
"github.com/viktorstrate/photoview/api/graphql/models"
)
2020-02-09 14:21:53 +01:00
type scanner_cache map[string]interface{}
func (cache *scanner_cache) insert_photo_type(path string, content_type string) {
(*cache)["photo_type/"+path] = content_type
}
func (cache *scanner_cache) get_photo_type(path string) *string {
result := (*cache)["photo_type/"+path]
if result == nil {
return nil
}
photo_type := result.(string)
return &photo_type
}
2020-02-09 21:25:33 +01:00
func ScanUser(database *sql.DB, userId int) error {
2020-02-01 17:58:45 +01:00
row := database.QueryRow("SELECT * FROM user WHERE user_id = ?", userId)
user, err := models.NewUserFromRow(row)
if err != nil {
log.Printf("Could not find user to scan: %s\n", err.Error())
return err
}
log.Printf("Starting scan for user '%s'\n", user.Username)
go scan(database, user)
return nil
}
func scan(database *sql.DB, user *models.User) {
2020-02-12 18:10:52 +01:00
// Start scanning
2020-02-09 14:21:53 +01:00
scanner_cache := make(scanner_cache)
2020-02-12 18:10:52 +01:00
album_paths_scanned := make([]interface{}, 0)
2020-02-09 14:21:53 +01:00
2020-02-01 17:58:45 +01:00
type scanInfo struct {
path string
parentId *int
}
scanQueue := list.New()
scanQueue.PushBack(scanInfo{
path: user.RootPath,
parentId: nil,
})
for scanQueue.Front() != nil {
albumInfo := scanQueue.Front().Value.(scanInfo)
scanQueue.Remove(scanQueue.Front())
albumPath := albumInfo.path
albumParentId := albumInfo.parentId
2020-02-12 18:10:52 +01:00
album_paths_scanned = append(album_paths_scanned, albumPath)
2020-02-01 17:58:45 +01:00
// Read path
dirContent, err := ioutil.ReadDir(albumPath)
if err != nil {
log.Printf("Could not read directory: %s\n", err.Error())
return
}
tx, err := database.Begin()
if err != nil {
log.Printf("ERROR: Could not begin database transaction: %s\n", err)
return
}
log.Printf("Scanning directory: %s", albumPath)
// Make album if not exists
albumTitle := path.Base(albumPath)
_, err = tx.Exec("INSERT IGNORE INTO album (title, parent_album, owner_id, path) VALUES (?, ?, ?, ?)", albumTitle, albumParentId, user.UserID, albumPath)
if err != nil {
fmt.Printf("ERROR: Could not insert album into database: %s\n", err)
tx.Rollback()
return
}
row := tx.QueryRow("SELECT album_id FROM album WHERE path = ?", albumPath)
var albumId int
if err := row.Scan(&albumId); err != nil {
fmt.Printf("ERROR: Could not get id of album: %s\n", err)
tx.Rollback()
return
}
2020-02-02 18:18:38 +01:00
// Commit album transaction
if err := tx.Commit(); err != nil {
log.Printf("ERROR: Could not commit database transaction: %s\n", err)
return
}
2020-02-01 17:58:45 +01:00
// Scan for photos
for _, item := range dirContent {
photoPath := path.Join(albumPath, item.Name())
2020-02-09 14:21:53 +01:00
if !item.IsDir() && isPathImage(photoPath, &scanner_cache) {
2020-02-02 18:18:38 +01:00
tx, err := database.Begin()
if err != nil {
log.Printf("ERROR: Could not begin database transaction for image %s: %s\n", photoPath, err)
return
}
2020-02-09 14:21:53 +01:00
content_type := scanner_cache.get_photo_type(photoPath)
if content_type == nil {
log.Println("Content type not found from cache")
return
}
if err := ProcessImage(tx, photoPath, albumId, *content_type); err != nil {
2020-02-02 18:18:38 +01:00
log.Printf("ERROR: processing image %s: %s", photoPath, err)
2020-02-02 00:29:42 +01:00
tx.Rollback()
return
}
2020-02-01 17:58:45 +01:00
2020-02-02 18:18:38 +01:00
tx.Commit()
}
2020-02-01 17:58:45 +01:00
}
// Scan for sub-albums
for _, item := range dirContent {
subalbumPath := path.Join(albumPath, item.Name())
2020-02-09 14:21:53 +01:00
if item.IsDir() && directoryContainsPhotos(subalbumPath, &scanner_cache) {
2020-02-01 17:58:45 +01:00
scanQueue.PushBack(scanInfo{
path: subalbumPath,
parentId: &albumId,
})
}
}
}
2020-02-12 18:10:52 +01:00
cleanupCache(database, album_paths_scanned)
2020-02-01 17:58:45 +01:00
log.Println("Done scanning")
}
2020-02-09 14:21:53 +01:00
func directoryContainsPhotos(rootPath string, cache *scanner_cache) bool {
2020-02-01 17:58:45 +01:00
scanQueue := list.New()
scanQueue.PushBack(rootPath)
for scanQueue.Front() != nil {
dirPath := scanQueue.Front().Value.(string)
scanQueue.Remove(scanQueue.Front())
dirContent, err := ioutil.ReadDir(dirPath)
if err != nil {
log.Printf("Could not read directory: %s\n", err.Error())
return false
}
for _, fileInfo := range dirContent {
filePath := path.Join(dirPath, fileInfo.Name())
if fileInfo.IsDir() {
scanQueue.PushBack(filePath)
} else {
2020-02-09 14:21:53 +01:00
if isPathImage(filePath, cache) {
2020-02-01 17:58:45 +01:00
return true
}
}
}
}
return false
}
2020-02-10 12:05:58 +01:00
var SupportedMimetypes = [...]string{
2020-02-01 17:58:45 +01:00
"image/jpeg",
"image/png",
2020-02-02 21:44:09 +01:00
"image/tiff",
"image/webp",
"image/x-canon-cr2",
2020-02-01 17:58:45 +01:00
"image/bmp",
}
2020-02-10 12:05:58 +01:00
var WebMimetypes = [...]string{
"image/jpeg",
"image/png",
"image/webp",
"image/bmp",
}
2020-02-09 14:21:53 +01:00
func isPathImage(path string, cache *scanner_cache) bool {
if cache.get_photo_type(path) != nil {
log.Printf("Image cache hit: %s\n", path)
return true
}
2020-02-01 17:58:45 +01:00
file, err := os.Open(path)
if err != nil {
log.Printf("Could not open file %s: %s\n", path, err)
return false
}
2020-02-02 18:18:38 +01:00
defer file.Close()
2020-02-01 17:58:45 +01:00
head := make([]byte, 261)
if _, err := file.Read(head); err != nil {
log.Printf("Could not read file %s: %s\n", path, err)
return false
}
imgType, err := filetype.Image(head)
if err != nil {
return false
}
2020-02-10 12:05:58 +01:00
for _, supported_mime := range SupportedMimetypes {
2020-02-01 17:58:45 +01:00
if supported_mime == imgType.MIME.Value {
2020-02-09 14:21:53 +01:00
cache.insert_photo_type(path, supported_mime)
2020-02-01 17:58:45 +01:00
return true
}
}
log.Printf("Unsupported image %s of type %s\n", path, imgType.MIME.Value)
return false
}
2020-02-12 18:10:52 +01:00
func cleanupCache(database *sql.DB, scanned_albums []interface{}) {
if len(scanned_albums) == 0 {
return
}
albums_questions := strings.Repeat("?,", len(scanned_albums))[:len(scanned_albums)*2-1]
rows, err := database.Query("SELECT album_id FROM album WHERE path NOT IN ("+albums_questions+")", scanned_albums...)
if err != nil {
log.Printf("ERROR: Could not get albums from database: %s\n", err)
return
}
deleted_albums := 0
deleted_ids := make([]interface{}, 0)
for rows.Next() {
var album_id int
rows.Scan(&album_id)
deleted_ids = append(deleted_ids, album_id)
cache_path := path.Join("./image-cache", strconv.Itoa(album_id))
err := os.RemoveAll(cache_path)
if err != nil {
log.Printf("ERROR: Could not delete unused cache folder: %s\n%s\n", cache_path, err)
} else {
deleted_albums++
}
}
if len(deleted_ids) > 0 {
albums_questions = strings.Repeat("?,", len(deleted_ids))[:len(deleted_ids)*2-1]
if _, err := database.Exec("DELETE FROM album WHERE album_id IN ("+albums_questions+")", deleted_ids...); err != nil {
log.Printf("ERROR: Could not delete old albums from database:\n%s\n", err)
}
}
log.Printf("Deleted %d unused albums from cache", deleted_albums)
}