2021-04-11 23:04:40 +00:00
|
|
|
package utils
|
|
|
|
|
|
|
|
import (
|
|
|
|
"strconv"
|
|
|
|
|
|
|
|
"github.com/corona10/goimagehash"
|
2022-07-13 06:30:54 +00:00
|
|
|
"github.com/stashapp/stash/pkg/sliceutil/intslice"
|
2021-04-11 23:04:40 +00:00
|
|
|
)
|
|
|
|
|
|
|
|
type Phash struct {
|
|
|
|
SceneID int `db:"id"`
|
|
|
|
Hash int64 `db:"phash"`
|
|
|
|
Neighbors []int
|
|
|
|
Bucket int
|
|
|
|
}
|
|
|
|
|
|
|
|
func FindDuplicates(hashes []*Phash, distance int) [][]int {
|
|
|
|
for i, scene := range hashes {
|
|
|
|
sceneHash := goimagehash.NewImageHash(uint64(scene.Hash), goimagehash.PHash)
|
|
|
|
for j, neighbor := range hashes {
|
2022-07-13 06:30:54 +00:00
|
|
|
if i != j && scene.SceneID != neighbor.SceneID {
|
2021-04-11 23:04:40 +00:00
|
|
|
neighborHash := goimagehash.NewImageHash(uint64(neighbor.Hash), goimagehash.PHash)
|
|
|
|
neighborDistance, _ := sceneHash.Distance(neighborHash)
|
|
|
|
if neighborDistance <= distance {
|
|
|
|
scene.Neighbors = append(scene.Neighbors, j)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
var buckets [][]int
|
|
|
|
for _, scene := range hashes {
|
|
|
|
if len(scene.Neighbors) > 0 && scene.Bucket == -1 {
|
|
|
|
bucket := len(buckets)
|
|
|
|
scenes := []int{scene.SceneID}
|
|
|
|
scene.Bucket = bucket
|
|
|
|
findNeighbors(bucket, scene.Neighbors, hashes, &scenes)
|
2022-07-13 06:30:54 +00:00
|
|
|
|
|
|
|
if len(scenes) > 1 {
|
|
|
|
buckets = append(buckets, scenes)
|
|
|
|
}
|
2021-04-11 23:04:40 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return buckets
|
|
|
|
}
|
|
|
|
|
|
|
|
func findNeighbors(bucket int, neighbors []int, hashes []*Phash, scenes *[]int) {
|
|
|
|
for _, id := range neighbors {
|
|
|
|
hash := hashes[id]
|
|
|
|
if hash.Bucket == -1 {
|
|
|
|
hash.Bucket = bucket
|
2022-07-13 06:30:54 +00:00
|
|
|
*scenes = intslice.IntAppendUnique(*scenes, hash.SceneID)
|
2021-04-11 23:04:40 +00:00
|
|
|
findNeighbors(bucket, hash.Neighbors, hashes, scenes)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func PhashToString(phash int64) string {
|
|
|
|
return strconv.FormatUint(uint64(phash), 16)
|
|
|
|
}
|
2021-06-22 23:10:20 +00:00
|
|
|
|
|
|
|
func StringToPhash(s string) (int64, error) {
|
|
|
|
ret, err := strconv.ParseUint(s, 16, 64)
|
|
|
|
if err != nil {
|
|
|
|
return 0, err
|
|
|
|
}
|
|
|
|
|
|
|
|
return int64(ret), nil
|
|
|
|
}
|