2021-08-22 16:14:34 +02:00
|
|
|
package photoprism
|
|
|
|
|
|
|
|
import (
|
|
|
|
"github.com/montanaflynn/stats"
|
|
|
|
"github.com/photoprism/photoprism/internal/query"
|
|
|
|
)
|
|
|
|
|
2021-08-28 15:26:26 +02:00
|
|
|
// Stats shows statistics on face embeddings.
|
|
|
|
func (w *Faces) Stats() (err error) {
|
2021-08-29 13:26:05 +02:00
|
|
|
if embeddings, err := query.Embeddings(true, false, 0, 0); err != nil {
|
2021-08-22 16:14:34 +02:00
|
|
|
return err
|
|
|
|
} else if samples := len(embeddings); samples == 0 {
|
2021-10-05 18:42:39 +02:00
|
|
|
log.Infof("faces: found no samples")
|
2021-08-22 16:14:34 +02:00
|
|
|
} else {
|
|
|
|
log.Infof("faces: computing distance of %d samples", samples)
|
|
|
|
|
|
|
|
distMin := make([]float64, samples)
|
|
|
|
distMax := make([]float64, samples)
|
|
|
|
|
|
|
|
for i := 0; i < samples; i++ {
|
|
|
|
min := -1.0
|
|
|
|
max := -1.0
|
|
|
|
|
|
|
|
for j := 0; j < samples; j++ {
|
|
|
|
if i == j {
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
2022-04-03 17:25:37 +02:00
|
|
|
d := embeddings[i].Dist(embeddings[j])
|
2021-08-22 16:14:34 +02:00
|
|
|
|
|
|
|
if min < 0 || d < min {
|
|
|
|
min = d
|
|
|
|
}
|
|
|
|
|
|
|
|
if max < 0 || d > max {
|
|
|
|
max = d
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
distMin[i] = min
|
|
|
|
distMax[i] = max
|
|
|
|
}
|
|
|
|
|
|
|
|
minMedian, _ := stats.Median(distMin)
|
|
|
|
minMin, _ := stats.Min(distMin)
|
|
|
|
minMax, _ := stats.Max(distMin)
|
|
|
|
|
|
|
|
log.Infof("faces: min Ø %f < median %f < %f", minMin, minMedian, minMax)
|
|
|
|
|
|
|
|
maxMedian, _ := stats.Median(distMax)
|
|
|
|
maxMin, _ := stats.Min(distMax)
|
|
|
|
maxMax, _ := stats.Max(distMax)
|
|
|
|
|
|
|
|
log.Infof("faces: max Ø %f < median %f < %f", maxMin, maxMedian, maxMax)
|
|
|
|
}
|
|
|
|
|
2023-02-21 04:49:06 +01:00
|
|
|
if faces, err := query.Faces(true, false, false, false); err != nil {
|
2021-08-22 16:14:34 +02:00
|
|
|
log.Errorf("faces: %s", err)
|
|
|
|
} else if samples := len(faces); samples > 0 {
|
|
|
|
log.Infof("faces: computing distance of faces matching to the same person")
|
|
|
|
|
|
|
|
dist := make(map[string][]float64)
|
|
|
|
|
|
|
|
for i := 0; i < samples; i++ {
|
|
|
|
f1 := faces[i]
|
|
|
|
|
|
|
|
e1 := f1.Embedding()
|
|
|
|
min := -1.0
|
|
|
|
max := -1.0
|
|
|
|
|
2021-09-17 14:26:12 +02:00
|
|
|
if k, ok := dist[f1.SubjUID]; ok {
|
2021-08-22 16:14:34 +02:00
|
|
|
min = k[0]
|
|
|
|
max = k[1]
|
|
|
|
}
|
|
|
|
|
|
|
|
for j := 0; j < samples; j++ {
|
|
|
|
if i == j {
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
|
|
|
f2 := faces[j]
|
|
|
|
|
2021-09-17 14:26:12 +02:00
|
|
|
if f1.SubjUID != f2.SubjUID {
|
2021-08-22 16:14:34 +02:00
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
2022-04-03 17:25:37 +02:00
|
|
|
d := e1.Dist(f2.Embedding())
|
2021-08-22 16:14:34 +02:00
|
|
|
|
|
|
|
if min < 0 || d < min {
|
|
|
|
min = d
|
|
|
|
}
|
|
|
|
|
|
|
|
if max < 0 || d > max {
|
|
|
|
max = d
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if max > 0 {
|
2021-09-17 14:26:12 +02:00
|
|
|
dist[f1.SubjUID] = []float64{min, max}
|
2021-08-22 16:14:34 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if l := len(dist); l == 0 {
|
2021-10-05 18:42:39 +02:00
|
|
|
log.Infof("faces: analyzed %d clusters, found no matches", samples)
|
2021-08-22 16:14:34 +02:00
|
|
|
} else {
|
|
|
|
log.Infof("faces: %d faces match to the same person", l)
|
|
|
|
}
|
|
|
|
|
|
|
|
for subj, d := range dist {
|
|
|
|
log.Infof("faces: %s Ø min %f, max %f", subj, d[0], d[1])
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|