182 lines
4.4 KiB
Go
182 lines
4.4 KiB
Go
/*
|
|
|
|
Package face provides face landmark detection.
|
|
|
|
Copyright (c) 2018 - 2021 Michael Mayer <hello@photoprism.org>
|
|
|
|
This program is free software: you can redistribute it and/or modify
|
|
it under the terms of the GNU Affero General Public License as published
|
|
by the Free Software Foundation, either version 3 of the License, or
|
|
(at your option) any later version.
|
|
|
|
This program is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
GNU Affero General Public License for more details.
|
|
|
|
You should have received a copy of the GNU Affero General Public License
|
|
along with this program. If not, see <https://www.gnu.org/licenses/>.
|
|
|
|
PhotoPrism® is a registered trademark of Michael Mayer. You may use it as required
|
|
to describe our software, run your own server, for educational purposes, but not for
|
|
offering commercial goods, products, or services without prior written permission.
|
|
In other words, please ask.
|
|
|
|
Feel free to send an e-mail to hello@photoprism.org if you have questions,
|
|
want to support our work, or just want to say hello.
|
|
|
|
Additional information can be found in our Developer Guide:
|
|
https://docs.photoprism.org/developer-guide/
|
|
|
|
*/
|
|
|
|
package face
|
|
|
|
import (
|
|
"encoding/json"
|
|
|
|
"github.com/photoprism/photoprism/internal/event"
|
|
)
|
|
|
|
var ClusterCore = 3
|
|
var ClusterRadius = 0.66
|
|
var SampleThreshold = 25
|
|
|
|
var log = event.Log
|
|
|
|
// Faces is a list of face detection results.
|
|
type Faces []Face
|
|
|
|
// Count returns the number of faces detected.
|
|
func (faces Faces) Count() int {
|
|
return len(faces)
|
|
}
|
|
|
|
// Uncertainty return the max face detection uncertainty in percent.
|
|
func (faces Faces) Uncertainty() int {
|
|
if len(faces) < 1 {
|
|
return 100
|
|
}
|
|
|
|
maxScore := 0
|
|
|
|
for _, f := range faces {
|
|
if f.Score > maxScore {
|
|
maxScore = f.Score
|
|
}
|
|
}
|
|
|
|
switch {
|
|
case maxScore > 300:
|
|
return 1
|
|
case maxScore > 200:
|
|
return 5
|
|
case maxScore > 100:
|
|
return 10
|
|
case maxScore > 80:
|
|
return 15
|
|
case maxScore > 65:
|
|
return 20
|
|
case maxScore > 50:
|
|
return 25
|
|
case maxScore > 40:
|
|
return 30
|
|
case maxScore > 30:
|
|
return 35
|
|
case maxScore > 20:
|
|
return 40
|
|
case maxScore > 10:
|
|
return 45
|
|
}
|
|
|
|
return 50
|
|
}
|
|
|
|
// Face represents a face detection result.
|
|
type Face struct {
|
|
Rows int `json:"rows,omitempty"`
|
|
Cols int `json:"cols,omitempty"`
|
|
Score int `json:"score,omitempty"`
|
|
Face Point `json:"face,omitempty"`
|
|
Eyes Points `json:"eyes,omitempty"`
|
|
Landmarks Points `json:"landmarks,omitempty"`
|
|
Embeddings [][]float32 `json:"embeddings,omitempty"`
|
|
}
|
|
|
|
// Dim returns the max number of rows and cols as float32 to calculate relative coordinates.
|
|
func (f *Face) Dim() float32 {
|
|
if f.Cols > 0 {
|
|
return float32(f.Cols)
|
|
}
|
|
|
|
return float32(1)
|
|
}
|
|
|
|
// Marker returns the relative position on the image.
|
|
func (f *Face) Marker() Marker {
|
|
marker := f.Face.Marker(Point{}, float32(f.Rows), float32(f.Cols))
|
|
midpoint := f.EyesMidpoint().Marker(Point{}, float32(f.Rows), float32(f.Cols))
|
|
marker.X = midpoint.X
|
|
marker.Y = midpoint.Y
|
|
|
|
return marker
|
|
}
|
|
|
|
// EyesMidpoint returns the point in between the eyes.
|
|
func (f *Face) EyesMidpoint() Point {
|
|
if len(f.Eyes) != 2 {
|
|
return Point{
|
|
Name: "midpoint",
|
|
Row: f.Face.Row,
|
|
Col: f.Face.Col,
|
|
Scale: f.Face.Scale,
|
|
}
|
|
}
|
|
|
|
return Point{
|
|
Name: "midpoint",
|
|
Row: (f.Eyes[0].Row + f.Eyes[1].Row) / 2,
|
|
Col: (f.Eyes[0].Col + f.Eyes[1].Col) / 2,
|
|
Scale: (f.Eyes[0].Scale + f.Eyes[1].Scale) / 2,
|
|
}
|
|
}
|
|
|
|
// RelativeLandmarks returns detected relative marker positions.
|
|
func (f *Face) RelativeLandmarks() Markers {
|
|
p := f.EyesMidpoint()
|
|
|
|
m := f.Landmarks.Markers(p, float32(f.Rows), float32(f.Cols))
|
|
m = append(m, f.Eyes.Markers(p, float32(f.Rows), float32(f.Cols))...)
|
|
|
|
return m
|
|
}
|
|
|
|
// RelativeLandmarksJSON returns detected relative marker positions as JSON.
|
|
func (f *Face) RelativeLandmarksJSON() (b []byte) {
|
|
var noResult = []byte("")
|
|
|
|
l := f.RelativeLandmarks()
|
|
|
|
if len(l) < 1 {
|
|
return noResult
|
|
}
|
|
|
|
if result, err := json.Marshal(l); err != nil {
|
|
log.Errorf("faces: %s", err)
|
|
return noResult
|
|
} else {
|
|
return result
|
|
}
|
|
}
|
|
|
|
// EmbeddingsJSON returns detected face embeddings as JSON array.
|
|
func (f *Face) EmbeddingsJSON() (b []byte) {
|
|
var noResult = []byte("")
|
|
|
|
if result, err := json.Marshal(f.Embeddings); err != nil {
|
|
return noResult
|
|
} else {
|
|
return result
|
|
}
|
|
}
|