photoprism/internal/face/face.go

190 lines
4.6 KiB
Go

/*
Package face provides facial recognition.
Copyright (c) 2018 - 2021 Michael Mayer <hello@photoprism.org>
This program is free software: you can redistribute it and/or modify
it under the terms of the GNU Affero General Public License as published
by the Free Software Foundation, either version 3 of the License, or
(at your option) any later version.
This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU Affero General Public License for more details.
You should have received a copy of the GNU Affero General Public License
along with this program. If not, see <https://www.gnu.org/licenses/>.
PhotoPrism® is a registered trademark of Michael Mayer. You may use it as required
to describe our software, run your own server, for educational purposes, but not for
offering commercial goods, products, or services without prior written permission.
In other words, please ask.
Feel free to send an e-mail to hello@photoprism.org if you have questions,
want to support our work, or just want to say hello.
Additional information can be found in our Developer Guide:
https://docs.photoprism.org/developer-guide/
*/
package face
import (
"encoding/json"
"github.com/photoprism/photoprism/internal/event"
)
var CropSize = 160
var ClusterCore = 4
var ClusterRadius = 0.6
var ClusterMinScore = 30
var ClusterMinSize = CropSize
var SampleThreshold = 2 * ClusterCore
var log = event.Log
// Faces is a list of face detection results.
type Faces []Face
// Count returns the number of faces detected.
func (faces Faces) Count() int {
return len(faces)
}
// Uncertainty return the max face detection uncertainty in percent.
func (faces Faces) Uncertainty() int {
if len(faces) < 1 {
return 100
}
maxScore := 0
for _, f := range faces {
if f.Score > maxScore {
maxScore = f.Score
}
}
switch {
case maxScore > 300:
return 1
case maxScore > 200:
return 5
case maxScore > 100:
return 10
case maxScore > 80:
return 15
case maxScore > 65:
return 20
case maxScore > 50:
return 25
case maxScore > 40:
return 30
case maxScore > 30:
return 35
case maxScore > 20:
return 40
case maxScore > 10:
return 45
}
return 50
}
// Face represents a face detection result.
type Face struct {
Rows int `json:"rows,omitempty"`
Cols int `json:"cols,omitempty"`
Score int `json:"score,omitempty"`
Face Area `json:"face,omitempty"`
Eyes Areas `json:"eyes,omitempty"`
Landmarks Areas `json:"landmarks,omitempty"`
Embeddings [][]float32 `json:"embeddings,omitempty"`
Thumb string `json:"-"`
}
// Size returns the absolute face size in pixels.
func (f *Face) Size() int {
return f.Face.Scale
}
// Dim returns the max number of rows and cols as float32 to calculate relative coordinates.
func (f *Face) Dim() float32 {
if f.Cols > 0 {
return float32(f.Cols)
}
return float32(1)
}
// Marker returns the relative position on the image.
func (f *Face) Marker() Marker {
marker := f.Face.Marker(Area{}, float32(f.Rows), float32(f.Cols))
midpoint := f.EyesMidpoint().Marker(Area{}, float32(f.Rows), float32(f.Cols))
marker.X = midpoint.X
marker.Y = midpoint.Y
return marker
}
// EyesMidpoint returns the point in between the eyes.
func (f *Face) EyesMidpoint() Area {
if len(f.Eyes) != 2 {
return Area{
Name: "midpoint",
Row: f.Face.Row,
Col: f.Face.Col,
Scale: f.Face.Scale,
}
}
return Area{
Name: "midpoint",
Row: (f.Eyes[0].Row + f.Eyes[1].Row) / 2,
Col: (f.Eyes[0].Col + f.Eyes[1].Col) / 2,
Scale: (f.Eyes[0].Scale + f.Eyes[1].Scale) / 2,
}
}
// RelativeLandmarks returns detected relative marker positions.
func (f *Face) RelativeLandmarks() Markers {
p := f.EyesMidpoint()
m := f.Landmarks.Markers(p, float32(f.Rows), float32(f.Cols))
m = append(m, f.Eyes.Markers(p, float32(f.Rows), float32(f.Cols))...)
return m
}
// RelativeLandmarksJSON returns detected relative marker positions as JSON.
func (f *Face) RelativeLandmarksJSON() (b []byte) {
var noResult = []byte("")
l := f.RelativeLandmarks()
if len(l) < 1 {
return noResult
}
if result, err := json.Marshal(l); err != nil {
log.Errorf("faces: %s", err)
return noResult
} else {
return result
}
}
// EmbeddingsJSON returns detected face embeddings as JSON array.
func (f *Face) EmbeddingsJSON() (b []byte) {
var noResult = []byte("")
if result, err := json.Marshal(f.Embeddings); err != nil {
return noResult
} else {
return result
}
}