AI: Add Vision API service endpoint for image classification #127 #1090

This is a proof of concept and still under development. The other
Vision API endpoints are stubs for testing and not yet functional.

Signed-off-by: Michael Mayer <michael@photoprism.app>
This commit is contained in:
Michael Mayer
2025-04-07 12:19:39 +02:00
parent 907850cb80
commit f3e066af45
12 changed files with 308 additions and 102 deletions

View File

@@ -1,19 +1,24 @@
package api
import (
"net/http"
"github.com/gin-gonic/gin"
"github.com/photoprism/photoprism/internal/ai/vision"
"github.com/photoprism/photoprism/internal/auth/acl"
)
// PostVisionCaption returns a suitable caption for an image.
//
// @Summary returns a suitable caption for an image
// @Id PostVisionCaption
// @Tags Vision
// @Produce json
// @Failure 401,403,404,429,501 {object} i18n.Response
// @Router /api/v1/vision/caption [post]
// @Summary returns a suitable caption for an image
// @Id PostVisionCaption
// @Tags Vision
// @Produce json
// @Success 200 {object} vision.ApiResponse
// @Failure 401,403,404,429,501 {object} i18n.Response
// @Param images body vision.ApiRequest true "list of image file urls"
// @Router /api/v1/vision/caption [post]
func PostVisionCaption(router *gin.RouterGroup) {
router.POST("/vision/caption", func(c *gin.Context) {
s := Auth(c, acl.ResourceVision, acl.AccessAll)
@@ -23,6 +28,21 @@ func PostVisionCaption(router *gin.RouterGroup) {
return
}
AbortNotImplemented(c)
var request vision.ApiRequest
// Assign and validate request form values.
if err := c.BindJSON(&request); err != nil {
AbortBadRequest(c)
return
}
// Generate Vision API service response.
response := vision.ApiResponse{
Id: request.GetId(),
Model: &vision.Model{Name: "Caption", Version: "Test", Resolution: 224},
Result: &vision.ApiResult{Caption: &vision.CaptionResult{Text: "Lorem Ipsum is simply dummy text of the printing and typesetting industry.", Confidence: 0.42424}},
}
c.JSON(http.StatusOK, response)
})
}