controller.go 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385
  1. package embedding
  2. import (
  3. "bytes"
  4. "encoding/json"
  5. "errors"
  6. "fmt"
  7. "github.com/ente-io/museum/pkg/utils/array"
  8. "strconv"
  9. "sync"
  10. "github.com/aws/aws-sdk-go/aws"
  11. "github.com/aws/aws-sdk-go/service/s3"
  12. "github.com/aws/aws-sdk-go/service/s3/s3manager"
  13. "github.com/ente-io/museum/ente"
  14. "github.com/ente-io/museum/pkg/controller"
  15. "github.com/ente-io/museum/pkg/controller/access"
  16. "github.com/ente-io/museum/pkg/repo"
  17. "github.com/ente-io/museum/pkg/repo/embedding"
  18. "github.com/ente-io/museum/pkg/utils/auth"
  19. "github.com/ente-io/museum/pkg/utils/network"
  20. "github.com/ente-io/museum/pkg/utils/s3config"
  21. "github.com/ente-io/museum/pkg/utils/time"
  22. "github.com/ente-io/stacktrace"
  23. "github.com/gin-gonic/gin"
  24. log "github.com/sirupsen/logrus"
  25. )
  26. type Controller struct {
  27. Repo *embedding.Repository
  28. AccessCtrl access.Controller
  29. ObjectCleanupController *controller.ObjectCleanupController
  30. S3Config *s3config.S3Config
  31. QueueRepo *repo.QueueRepository
  32. TaskLockingRepo *repo.TaskLockRepository
  33. FileRepo *repo.FileRepository
  34. CollectionRepo *repo.CollectionRepository
  35. HostName string
  36. cleanupCronRunning bool
  37. }
  38. func (c *Controller) InsertOrUpdate(ctx *gin.Context, req ente.InsertOrUpdateEmbeddingRequest) (*ente.Embedding, error) {
  39. userID := auth.GetUserID(ctx.Request.Header)
  40. err := c.AccessCtrl.VerifyFileOwnership(ctx, &access.VerifyFileOwnershipParams{
  41. ActorUserId: userID,
  42. FileIDs: []int64{req.FileID},
  43. })
  44. if err != nil {
  45. return nil, stacktrace.Propagate(err, "User does not own file")
  46. }
  47. count, err := c.CollectionRepo.GetCollectionCount(req.FileID)
  48. if err != nil {
  49. return nil, stacktrace.Propagate(err, "")
  50. }
  51. if count < 1 {
  52. return nil, stacktrace.Propagate(ente.ErrNotFound, "")
  53. }
  54. version := 1
  55. if req.Version != nil {
  56. version = *req.Version
  57. }
  58. obj := ente.EmbeddingObject{
  59. Version: version,
  60. EncryptedEmbedding: req.EncryptedEmbedding,
  61. DecryptionHeader: req.DecryptionHeader,
  62. Client: network.GetPrettyUA(ctx.GetHeader("User-Agent")) + "/" + ctx.GetHeader("X-Client-Version"),
  63. }
  64. size, uploadErr := c.uploadObject(obj, c.getObjectKey(userID, req.FileID, req.Model))
  65. if uploadErr != nil {
  66. log.Error(uploadErr)
  67. return nil, stacktrace.Propagate(uploadErr, "")
  68. }
  69. embedding, err := c.Repo.InsertOrUpdate(ctx, userID, req, size)
  70. if err != nil {
  71. return nil, stacktrace.Propagate(err, "")
  72. }
  73. return &embedding, nil
  74. }
  75. func (c *Controller) GetDiff(ctx *gin.Context, req ente.GetEmbeddingDiffRequest) ([]ente.Embedding, error) {
  76. userID := auth.GetUserID(ctx.Request.Header)
  77. if req.Model == "" {
  78. req.Model = ente.GgmlClip
  79. }
  80. embeddings, err := c.Repo.GetDiff(ctx, userID, req.Model, *req.SinceTime, req.Limit)
  81. if err != nil {
  82. return nil, stacktrace.Propagate(err, "")
  83. }
  84. // Collect object keys for embeddings with missing data
  85. var objectKeys []string
  86. for i := range embeddings {
  87. if embeddings[i].EncryptedEmbedding == "" {
  88. objectKey := c.getObjectKey(userID, embeddings[i].FileID, embeddings[i].Model)
  89. objectKeys = append(objectKeys, objectKey)
  90. }
  91. }
  92. // Fetch missing embeddings in parallel
  93. if len(objectKeys) > 0 {
  94. embeddingObjects, err := c.getEmbeddingObjectsParallel(objectKeys)
  95. if err != nil {
  96. return nil, stacktrace.Propagate(err, "")
  97. }
  98. // Populate missing data in embeddings from fetched objects
  99. for i, obj := range embeddingObjects {
  100. for j := range embeddings {
  101. if embeddings[j].EncryptedEmbedding == "" && c.getObjectKey(userID, embeddings[j].FileID, embeddings[j].Model) == objectKeys[i] {
  102. embeddings[j].EncryptedEmbedding = obj.EncryptedEmbedding
  103. embeddings[j].DecryptionHeader = obj.DecryptionHeader
  104. }
  105. }
  106. }
  107. }
  108. return embeddings, nil
  109. }
  110. func (c *Controller) GetFilesEmbedding(ctx *gin.Context, req ente.GetFilesEmbeddingRequest) (*ente.GetFilesEmbeddingResponse, error) {
  111. userID := auth.GetUserID(ctx.Request.Header)
  112. if err := c._validateGetFileEmbeddingsRequest(ctx, userID, req); err != nil {
  113. return nil, stacktrace.Propagate(err, "")
  114. }
  115. userFileEmbeddings, err := c.Repo.GetFilesEmbedding(ctx, userID, req.Model, req.FileIDs)
  116. if err != nil {
  117. return nil, stacktrace.Propagate(err, "")
  118. }
  119. dbFileIds := make([]int64, 0)
  120. for _, embedding := range userFileEmbeddings {
  121. dbFileIds = append(dbFileIds, embedding.FileID)
  122. }
  123. missingFileIds := array.FindMissingElementsInSecondList(req.FileIDs, dbFileIds)
  124. errFileIds := make([]int64, 0)
  125. // Fetch missing userFileEmbeddings in parallel
  126. embeddingObjects, err := c.getEmbeddingObjectsParallelV2(userID, userFileEmbeddings)
  127. if err != nil {
  128. return nil, stacktrace.Propagate(err, "")
  129. }
  130. fetchedEmbeddings := make([]ente.Embedding, 0)
  131. // Populate missing data in userFileEmbeddings from fetched objects
  132. for _, obj := range embeddingObjects {
  133. if obj.err != nil {
  134. errFileIds = append(errFileIds, obj.dbEmbeddingRow.FileID)
  135. } else {
  136. fetchedEmbeddings = append(fetchedEmbeddings, ente.Embedding{
  137. FileID: obj.dbEmbeddingRow.FileID,
  138. Model: obj.dbEmbeddingRow.Model,
  139. EncryptedEmbedding: obj.embeddingObject.EncryptedEmbedding,
  140. DecryptionHeader: obj.embeddingObject.DecryptionHeader,
  141. UpdatedAt: obj.dbEmbeddingRow.UpdatedAt,
  142. Client: obj.dbEmbeddingRow.Client,
  143. })
  144. }
  145. }
  146. return &ente.GetFilesEmbeddingResponse{
  147. Embeddings: fetchedEmbeddings,
  148. NoDataFileIDs: missingFileIds,
  149. ErrFileIDs: errFileIds,
  150. }, nil
  151. }
  152. func (c *Controller) DeleteAll(ctx *gin.Context) error {
  153. userID := auth.GetUserID(ctx.Request.Header)
  154. err := c.Repo.DeleteAll(ctx, userID)
  155. if err != nil {
  156. return stacktrace.Propagate(err, "")
  157. }
  158. return nil
  159. }
  160. // CleanupDeletedEmbeddings clears all embeddings for deleted files from the object store
  161. func (c *Controller) CleanupDeletedEmbeddings() {
  162. log.Info("Cleaning up deleted embeddings")
  163. if c.cleanupCronRunning {
  164. log.Info("Skipping CleanupDeletedEmbeddings cron run as another instance is still running")
  165. return
  166. }
  167. c.cleanupCronRunning = true
  168. defer func() {
  169. c.cleanupCronRunning = false
  170. }()
  171. items, err := c.QueueRepo.GetItemsReadyForDeletion(repo.DeleteEmbeddingsQueue, 200)
  172. if err != nil {
  173. log.WithError(err).Error("Failed to fetch items from queue")
  174. return
  175. }
  176. for _, i := range items {
  177. c.deleteEmbedding(i)
  178. }
  179. }
  180. func (c *Controller) deleteEmbedding(qItem repo.QueueItem) {
  181. lockName := fmt.Sprintf("Embedding:%s", qItem.Item)
  182. lockStatus, err := c.TaskLockingRepo.AcquireLock(lockName, time.MicrosecondsAfterHours(1), c.HostName)
  183. ctxLogger := log.WithField("item", qItem.Item).WithField("queue_id", qItem.Id)
  184. if err != nil || !lockStatus {
  185. ctxLogger.Warn("unable to acquire lock")
  186. return
  187. }
  188. defer func() {
  189. err = c.TaskLockingRepo.ReleaseLock(lockName)
  190. if err != nil {
  191. ctxLogger.Errorf("Error while releasing lock %s", err)
  192. }
  193. }()
  194. ctxLogger.Info("Deleting all embeddings")
  195. fileID, _ := strconv.ParseInt(qItem.Item, 10, 64)
  196. ownerID, err := c.FileRepo.GetOwnerID(fileID)
  197. if err != nil {
  198. ctxLogger.WithError(err).Error("Failed to fetch ownerID")
  199. return
  200. }
  201. prefix := c.getEmbeddingObjectPrefix(ownerID, fileID)
  202. err = c.ObjectCleanupController.DeleteAllObjectsWithPrefix(prefix, c.S3Config.GetHotDataCenter())
  203. if err != nil {
  204. ctxLogger.WithError(err).Error("Failed to delete all objects")
  205. return
  206. }
  207. err = c.Repo.Delete(fileID)
  208. if err != nil {
  209. ctxLogger.WithError(err).Error("Failed to remove from db")
  210. return
  211. }
  212. err = c.QueueRepo.DeleteItem(repo.DeleteEmbeddingsQueue, qItem.Item)
  213. if err != nil {
  214. ctxLogger.WithError(err).Error("Failed to remove item from the queue")
  215. return
  216. }
  217. ctxLogger.Info("Successfully deleted all embeddings")
  218. }
  219. func (c *Controller) getObjectKey(userID int64, fileID int64, model string) string {
  220. return c.getEmbeddingObjectPrefix(userID, fileID) + model + ".json"
  221. }
  222. func (c *Controller) getEmbeddingObjectPrefix(userID int64, fileID int64) string {
  223. return strconv.FormatInt(userID, 10) + "/ml-data/" + strconv.FormatInt(fileID, 10) + "/"
  224. }
  225. // uploadObject uploads the embedding object to the object store and returns the object size
  226. func (c *Controller) uploadObject(obj ente.EmbeddingObject, key string) (int, error) {
  227. embeddingObj, _ := json.Marshal(obj)
  228. uploader := s3manager.NewUploaderWithClient(c.S3Config.GetHotS3Client())
  229. up := s3manager.UploadInput{
  230. Bucket: c.S3Config.GetHotBucket(),
  231. Key: &key,
  232. Body: bytes.NewReader(embeddingObj),
  233. }
  234. result, err := uploader.Upload(&up)
  235. if err != nil {
  236. log.Error(err)
  237. return -1, stacktrace.Propagate(err, "")
  238. }
  239. log.Infof("Uploaded to bucket %s", result.Location)
  240. return len(embeddingObj), nil
  241. }
  242. var globalFetchSemaphore = make(chan struct{}, 300)
  243. func (c *Controller) getEmbeddingObjectsParallel(objectKeys []string) ([]ente.EmbeddingObject, error) {
  244. var wg sync.WaitGroup
  245. var errs []error
  246. embeddingObjects := make([]ente.EmbeddingObject, len(objectKeys))
  247. downloader := s3manager.NewDownloaderWithClient(c.S3Config.GetHotS3Client())
  248. for i, objectKey := range objectKeys {
  249. wg.Add(1)
  250. globalFetchSemaphore <- struct{}{} // Acquire from global semaphore
  251. go func(i int, objectKey string) {
  252. defer wg.Done()
  253. defer func() { <-globalFetchSemaphore }() // Release back to global semaphore
  254. obj, err := c.getEmbeddingObject(objectKey, downloader)
  255. if err != nil {
  256. errs = append(errs, err)
  257. log.Error("error fetching embedding object: "+objectKey, err)
  258. } else {
  259. embeddingObjects[i] = obj
  260. }
  261. }(i, objectKey)
  262. }
  263. wg.Wait()
  264. if len(errs) > 0 {
  265. return nil, stacktrace.Propagate(errors.New("failed to fetch some objects"), "")
  266. }
  267. return embeddingObjects, nil
  268. }
  269. type embeddingObjectResult struct {
  270. embeddingObject ente.EmbeddingObject
  271. dbEmbeddingRow ente.Embedding
  272. err error
  273. }
  274. func (c *Controller) getEmbeddingObjectsParallelV2(userID int64, dbEmbeddingRows []ente.Embedding) ([]embeddingObjectResult, error) {
  275. var wg sync.WaitGroup
  276. embeddingObjects := make([]embeddingObjectResult, len(dbEmbeddingRows))
  277. downloader := s3manager.NewDownloaderWithClient(c.S3Config.GetHotS3Client())
  278. for i, dbEmbeddingRow := range dbEmbeddingRows {
  279. wg.Add(1)
  280. globalFetchSemaphore <- struct{}{} // Acquire from global semaphore
  281. go func(i int, dbEmbeddingRow ente.Embedding) {
  282. defer wg.Done()
  283. defer func() { <-globalFetchSemaphore }() // Release back to global semaphore
  284. objectKey := c.getObjectKey(userID, dbEmbeddingRow.FileID, dbEmbeddingRow.Model)
  285. obj, err := c.getEmbeddingObject(objectKey, downloader)
  286. if err != nil {
  287. log.Error("error fetching embedding object: "+objectKey, err)
  288. embeddingObjects[i] = embeddingObjectResult{
  289. err: err,
  290. dbEmbeddingRow: dbEmbeddingRow,
  291. }
  292. } else {
  293. embeddingObjects[i] = embeddingObjectResult{
  294. embeddingObject: obj,
  295. dbEmbeddingRow: dbEmbeddingRow,
  296. }
  297. }
  298. }(i, dbEmbeddingRow)
  299. }
  300. wg.Wait()
  301. return embeddingObjects, nil
  302. }
  303. func (c *Controller) getEmbeddingObject(objectKey string, downloader *s3manager.Downloader) (ente.EmbeddingObject, error) {
  304. var obj ente.EmbeddingObject
  305. buff := &aws.WriteAtBuffer{}
  306. _, err := downloader.Download(buff, &s3.GetObjectInput{
  307. Bucket: c.S3Config.GetHotBucket(),
  308. Key: &objectKey,
  309. })
  310. if err != nil {
  311. log.Error(err)
  312. return obj, stacktrace.Propagate(err, "")
  313. }
  314. err = json.Unmarshal(buff.Bytes(), &obj)
  315. if err != nil {
  316. log.Error(err)
  317. return obj, stacktrace.Propagate(err, "")
  318. }
  319. return obj, nil
  320. }
  321. func (c *Controller) _validateGetFileEmbeddingsRequest(ctx *gin.Context, userID int64, req ente.GetFilesEmbeddingRequest) error {
  322. if req.Model == "" {
  323. return ente.NewBadRequestWithMessage("model is required")
  324. }
  325. if len(req.FileIDs) == 0 {
  326. return ente.NewBadRequestWithMessage("fileIDs are required")
  327. }
  328. if len(req.FileIDs) > 100 {
  329. return ente.NewBadRequestWithMessage("fileIDs should be less than or equal to 100")
  330. }
  331. if err := c.AccessCtrl.VerifyFileOwnership(ctx, &access.VerifyFileOwnershipParams{
  332. ActorUserId: userID,
  333. FileIDs: req.FileIDs,
  334. }); err != nil {
  335. return stacktrace.Propagate(err, "User does not own some file(s)")
  336. }
  337. return nil
  338. }