mirror of
https://github.com/penpot/penpot.git
synced 2026-05-23 17:03:41 +00:00
221 lines
7.9 KiB
Clojure
221 lines
7.9 KiB
Clojure
;; This Source Code Form is subject to the terms of the Mozilla Public
|
|
;; License, v. 2.0. If a copy of the MPL was not distributed with this
|
|
;; file, You can obtain one at http://mozilla.org/MPL/2.0/.
|
|
;;
|
|
;; Copyright (c) KALEIDOS INC
|
|
|
|
(ns app.storage.gc-touched
|
|
"This task is part of the garbage collection process of storage
|
|
objects and is responsible on analyzing the touched objects and mark
|
|
them for deletion if corresponds.
|
|
|
|
For example: when file_media_object is deleted, the depending
|
|
storage_object are marked as touched. This means that some files
|
|
that depend on a concrete storage_object are no longer exists and
|
|
maybe this storage_object is no longer necessary and can be eligible
|
|
for elimination. This task periodically analyzes touched objects and
|
|
mark them as freeze (means that has other references and the object
|
|
is still valid) or deleted (no more references to this object so is
|
|
ready to be deleted)."
|
|
(:require
|
|
[app.common.data :as d]
|
|
[app.common.data.macros :as dm]
|
|
[app.common.exceptions :as ex]
|
|
[app.common.logging :as l]
|
|
[app.common.time :as ct]
|
|
[app.config :as cf]
|
|
[app.db :as db]
|
|
[app.storage :as sto]
|
|
[app.storage.impl :as impl]
|
|
[integrant.core :as ig]))
|
|
|
|
(def ^:private sql:has-team-font-variant-refs
|
|
"SELECT ((SELECT EXISTS (SELECT 1 FROM team_font_variant WHERE woff1_file_id = ?)) OR
|
|
(SELECT EXISTS (SELECT 1 FROM team_font_variant WHERE woff2_file_id = ?)) OR
|
|
(SELECT EXISTS (SELECT 1 FROM team_font_variant WHERE otf_file_id = ?)) OR
|
|
(SELECT EXISTS (SELECT 1 FROM team_font_variant WHERE ttf_file_id = ?))) AS has_refs")
|
|
|
|
(defn- has-team-font-variant-refs?
|
|
[conn {:keys [id]}]
|
|
(-> (db/exec-one! conn [sql:has-team-font-variant-refs id id id id])
|
|
(get :has-refs)))
|
|
|
|
(def ^:private
|
|
sql:has-file-media-object-refs
|
|
"SELECT ((SELECT EXISTS (SELECT 1 FROM file_media_object WHERE media_id = ?)) OR
|
|
(SELECT EXISTS (SELECT 1 FROM file_media_object WHERE thumbnail_id = ?))) AS has_refs")
|
|
|
|
(defn- has-file-media-object-refs?
|
|
[conn {:keys [id]}]
|
|
(-> (db/exec-one! conn [sql:has-file-media-object-refs id id])
|
|
(get :has-refs)))
|
|
|
|
(def ^:private sql:has-profile-refs
|
|
"SELECT ((SELECT EXISTS (SELECT 1 FROM profile WHERE photo_id = ?)) OR
|
|
(SELECT EXISTS (SELECT 1 FROM team WHERE photo_id = ?))) AS has_refs")
|
|
|
|
(defn- has-profile-refs?
|
|
[conn {:keys [id]}]
|
|
(-> (db/exec-one! conn [sql:has-profile-refs id id])
|
|
(get :has-refs)))
|
|
|
|
(def ^:private
|
|
sql:has-file-object-thumbnail-refs
|
|
"SELECT EXISTS (SELECT 1 FROM file_tagged_object_thumbnail WHERE media_id = ?) AS has_refs")
|
|
|
|
(defn- has-file-object-thumbnails-refs?
|
|
[conn {:keys [id]}]
|
|
(-> (db/exec-one! conn [sql:has-file-object-thumbnail-refs id])
|
|
(get :has-refs)))
|
|
|
|
(def ^:private
|
|
sql:has-file-thumbnail-refs
|
|
"SELECT EXISTS (SELECT 1 FROM file_thumbnail WHERE media_id = ?) AS has_refs")
|
|
|
|
(defn- has-file-thumbnails-refs?
|
|
[conn {:keys [id]}]
|
|
(-> (db/exec-one! conn [sql:has-file-thumbnail-refs id])
|
|
(get :has-refs)))
|
|
|
|
(def sql:exists-file-data-refs
|
|
"SELECT EXISTS (
|
|
SELECT 1 FROM file_data
|
|
WHERE file_id = ?
|
|
AND id = ?
|
|
AND metadata->>'storage-ref-id' = ?::text
|
|
) AS has_refs")
|
|
|
|
(defn- has-file-data-refs?
|
|
[conn sobject]
|
|
(let [{:keys [file-id id]} (:metadata sobject)]
|
|
(-> (db/exec-one! conn [sql:exists-file-data-refs file-id id (:id sobject)])
|
|
(get :has-refs))))
|
|
|
|
(def ^:private sql:mark-freeze-in-bulk
|
|
"UPDATE storage_object
|
|
SET touched_at = NULL
|
|
WHERE id = ANY(?::uuid[])")
|
|
|
|
(defn- mark-freeze-in-bulk!
|
|
[conn ids]
|
|
(let [ids (db/create-array conn "uuid" ids)]
|
|
(db/exec-one! conn [sql:mark-freeze-in-bulk ids])))
|
|
|
|
(def ^:private sql:mark-delete-in-bulk
|
|
"UPDATE storage_object
|
|
SET deleted_at = ?,
|
|
touched_at = NULL
|
|
WHERE id = ANY(?::uuid[])")
|
|
|
|
(defn- mark-delete-in-bulk!
|
|
[conn deletion-delay ids]
|
|
(let [ids (db/create-array conn "uuid" ids)
|
|
now (ct/plus (ct/now) deletion-delay)]
|
|
(db/exec-one! conn [sql:mark-delete-in-bulk now ids])))
|
|
|
|
;; NOTE: A getter that retrieves the key which will be used for group
|
|
;; ids; previously we have no value, then we introduced the
|
|
;; `:reference` prop, and then it is renamed to `:bucket` and now is
|
|
;; string instead. This is implemented in this way for backward
|
|
;; comaptibilty.
|
|
|
|
;; NOTE: we use the "file-media-object" as default value for
|
|
;; backward compatibility because when we deploy it we can
|
|
;; have old backend instances running in the same time as
|
|
;; the new one and we can still have storage-objects created
|
|
;; without bucket value. And we know that if it does not
|
|
;; have value, it means :file-media-object.
|
|
|
|
(defn- lookup-bucket
|
|
[{:keys [metadata]}]
|
|
(or (some-> metadata :bucket)
|
|
(some-> metadata :reference d/name)
|
|
sto/default-bucket))
|
|
|
|
(defn- process-objects!
|
|
[conn has-refs? bucket objects]
|
|
(loop [to-freeze #{}
|
|
to-delete #{}
|
|
objects (seq objects)]
|
|
(if-let [{:keys [id] :as object} (first objects)]
|
|
(if (has-refs? conn object)
|
|
(do
|
|
(l/dbg :id (str id)
|
|
:status "freeze"
|
|
:bucket bucket)
|
|
(recur (conj to-freeze id) to-delete (rest objects)))
|
|
(do
|
|
(l/dbg :id (str id)
|
|
:status "delete"
|
|
:bucket bucket)
|
|
(recur to-freeze (conj to-delete id) (rest objects))))
|
|
(let [deletion-delay (if (= bucket "tempfile")
|
|
(ct/duration {:hours 2})
|
|
(cf/get-deletion-delay))]
|
|
(some->> (seq to-freeze) (mark-freeze-in-bulk! conn))
|
|
(some->> (seq to-delete) (mark-delete-in-bulk! conn deletion-delay))
|
|
[(count to-freeze) (count to-delete)]))))
|
|
|
|
(defn- process-bucket!
|
|
[conn bucket objects]
|
|
(case bucket
|
|
"file-media-object" (process-objects! conn has-file-media-object-refs? bucket objects)
|
|
"team-font-variant" (process-objects! conn has-team-font-variant-refs? bucket objects)
|
|
"file-object-thumbnail" (process-objects! conn has-file-object-thumbnails-refs? bucket objects)
|
|
"file-thumbnail" (process-objects! conn has-file-thumbnails-refs? bucket objects)
|
|
"profile" (process-objects! conn has-profile-refs? bucket objects)
|
|
"file-data" (process-objects! conn has-file-data-refs? bucket objects)
|
|
"tempfile" (process-objects! conn (constantly false) bucket objects)
|
|
(ex/raise :type :internal
|
|
:code :unexpected-unknown-reference
|
|
:hint (dm/fmt "unknown reference '%'" bucket))))
|
|
|
|
(defn process-chunk!
|
|
[{:keys [::db/conn]} chunk]
|
|
(reduce-kv (fn [[nfo ndo] bucket objects]
|
|
(let [[nfo' ndo'] (process-bucket! conn bucket objects)]
|
|
[(+ nfo nfo')
|
|
(+ ndo ndo')]))
|
|
[0 0]
|
|
(d/group-by lookup-bucket identity #{} chunk)))
|
|
|
|
(def ^:private sql:get-touched-storage-objects
|
|
"SELECT so.*
|
|
FROM storage_object AS so
|
|
WHERE so.touched_at IS NOT NULL
|
|
AND so.touched_at <= ?
|
|
ORDER BY touched_at ASC
|
|
FOR UPDATE
|
|
SKIP LOCKED
|
|
LIMIT 10")
|
|
|
|
(defn get-chunk
|
|
[conn timestamp]
|
|
(->> (db/exec! conn [sql:get-touched-storage-objects timestamp])
|
|
(map impl/decode-row)
|
|
(not-empty)))
|
|
|
|
(defn- process-touched!
|
|
[{:keys [::db/pool ::timestamp] :as cfg}]
|
|
(loop [freezed 0
|
|
deleted 0]
|
|
(if-let [chunk (get-chunk pool timestamp)]
|
|
(let [[nfo ndo] (db/tx-run! cfg process-chunk! chunk)]
|
|
(recur (long (+ freezed nfo))
|
|
(long (+ deleted ndo))))
|
|
{:freeze freezed :delete deleted})))
|
|
|
|
;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
|
|
;; HANDLER
|
|
;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
|
|
|
|
(defmethod ig/assert-key ::handler
|
|
[_ params]
|
|
(assert (db/pool? (::db/pool params)) "expect valid storage"))
|
|
|
|
(defmethod ig/init-key ::handler
|
|
[_ cfg]
|
|
(fn [_]
|
|
(process-touched! (assoc cfg ::timestamp (ct/now)))))
|
|
|