(ns metabase.task.persist-refresh (:require [clojure.string :as str] [clojurewerkz.quartzite.conversion :as qc] [clojurewerkz.quartzite.jobs :as jobs] [clojurewerkz.quartzite.schedule.cron :as cron] [clojurewerkz.quartzite.triggers :as triggers] [medley.core :as m] [metabase.db :as mdb] [metabase.driver :as driver] [metabase.driver.ddl.interface :as ddl.i] [metabase.driver.sql.query-processor :as sql.qp] [metabase.email.messages :as messages] [metabase.models.card :refer [Card]] [metabase.models.database :refer [Database]] [metabase.models.persisted-info :as persisted-info] [metabase.models.task-history :as task-history] [metabase.public-settings :as public-settings] [metabase.query-processor.middleware.limit :as limit] [metabase.query-processor.timezone :as qp.timezone] [metabase.task :as task] [metabase.util :as u] [metabase.util.log :as log] [potemkin.types :as p] [toucan2.core :as t2]) (:import (java.util TimeZone) (org.quartz ObjectAlreadyExistsException Trigger))) | |
(set! *warn-on-reflection* true) | |
(defn- job-context->job-type [job-context] (select-keys (qc/from-job-data job-context) ["db-id" "persisted-id" "type"])) | |
This protocol is just a wrapper of the ddl.interface multimethods to ease for testing. Rather than defing some multimethods on fake engine types, just work against this, and it will dispatch to the ddl.interface normally, or allow for easy to control custom behavior in tests. | (p/defprotocol+ Refresher (refresh! [this database definition dataset-query] "Refresh a persisted model. Returns a map with :state that is :success or :error. If :state is :error, includes a key :error with a string message. See [[metabase.driver.ddl.interface/refresh!]] for more information.") (unpersist! [this database persisted-info])) |
Refresher implementation that dispatches to the multimethods in [[metabase.driver.ddl.interface]]. | (def ^:private dispatching-refresher (reify Refresher (refresh! [_ database definition card] (binding [persisted-info/*allow-persisted-substitution* false] (let [query (limit/disable-max-results (:dataset_query card))] (ddl.i/refresh! (:engine database) database definition query)))) (unpersist! [_ database persisted-info] (ddl.i/unpersist! (:engine database) database persisted-info)))) |
(defn- refresh-with-stats! [refresher database stats persisted-info] ;; Since this could be long running, double check state just before refreshing (when (contains? (persisted-info/refreshable-states) (t2/select-one-fn :state :model/PersistedInfo :id (:id persisted-info))) (log/infof "Attempting to refresh persisted model %s." (:card_id persisted-info)) (let [card (t2/select-one Card :id (:card_id persisted-info)) definition (persisted-info/metadata->definition (:result_metadata card) (:table_name persisted-info)) _ (t2/update! :model/PersistedInfo (u/the-id persisted-info) {:definition definition, :query_hash (persisted-info/query-hash (:dataset_query card)) :active false, :refresh_begin :%now, :refresh_end nil, :state "refreshing" :state_change_at :%now}) {:keys [state error]} (try (refresh! refresher database definition card) (catch Exception e (log/infof e "Error refreshing persisting model with card-id %s" (:card_id persisted-info)) {:state :error :error (ex-message e)}))] (t2/update! :model/PersistedInfo (u/the-id persisted-info) {:active (= state :success), :refresh_end :%now, :state (if (= state :success) "persisted" "error") :state_change_at :%now :error (when (= state :error) error)}) (if (= :success state) (update stats :success inc) (-> stats (update :error-details conj {:persisted-info-id (:id persisted-info) :error error}) (update :error inc)))))) | |
(defn- error-details [results] (some-> results :error-details seq)) | |
Send an email to the admin if there are any errors in the persisted model refresh task. | (defn- send-persist-refresh-email-if-error! [db-id task-details] (try (let [error-details (error-details task-details) error-details-by-id (m/index-by :persisted-info-id error-details) persisted-infos (->> (t2/hydrate (t2/select :model/PersistedInfo :id [:in (keys error-details-by-id)]) [:card :collection] :database) (map #(assoc % :error (get-in error-details-by-id [(:id %) :error]))))] (messages/send-persistent-model-error-email! db-id persisted-infos (:trigger task-details))) (catch Exception e (log/error e "Error sending persist refresh email")))) |
Create a task history entry with start, end, and duration. :task will be | (defn- save-task-history! [task-type db-id thunk] (task-history/with-task-history {:task task-type :db_id db-id :on-success-info (fn [_update-map task-details] (let [error (error-details task-details)] (when (and error (= "persist-refresh" task-type)) (send-persist-refresh-email-if-error! db-id task-details)) {:task_details task-details :status (if error :failed :success)}))} (thunk))) |
Seam for tests to pass in specific deletables to drop. | (defn- prune-deletables! [refresher deletables] (when (seq deletables) (let [db-id->db (m/index-by :id (t2/select Database :id [:in (map :database_id deletables)])) unpersist-fn (fn [] (reduce (fn [stats persisted-info] ;; Since this could be long running, double check state just before deleting (let [current-state (t2/select-one-fn :state :model/PersistedInfo :id (:id persisted-info)) card-info (t2/select-one [Card :archived :type] :id (:card_id persisted-info))] (if (or (contains? (persisted-info/prunable-states) current-state) (:archived card-info) (not= (:type card-info) :model)) (let [database (-> persisted-info :database_id db-id->db)] (log/infof "Unpersisting model with card-id %s" (:card_id persisted-info)) (try (unpersist! refresher database persisted-info) (when-not (= "off" current-state) (t2/delete! :model/PersistedInfo :id (:id persisted-info))) (update stats :success inc) (catch Exception e (log/infof e "Error unpersisting model with card-id %s" (:card_id persisted-info)) (update stats :error inc)))) (update stats :skipped inc)))) {:success 0, :error 0, :skipped 0} deletables))] (save-task-history! "unpersist-tables" nil unpersist-fn)))) |
Returns persisted info records that can be unpersisted. Will select records that have moved into a deletable state after a sufficient delay to ensure no queries are running against them and to allow changing mind. Also selects persisted info records pointing to cards that are no longer models, archived cards/models, and all records where the corresponding card or database has been permanently deleted. | (defn- deletable-models [] (t2/select :model/PersistedInfo {:select [:p.*] :from [[:persisted_info :p]] :left-join [[:report_card :c] [:= :c.id :p.card_id]] :where [:or [:and [:in :state (persisted-info/prunable-states)] ;; Buffer deletions for an hour if the ;; prune job happens soon after setting state. ;; 1. so that people have a chance to change their mind. ;; 2. if a query is running against the cache, it doesn't get ripped out. [:< :state_change_at (sql.qp/add-interval-honeysql-form (mdb/db-type) :%now -1 :hour)]] [:= :c.type "question"] [:= :c.archived true] ;; card_id is set to null when the corresponding card is deleted [:= :p.card_id nil]]})) |
Returns refreshable models for a database id. Must still be models and not archived. | (defn- refreshable-models [database-id] (t2/select :model/PersistedInfo {:select [:p.* :c.type :c.archived :c.name] :from [[:persisted_info :p]] :left-join [[:report_card :c] [:= :c.id :p.card_id]] :where [:and [:= :p.database_id database-id] [:in :p.state (persisted-info/refreshable-states)] [:= :c.archived false] [:= :c.type "model"]]})) |
Prunes all deletable PersistInfos, should not be called from tests as it will orphan cache tables if refresher is replaced. | (defn- prune-all-deletable! [refresher] (let [deletables (deletable-models)] (prune-deletables! refresher deletables))) |
Refresh tables backing the persisted models. Updates all persisted tables with that database id which are in a state of "persisted". | (defn- refresh-tables! [database-id refresher] (log/infof "Starting persisted model refresh task for Database %s." database-id) (persisted-info/ready-unpersisted-models! database-id) (let [database (t2/select-one Database :id database-id) persisted (refreshable-models database-id) thunk (fn [] (reduce (partial refresh-with-stats! refresher database) {:success 0, :error 0, :trigger "Scheduled"} persisted)) {:keys [error success]} (save-task-history! "persist-refresh" database-id thunk)] (log/infof "Finished persisted model refresh task for Database %s with %s successes and %s errors." database-id success error))) |
Refresh an individual model based on [[PersistedInfo]]. | (defn- refresh-individual! [persisted-info-id refresher] (let [persisted-info (t2/select-one :model/PersistedInfo :id persisted-info-id) database (when persisted-info (t2/select-one Database :id (:database_id persisted-info)))] (if (and persisted-info database) (do (save-task-history! "persist-refresh" (u/the-id database) (partial refresh-with-stats! refresher database {:success 0 :error 0, :trigger "Manual"} persisted-info)) (log/infof "Finished updated model-id %s from persisted-info %s." (:card_id persisted-info) (u/the-id persisted-info))) (log/infof "Unable to refresh model with card-id %s" (:card_id persisted-info))))) |
Refresh tables. Gets the database id from the job context and calls | (defn- refresh-job-fn! [job-context] (let [{:strs [type db-id persisted-id] :as _payload} (job-context->job-type job-context)] (case type "database" (refresh-tables! db-id dispatching-refresher) "individual" (refresh-individual! persisted-id dispatching-refresher) (log/infof "Unknown payload type %s" type)))) |
(defn- prune-job-fn! [_job-context] (prune-all-deletable! dispatching-refresher)) | |
Refresh persisted tables job | (jobs/defjob ^{org.quartz.DisallowConcurrentExecution true :doc } PersistenceRefresh [job-context] (refresh-job-fn! job-context)) |
Remove deletable persisted tables | (jobs/defjob ^{org.quartz.DisallowConcurrentExecution true :doc } PersistencePrune [job-context] (prune-job-fn! job-context)) |
Job key string for refresh job. Call | (def ^:private refresh-job-key "metabase.task.PersistenceRefresh.job") |
Job key string for prune job. Call | (def ^:private prune-job-key "metabase.task.PersistencePrune.job") |
(def ^:private refresh-job (jobs/build (jobs/with-description "Persisted Model refresh task") (jobs/of-type PersistenceRefresh) (jobs/with-identity (jobs/key refresh-job-key)) (jobs/store-durably))) | |
(def ^:private prune-job (jobs/build (jobs/with-description "Persisted Model prune task") (jobs/of-type PersistencePrune) (jobs/with-identity (jobs/key prune-job-key)) (jobs/store-durably))) | |
(def ^:private prune-scheduled-trigger-key (triggers/key "metabase.task.PersistencePrune.scheduled.trigger")) | |
(def ^:private prune-once-trigger-key (triggers/key "metabase.task.PersistencePrune.once.trigger")) | |
(defn- database-trigger-key [database] (triggers/key (format "metabase.task.PersistenceRefresh.database.trigger.%d" (u/the-id database)))) | |
(defn- individual-trigger-key [persisted-info] (triggers/key (format "metabase.task.PersistenceRefresh.individual.trigger.%d" (u/the-id persisted-info)))) | |
Return a cron schedule that fires every | (defn- cron-schedule [cron-spec] (cron/schedule (cron/cron-schedule cron-spec) (cron/in-time-zone (TimeZone/getTimeZone (or (driver/report-timezone) (qp.timezone/system-timezone-id) "UTC"))) (cron/with-misfire-handling-instruction-do-nothing))) |
(comment (let [[start-hour start-minute] (map parse-long (str/split "00:00" #":")) hours 1] (if (= 24 hours) (format "0 %d %d * * ? *" start-minute start-hour) (format "0 %d %d/%d * * ? *" start-minute start-hour hours)))) | |
(def ^:private prune-scheduled-trigger (triggers/build (triggers/with-description "Prune deletable PersistInfo once per hour") (triggers/with-identity prune-scheduled-trigger-key) (triggers/for-job (jobs/key prune-job-key)) (triggers/start-now) (triggers/with-schedule (cron-schedule "0 0 0/1 * * ? *")))) | |
(def ^:private prune-once-trigger (triggers/build (triggers/with-description "Prune deletable PersistInfo now") (triggers/with-identity prune-once-trigger-key) (triggers/for-job (jobs/key prune-job-key)) (triggers/start-now))) | |
(defn- database-trigger ^org.quartz.CronTrigger [database cron-spec] (triggers/build (triggers/with-description (format "Refresh models for database %d" (u/the-id database))) (triggers/with-identity (database-trigger-key database)) (triggers/using-job-data {"db-id" (u/the-id database) "type" "database"}) (triggers/for-job (jobs/key refresh-job-key)) (triggers/start-now) (triggers/with-schedule (cron-schedule cron-spec)))) | |
(defn- individual-trigger [persisted-info] (triggers/build (triggers/with-description (format "Refresh model %d: persisted-info %d" (:card_id persisted-info) (u/the-id persisted-info))) (triggers/with-identity (individual-trigger-key persisted-info)) (triggers/using-job-data {"persisted-id" (u/the-id persisted-info) "type" "individual"}) (triggers/for-job (jobs/key refresh-job-key)) (triggers/start-now))) | |
Schedule a database for persistence refreshing. | (defn schedule-persistence-for-database! [database cron-spec] (let [tggr (database-trigger database cron-spec)] (log/info (u/format-color 'green "Scheduling persistence refreshes for database %d: trigger: %s" (u/the-id database) (.. ^Trigger tggr getKey getName))) (persisted-info/ready-database! (u/the-id database)) (try (task/add-trigger! tggr) (catch ObjectAlreadyExistsException _e (log/info (u/format-color 'green "Persistence already present for database %d: trigger: %s" (u/the-id database) (.. ^Trigger tggr getKey getName))))))) |
Schedule a refresh of an individual [[PersistedInfo record]]. Done through quartz for locking purposes. | (defn schedule-refresh-for-individual! [persisted-info] (let [tggr (individual-trigger persisted-info)] (log/info (u/format-color 'green "Scheduling refresh for model: %d" (:card_id persisted-info))) (try (task/add-trigger! tggr) (catch ObjectAlreadyExistsException _e (log/info (u/format-color :green "Persistence already present for model %d %s" (:card_id persisted-info) (.. ^Trigger tggr getKey getName))))))) |
other errors? | |
Fetch all database-ids that have a refresh job scheduled. | (defn job-info-by-db-id [] (some->> refresh-job-key task/job-info :triggers (m/index-by (comp #(get % "db-id") :data)))) |
Stop refreshing tables for a given database. Should only be called when marking the database as not persisting. Tables will be left over and up to the caller to clean up. | (defn unschedule-persistence-for-database! [database] (task/delete-trigger! (database-trigger-key database))) |
Unschedule all job triggers. | (defn- unschedule-all-refresh-triggers! [job-key] (let [trigger-keys (->> (task/job-info job-key) :triggers (map :key))] (doseq [tk trigger-keys] (task/delete-trigger! (triggers/key tk))))) |
Reschedule refresh for all enabled databases. Removes all existing triggers, and schedules refresh for databases with
| (defn reschedule-refresh! [] (let [dbs-with-persistence (filter (comp :persist-models-enabled :settings) (t2/select Database)) cron-schedule (public-settings/persisted-model-refresh-cron-schedule)] (unschedule-all-refresh-triggers! refresh-job-key) (doseq [db dbs-with-persistence] (schedule-persistence-for-database! db cron-schedule)))) |
Enable persisting - The prune job is scheduled anew. - Refresh jobs are added when persist is enabled on a db. | (defn enable-persisting! [] (unschedule-all-refresh-triggers! prune-job-key) (task/add-trigger! prune-scheduled-trigger)) |
Disable persisting - All PersistedInfo are marked for deletion. - Refresh job triggers are removed. - Prune scheduled job trigger is removed. - The prune job is triggered to run immediately. | (defn disable-persisting! [] (persisted-info/mark-for-pruning! {}) (unschedule-all-refresh-triggers! refresh-job-key) (task/delete-trigger! prune-scheduled-trigger-key) ;; ensure we clean up marked for deletion (task/add-trigger! prune-once-trigger)) |
(defn- job-init! [] (task/add-job! refresh-job)) | |
(defmethod task/init! ::PersistRefresh [_] (job-init!) (reschedule-refresh!)) | |
(defmethod task/init! ::PersistPrune [_] (task/add-job! prune-job) (when (public-settings/persisted-models-enabled) (enable-persisting!))) | |