cache.rs 10 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307
  1. use crate::{
  2. errors::{internal_error, DocError, DocResult},
  3. services::doc::revision::{
  4. cache::{disk::RevisionDiskCache, memory::RevisionMemoryCache},
  5. RevisionRecord,
  6. RevisionServer,
  7. },
  8. sql_tables::RevTableSql,
  9. };
  10. use flowy_collaboration::entities::doc::Doc;
  11. use flowy_database::ConnectionPool;
  12. use lib_infra::future::FutureResult;
  13. use lib_ot::{
  14. core::{Operation, OperationTransformable},
  15. revision::{RevState, RevType, Revision, RevisionRange},
  16. rich_text::RichTextDelta,
  17. };
  18. use std::{sync::Arc, time::Duration};
  19. use tokio::{
  20. sync::{mpsc, RwLock},
  21. task::{spawn_blocking, JoinHandle},
  22. };
  23. pub trait RevisionIterator: Send + Sync {
  24. fn next(&self) -> FutureResult<Option<RevisionRecord>, DocError>;
  25. }
  26. type DocRevisionDeskCache = dyn RevisionDiskCache<Error = DocError>;
  27. pub struct RevisionCache {
  28. user_id: String,
  29. doc_id: String,
  30. dish_cache: Arc<DocRevisionDeskCache>,
  31. memory_cache: Arc<RevisionMemoryCache>,
  32. defer_save: RwLock<Option<JoinHandle<()>>>,
  33. server: Arc<dyn RevisionServer>,
  34. }
  35. impl RevisionCache {
  36. pub fn new(
  37. user_id: &str,
  38. doc_id: &str,
  39. pool: Arc<ConnectionPool>,
  40. server: Arc<dyn RevisionServer>,
  41. ) -> RevisionCache {
  42. let doc_id = doc_id.to_owned();
  43. let dish_cache = Arc::new(Persistence::new(user_id, pool));
  44. let memory_cache = Arc::new(RevisionMemoryCache::new());
  45. Self {
  46. user_id: user_id.to_owned(),
  47. doc_id,
  48. dish_cache,
  49. memory_cache,
  50. defer_save: RwLock::new(None),
  51. server,
  52. }
  53. }
  54. #[tracing::instrument(level = "debug", skip(self, revision))]
  55. pub async fn add_local_revision(&self, revision: Revision) -> DocResult<()> {
  56. if self.memory_cache.contains(&revision.rev_id) {
  57. return Err(DocError::duplicate_rev().context(format!("Duplicate revision id: {}", revision.rev_id)));
  58. }
  59. let record = RevisionRecord {
  60. revision,
  61. state: RevState::StateLocal,
  62. };
  63. self.memory_cache.add_revision(record).await?;
  64. self.save_revisions().await;
  65. Ok(())
  66. }
  67. #[tracing::instrument(level = "debug", skip(self, revision))]
  68. pub async fn add_remote_revision(&self, revision: Revision) -> DocResult<()> {
  69. if self.memory_cache.contains(&revision.rev_id) {
  70. return Err(DocError::duplicate_rev().context(format!("Duplicate revision id: {}", revision.rev_id)));
  71. }
  72. let record = RevisionRecord {
  73. revision,
  74. state: RevState::StateLocal,
  75. };
  76. self.memory_cache.add_revision(record).await?;
  77. self.save_revisions().await;
  78. Ok(())
  79. }
  80. #[tracing::instrument(level = "debug", skip(self, rev_id), fields(rev_id = %rev_id))]
  81. pub async fn ack_revision(&self, rev_id: i64) {
  82. self.memory_cache.ack_revision(&rev_id).await;
  83. self.save_revisions().await;
  84. }
  85. pub async fn query_revision(&self, doc_id: &str, rev_id: i64) -> Option<RevisionRecord> {
  86. match self.memory_cache.query_revision(&rev_id).await {
  87. None => match self.dish_cache.read_revision(doc_id, rev_id) {
  88. Ok(revision) => revision,
  89. Err(e) => {
  90. log::error!("query_revision error: {:?}", e);
  91. None
  92. },
  93. },
  94. Some(record) => Some(record),
  95. }
  96. }
  97. async fn save_revisions(&self) {
  98. if let Some(handler) = self.defer_save.write().await.take() {
  99. handler.abort();
  100. }
  101. if self.memory_cache.is_empty() {
  102. return;
  103. }
  104. let memory_cache = self.memory_cache.clone();
  105. let disk_cache = self.dish_cache.clone();
  106. *self.defer_save.write().await = Some(tokio::spawn(async move {
  107. tokio::time::sleep(Duration::from_millis(300)).await;
  108. let (ids, records) = memory_cache.revisions();
  109. match disk_cache.create_revisions(records) {
  110. Ok(_) => {
  111. memory_cache.remove_revisions(ids);
  112. },
  113. Err(e) => log::error!("Save revision failed: {:?}", e),
  114. }
  115. }));
  116. }
  117. pub async fn revisions_in_range(&self, range: RevisionRange) -> DocResult<Vec<Revision>> {
  118. let revs = self.memory_cache.revisions_in_range(&range).await?;
  119. if revs.len() == range.len() as usize {
  120. Ok(revs)
  121. } else {
  122. let doc_id = self.doc_id.clone();
  123. let disk_cache = self.dish_cache.clone();
  124. let records = spawn_blocking(move || disk_cache.revisions_in_range(&doc_id, &range))
  125. .await
  126. .map_err(internal_error)??;
  127. let revisions = records
  128. .into_iter()
  129. .map(|record| record.revision)
  130. .collect::<Vec<Revision>>();
  131. Ok(revisions)
  132. }
  133. }
  134. pub async fn load_document(&self) -> DocResult<Doc> {
  135. // Loading the document from disk and it will be sync with server.
  136. let result = load_from_disk(&self.doc_id, self.memory_cache.clone(), self.dish_cache.clone()).await;
  137. if result.is_ok() {
  138. return result;
  139. }
  140. // The document doesn't exist in local. Try load from server
  141. let doc = self.server.fetch_document(&self.doc_id).await?;
  142. let delta_data = doc.data.as_bytes();
  143. let revision = Revision::new(
  144. doc.base_rev_id,
  145. doc.rev_id,
  146. delta_data.to_owned(),
  147. &doc.id,
  148. RevType::Remote,
  149. self.user_id.clone(),
  150. );
  151. self.add_remote_revision(revision).await?;
  152. Ok(doc)
  153. }
  154. }
  155. impl RevisionIterator for RevisionCache {
  156. fn next(&self) -> FutureResult<Option<RevisionRecord>, DocError> {
  157. let memory_cache = self.memory_cache.clone();
  158. let disk_cache = self.dish_cache.clone();
  159. let doc_id = self.doc_id.clone();
  160. FutureResult::new(async move {
  161. match memory_cache.front_local_revision().await {
  162. None => {
  163. //
  164. match memory_cache.front_local_rev_id().await {
  165. None => Ok(None),
  166. Some(rev_id) => match disk_cache.read_revision(&doc_id, rev_id)? {
  167. None => Ok(None),
  168. Some(record) => Ok(Some(record)),
  169. },
  170. }
  171. },
  172. Some((_, record)) => Ok(Some(record)),
  173. }
  174. })
  175. }
  176. }
  177. async fn load_from_disk(
  178. doc_id: &str,
  179. memory_cache: Arc<RevisionMemoryCache>,
  180. disk_cache: Arc<DocRevisionDeskCache>,
  181. ) -> DocResult<Doc> {
  182. let doc_id = doc_id.to_owned();
  183. let (tx, mut rx) = mpsc::channel(2);
  184. let doc = spawn_blocking(move || {
  185. let records = disk_cache.read_revisions(&doc_id)?;
  186. if records.is_empty() {
  187. return Err(DocError::doc_not_found().context("Local doesn't have this document"));
  188. }
  189. let (base_rev_id, rev_id) = records.last().unwrap().revision.pair_rev_id();
  190. let mut delta = RichTextDelta::new();
  191. for (_, record) in records.into_iter().enumerate() {
  192. // Opti: revision's clone may cause memory issues
  193. match RichTextDelta::from_bytes(record.revision.clone().delta_data) {
  194. Ok(local_delta) => {
  195. delta = delta.compose(&local_delta)?;
  196. match tx.blocking_send(record) {
  197. Ok(_) => {},
  198. Err(e) => tracing::error!("❌Load document from disk error: {}", e),
  199. }
  200. },
  201. Err(e) => {
  202. tracing::error!("Deserialize delta from revision failed: {}", e);
  203. },
  204. }
  205. }
  206. correct_delta_if_need(&mut delta);
  207. Result::<Doc, DocError>::Ok(Doc {
  208. id: doc_id,
  209. data: delta.to_json(),
  210. rev_id,
  211. base_rev_id,
  212. })
  213. })
  214. .await
  215. .map_err(internal_error)?;
  216. while let Some(record) = rx.recv().await {
  217. match memory_cache.add_revision(record).await {
  218. Ok(_) => {},
  219. Err(e) => log::error!("{:?}", e),
  220. }
  221. }
  222. doc
  223. }
  224. fn correct_delta_if_need(delta: &mut RichTextDelta) {
  225. if delta.ops.last().is_none() {
  226. return;
  227. }
  228. let data = delta.ops.last().as_ref().unwrap().get_data();
  229. if !data.ends_with('\n') {
  230. log::error!("❌The op must end with newline. Correcting it by inserting newline op");
  231. delta.ops.push(Operation::Insert("\n".into()));
  232. }
  233. }
  234. pub(crate) struct Persistence {
  235. user_id: String,
  236. pub(crate) pool: Arc<ConnectionPool>,
  237. }
  238. impl RevisionDiskCache for Persistence {
  239. type Error = DocError;
  240. fn create_revisions(&self, revisions: Vec<RevisionRecord>) -> Result<(), Self::Error> {
  241. let conn = &*self.pool.get().map_err(internal_error)?;
  242. conn.immediate_transaction::<_, DocError, _>(|| {
  243. let _ = RevTableSql::create_rev_table(revisions, conn)?;
  244. Ok(())
  245. })
  246. }
  247. fn revisions_in_range(&self, doc_id: &str, range: &RevisionRange) -> Result<Vec<RevisionRecord>, Self::Error> {
  248. let conn = &*self.pool.get().map_err(internal_error).unwrap();
  249. let revisions = RevTableSql::read_rev_tables_with_range(&self.user_id, doc_id, range.clone(), conn)?;
  250. Ok(revisions)
  251. }
  252. fn read_revision(&self, doc_id: &str, rev_id: i64) -> Result<Option<RevisionRecord>, Self::Error> {
  253. let conn = self.pool.get().map_err(internal_error)?;
  254. let some = RevTableSql::read_rev_table(&self.user_id, doc_id, &rev_id, &*conn)?;
  255. Ok(some)
  256. }
  257. fn read_revisions(&self, doc_id: &str) -> Result<Vec<RevisionRecord>, Self::Error> {
  258. let conn = self.pool.get().map_err(internal_error)?;
  259. let some = RevTableSql::read_rev_tables(&self.user_id, doc_id, &*conn)?;
  260. Ok(some)
  261. }
  262. }
  263. impl Persistence {
  264. pub(crate) fn new(user_id: &str, pool: Arc<ConnectionPool>) -> Self {
  265. Self {
  266. user_id: user_id.to_owned(),
  267. pool,
  268. }
  269. }
  270. }
  271. #[cfg(feature = "flowy_unit_test")]
  272. impl RevisionCache {
  273. pub fn dish_cache(&self) -> Arc<DocRevisionDeskCache> { self.dish_cache.clone() }
  274. pub fn memory_cache(&self) -> Arc<RevisionMemoryCache> { self.memory_cache.clone() }
  275. }