tdbPCache.c 11.6 KB
Newer Older
H
refact  
Hongze Cheng 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */
H
Hongze Cheng 已提交
15 16
#include "tdbInt.h"

H
Hongze Cheng 已提交
17 18
// #include <sys/types.h>
// #include <unistd.h>
H
Hongze Cheng 已提交
19

H
more  
Hongze Cheng 已提交
20
struct SPCache {
H
Hongze Cheng 已提交
21 22 23
  int         szPage;
  int         nPages;
  SPage     **aPage;
H
Hongze Cheng 已提交
24 25 26 27 28 29 30 31
  tdb_mutex_t mutex;
  int         nFree;
  SPage      *pFree;
  int         nPage;
  int         nHash;
  SPage     **pgHash;
  int         nRecyclable;
  SPage       lru;
H
Hongze Cheng 已提交
32 33
};

wafwerar's avatar
wafwerar 已提交
34 35 36
static inline uint32_t tdbPCachePageHash(const SPgid *pPgid) {
  uint32_t *t = (uint32_t *)((pPgid)->fileid);
  return (uint32_t)(t[0] + t[1] + t[2] + t[3] + t[4] + t[5] + (pPgid)->pgno);
wafwerar's avatar
wafwerar 已提交
37
}
H
Hongze Cheng 已提交
38

H
refact  
Hongze Cheng 已提交
39
static int    tdbPCacheOpenImpl(SPCache *pCache);
H
Hongze Cheng 已提交
40
static SPage *tdbPCacheFetchImpl(SPCache *pCache, const SPgid *pPgid, TXN *pTxn);
H
Hongze Cheng 已提交
41 42 43 44
static void   tdbPCachePinPage(SPCache *pCache, SPage *pPage);
static void   tdbPCacheRemovePageFromHash(SPCache *pCache, SPage *pPage);
static void   tdbPCacheAddPageToHash(SPCache *pCache, SPage *pPage);
static void   tdbPCacheUnpinPage(SPCache *pCache, SPage *pPage);
H
Hongze Cheng 已提交
45 46 47 48 49 50
static int    tdbPCacheCloseImpl(SPCache *pCache);

static void tdbPCacheInitLock(SPCache *pCache) { tdbMutexInit(&(pCache->mutex), NULL); }
static void tdbPCacheDestroyLock(SPCache *pCache) { tdbMutexDestroy(&(pCache->mutex)); }
static void tdbPCacheLock(SPCache *pCache) { tdbMutexLock(&(pCache->mutex)); }
static void tdbPCacheUnlock(SPCache *pCache) { tdbMutexUnlock(&(pCache->mutex)); }
H
Hongze Cheng 已提交
51

H
Hongze Cheng 已提交
52
int tdbPCacheOpen(int pageSize, int cacheSize, SPCache **ppCache) {
H
more  
Hongze Cheng 已提交
53
  SPCache *pCache;
H
Hongze Cheng 已提交
54 55
  void    *pPtr;
  SPage   *pPgHdr;
H
Hongze Cheng 已提交
56

H
Hongze Cheng 已提交
57
  pCache = (SPCache *)tdbOsCalloc(1, sizeof(*pCache) + sizeof(SPage *) * cacheSize);
H
more  
Hongze Cheng 已提交
58
  if (pCache == NULL) {
H
Hongze Cheng 已提交
59 60 61
    return -1;
  }

H
Hongze Cheng 已提交
62 63
  pCache->szPage = pageSize;
  pCache->nPages = cacheSize;
H
Hongze Cheng 已提交
64 65 66 67 68
  pCache->aPage = (SPage **)tdbOsCalloc(cacheSize, sizeof(SPage *));
  if (pCache->aPage == NULL) {
    tdbOsFree(pCache);
    return -1;
  }
H
Hongze Cheng 已提交
69

H
more  
Hongze Cheng 已提交
70
  if (tdbPCacheOpenImpl(pCache) < 0) {
H
Hongze Cheng 已提交
71
    tdbOsFree(pCache);
H
more  
Hongze Cheng 已提交
72
    return -1;
H
Hongze Cheng 已提交
73 74
  }

H
more  
Hongze Cheng 已提交
75
  *ppCache = pCache;
H
Hongze Cheng 已提交
76 77 78
  return 0;
}

H
Hongze Cheng 已提交
79
int tdbPCacheClose(SPCache *pCache) {
H
Hongze Cheng 已提交
80 81
  if (pCache) {
    tdbPCacheCloseImpl(pCache);
H
Hongze Cheng 已提交
82
    tdbOsFree(pCache->aPage);
H
Hongze Cheng 已提交
83 84
    tdbOsFree(pCache);
  }
H
Hongze Cheng 已提交
85
  return 0;
H
Hongze Cheng 已提交
86 87
}

H
Hongze Cheng 已提交
88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153
// TODO:
// if (pPage->id >= pCache->nPages) {
//   free(pPage);
//   pCache->aPage[pPage->id] = NULL;
// } else {
//   add to free list
// }

static int tdbPCacheAlterImpl(SPCache *pCache, int32_t nPage) {
  if (pCache->nPages == nPage) {
    return 0;
  } else if (pCache->nPages < nPage) {
    SPage **aPage = tdbOsCalloc(nPage, sizeof(SPage *));
    if (aPage == NULL) {
      return -1;
    }

    for (int32_t iPage = pCache->nPage; iPage < nPage; iPage++) {
      if (tdbPageCreate(pCache->szPage, &aPage[iPage], tdbDefaultMalloc, NULL) < 0) {
        // TODO: handle error
        return -1;
      }

      // pPage->pgid = 0;
      aPage[iPage]->isAnchor = 0;
      aPage[iPage]->isLocal = 1;
      aPage[iPage]->nRef = 0;
      aPage[iPage]->pHashNext = NULL;
      aPage[iPage]->pLruNext = NULL;
      aPage[iPage]->pLruPrev = NULL;
      aPage[iPage]->pDirtyNext = NULL;

      // add page to free list
      aPage[iPage]->pFreeNext = pCache->pFree;
      pCache->pFree = aPage[iPage];
      pCache->nFree++;

      // add to local list
      aPage[iPage]->id = iPage;
    }

    for (int32_t iPage = 0; iPage < pCache->nPage; iPage++) {
      aPage[iPage] = pCache->aPage[iPage];
    }

    tdbOsFree(pCache->aPage);
    pCache->nFree = nPage - pCache->nPage;
    pCache->aPage = aPage;
  }

  pCache->nPages = nPage;
  return 0;
}

int tdbPCacheAlter(SPCache *pCache, int32_t nPage) {
  int ret = 0;

  tdbPCacheLock(pCache);

  ret = tdbPCacheAlterImpl(pCache, nPage);

  tdbPCacheUnlock(pCache);

  return ret;
}

H
Hongze Cheng 已提交
154
SPage *tdbPCacheFetch(SPCache *pCache, const SPgid *pPgid, TXN *pTxn) {
H
refact  
Hongze Cheng 已提交
155
  SPage *pPage;
H
Hongze Cheng 已提交
156
  i32    nRef;
H
more  
Hongze Cheng 已提交
157

H
Hongze Cheng 已提交
158
  tdbPCacheLock(pCache);
H
Hongze Cheng 已提交
159

H
Hongze Cheng 已提交
160
  pPage = tdbPCacheFetchImpl(pCache, pPgid, pTxn);
H
Hongze Cheng 已提交
161
  if (pPage) {
H
Hongze Cheng 已提交
162
    nRef = tdbRefPage(pPage);
H
Hongze Cheng 已提交
163 164
  }

H
Hongze Cheng 已提交
165 166
  ASSERT(pPage);

H
Hongze Cheng 已提交
167
  tdbPCacheUnlock(pCache);
H
more  
Hongze Cheng 已提交
168

H
Hongze Cheng 已提交
169 170 171
  // printf("thread %" PRId64 " fetch page %d pgno %d pPage %p nRef %d\n", taosGetSelfPthreadId(), pPage->id,
  //        TDB_PAGE_PGNO(pPage), pPage, nRef);

M
Minglei Jin 已提交
172
  tdbDebug("pcache/fetch page %p/%d/%d/%d", pPage, TDB_PAGE_PGNO(pPage), pPage->id, nRef);
H
more  
Hongze Cheng 已提交
173
  return pPage;
H
Hongze Cheng 已提交
174 175
}

H
Hongze Cheng 已提交
176
void tdbPCacheRelease(SPCache *pCache, SPage *pPage, TXN *pTxn) {
H
Hongze Cheng 已提交
177 178
  i32 nRef;

H
Hongze Cheng 已提交
179 180
  ASSERT(pTxn);

H
Hongze Cheng 已提交
181 182
  // nRef = tdbUnrefPage(pPage);
  // ASSERT(nRef >= 0);
H
Hongze Cheng 已提交
183

H
Hongze Cheng 已提交
184 185
  tdbPCacheLock(pCache);
  nRef = tdbUnrefPage(pPage);
186
  tdbDebug("pcache/release page %p/%d/%d/%d", pPage, TDB_PAGE_PGNO(pPage), pPage->id, nRef);
H
Hongze Cheng 已提交
187
  if (nRef == 0) {
H
Hongze Cheng 已提交
188 189
    // test the nRef again to make sure
    // it is safe th handle the page
H
Hongze Cheng 已提交
190 191 192 193 194 195 196 197
    // nRef = tdbGetPageRef(pPage);
    // if (nRef == 0) {
    if (pPage->isLocal) {
      tdbPCacheUnpinPage(pCache, pPage);
    } else {
      if (TDB_TXN_IS_WRITE(pTxn)) {
        // remove from hash
        tdbPCacheRemovePageFromHash(pCache, pPage);
H
Hongze Cheng 已提交
198 199
      }

H
Hongze Cheng 已提交
200 201 202
      tdbPageDestroy(pPage, pTxn->xFree, pTxn->xArg);
    }
    // }
H
more  
Hongze Cheng 已提交
203
  }
H
Hongze Cheng 已提交
204 205 206
  tdbPCacheUnlock(pCache);
  // printf("thread %" PRId64 " relas page %d pgno %d pPage %p nRef %d\n", taosGetSelfPthreadId(), pPage->id,
  //        TDB_PAGE_PGNO(pPage), pPage, nRef);
H
Hongze Cheng 已提交
207 208
}

H
Hongze Cheng 已提交
209
int tdbPCacheGetPageSize(SPCache *pCache) { return pCache->szPage; }
H
more  
Hongze Cheng 已提交
210

H
Hongze Cheng 已提交
211
static SPage *tdbPCacheFetchImpl(SPCache *pCache, const SPgid *pPgid, TXN *pTxn) {
H
Hongze Cheng 已提交
212 213 214 215 216
  int    ret = 0;
  SPage *pPage = NULL;
  SPage *pPageH = NULL;

  ASSERT(pTxn);
H
more  
Hongze Cheng 已提交
217 218

  // 1. Search the hash table
wafwerar's avatar
wafwerar 已提交
219
  pPage = pCache->pgHash[tdbPCachePageHash(pPgid) % pCache->nHash];
H
more  
Hongze Cheng 已提交
220
  while (pPage) {
221
    if (pPage->pgid.pgno == pPgid->pgno && memcmp(pPage->pgid.fileid, pPgid->fileid, TDB_FILE_ID_LEN) == 0) break;
H
more  
Hongze Cheng 已提交
222 223 224
    pPage = pPage->pHashNext;
  }

H
refact  
Hongze Cheng 已提交
225
  if (pPage) {
H
Hongze Cheng 已提交
226 227 228 229
    if (pPage->isLocal || TDB_TXN_IS_WRITE(pTxn)) {
      tdbPCachePinPage(pCache, pPage);
      return pPage;
    }
H
more  
Hongze Cheng 已提交
230 231
  }

H
Hongze Cheng 已提交
232 233 234 235 236
  // 1. pPage == NULL
  // 2. pPage && pPage->isLocal == 0 && !TDB_TXN_IS_WRITE(pTxn)
  pPageH = pPage;
  pPage = NULL;

H
more  
Hongze Cheng 已提交
237 238 239 240 241 242 243 244 245 246 247
  // 2. Try to allocate a new page from the free list
  if (pCache->pFree) {
    pPage = pCache->pFree;
    pCache->pFree = pPage->pFreeNext;
    pCache->nFree--;
    pPage->pLruNext = NULL;
  }

  // 3. Try to Recycle a page
  if (!pPage && !pCache->lru.pLruPrev->isAnchor) {
    pPage = pCache->lru.pLruPrev;
H
Hongze Cheng 已提交
248 249
    tdbPCacheRemovePageFromHash(pCache, pPage);
    tdbPCachePinPage(pCache, pPage);
H
more  
Hongze Cheng 已提交
250 251
  }

H
Hongze Cheng 已提交
252
  // 4. Try a create new page
H
Hongze Cheng 已提交
253
  if (!pPage) {
H
Hongze Cheng 已提交
254
    ret = tdbPageCreate(pCache->szPage, &pPage, pTxn->xMalloc, pTxn->xArg);
H
Hongze Cheng 已提交
255 256 257 258 259 260 261 262 263
    if (ret < 0) {
      // TODO
      ASSERT(0);
      return NULL;
    }

    // init the page fields
    pPage->isAnchor = 0;
    pPage->isLocal = 0;
H
Hongze Cheng 已提交
264 265
    pPage->nRef = 0;
    pPage->id = -1;
H
Hongze Cheng 已提交
266
  }
H
more  
Hongze Cheng 已提交
267 268 269 270 271

  // 5. Page here are just created from a free list
  // or by recycling or allocated streesly,
  // need to initialize it
  if (pPage) {
H
Hongze Cheng 已提交
272 273 274
    if (pPageH) {
      // copy the page content
      memcpy(&(pPage->pgid), pPgid, sizeof(*pPgid));
275 276 277 278 279 280 281 282 283

      for (int nLoops = 0;;) {
        if (pPageH->pPager) break;
        if (++nLoops > 1000) {
          sched_yield();
          nLoops = 0;
        }
      }

H
Hongze Cheng 已提交
284 285 286 287
      pPage->pLruNext = NULL;
      pPage->pPager = pPageH->pPager;

      memcpy(pPage->pData, pPageH->pData, pPage->pageSize);
288 289
      tdbDebug("pcache/pPageH: %p %d %p %p %d", pPageH, pPageH->pPageHdr - pPageH->pData, pPageH->xCellSize, pPage,
               TDB_PAGE_PGNO(pPageH));
H
Hongze Cheng 已提交
290
      tdbPageInit(pPage, pPageH->pPageHdr - pPageH->pData, pPageH->xCellSize);
H
Hongze Cheng 已提交
291 292 293 294
      pPage->kLen = pPageH->kLen;
      pPage->vLen = pPageH->vLen;
      pPage->maxLocal = pPageH->maxLocal;
      pPage->minLocal = pPageH->minLocal;
H
Hongze Cheng 已提交
295 296 297 298 299 300 301 302 303
    } else {
      memcpy(&(pPage->pgid), pPgid, sizeof(*pPgid));
      pPage->pLruNext = NULL;
      pPage->pPager = NULL;

      if (pPage->isLocal || TDB_TXN_IS_WRITE(pTxn)) {
        tdbPCacheAddPageToHash(pCache, pPage);
      }
    }
H
more  
Hongze Cheng 已提交
304 305
  }

H
more  
Hongze Cheng 已提交
306
  return pPage;
H
more  
Hongze Cheng 已提交
307 308
}

H
Hongze Cheng 已提交
309
static void tdbPCachePinPage(SPCache *pCache, SPage *pPage) {
H
Hongze Cheng 已提交
310 311 312
  if (pPage->pLruNext != NULL) {
    ASSERT(tdbGetPageRef(pPage) == 0);

H
more  
Hongze Cheng 已提交
313 314 315 316 317
    pPage->pLruPrev->pLruNext = pPage->pLruNext;
    pPage->pLruNext->pLruPrev = pPage->pLruPrev;
    pPage->pLruNext = NULL;

    pCache->nRecyclable--;
H
Hongze Cheng 已提交
318

H
Hongze Cheng 已提交
319
    // printf("pin page %d pgno %d pPage %p\n", pPage->id, TDB_PAGE_PGNO(pPage), pPage);
320
    tdbDebug("pcache/pin page %p/%d/%d", pPage, TDB_PAGE_PGNO(pPage), pPage->id);
H
more  
Hongze Cheng 已提交
321
  }
H
more  
Hongze Cheng 已提交
322 323
}

H
Hongze Cheng 已提交
324 325
static void tdbPCacheUnpinPage(SPCache *pCache, SPage *pPage) {
  i32 nRef;
H
Hongze Cheng 已提交
326

H
Hongze Cheng 已提交
327
  ASSERT(pPage->isLocal);
H
Hongze Cheng 已提交
328
  ASSERT(!pPage->isDirty);
H
Hongze Cheng 已提交
329
  ASSERT(tdbGetPageRef(pPage) == 0);
H
Hongze Cheng 已提交
330

H
Hongze Cheng 已提交
331
  ASSERT(pPage->pLruNext == NULL);
H
more  
Hongze Cheng 已提交
332

H
Hongze Cheng 已提交
333 334 335 336
  pPage->pLruPrev = &(pCache->lru);
  pPage->pLruNext = pCache->lru.pLruNext;
  pCache->lru.pLruNext->pLruPrev = pPage;
  pCache->lru.pLruNext = pPage;
H
more  
Hongze Cheng 已提交
337 338

  pCache->nRecyclable++;
H
Hongze Cheng 已提交
339

H
Hongze Cheng 已提交
340
  // printf("unpin page %d pgno %d pPage %p\n", pPage->id, TDB_PAGE_PGNO(pPage), pPage);
341
  tdbDebug("pcache/unpin page %p/%d/%d", pPage, TDB_PAGE_PGNO(pPage), pPage->id);
H
more  
Hongze Cheng 已提交
342 343
}

H
Hongze Cheng 已提交
344
static void tdbPCacheRemovePageFromHash(SPCache *pCache, SPage *pPage) {
345 346 347
  uint32_t h = tdbPCachePageHash(&(pPage->pgid)) % pCache->nHash;

  SPage **ppPage = &(pCache->pgHash[h]);
348 349 350
  for (; (*ppPage) && *ppPage != pPage; ppPage = &((*ppPage)->pHashNext))
    ;

H
Hongze Cheng 已提交
351
  if (*ppPage) {
352 353
    *ppPage = pPage->pHashNext;
    pCache->nPage--;
H
Hongze Cheng 已提交
354 355
    // printf("rmv page %d to hash, pgno %d, pPage %p\n", pPage->id, TDB_PAGE_PGNO(pPage), pPage);
  }
H
Hongze Cheng 已提交
356

357
  tdbDebug("pcache/remove page %p/%d/%d from hash %" PRIu32, pPage, TDB_PAGE_PGNO(pPage), pPage->id, h);
H
more  
Hongze Cheng 已提交
358 359
}

H
Hongze Cheng 已提交
360
static void tdbPCacheAddPageToHash(SPCache *pCache, SPage *pPage) {
361
  uint32_t h = tdbPCachePageHash(&(pPage->pgid)) % pCache->nHash;
H
more  
Hongze Cheng 已提交
362 363 364 365 366

  pPage->pHashNext = pCache->pgHash[h];
  pCache->pgHash[h] = pPage;

  pCache->nPage++;
H
Hongze Cheng 已提交
367

H
Hongze Cheng 已提交
368
  // printf("add page %d to hash, pgno %d, pPage %p\n", pPage->id, TDB_PAGE_PGNO(pPage), pPage);
369
  tdbDebug("pcache/add page %p/%d/%d to hash %" PRIu32, pPage, TDB_PAGE_PGNO(pPage), pPage->id, h);
H
more  
Hongze Cheng 已提交
370 371 372
}

static int tdbPCacheOpenImpl(SPCache *pCache) {
H
refact  
Hongze Cheng 已提交
373
  SPage *pPage;
H
Hongze Cheng 已提交
374
  u8    *pPtr;
H
refact  
Hongze Cheng 已提交
375
  int    tsize;
H
Hongze Cheng 已提交
376
  int    ret;
H
more  
Hongze Cheng 已提交
377 378 379 380 381 382

  tdbPCacheInitLock(pCache);

  // Open the free list
  pCache->nFree = 0;
  pCache->pFree = NULL;
H
Hongze Cheng 已提交
383
  for (int i = 0; i < pCache->nPages; i++) {
H
Hongze Cheng 已提交
384
    if (tdbPageCreate(pCache->szPage, &pPage, tdbDefaultMalloc, NULL) < 0) {
H
Hongze Cheng 已提交
385
      // TODO: handle error
H
more  
Hongze Cheng 已提交
386 387 388 389 390
      return -1;
    }

    // pPage->pgid = 0;
    pPage->isAnchor = 0;
H
Hongze Cheng 已提交
391
    pPage->isLocal = 1;
H
Hongze Cheng 已提交
392
    pPage->nRef = 0;
H
more  
Hongze Cheng 已提交
393 394 395
    pPage->pHashNext = NULL;
    pPage->pLruNext = NULL;
    pPage->pLruPrev = NULL;
H
more  
Hongze Cheng 已提交
396
    pPage->pDirtyNext = NULL;
H
more  
Hongze Cheng 已提交
397

H
Hongze Cheng 已提交
398
    // add page to free list
H
more  
Hongze Cheng 已提交
399 400 401
    pPage->pFreeNext = pCache->pFree;
    pCache->pFree = pPage;
    pCache->nFree++;
H
Hongze Cheng 已提交
402 403

    // add to local list
H
Hongze Cheng 已提交
404 405
    pPage->id = i;
    pCache->aPage[i] = pPage;
H
more  
Hongze Cheng 已提交
406 407 408 409
  }

  // Open the hash table
  pCache->nPage = 0;
H
Hongze Cheng 已提交
410
  pCache->nHash = pCache->nPages < 8 ? 8 : pCache->nPages;
H
Hongze Cheng 已提交
411
  pCache->pgHash = (SPage **)tdbOsCalloc(pCache->nHash, sizeof(SPage *));
H
more  
Hongze Cheng 已提交
412 413 414 415 416 417 418 419 420 421 422 423
  if (pCache->pgHash == NULL) {
    // TODO
    return -1;
  }

  // Open LRU list
  pCache->nRecyclable = 0;
  pCache->lru.isAnchor = 1;
  pCache->lru.pLruNext = &(pCache->lru);
  pCache->lru.pLruPrev = &(pCache->lru);

  return 0;
H
Hongze Cheng 已提交
424 425
}

H
Hongze Cheng 已提交
426
static int tdbPCacheCloseImpl(SPCache *pCache) {
H
Hongze Cheng 已提交
427 428
  for (i32 iPage = 0; iPage < pCache->nPages; iPage++) {
    if (pCache->aPage[iPage]) {
H
Hongze Cheng 已提交
429
      tdbPageDestroy(pCache->aPage[iPage], tdbDefaultFree, NULL);
H
Hongze Cheng 已提交
430 431
      pCache->aPage[iPage] = NULL;
    }
H
Hongze Cheng 已提交
432 433
  }

H
Hongze Cheng 已提交
434
  tdbOsFree(pCache->pgHash);
H
Hongze Cheng 已提交
435
  tdbPCacheDestroyLock(pCache);
wmmhello's avatar
wmmhello 已提交
436
  return 0;
H
Hongze Cheng 已提交
437
}