tdbPCache.c 7.3 KB
Newer Older
H
refact  
Hongze Cheng 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */
H
Hongze Cheng 已提交
15 16
#include "tdbInt.h"

H
more  
Hongze Cheng 已提交
17 18 19 20
struct SPCache {
  int             pageSize;
  int             cacheSize;
  pthread_mutex_t mutex;
H
more  
Hongze Cheng 已提交
21
  int             nFree;
H
Hongze Cheng 已提交
22
  SPage          *pFree;
H
more  
Hongze Cheng 已提交
23 24
  int             nPage;
  int             nHash;
H
Hongze Cheng 已提交
25
  SPage         **pgHash;
H
more  
Hongze Cheng 已提交
26
  int             nRecyclable;
H
refact  
Hongze Cheng 已提交
27
  SPage           lru;
H
Hongze Cheng 已提交
28 29
};

H
more  
Hongze Cheng 已提交
30 31 32 33 34 35
#define PCACHE_PAGE_HASH(pPgid)                              \
  ({                                                         \
    u32 *t = (u32 *)((pPgid)->fileid);                       \
    t[0] + t[1] + t[2] + t[3] + t[4] + t[5] + (pPgid)->pgno; \
  })
#define PAGE_IS_PINNED(pPage) ((pPage)->pLruNext == NULL)
H
Hongze Cheng 已提交
36

H
Hongze Cheng 已提交
37 38 39 40 41 42 43 44 45 46 47 48
// For page ref
#define TDB_INIT_PAGE_REF(pPage) ((pPage)->nRef = 0)
#if 0
#define TDB_REF_PAGE(pPage)     (++(pPage)->nRef)
#define TDB_UNREF_PAGE(pPage)   (--(pPage)->nRef)
#define TDB_GET_PAGE_REF(pPage) ((pPage)->nRef)
#else
#define TDB_REF_PAGE(pPage)     atomic_add_fetch_32(&((pPage)->nRef), 1)
#define TDB_UNREF_PAGE(pPage)   atomic_sub_fetch_32(&((pPage)->nRef), 1)
#define TDB_GET_PAGE_REF(pPage) atomic_load_32(&((pPage)->nRef))
#endif

H
refact  
Hongze Cheng 已提交
49 50 51 52 53 54 55
static int    tdbPCacheOpenImpl(SPCache *pCache);
static void   tdbPCacheInitLock(SPCache *pCache);
static void   tdbPCacheClearLock(SPCache *pCache);
static void   tdbPCacheLock(SPCache *pCache);
static void   tdbPCacheUnlock(SPCache *pCache);
static bool   tdbPCacheLocked(SPCache *pCache);
static SPage *tdbPCacheFetchImpl(SPCache *pCache, const SPgid *pPgid, bool alcNewPage);
H
Hongze Cheng 已提交
56 57 58 59
static void   tdbPCachePinPage(SPCache *pCache, SPage *pPage);
static void   tdbPCacheRemovePageFromHash(SPCache *pCache, SPage *pPage);
static void   tdbPCacheAddPageToHash(SPCache *pCache, SPage *pPage);
static void   tdbPCacheUnpinPage(SPCache *pCache, SPage *pPage);
H
Hongze Cheng 已提交
60

H
Hongze Cheng 已提交
61
int tdbPCacheOpen(int pageSize, int cacheSize, SPCache **ppCache) {
H
more  
Hongze Cheng 已提交
62
  SPCache *pCache;
H
Hongze Cheng 已提交
63 64
  void    *pPtr;
  SPage   *pPgHdr;
H
Hongze Cheng 已提交
65

H
more  
Hongze Cheng 已提交
66 67
  pCache = (SPCache *)calloc(1, sizeof(*pCache));
  if (pCache == NULL) {
H
Hongze Cheng 已提交
68 69 70
    return -1;
  }

H
more  
Hongze Cheng 已提交
71 72
  pCache->pageSize = pageSize;
  pCache->cacheSize = cacheSize;
H
Hongze Cheng 已提交
73

H
more  
Hongze Cheng 已提交
74 75 76
  if (tdbPCacheOpenImpl(pCache) < 0) {
    free(pCache);
    return -1;
H
Hongze Cheng 已提交
77 78
  }

H
more  
Hongze Cheng 已提交
79
  *ppCache = pCache;
H
Hongze Cheng 已提交
80 81 82
  return 0;
}

H
Hongze Cheng 已提交
83
int tdbPCacheClose(SPCache *pCache) {
H
Hongze Cheng 已提交
84
  /* TODO */
H
Hongze Cheng 已提交
85
  return 0;
H
Hongze Cheng 已提交
86 87
}

H
refact  
Hongze Cheng 已提交
88 89
SPage *tdbPCacheFetch(SPCache *pCache, const SPgid *pPgid, bool alcNewPage) {
  SPage *pPage;
H
more  
Hongze Cheng 已提交
90

H
Hongze Cheng 已提交
91
  tdbPCacheLock(pCache);
H
Hongze Cheng 已提交
92

H
more  
Hongze Cheng 已提交
93
  pPage = tdbPCacheFetchImpl(pCache, pPgid, alcNewPage);
H
Hongze Cheng 已提交
94 95 96 97
  if (pPage) {
    TDB_REF_PAGE(pPage);
  }

H
Hongze Cheng 已提交
98
  tdbPCacheUnlock(pCache);
H
more  
Hongze Cheng 已提交
99 100

  return pPage;
H
Hongze Cheng 已提交
101 102
}

H
Hongze Cheng 已提交
103
void tdbPCacheRelease(SPCache *pCache, SPage *pPage) {
H
Hongze Cheng 已提交
104 105 106 107 108 109
  i32 nRef;

  nRef = TDB_UNREF_PAGE(pPage);
  ASSERT(nRef >= 0);

  if (nRef == 0) {
H
more  
Hongze Cheng 已提交
110
    if (1 /*TODO: page still clean*/) {
H
Hongze Cheng 已提交
111
      tdbPCacheUnpinPage(pCache, pPage);
H
more  
Hongze Cheng 已提交
112 113 114 115 116
    } else {
      // TODO
      ASSERT(0);
    }
  }
H
Hongze Cheng 已提交
117 118
}

H
more  
Hongze Cheng 已提交
119 120 121 122
static void tdbPCacheInitLock(SPCache *pCache) { pthread_mutex_init(&(pCache->mutex), NULL); }

static void tdbPCacheClearLock(SPCache *pCache) { pthread_mutex_destroy(&(pCache->mutex)); }

H
Hongze Cheng 已提交
123 124 125 126 127 128 129 130
static void tdbPCacheLock(SPCache *pCache) { pthread_mutex_lock(&(pCache->mutex)); }

static void tdbPCacheUnlock(SPCache *pCache) { pthread_mutex_unlock(&(pCache->mutex)); }

static bool tdbPCacheLocked(SPCache *pCache) {
  assert(0);
  // TODO
  return true;
H
more  
Hongze Cheng 已提交
131 132
}

H
refact  
Hongze Cheng 已提交
133 134
static SPage *tdbPCacheFetchImpl(SPCache *pCache, const SPgid *pPgid, bool alcNewPage) {
  SPage *pPage;
H
more  
Hongze Cheng 已提交
135 136 137 138

  // 1. Search the hash table
  pPage = pCache->pgHash[PCACHE_PAGE_HASH(pPgid) % pCache->nHash];
  while (pPage) {
H
more  
Hongze Cheng 已提交
139
    if (TDB_IS_SAME_PAGE(&(pPage->pgid), pPgid)) break;
H
more  
Hongze Cheng 已提交
140 141 142
    pPage = pPage->pHashNext;
  }

H
more  
Hongze Cheng 已提交
143
  if (pPage || !alcNewPage) {
H
more  
Hongze Cheng 已提交
144
    if (pPage) {
H
Hongze Cheng 已提交
145
      tdbPCachePinPage(pCache, pPage);
H
more  
Hongze Cheng 已提交
146
    }
H
more  
Hongze Cheng 已提交
147 148 149
    return pPage;
  }

H
more  
Hongze Cheng 已提交
150 151 152 153 154 155 156 157 158 159 160
  // 2. Try to allocate a new page from the free list
  if (pCache->pFree) {
    pPage = pCache->pFree;
    pCache->pFree = pPage->pFreeNext;
    pCache->nFree--;
    pPage->pLruNext = NULL;
  }

  // 3. Try to Recycle a page
  if (!pPage && !pCache->lru.pLruPrev->isAnchor) {
    pPage = pCache->lru.pLruPrev;
H
Hongze Cheng 已提交
161 162
    tdbPCacheRemovePageFromHash(pCache, pPage);
    tdbPCachePinPage(pCache, pPage);
H
more  
Hongze Cheng 已提交
163 164
  }

H
more  
Hongze Cheng 已提交
165
  // 4. Try a stress allocation (TODO)
H
more  
Hongze Cheng 已提交
166 167 168 169 170

  // 5. Page here are just created from a free list
  // or by recycling or allocated streesly,
  // need to initialize it
  if (pPage) {
H
more  
Hongze Cheng 已提交
171
    memcpy(&(pPage->pgid), pPgid, sizeof(*pPgid));
H
more  
Hongze Cheng 已提交
172
    pPage->pLruNext = NULL;
H
more  
Hongze Cheng 已提交
173
    pPage->pPager = NULL;
H
Hongze Cheng 已提交
174
    tdbPCacheAddPageToHash(pCache, pPage);
H
more  
Hongze Cheng 已提交
175 176
  }

H
more  
Hongze Cheng 已提交
177
  return pPage;
H
more  
Hongze Cheng 已提交
178 179
}

H
Hongze Cheng 已提交
180
static void tdbPCachePinPage(SPCache *pCache, SPage *pPage) {
H
more  
Hongze Cheng 已提交
181 182 183 184 185 186
  if (!PAGE_IS_PINNED(pPage)) {
    pPage->pLruPrev->pLruNext = pPage->pLruNext;
    pPage->pLruNext->pLruPrev = pPage->pLruPrev;
    pPage->pLruNext = NULL;

    pCache->nRecyclable--;
H
more  
Hongze Cheng 已提交
187
  }
H
more  
Hongze Cheng 已提交
188 189
}

H
Hongze Cheng 已提交
190 191
static void tdbPCacheUnpinPage(SPCache *pCache, SPage *pPage) {
  i32 nRef;
H
Hongze Cheng 已提交
192 193 194

  tdbPCacheLock(pCache);

H
Hongze Cheng 已提交
195
  nRef = TDB_GET_PAGE_REF(pPage);
H
Hongze Cheng 已提交
196 197 198 199
  ASSERT(nRef >= 0);
  if (nRef == 0) {
    // Add the page to LRU list
    ASSERT(pPage->pLruNext == NULL);
H
more  
Hongze Cheng 已提交
200

H
Hongze Cheng 已提交
201 202 203 204 205
    pPage->pLruPrev = &(pCache->lru);
    pPage->pLruNext = pCache->lru.pLruNext;
    pCache->lru.pLruNext->pLruPrev = pPage;
    pCache->lru.pLruNext = pPage;
  }
H
more  
Hongze Cheng 已提交
206 207

  pCache->nRecyclable++;
H
Hongze Cheng 已提交
208 209

  tdbPCacheUnlock(pCache);
H
more  
Hongze Cheng 已提交
210 211
}

H
Hongze Cheng 已提交
212 213 214
static void tdbPCacheRemovePageFromHash(SPCache *pCache, SPage *pPage) {
  SPage **ppPage;
  int     h;
H
more  
Hongze Cheng 已提交
215 216 217 218 219 220 221 222 223 224

  h = PCACHE_PAGE_HASH(&(pPage->pgid));
  for (ppPage = &(pCache->pgHash[h % pCache->nHash]); *ppPage != pPage; ppPage = &((*ppPage)->pHashNext))
    ;
  ASSERT(*ppPage == pPage);
  *ppPage = pPage->pHashNext;

  pCache->nPage--;
}

H
Hongze Cheng 已提交
225 226
static void tdbPCacheAddPageToHash(SPCache *pCache, SPage *pPage) {
  int h;
H
more  
Hongze Cheng 已提交
227

H
more  
Hongze Cheng 已提交
228
  h = PCACHE_PAGE_HASH(&(pPage->pgid)) % pCache->nHash;
H
more  
Hongze Cheng 已提交
229 230 231 232 233

  pPage->pHashNext = pCache->pgHash[h];
  pCache->pgHash[h] = pPage;

  pCache->nPage++;
H
more  
Hongze Cheng 已提交
234 235 236
}

static int tdbPCacheOpenImpl(SPCache *pCache) {
H
refact  
Hongze Cheng 已提交
237
  SPage *pPage;
H
Hongze Cheng 已提交
238
  u8    *pPtr;
H
refact  
Hongze Cheng 已提交
239
  int    tsize;
H
Hongze Cheng 已提交
240
  int    ret;
H
more  
Hongze Cheng 已提交
241 242 243 244 245 246 247

  tdbPCacheInitLock(pCache);

  // Open the free list
  pCache->nFree = 0;
  pCache->pFree = NULL;
  for (int i = 0; i < pCache->cacheSize; i++) {
H
Hongze Cheng 已提交
248
    ret = tdbPageCreate(pCache->pageSize, &pPage, NULL, NULL);
H
Hongze Cheng 已提交
249 250
    if (ret < 0) {
      // TODO: handle error
H
more  
Hongze Cheng 已提交
251 252 253 254 255 256
      return -1;
    }

    // pPage->pgid = 0;
    pPage->isAnchor = 0;
    pPage->isLocalPage = 1;
H
Hongze Cheng 已提交
257
    TDB_INIT_PAGE_REF(pPage);
H
more  
Hongze Cheng 已提交
258 259 260
    pPage->pHashNext = NULL;
    pPage->pLruNext = NULL;
    pPage->pLruPrev = NULL;
H
more  
Hongze Cheng 已提交
261
    pPage->pDirtyNext = NULL;
H
more  
Hongze Cheng 已提交
262 263 264 265 266 267 268 269 270

    pPage->pFreeNext = pCache->pFree;
    pCache->pFree = pPage;
    pCache->nFree++;
  }

  // Open the hash table
  pCache->nPage = 0;
  pCache->nHash = pCache->cacheSize;
H
refact  
Hongze Cheng 已提交
271
  pCache->pgHash = (SPage **)calloc(pCache->nHash, sizeof(SPage *));
H
more  
Hongze Cheng 已提交
272 273 274 275 276 277 278 279 280 281 282 283
  if (pCache->pgHash == NULL) {
    // TODO
    return -1;
  }

  // Open LRU list
  pCache->nRecyclable = 0;
  pCache->lru.isAnchor = 1;
  pCache->lru.pLruNext = &(pCache->lru);
  pCache->lru.pLruPrev = &(pCache->lru);

  return 0;
H
Hongze Cheng 已提交
284 285
}

H
Hongze Cheng 已提交
286
int tdbPCacheGetPageSize(SPCache *pCache) { return pCache->pageSize; }