mirror of https://gitee.com/bigwinds/arangodb
1711 lines
57 KiB
C++
1711 lines
57 KiB
C++
////////////////////////////////////////////////////////////////////////////////
|
|
/// DISCLAIMER
|
|
///
|
|
/// Copyright 2014-2016 ArangoDB GmbH, Cologne, Germany
|
|
/// Copyright 2004-2014 triAGENS GmbH, Cologne, Germany
|
|
///
|
|
/// Licensed under the Apache License, Version 2.0 (the "License");
|
|
/// you may not use this file except in compliance with the License.
|
|
/// You may obtain a copy of the License at
|
|
///
|
|
/// http://www.apache.org/licenses/LICENSE-2.0
|
|
///
|
|
/// Unless required by applicable law or agreed to in writing, software
|
|
/// distributed under the License is distributed on an "AS IS" BASIS,
|
|
/// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
/// See the License for the specific language governing permissions and
|
|
/// limitations under the License.
|
|
///
|
|
/// Copyright holder is ArangoDB GmbH, Cologne, Germany
|
|
///
|
|
/// @author Dr. Frank Celler
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
|
|
#include "collection.h"
|
|
|
|
#include <regex.h>
|
|
|
|
#include "Basics/conversions.h"
|
|
#include "Basics/files.h"
|
|
#include "Basics/FileUtils.h"
|
|
#include "Basics/hashes.h"
|
|
#include "Basics/json.h"
|
|
#include "Basics/JsonHelper.h"
|
|
#include "Basics/Logger.h"
|
|
#include "Basics/random.h"
|
|
#include "Basics/tri-strings.h"
|
|
#include "Basics/memory-map.h"
|
|
#include "Basics/VelocyPackHelper.h"
|
|
#include "Cluster/ClusterInfo.h"
|
|
#include "VocBase/document-collection.h"
|
|
#include "VocBase/server.h"
|
|
#include "VocBase/vocbase.h"
|
|
|
|
#include <velocypack/Collection.h>
|
|
#include <velocypack/velocypack-aliases.h>
|
|
|
|
using namespace arangodb;
|
|
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
/// @brief extract the numeric part from a filename
|
|
/// the filename must look like this: /.*type-abc\.ending$/, where abc is
|
|
/// a number, and type and ending are arbitrary letters
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
|
|
static uint64_t GetNumericFilenamePart(char const* filename) {
|
|
char const* pos1 = strrchr(filename, '.');
|
|
|
|
if (pos1 == nullptr) {
|
|
return 0;
|
|
}
|
|
|
|
char const* pos2 = strrchr(filename, '-');
|
|
|
|
if (pos2 == nullptr || pos2 > pos1) {
|
|
return 0;
|
|
}
|
|
|
|
return TRI_UInt64String2(pos2 + 1, pos1 - pos2 - 1);
|
|
}
|
|
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
/// @brief compare two filenames, based on the numeric part contained in
|
|
/// the filename. this is used to sort datafile filenames on startup
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
|
|
static int FilenameComparator(const void* lhs, const void* rhs) {
|
|
char const* l = *((char**)lhs);
|
|
char const* r = *((char**)rhs);
|
|
|
|
uint64_t const numLeft = GetNumericFilenamePart(l);
|
|
uint64_t const numRight = GetNumericFilenamePart(r);
|
|
|
|
if (numLeft != numRight) {
|
|
return numLeft < numRight ? -1 : 1;
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
/// @brief compare two datafiles, based on the numeric part contained in
|
|
/// the filename
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
|
|
static int DatafileComparator(const void* lhs, const void* rhs) {
|
|
TRI_datafile_t* l = *((TRI_datafile_t**)lhs);
|
|
TRI_datafile_t* r = *((TRI_datafile_t**)rhs);
|
|
|
|
uint64_t const numLeft =
|
|
(l->_filename != nullptr ? GetNumericFilenamePart(l->_filename) : 0);
|
|
uint64_t const numRight =
|
|
(r->_filename != nullptr ? GetNumericFilenamePart(r->_filename) : 0);
|
|
|
|
if (numLeft != numRight) {
|
|
return numLeft < numRight ? -1 : 1;
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
/// @brief sort a vector of filenames, using the numeric parts contained
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
|
|
static void SortFilenames(TRI_vector_string_t* files) {
|
|
if (files->_length <= 1) {
|
|
return;
|
|
}
|
|
|
|
qsort(files->_buffer, files->_length, sizeof(char*), &FilenameComparator);
|
|
}
|
|
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
/// @brief sort a vector of datafiles, using the numeric parts contained
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
|
|
static void SortDatafiles(TRI_vector_pointer_t* files) {
|
|
if (files->_length <= 1) {
|
|
return;
|
|
}
|
|
|
|
qsort(files->_buffer, files->_length, sizeof(TRI_datafile_t*),
|
|
&DatafileComparator);
|
|
}
|
|
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
/// @brief initializes a new collection
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
|
|
static void InitCollection(TRI_vocbase_t* vocbase, TRI_collection_t* collection,
|
|
std::string const& directory, VocbaseCollectionInfo const& info) {
|
|
TRI_ASSERT(collection != nullptr);
|
|
|
|
collection->_info.update(info);
|
|
|
|
collection->_vocbase = vocbase;
|
|
collection->_tickMax = 0;
|
|
collection->_state = TRI_COL_STATE_WRITE;
|
|
collection->_lastError = 0;
|
|
collection->_directory = TRI_DuplicateString(TRI_UNKNOWN_MEM_ZONE, directory.c_str(), directory.size());
|
|
|
|
TRI_InitVectorPointer(&collection->_datafiles, TRI_UNKNOWN_MEM_ZONE);
|
|
TRI_InitVectorPointer(&collection->_journals, TRI_UNKNOWN_MEM_ZONE);
|
|
TRI_InitVectorPointer(&collection->_compactors, TRI_UNKNOWN_MEM_ZONE);
|
|
TRI_InitVectorString(&collection->_indexFiles, TRI_CORE_MEM_ZONE);
|
|
}
|
|
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
/// @brief scans a collection and locates all files
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
|
|
static TRI_col_file_structure_t ScanCollectionDirectory(char const* path) {
|
|
TRI_col_file_structure_t structure;
|
|
regex_t re;
|
|
|
|
TRI_InitVectorString(&structure._journals, TRI_CORE_MEM_ZONE);
|
|
TRI_InitVectorString(&structure._compactors, TRI_CORE_MEM_ZONE);
|
|
TRI_InitVectorString(&structure._datafiles, TRI_CORE_MEM_ZONE);
|
|
TRI_InitVectorString(&structure._indexes, TRI_CORE_MEM_ZONE);
|
|
|
|
if (regcomp(&re,
|
|
"^(temp|compaction|journal|datafile|index|compactor)-([0-9][0-9]*"
|
|
")\\.(db|json)(\\.dead)?$",
|
|
REG_EXTENDED) != 0) {
|
|
LOG(ERR) << "unable to compile regular expression";
|
|
|
|
return structure;
|
|
}
|
|
|
|
// check files within the directory
|
|
std::vector<std::string> files = TRI_FilesDirectory(path);
|
|
|
|
for (auto const& file : files) {
|
|
regmatch_t matches[5];
|
|
|
|
if (regexec(&re, file.c_str(), sizeof(matches) / sizeof(matches[0]),
|
|
matches, 0) == 0) {
|
|
// file type: (journal|datafile|index|compactor)
|
|
char const* first = file.c_str() + matches[1].rm_so;
|
|
size_t firstLen = matches[1].rm_eo - matches[1].rm_so;
|
|
|
|
// extension
|
|
char const* third = file.c_str() + matches[3].rm_so;
|
|
size_t thirdLen = matches[3].rm_eo - matches[3].rm_so;
|
|
|
|
// isdead?
|
|
size_t fourthLen = matches[4].rm_eo - matches[4].rm_so;
|
|
|
|
// .............................................................................
|
|
// file is dead
|
|
// .............................................................................
|
|
|
|
if (fourthLen > 0) {
|
|
char* filename;
|
|
|
|
filename = TRI_Concatenate2File(path, file.c_str());
|
|
|
|
if (filename != nullptr) {
|
|
LOG(TRACE) << "removing .dead file '" << filename << "'";
|
|
TRI_UnlinkFile(filename);
|
|
TRI_FreeString(TRI_CORE_MEM_ZONE, filename);
|
|
}
|
|
}
|
|
|
|
// .............................................................................
|
|
// file is an index
|
|
// .............................................................................
|
|
|
|
else if (TRI_EqualString("index", first, firstLen) &&
|
|
TRI_EqualString("json", third, thirdLen)) {
|
|
char* filename;
|
|
|
|
filename = TRI_Concatenate2File(path, file.c_str());
|
|
TRI_PushBackVectorString(&structure._indexes, filename);
|
|
}
|
|
|
|
// .............................................................................
|
|
// file is a journal or datafile
|
|
// .............................................................................
|
|
|
|
else if (TRI_EqualString("db", third, thirdLen)) {
|
|
std::string filename = TRI_Concatenate2File(path, file.c_str());
|
|
|
|
// file is a journal
|
|
if (TRI_EqualString("journal", first, firstLen)) {
|
|
TRI_PushBackVectorString(&structure._journals,
|
|
TRI_DuplicateString(filename.c_str()));
|
|
}
|
|
|
|
// file is a datafile
|
|
else if (TRI_EqualString("datafile", first, firstLen)) {
|
|
TRI_PushBackVectorString(&structure._datafiles,
|
|
TRI_DuplicateString(filename.c_str()));
|
|
}
|
|
|
|
// file is a left-over compaction file. rename it back
|
|
else if (TRI_EqualString("compaction", first, firstLen)) {
|
|
char* relName;
|
|
char* newName;
|
|
|
|
relName = TRI_Concatenate2String(
|
|
"datafile-", file.c_str() + strlen("compaction-"));
|
|
newName = TRI_Concatenate2File(path, relName);
|
|
TRI_FreeString(TRI_CORE_MEM_ZONE, relName);
|
|
|
|
if (TRI_ExistsFile(newName)) {
|
|
// we have a compaction-xxxx and a datafile-xxxx file. we'll keep
|
|
// the datafile
|
|
TRI_UnlinkFile(filename.c_str());
|
|
|
|
LOG(WARN) << "removing left-over compaction file '" << filename.c_str() << "'";
|
|
|
|
TRI_FreeString(TRI_CORE_MEM_ZONE, newName);
|
|
continue;
|
|
} else {
|
|
int res;
|
|
|
|
// this should fail, but shouldn't do any harm either...
|
|
TRI_UnlinkFile(newName);
|
|
|
|
// rename the compactor to a datafile
|
|
res = TRI_RenameFile(filename.c_str(), newName);
|
|
|
|
if (res != TRI_ERROR_NO_ERROR) {
|
|
LOG(ERR) << "unable to rename compaction file '" << filename.c_str() << "'";
|
|
|
|
TRI_FreeString(TRI_CORE_MEM_ZONE, newName);
|
|
|
|
continue;
|
|
}
|
|
}
|
|
|
|
TRI_PushBackVectorString(&structure._datafiles, newName);
|
|
}
|
|
|
|
// temporary file, we can delete it!
|
|
else if (TRI_EqualString("temp", first, firstLen)) {
|
|
LOG(WARN) << "found temporary file '" << filename.c_str() << "', which is probably a left-over. deleting it";
|
|
TRI_UnlinkFile(filename.c_str());
|
|
}
|
|
|
|
// ups, what kind of file is that
|
|
else {
|
|
LOG(ERR) << "unknown datafile type '" << file.c_str() << "'";
|
|
}
|
|
} else {
|
|
LOG(ERR) << "unknown datafile type '" << file.c_str() << "'";
|
|
}
|
|
}
|
|
}
|
|
|
|
regfree(&re);
|
|
|
|
// now sort the files in the structures that we created.
|
|
// the sorting allows us to iterate the files in the correct order
|
|
SortFilenames(&structure._journals);
|
|
SortFilenames(&structure._compactors);
|
|
SortFilenames(&structure._datafiles);
|
|
SortFilenames(&structure._indexes);
|
|
|
|
return structure;
|
|
}
|
|
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
/// @brief checks a collection
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
|
|
static bool CheckCollection(TRI_collection_t* collection, bool ignoreErrors) {
|
|
TRI_datafile_t* datafile;
|
|
TRI_vector_pointer_t all;
|
|
TRI_vector_pointer_t compactors;
|
|
TRI_vector_pointer_t datafiles;
|
|
TRI_vector_pointer_t journals;
|
|
TRI_vector_pointer_t sealed;
|
|
bool stop;
|
|
regex_t re;
|
|
|
|
if (regcomp(&re,
|
|
"^(temp|compaction|journal|datafile|index|compactor)-([0-9][0-9]*"
|
|
")\\.(db|json)(\\.dead)?$",
|
|
REG_EXTENDED) != 0) {
|
|
LOG(ERR) << "unable to compile regular expression";
|
|
|
|
return false;
|
|
}
|
|
|
|
stop = false;
|
|
|
|
// check files within the directory
|
|
std::vector<std::string> files = TRI_FilesDirectory(collection->_directory);
|
|
|
|
TRI_InitVectorPointer(&journals, TRI_UNKNOWN_MEM_ZONE);
|
|
TRI_InitVectorPointer(&compactors, TRI_UNKNOWN_MEM_ZONE);
|
|
TRI_InitVectorPointer(&datafiles, TRI_UNKNOWN_MEM_ZONE);
|
|
TRI_InitVectorPointer(&sealed, TRI_UNKNOWN_MEM_ZONE);
|
|
TRI_InitVectorPointer(&all, TRI_UNKNOWN_MEM_ZONE);
|
|
|
|
for (auto const& file : files) {
|
|
regmatch_t matches[5];
|
|
|
|
if (regexec(&re, file.c_str(), sizeof(matches) / sizeof(matches[0]),
|
|
matches, 0) == 0) {
|
|
char const* first = file.c_str() + matches[1].rm_so;
|
|
size_t firstLen = matches[1].rm_eo - matches[1].rm_so;
|
|
|
|
char const* third = file.c_str() + matches[3].rm_so;
|
|
size_t thirdLen = matches[3].rm_eo - matches[3].rm_so;
|
|
|
|
size_t fourthLen = matches[4].rm_eo - matches[4].rm_so;
|
|
|
|
// check for temporary & dead files
|
|
|
|
if (fourthLen > 0 || TRI_EqualString("temp", first, firstLen)) {
|
|
// found a temporary file. we can delete it!
|
|
char* filename;
|
|
|
|
filename = TRI_Concatenate2File(collection->_directory, file.c_str());
|
|
|
|
LOG(TRACE) << "found temporary file '" << filename << "', which is probably a left-over. deleting it";
|
|
TRI_UnlinkFile(filename);
|
|
TRI_Free(TRI_CORE_MEM_ZONE, filename);
|
|
continue;
|
|
}
|
|
|
|
// .............................................................................
|
|
// file is an index, just store the filename
|
|
// .............................................................................
|
|
|
|
if (TRI_EqualString("index", first, firstLen) &&
|
|
TRI_EqualString("json", third, thirdLen)) {
|
|
char* filename;
|
|
|
|
filename = TRI_Concatenate2File(collection->_directory, file.c_str());
|
|
TRI_PushBackVectorString(&collection->_indexFiles, filename);
|
|
}
|
|
|
|
// .............................................................................
|
|
// file is a journal or datafile, open the datafile
|
|
// .............................................................................
|
|
|
|
else if (TRI_EqualString("db", third, thirdLen)) {
|
|
char* filename;
|
|
char* ptr;
|
|
TRI_col_header_marker_t* cm;
|
|
|
|
if (TRI_EqualString("compaction", first, firstLen)) {
|
|
// found a compaction file. now rename it back
|
|
char* relName;
|
|
char* newName;
|
|
|
|
filename = TRI_Concatenate2File(collection->_directory, file.c_str());
|
|
relName = TRI_Concatenate2String(
|
|
"datafile-", file.c_str() + strlen("compaction-"));
|
|
newName = TRI_Concatenate2File(collection->_directory, relName);
|
|
|
|
TRI_FreeString(TRI_CORE_MEM_ZONE, relName);
|
|
|
|
if (TRI_ExistsFile(newName)) {
|
|
// we have a compaction-xxxx and a datafile-xxxx file. we'll keep
|
|
// the datafile
|
|
LOG(WARN) << "removing unfinished compaction file '" << filename << "'";
|
|
TRI_UnlinkFile(filename);
|
|
|
|
TRI_FreeString(TRI_CORE_MEM_ZONE, newName);
|
|
TRI_FreeString(TRI_CORE_MEM_ZONE, filename);
|
|
continue;
|
|
} else {
|
|
int res;
|
|
|
|
res = TRI_RenameFile(filename, newName);
|
|
|
|
if (res != TRI_ERROR_NO_ERROR) {
|
|
LOG(ERR) << "unable to rename compaction file '" << filename << "' to '" << newName << "'";
|
|
TRI_FreeString(TRI_CORE_MEM_ZONE, newName);
|
|
TRI_FreeString(TRI_CORE_MEM_ZONE, filename);
|
|
stop = true;
|
|
break;
|
|
}
|
|
}
|
|
|
|
TRI_Free(TRI_CORE_MEM_ZONE, filename);
|
|
// reuse newName
|
|
filename = newName;
|
|
} else {
|
|
filename = TRI_Concatenate2File(collection->_directory, file.c_str());
|
|
}
|
|
|
|
TRI_ASSERT(filename != nullptr);
|
|
datafile = TRI_OpenDatafile(filename, ignoreErrors);
|
|
|
|
if (datafile == nullptr) {
|
|
collection->_lastError = TRI_errno();
|
|
LOG(ERR) << "cannot open datafile '" << filename << "': " << TRI_last_error();
|
|
|
|
TRI_FreeString(TRI_CORE_MEM_ZONE, filename);
|
|
stop = true;
|
|
break;
|
|
}
|
|
|
|
TRI_PushBackVectorPointer(&all, datafile);
|
|
|
|
// check the document header
|
|
ptr = datafile->_data;
|
|
// skip the datafile header
|
|
ptr += TRI_DF_ALIGN_BLOCK(sizeof(TRI_df_header_marker_t));
|
|
cm = (TRI_col_header_marker_t*)ptr;
|
|
|
|
if (cm->base._type != TRI_COL_MARKER_HEADER) {
|
|
LOG(ERR) << "collection header mismatch in file '" << filename << "', expected TRI_COL_MARKER_HEADER, found " << cm->base._type;
|
|
|
|
TRI_FreeString(TRI_CORE_MEM_ZONE, filename);
|
|
stop = true;
|
|
break;
|
|
}
|
|
|
|
if (cm->_cid != collection->_info.id()) {
|
|
LOG(ERR) << "collection identifier mismatch, expected " << collection->_info.id() << ", found " << cm->_cid;
|
|
|
|
TRI_FreeString(TRI_CORE_MEM_ZONE, filename);
|
|
stop = true;
|
|
break;
|
|
}
|
|
|
|
// file is a journal
|
|
if (TRI_EqualString("journal", first, firstLen)) {
|
|
if (datafile->_isSealed) {
|
|
if (datafile->_state != TRI_DF_STATE_READ) {
|
|
LOG(WARN) << "strange, journal '" << filename << "' is already sealed; must be a left over; will use it as datafile";
|
|
}
|
|
|
|
TRI_PushBackVectorPointer(&sealed, datafile);
|
|
} else {
|
|
TRI_PushBackVectorPointer(&journals, datafile);
|
|
}
|
|
}
|
|
|
|
// file is a compactor
|
|
else if (TRI_EqualString("compactor", first, firstLen)) {
|
|
// ignore
|
|
}
|
|
|
|
// file is a datafile (or was a compaction file)
|
|
else if (TRI_EqualString("datafile", first, firstLen) ||
|
|
TRI_EqualString("compaction", first, firstLen)) {
|
|
if (!datafile->_isSealed) {
|
|
LOG(ERR) << "datafile '" << filename << "' is not sealed, this should never happen";
|
|
|
|
collection->_lastError =
|
|
TRI_set_errno(TRI_ERROR_ARANGO_CORRUPTED_DATAFILE);
|
|
TRI_FreeString(TRI_CORE_MEM_ZONE, filename);
|
|
stop = true;
|
|
break;
|
|
} else {
|
|
TRI_PushBackVectorPointer(&datafiles, datafile);
|
|
}
|
|
}
|
|
|
|
else {
|
|
LOG(ERR) << "unknown datafile '" << file.c_str() << "'";
|
|
}
|
|
|
|
TRI_FreeString(TRI_CORE_MEM_ZONE, filename);
|
|
} else {
|
|
LOG(ERR) << "unknown datafile '" << file.c_str() << "'";
|
|
}
|
|
}
|
|
}
|
|
|
|
regfree(&re);
|
|
|
|
size_t i, n;
|
|
// convert the sealed journals into datafiles
|
|
if (!stop) {
|
|
n = sealed._length;
|
|
|
|
for (i = 0; i < n; ++i) {
|
|
char* number;
|
|
char* dname;
|
|
char* filename;
|
|
bool ok;
|
|
|
|
datafile = static_cast<TRI_datafile_t*>(sealed._buffer[i]);
|
|
|
|
number = TRI_StringUInt64(datafile->_fid);
|
|
dname = TRI_Concatenate3String("datafile-", number, ".db");
|
|
filename = TRI_Concatenate2File(collection->_directory, dname);
|
|
|
|
TRI_FreeString(TRI_CORE_MEM_ZONE, dname);
|
|
TRI_FreeString(TRI_CORE_MEM_ZONE, number);
|
|
|
|
ok = TRI_RenameDatafile(datafile, filename);
|
|
|
|
if (ok) {
|
|
TRI_PushBackVectorPointer(&datafiles, datafile);
|
|
LOG(DEBUG) << "renamed sealed journal to '" << filename << "'";
|
|
} else {
|
|
collection->_lastError = datafile->_lastError;
|
|
stop = true;
|
|
LOG(ERR) << "cannot rename sealed log-file to " << filename << ", this should not happen: " << TRI_last_error();
|
|
break;
|
|
}
|
|
|
|
TRI_FreeString(TRI_CORE_MEM_ZONE, filename);
|
|
}
|
|
}
|
|
|
|
TRI_DestroyVectorPointer(&sealed);
|
|
|
|
// stop if necessary
|
|
if (stop) {
|
|
n = all._length;
|
|
|
|
for (i = 0; i < n; ++i) {
|
|
datafile = static_cast<TRI_datafile_t*>(all._buffer[i]);
|
|
|
|
LOG(TRACE) << "closing datafile '" << datafile->_filename << "'";
|
|
|
|
TRI_CloseDatafile(datafile);
|
|
TRI_FreeDatafile(datafile);
|
|
}
|
|
|
|
TRI_DestroyVectorPointer(&all);
|
|
TRI_DestroyVectorPointer(&datafiles);
|
|
|
|
return false;
|
|
}
|
|
|
|
TRI_DestroyVectorPointer(&all);
|
|
|
|
// sort the datafiles.
|
|
// this allows us to iterate them in the correct order
|
|
SortDatafiles(&datafiles);
|
|
SortDatafiles(&journals);
|
|
SortDatafiles(&compactors);
|
|
|
|
// add the datafiles and journals
|
|
collection->_datafiles = datafiles;
|
|
collection->_journals = journals;
|
|
collection->_compactors = compactors;
|
|
|
|
return true;
|
|
}
|
|
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
/// @brief free all datafiles in a vector
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
|
|
static void FreeDatafilesVector(TRI_vector_pointer_t* vector) {
|
|
TRI_ASSERT(vector != nullptr);
|
|
|
|
size_t const n = vector->_length;
|
|
for (size_t i = 0; i < n; ++i) {
|
|
TRI_datafile_t* datafile = static_cast<TRI_datafile_t*>(vector->_buffer[i]);
|
|
|
|
LOG(TRACE) << "freeing collection datafile";
|
|
|
|
TRI_ASSERT(datafile != nullptr);
|
|
TRI_FreeDatafile(datafile);
|
|
}
|
|
|
|
TRI_DestroyVectorPointer(vector);
|
|
}
|
|
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
/// @brief iterate over all datafiles in a vector
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
|
|
static bool IterateDatafilesVector(const TRI_vector_pointer_t* const files,
|
|
bool (*iterator)(TRI_df_marker_t const*,
|
|
void*, TRI_datafile_t*),
|
|
void* data) {
|
|
TRI_ASSERT(iterator != nullptr);
|
|
|
|
size_t const n = files->_length;
|
|
|
|
for (size_t i = 0; i < n; ++i) {
|
|
TRI_datafile_t* datafile =
|
|
static_cast<TRI_datafile_t*>(TRI_AtVectorPointer(files, i));
|
|
|
|
LOG(TRACE) << "iterating over datafile '" << datafile->getName(datafile) << "', fid " << datafile->_fid;
|
|
|
|
if (!TRI_IterateDatafile(datafile, iterator, data)) {
|
|
return false;
|
|
}
|
|
|
|
if (datafile->isPhysical(datafile) && datafile->_isSealed) {
|
|
TRI_MMFileAdvise(datafile->_data, datafile->_maximalSize,
|
|
TRI_MADVISE_RANDOM);
|
|
}
|
|
}
|
|
|
|
return true;
|
|
}
|
|
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
/// @brief closes the datafiles passed in the vector
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
|
|
static bool CloseDataFiles(const TRI_vector_pointer_t* const files) {
|
|
bool result = true;
|
|
|
|
size_t const n = files->_length;
|
|
|
|
for (size_t i = 0; i < n; ++i) {
|
|
TRI_datafile_t* datafile = static_cast<TRI_datafile_t*>(files->_buffer[i]);
|
|
|
|
TRI_ASSERT(datafile != nullptr);
|
|
|
|
result &= TRI_CloseDatafile(datafile);
|
|
}
|
|
|
|
return result;
|
|
}
|
|
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
/// @brief iterate over a set of datafiles, identified by filenames
|
|
/// note: the files will be opened and closed
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
|
|
static bool IterateFiles(TRI_vector_string_t* vector,
|
|
bool (*iterator)(TRI_df_marker_t const*, void*,
|
|
TRI_datafile_t*),
|
|
void* data) {
|
|
TRI_ASSERT(iterator != nullptr);
|
|
|
|
size_t const n = vector->_length;
|
|
|
|
for (size_t i = 0; i < n; ++i) {
|
|
char* filename = TRI_AtVectorString(vector, i);
|
|
LOG(DEBUG) << "iterating over collection journal file '" << filename << "'";
|
|
|
|
TRI_datafile_t* datafile = TRI_OpenDatafile(filename, true);
|
|
|
|
if (datafile != nullptr) {
|
|
TRI_IterateDatafile(datafile, iterator, data);
|
|
TRI_CloseDatafile(datafile);
|
|
TRI_FreeDatafile(datafile);
|
|
}
|
|
}
|
|
|
|
return true;
|
|
}
|
|
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
/// @brief get the full directory name for a collection
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
|
|
static std::string GetCollectionDirectory(char const* path, char const* name,
|
|
TRI_voc_cid_t cid) {
|
|
TRI_ASSERT(path != nullptr);
|
|
TRI_ASSERT(name != nullptr);
|
|
|
|
std::string filename("collection-");
|
|
filename.append(std::to_string(cid));
|
|
filename.push_back('-');
|
|
filename.append(std::to_string(TRI_UInt32Random()));
|
|
|
|
return arangodb::basics::FileUtils::buildFilename(path, filename);
|
|
}
|
|
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
/// @brief creates a new collection
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
|
|
TRI_collection_t* TRI_CreateCollection(
|
|
TRI_vocbase_t* vocbase, TRI_collection_t* collection, char const* path,
|
|
arangodb::VocbaseCollectionInfo const& parameters) {
|
|
// sanity check
|
|
if (sizeof(TRI_df_header_marker_t) + sizeof(TRI_df_footer_marker_t) >
|
|
parameters.maximalSize()) {
|
|
TRI_set_errno(TRI_ERROR_ARANGO_DATAFILE_FULL);
|
|
|
|
LOG(ERR) << "cannot create datafile '" << parameters.namec_str() << "' in '" << path << "', maximal size '" << (unsigned int)parameters.maximalSize() << "' is too small";
|
|
|
|
return nullptr;
|
|
}
|
|
|
|
if (!TRI_IsDirectory(path)) {
|
|
TRI_set_errno(TRI_ERROR_ARANGO_DATADIR_INVALID);
|
|
|
|
LOG(ERR) << "cannot create collection '" << path << "', path is not a directory";
|
|
|
|
return nullptr;
|
|
}
|
|
|
|
std::string const dirname = GetCollectionDirectory(
|
|
path, parameters.namec_str(), parameters.id());
|
|
|
|
// directory must not exist
|
|
if (TRI_ExistsFile(dirname.c_str())) {
|
|
TRI_set_errno(TRI_ERROR_ARANGO_COLLECTION_DIRECTORY_ALREADY_EXISTS);
|
|
|
|
LOG(ERR) << "cannot create collection '" << parameters.namec_str() << "' in directory '" << dirname.c_str() << "': directory already exists";
|
|
|
|
return nullptr;
|
|
}
|
|
|
|
// use a temporary directory first. this saves us from leaving an empty
|
|
// directory
|
|
// behind, an the server refusing to start
|
|
std::string const tmpname = dirname + ".tmp";
|
|
|
|
// create directory
|
|
std::string errorMessage;
|
|
long systemError;
|
|
int res = TRI_CreateDirectory(tmpname.c_str(), systemError, errorMessage);
|
|
|
|
if (res != TRI_ERROR_NO_ERROR) {
|
|
LOG(ERR) << "cannot create collection '" << parameters.namec_str() << "' in directory '" << path << "': " << TRI_errno_string(res) << " - " << systemError << " - " << errorMessage.c_str();
|
|
|
|
return nullptr;
|
|
}
|
|
|
|
TRI_IF_FAILURE("CreateCollection::tempDirectory") {
|
|
return nullptr;
|
|
}
|
|
|
|
// create a temporary file
|
|
std::string const tmpfile(arangodb::basics::FileUtils::buildFilename(tmpname.c_str(), ".tmp"));
|
|
res = TRI_WriteFile(tmpfile.c_str(), "", 0);
|
|
|
|
TRI_IF_FAILURE("CreateCollection::tempFile") {
|
|
return nullptr;
|
|
}
|
|
|
|
if (res != TRI_ERROR_NO_ERROR) {
|
|
LOG(ERR) << "cannot create collection '" << parameters.namec_str() << "' in directory '" << path << "': " << TRI_errno_string(res) << " - " << systemError << " - " << errorMessage.c_str();
|
|
TRI_RemoveDirectory(tmpname.c_str());
|
|
|
|
return nullptr;
|
|
}
|
|
|
|
TRI_IF_FAILURE("CreateCollection::renameDirectory") {
|
|
return nullptr;
|
|
}
|
|
|
|
res = TRI_RenameFile(tmpname.c_str(), dirname.c_str());
|
|
|
|
if (res != TRI_ERROR_NO_ERROR) {
|
|
LOG(ERR) << "cannot create collection '" << parameters.namec_str() << "' in directory '" << path << "': " << TRI_errno_string(res) << " - " << systemError << " - " << errorMessage.c_str();
|
|
TRI_RemoveDirectory(tmpname.c_str());
|
|
|
|
return nullptr;
|
|
}
|
|
|
|
// now we have the collection directory in place with the correct name and a
|
|
// .tmp file in it
|
|
|
|
// create collection structure
|
|
if (collection == nullptr) {
|
|
try {
|
|
TRI_collection_t* tmp = new TRI_collection_t(parameters);
|
|
collection = tmp;
|
|
// new TRI_collection_t(parameters);
|
|
} catch (std::exception&) {
|
|
collection = nullptr;
|
|
}
|
|
|
|
if (collection == nullptr) {
|
|
LOG(ERR) << "cannot create collection '" << path << "': out of memory";
|
|
|
|
return nullptr;
|
|
}
|
|
}
|
|
|
|
InitCollection(vocbase, collection, dirname, parameters);
|
|
/* PANAIA: 1) the parameter file if it exists must be removed
|
|
2) if collection
|
|
*/
|
|
|
|
return collection;
|
|
}
|
|
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
/// @brief frees the memory allocated, but does not free the pointer
|
|
///
|
|
/// Note that the collection must be closed first.
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
|
|
void TRI_DestroyCollection(TRI_collection_t* collection) {
|
|
TRI_ASSERT(collection);
|
|
collection->_info.clearKeyOptions();
|
|
|
|
FreeDatafilesVector(&collection->_datafiles);
|
|
FreeDatafilesVector(&collection->_journals);
|
|
FreeDatafilesVector(&collection->_compactors);
|
|
|
|
TRI_DestroyVectorString(&collection->_indexFiles);
|
|
if (collection->_directory != nullptr) {
|
|
TRI_FreeString(TRI_CORE_MEM_ZONE, collection->_directory);
|
|
collection->_directory = nullptr;
|
|
}
|
|
}
|
|
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
/// @brief frees the memory allocated and frees the pointer
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
|
|
void TRI_FreeCollection(TRI_collection_t* collection) {
|
|
TRI_ASSERT(collection);
|
|
TRI_DestroyCollection(collection);
|
|
delete collection;
|
|
}
|
|
|
|
VocbaseCollectionInfo::VocbaseCollectionInfo(CollectionInfo const& other)
|
|
: _version(TRI_COL_VERSION),
|
|
_type(other.type()),
|
|
_revision(0), // not known in the cluster case on the coordinator
|
|
_cid(other.id()), // this is on the coordinator and describes a
|
|
// cluster-wide collection, for safety reasons,
|
|
// we also set _cid
|
|
_planId(other.id()),
|
|
_maximalSize(other.journalSize()),
|
|
_initialCount(-1),
|
|
_indexBuckets(other.indexBuckets()),
|
|
_keyOptions(nullptr),
|
|
_isSystem(other.isSystem()),
|
|
_deleted(other.deleted()),
|
|
_doCompact(other.doCompact()),
|
|
_isVolatile(other.isVolatile()),
|
|
_waitForSync(other.waitForSync()) {
|
|
std::string const name = other.name();
|
|
memset(_name, 0, sizeof(_name));
|
|
memcpy(_name, name.c_str(), name.size());
|
|
|
|
std::unique_ptr<TRI_json_t> otherOpts(other.keyOptions());
|
|
if (otherOpts != nullptr) {
|
|
std::shared_ptr<arangodb::velocypack::Builder> builder =
|
|
arangodb::basics::JsonHelper::toVelocyPack(otherOpts.get());
|
|
_keyOptions = builder->steal();
|
|
}
|
|
}
|
|
|
|
VocbaseCollectionInfo::VocbaseCollectionInfo(TRI_vocbase_t* vocbase,
|
|
char const* name,
|
|
TRI_col_type_e type,
|
|
TRI_voc_size_t maximalSize,
|
|
VPackSlice const& keyOptions)
|
|
: _version(TRI_COL_VERSION),
|
|
_type(type),
|
|
_revision(0),
|
|
_cid(0),
|
|
_planId(0),
|
|
_maximalSize(vocbase->_settings.defaultMaximalSize),
|
|
_initialCount(-1),
|
|
_indexBuckets(TRI_DEFAULT_INDEX_BUCKETS),
|
|
_keyOptions(nullptr),
|
|
_isSystem(false),
|
|
_deleted(false),
|
|
_doCompact(true),
|
|
_isVolatile(false),
|
|
_waitForSync(vocbase->_settings.defaultWaitForSync) {
|
|
_maximalSize =
|
|
static_cast<TRI_voc_size_t>((maximalSize / PageSize) * PageSize);
|
|
if (_maximalSize == 0 && maximalSize != 0) {
|
|
_maximalSize = static_cast<TRI_voc_size_t>(PageSize);
|
|
}
|
|
memset(_name, 0, sizeof(_name));
|
|
TRI_CopyString(_name, name, sizeof(_name) - 1);
|
|
|
|
if (!keyOptions.isNone()) {
|
|
VPackBuilder builder;
|
|
builder.add(keyOptions);
|
|
_keyOptions = builder.steal();
|
|
}
|
|
}
|
|
|
|
VocbaseCollectionInfo::VocbaseCollectionInfo(TRI_vocbase_t* vocbase,
|
|
char const* name,
|
|
VPackSlice const& options)
|
|
: VocbaseCollectionInfo(vocbase, name, TRI_COL_TYPE_DOCUMENT, options) {}
|
|
|
|
VocbaseCollectionInfo::VocbaseCollectionInfo(TRI_vocbase_t* vocbase,
|
|
char const* name,
|
|
TRI_col_type_e type,
|
|
VPackSlice const& options)
|
|
: _version(TRI_COL_VERSION),
|
|
_type(type),
|
|
_revision(0),
|
|
_cid(0),
|
|
_planId(0),
|
|
_maximalSize(vocbase->_settings.defaultMaximalSize),
|
|
_initialCount(-1),
|
|
_indexBuckets(TRI_DEFAULT_INDEX_BUCKETS),
|
|
_keyOptions(nullptr),
|
|
_isSystem(false),
|
|
_deleted(false),
|
|
_doCompact(true),
|
|
_isVolatile(false),
|
|
_waitForSync(vocbase->_settings.defaultWaitForSync) {
|
|
memset(_name, 0, sizeof(_name));
|
|
|
|
if (name != nullptr && *name != '\0') {
|
|
TRI_CopyString(_name, name, sizeof(_name) - 1);
|
|
}
|
|
|
|
if (options.isObject()) {
|
|
TRI_voc_size_t maximalSize;
|
|
if (options.hasKey("journalSize")) {
|
|
maximalSize =
|
|
arangodb::basics::VelocyPackHelper::getNumericValue<TRI_voc_size_t>(
|
|
options, "journalSize", vocbase->_settings.defaultMaximalSize);
|
|
} else {
|
|
maximalSize =
|
|
arangodb::basics::VelocyPackHelper::getNumericValue<TRI_voc_size_t>(
|
|
options, "maximalSize", vocbase->_settings.defaultMaximalSize);
|
|
}
|
|
|
|
_maximalSize =
|
|
static_cast<TRI_voc_size_t>((maximalSize / PageSize) * PageSize);
|
|
if (_maximalSize == 0 && maximalSize != 0) {
|
|
_maximalSize = static_cast<TRI_voc_size_t>(PageSize);
|
|
}
|
|
|
|
_doCompact = arangodb::basics::VelocyPackHelper::getBooleanValue(
|
|
options, "doCompact", true);
|
|
_waitForSync = arangodb::basics::VelocyPackHelper::getBooleanValue(
|
|
options, "waitForSync", vocbase->_settings.defaultWaitForSync);
|
|
_isVolatile = arangodb::basics::VelocyPackHelper::getBooleanValue(
|
|
options, "isVolatile", false);
|
|
_indexBuckets =
|
|
arangodb::basics::VelocyPackHelper::getNumericValue<uint32_t>(
|
|
options, "indexBuckets", TRI_DEFAULT_INDEX_BUCKETS);
|
|
_type = static_cast<TRI_col_type_e>(
|
|
arangodb::basics::VelocyPackHelper::getNumericValue<size_t>(
|
|
options, "type", _type));
|
|
|
|
std::string cname =
|
|
arangodb::basics::VelocyPackHelper::getStringValue(options, "name", "");
|
|
if (!cname.empty()) {
|
|
TRI_CopyString(_name, cname.c_str(), sizeof(_name) - 1);
|
|
}
|
|
|
|
std::string cidString =
|
|
arangodb::basics::VelocyPackHelper::getStringValue(options, "cid", "");
|
|
if (!cidString.empty()) {
|
|
// note: this may throw
|
|
_cid = std::stoull(cidString);
|
|
}
|
|
|
|
if (options.hasKey("isSystem")) {
|
|
VPackSlice isSystemSlice = options.get("isSystem");
|
|
if (isSystemSlice.isBoolean()) {
|
|
_isSystem = isSystemSlice.getBoolean();
|
|
}
|
|
} else {
|
|
_isSystem = false;
|
|
}
|
|
|
|
if (options.hasKey("journalSize")) {
|
|
VPackSlice maxSizeSlice = options.get("journalSize");
|
|
TRI_voc_size_t maximalSize =
|
|
maxSizeSlice.getNumericValue<TRI_voc_size_t>();
|
|
if (maximalSize < TRI_JOURNAL_MINIMAL_SIZE) {
|
|
THROW_ARANGO_EXCEPTION_MESSAGE(TRI_ERROR_BAD_PARAMETER,
|
|
"journalSize is too small");
|
|
}
|
|
}
|
|
|
|
VPackSlice const planIdSlice = options.get("planId");
|
|
TRI_voc_cid_t planId = 0;
|
|
if (planIdSlice.isNumber()) {
|
|
planId = planIdSlice.getNumericValue<TRI_voc_cid_t>();
|
|
} else if (planIdSlice.isString()) {
|
|
std::string tmp = planIdSlice.copyString();
|
|
planId = static_cast<TRI_voc_cid_t>(
|
|
TRI_UInt64String2(tmp.c_str(), tmp.length()));
|
|
}
|
|
|
|
if (planId > 0) {
|
|
_planId = planId;
|
|
}
|
|
|
|
VPackSlice const cidSlice = options.get("id");
|
|
if (cidSlice.isNumber()) {
|
|
_cid = cidSlice.getNumericValue<TRI_voc_cid_t>();
|
|
} else if (cidSlice.isString()) {
|
|
std::string tmp = cidSlice.copyString();
|
|
_cid = static_cast<TRI_voc_cid_t>(
|
|
TRI_UInt64String2(tmp.c_str(), tmp.length()));
|
|
}
|
|
|
|
if (options.hasKey("keyOptions")) {
|
|
VPackSlice const slice = options.get("keyOptions");
|
|
VPackBuilder builder;
|
|
builder.add(slice);
|
|
// Copy the ownership of the options over
|
|
_keyOptions = builder.steal();
|
|
}
|
|
|
|
if (options.hasKey("deleted")) {
|
|
VPackSlice const slice = options.get("deleted");
|
|
if (slice.isBoolean()) {
|
|
_deleted = slice.getBoolean();
|
|
}
|
|
}
|
|
}
|
|
|
|
#ifndef TRI_HAVE_ANONYMOUS_MMAP
|
|
if (_isVolatile) {
|
|
THROW_ARANGO_EXCEPTION_MESSAGE(
|
|
TRI_ERROR_BAD_PARAMETER,
|
|
"volatile collections are not supported on this platform");
|
|
}
|
|
#endif
|
|
|
|
if (_isVolatile && _waitForSync) {
|
|
// the combination of waitForSync and isVolatile makes no sense
|
|
THROW_ARANGO_EXCEPTION_MESSAGE(
|
|
TRI_ERROR_BAD_PARAMETER,
|
|
"volatile collections do not support the waitForSync option");
|
|
}
|
|
|
|
if (_indexBuckets < 1 || _indexBuckets > 1024) {
|
|
THROW_ARANGO_EXCEPTION_MESSAGE(
|
|
TRI_ERROR_BAD_PARAMETER,
|
|
"indexBuckets must be a two-power between 1 and 1024");
|
|
}
|
|
|
|
if (!TRI_IsAllowedNameCollection(_isSystem, _name)) {
|
|
THROW_ARANGO_EXCEPTION(TRI_ERROR_ARANGO_ILLEGAL_NAME);
|
|
}
|
|
|
|
// fix _isSystem value if mis-specified by user
|
|
_isSystem = (*_name == '_');
|
|
}
|
|
|
|
VocbaseCollectionInfo VocbaseCollectionInfo::fromFile(
|
|
char const* path, TRI_vocbase_t* vocbase, char const* collectionName,
|
|
bool versionWarning) {
|
|
// find parameter file
|
|
char* filename = TRI_Concatenate2File(path, TRI_VOC_PARAMETER_FILE);
|
|
|
|
if (filename == nullptr) {
|
|
LOG(ERR) << "cannot load parameter info for collection '" << path << "', out of memory";
|
|
THROW_ARANGO_EXCEPTION(TRI_ERROR_OUT_OF_MEMORY);
|
|
}
|
|
|
|
if (!TRI_ExistsFile(filename)) {
|
|
TRI_FreeString(TRI_CORE_MEM_ZONE, filename);
|
|
THROW_ARANGO_EXCEPTION(TRI_ERROR_ARANGO_ILLEGAL_PARAMETER_FILE);
|
|
}
|
|
|
|
std::string filePath(filename, strlen(filename));
|
|
std::shared_ptr<VPackBuilder> content =
|
|
arangodb::basics::VelocyPackHelper::velocyPackFromFile(filePath);
|
|
VPackSlice slice = content->slice();
|
|
if (!slice.isObject()) {
|
|
LOG(ERR) << "cannot open '" << filename << "', collection parameters are not readable";
|
|
TRI_FreeString(TRI_CORE_MEM_ZONE, filename);
|
|
THROW_ARANGO_EXCEPTION(TRI_ERROR_ARANGO_ILLEGAL_PARAMETER_FILE);
|
|
}
|
|
TRI_FreeString(TRI_CORE_MEM_ZONE, filename);
|
|
|
|
// fiddle "isSystem" value, which is not contained in the JSON file
|
|
bool isSystemValue = false;
|
|
if (slice.hasKey("name")) {
|
|
auto name = slice.get("name").copyString();
|
|
if (!name.empty()) {
|
|
isSystemValue = name[0] == '_';
|
|
}
|
|
}
|
|
|
|
VPackBuilder bx;
|
|
bx.openObject();
|
|
bx.add("isSystem", VPackValue(isSystemValue));
|
|
bx.close();
|
|
VPackSlice isSystem = bx.slice();
|
|
VPackBuilder b2 = VPackCollection::merge(slice, isSystem, false);
|
|
slice = b2.slice();
|
|
|
|
VocbaseCollectionInfo info(vocbase, collectionName, slice);
|
|
|
|
// warn about wrong version of the collection
|
|
if (versionWarning && info.version() < TRI_COL_VERSION_20) {
|
|
if (info.name()[0] != '\0') {
|
|
// only warn if the collection version is older than expected, and if it's
|
|
// not a shape collection
|
|
LOG(WARN) << "collection '" << info.namec_str() << "' has an old version and needs to be upgraded.";
|
|
}
|
|
}
|
|
return info;
|
|
}
|
|
|
|
// collection version
|
|
TRI_col_version_t VocbaseCollectionInfo::version() const { return _version; }
|
|
|
|
// collection type
|
|
TRI_col_type_e VocbaseCollectionInfo::type() const { return _type; }
|
|
|
|
// local collection identifier
|
|
TRI_voc_cid_t VocbaseCollectionInfo::id() const { return _cid; }
|
|
|
|
// cluster-wide collection identifier
|
|
TRI_voc_cid_t VocbaseCollectionInfo::planId() const { return _planId; }
|
|
|
|
// last revision id written
|
|
TRI_voc_rid_t VocbaseCollectionInfo::revision() const { return _revision; }
|
|
|
|
// maximal size of memory mapped file
|
|
TRI_voc_size_t VocbaseCollectionInfo::maximalSize() const {
|
|
return _maximalSize;
|
|
}
|
|
|
|
// initial count, used when loading a collection
|
|
int64_t VocbaseCollectionInfo::initialCount() const { return _initialCount; }
|
|
|
|
// number of buckets used in hash tables for indexes
|
|
uint32_t VocbaseCollectionInfo::indexBuckets() const { return _indexBuckets; }
|
|
|
|
// name of the collection
|
|
std::string VocbaseCollectionInfo::name() const { return std::string(_name); }
|
|
|
|
// name of the collection as c string
|
|
char const* VocbaseCollectionInfo::namec_str() const { return _name; }
|
|
|
|
// options for key creation
|
|
std::shared_ptr<arangodb::velocypack::Buffer<uint8_t> const>
|
|
VocbaseCollectionInfo::keyOptions() const {
|
|
return _keyOptions;
|
|
}
|
|
|
|
// If true, collection has been deleted
|
|
bool VocbaseCollectionInfo::deleted() const { return _deleted; }
|
|
|
|
// If true, collection will be compacted
|
|
bool VocbaseCollectionInfo::doCompact() const { return _doCompact; }
|
|
|
|
// If true, collection is a system collection
|
|
bool VocbaseCollectionInfo::isSystem() const { return _isSystem; }
|
|
|
|
// If true, collection is memory-only
|
|
bool VocbaseCollectionInfo::isVolatile() const { return _isVolatile; }
|
|
|
|
// If true waits for mysnc
|
|
bool VocbaseCollectionInfo::waitForSync() const { return _waitForSync; }
|
|
|
|
void VocbaseCollectionInfo::setVersion(TRI_col_version_t version) {
|
|
_version = version;
|
|
}
|
|
|
|
void VocbaseCollectionInfo::rename(char const* name) {
|
|
TRI_CopyString(_name, name, sizeof(_name) - 1);
|
|
}
|
|
|
|
void VocbaseCollectionInfo::setRevision(TRI_voc_rid_t rid, bool force) {
|
|
if (force || rid > _revision) {
|
|
_revision = rid;
|
|
}
|
|
}
|
|
|
|
void VocbaseCollectionInfo::setCollectionId(TRI_voc_cid_t cid) { _cid = cid; }
|
|
|
|
void VocbaseCollectionInfo::updateCount(size_t size) { _initialCount = size; }
|
|
|
|
void VocbaseCollectionInfo::setPlanId(TRI_voc_cid_t planId) {
|
|
_planId = planId;
|
|
}
|
|
|
|
void VocbaseCollectionInfo::setDeleted(bool deleted) { _deleted = deleted; }
|
|
|
|
void VocbaseCollectionInfo::clearKeyOptions() { _keyOptions.reset(); }
|
|
|
|
int VocbaseCollectionInfo::saveToFile(char const* path, bool forceSync) const {
|
|
char* filename = TRI_Concatenate2File(path, TRI_VOC_PARAMETER_FILE);
|
|
|
|
TRI_json_t* json = TRI_CreateJsonCollectionInfo(*this);
|
|
|
|
if (json == nullptr) {
|
|
LOG(ERR) << "cannot save collection properties file '" << filename << "': " << TRI_errno_string(TRI_ERROR_OUT_OF_MEMORY);
|
|
TRI_FreeString(TRI_CORE_MEM_ZONE, filename);
|
|
return TRI_ERROR_OUT_OF_MEMORY;
|
|
}
|
|
|
|
// save json info to file
|
|
bool ok = TRI_SaveJson(filename, json, forceSync);
|
|
|
|
int res;
|
|
if (!ok) {
|
|
res = TRI_errno();
|
|
LOG(ERR) << "cannot save collection properties file '" << filename << "': " << TRI_last_error();
|
|
} else {
|
|
res = TRI_ERROR_NO_ERROR;
|
|
}
|
|
|
|
TRI_FreeJson(TRI_UNKNOWN_MEM_ZONE, json);
|
|
TRI_FreeString(TRI_CORE_MEM_ZONE, filename);
|
|
return res;
|
|
}
|
|
|
|
void VocbaseCollectionInfo::update(VPackSlice const& slice, bool preferDefaults,
|
|
TRI_vocbase_t const* vocbase) {
|
|
// the following collection properties are intentionally not updated as
|
|
// updating
|
|
// them would be very complicated:
|
|
// - _cid
|
|
// - _name
|
|
// - _type
|
|
// - _isSystem
|
|
// - _isVolatile
|
|
// ... probably a few others missing here ...
|
|
|
|
if (preferDefaults) {
|
|
if (vocbase != nullptr) {
|
|
_doCompact = arangodb::basics::VelocyPackHelper::getBooleanValue(
|
|
slice, "doCompact", true);
|
|
_waitForSync = arangodb::basics::VelocyPackHelper::getBooleanValue(
|
|
slice, "waitForSync", vocbase->_settings.defaultWaitForSync);
|
|
if (slice.hasKey("journalSize")) {
|
|
_maximalSize = arangodb::basics::VelocyPackHelper::getNumericValue<int>(
|
|
slice, "journalSize", vocbase->_settings.defaultMaximalSize);
|
|
} else {
|
|
_maximalSize = arangodb::basics::VelocyPackHelper::getNumericValue<int>(
|
|
slice, "maximalSize", vocbase->_settings.defaultMaximalSize);
|
|
}
|
|
_indexBuckets =
|
|
arangodb::basics::VelocyPackHelper::getNumericValue<uint32_t>(
|
|
slice, "indexBuckets", TRI_DEFAULT_INDEX_BUCKETS);
|
|
} else {
|
|
_doCompact = arangodb::basics::VelocyPackHelper::getBooleanValue(
|
|
slice, "doCompact", true);
|
|
_waitForSync = arangodb::basics::VelocyPackHelper::getBooleanValue(
|
|
slice, "waitForSync", false);
|
|
if (slice.hasKey("journalSize")) {
|
|
_maximalSize =
|
|
arangodb::basics::VelocyPackHelper::getNumericValue<TRI_voc_size_t>(
|
|
slice, "journalSize", TRI_JOURNAL_DEFAULT_MAXIMAL_SIZE);
|
|
} else {
|
|
_maximalSize =
|
|
arangodb::basics::VelocyPackHelper::getNumericValue<TRI_voc_size_t>(
|
|
slice, "maximalSize", TRI_JOURNAL_DEFAULT_MAXIMAL_SIZE);
|
|
}
|
|
_indexBuckets =
|
|
arangodb::basics::VelocyPackHelper::getNumericValue<uint32_t>(
|
|
slice, "indexBuckets", TRI_DEFAULT_INDEX_BUCKETS);
|
|
}
|
|
} else {
|
|
_doCompact = arangodb::basics::VelocyPackHelper::getBooleanValue(
|
|
slice, "doCompact", _doCompact);
|
|
_waitForSync = arangodb::basics::VelocyPackHelper::getBooleanValue(
|
|
slice, "waitForSync", _waitForSync);
|
|
if (slice.hasKey("journalSize")) {
|
|
_maximalSize =
|
|
arangodb::basics::VelocyPackHelper::getNumericValue<TRI_voc_size_t>(
|
|
slice, "journalSize", _maximalSize);
|
|
} else {
|
|
_maximalSize =
|
|
arangodb::basics::VelocyPackHelper::getNumericValue<TRI_voc_size_t>(
|
|
slice, "maximalSize", _maximalSize);
|
|
}
|
|
_indexBuckets =
|
|
arangodb::basics::VelocyPackHelper::getNumericValue<uint32_t>(
|
|
slice, "indexBuckets", _indexBuckets);
|
|
}
|
|
}
|
|
|
|
void VocbaseCollectionInfo::update(VocbaseCollectionInfo const& other) {
|
|
_version = other.version();
|
|
_type = other.type();
|
|
_cid = other.id();
|
|
_planId = other.planId();
|
|
_revision = other.revision();
|
|
_maximalSize = other.maximalSize();
|
|
_initialCount = other.initialCount();
|
|
_indexBuckets = other.indexBuckets();
|
|
|
|
TRI_CopyString(_name, other.namec_str(), sizeof(_name) - 1);
|
|
|
|
_keyOptions = other.keyOptions();
|
|
|
|
_deleted = other.deleted();
|
|
_doCompact = other.doCompact();
|
|
_isSystem = other.isSystem();
|
|
_isVolatile = other.isVolatile();
|
|
_waitForSync = other.waitForSync();
|
|
}
|
|
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
/// @brief jsonify a parameter info block
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
|
|
// Only temporary
|
|
TRI_json_t* TRI_CreateJsonCollectionInfo(
|
|
arangodb::VocbaseCollectionInfo const& info) {
|
|
try {
|
|
VPackBuilder builder;
|
|
builder.openObject();
|
|
TRI_CreateVelocyPackCollectionInfo(info, builder);
|
|
builder.close();
|
|
return arangodb::basics::VelocyPackHelper::velocyPackToJson(
|
|
builder.slice());
|
|
} catch (...) {
|
|
return nullptr;
|
|
}
|
|
}
|
|
|
|
std::shared_ptr<VPackBuilder> TRI_CreateVelocyPackCollectionInfo(
|
|
arangodb::VocbaseCollectionInfo const& info) {
|
|
// This function might throw
|
|
auto builder = std::make_shared<VPackBuilder>();
|
|
builder->openObject();
|
|
TRI_CreateVelocyPackCollectionInfo(info, *builder);
|
|
builder->close();
|
|
return builder;
|
|
}
|
|
|
|
void TRI_CreateVelocyPackCollectionInfo(
|
|
arangodb::VocbaseCollectionInfo const& info, VPackBuilder& builder) {
|
|
// This function might throw
|
|
//
|
|
TRI_ASSERT(!builder.isClosed());
|
|
|
|
std::string cidString = std::to_string(info.id());
|
|
std::string planIdString = std::to_string(info.planId());
|
|
|
|
builder.add("version", VPackValue(info.version()));
|
|
builder.add("type", VPackValue(info.type()));
|
|
builder.add("cid", VPackValue(cidString));
|
|
|
|
if (info.planId() > 0) {
|
|
builder.add("planId", VPackValue(planIdString));
|
|
}
|
|
|
|
if (info.initialCount() >= 0) {
|
|
builder.add("count", VPackValue(info.initialCount()));
|
|
}
|
|
builder.add("indexBuckets", VPackValue(info.indexBuckets()));
|
|
builder.add("deleted", VPackValue(info.deleted()));
|
|
builder.add("doCompact", VPackValue(info.doCompact()));
|
|
builder.add("maximalSize", VPackValue(info.maximalSize()));
|
|
builder.add("name", VPackValue(info.name()));
|
|
builder.add("isVolatile", VPackValue(info.isVolatile()));
|
|
builder.add("waitForSync", VPackValue(info.waitForSync()));
|
|
|
|
auto opts = info.keyOptions();
|
|
if (opts.get() != nullptr) {
|
|
VPackSlice const slice(opts->data());
|
|
builder.add("keyOptions", slice);
|
|
}
|
|
}
|
|
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
/// @brief updates the parameter info block
|
|
///
|
|
/// You must hold the @ref TRI_WRITE_LOCK_STATUS_VOCBASE_COL when calling this
|
|
/// function.
|
|
/// Note: the parameter pointer might be 0 when a collection gets unloaded!!!!
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
|
|
int TRI_UpdateCollectionInfo(TRI_vocbase_t* vocbase,
|
|
TRI_collection_t* collection,
|
|
VPackSlice const& slice, bool doSync) {
|
|
if (!slice.isNone()) {
|
|
TRI_LOCK_JOURNAL_ENTRIES_DOC_COLLECTION(
|
|
(TRI_document_collection_t*)collection);
|
|
try {
|
|
collection->_info.update(slice, false, vocbase);
|
|
} catch (...) {
|
|
TRI_UNLOCK_JOURNAL_ENTRIES_DOC_COLLECTION(
|
|
(TRI_document_collection_t*)collection);
|
|
return TRI_ERROR_INTERNAL;
|
|
}
|
|
TRI_UNLOCK_JOURNAL_ENTRIES_DOC_COLLECTION(
|
|
(TRI_document_collection_t*)collection);
|
|
}
|
|
return collection->_info.saveToFile(collection->_directory, doSync);
|
|
}
|
|
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
/// @brief renames a collection
|
|
///
|
|
/// You must hold the @ref TRI_WRITE_LOCK_STATUS_VOCBASE_COL when calling this
|
|
/// function.
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
|
|
int TRI_RenameCollection(TRI_collection_t* collection, char const* name) {
|
|
// Save name for rollback
|
|
std::string oldName = collection->_info.name();
|
|
collection->_info.rename(name);
|
|
|
|
int res = collection->_info.saveToFile(collection->_directory, true);
|
|
if (res != TRI_ERROR_NO_ERROR) {
|
|
// Rollback
|
|
collection->_info.rename(oldName.c_str());
|
|
}
|
|
|
|
return res;
|
|
}
|
|
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
/// @brief iterates over a collection
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
|
|
bool TRI_IterateCollection(TRI_collection_t* collection,
|
|
bool (*iterator)(TRI_df_marker_t const*, void*,
|
|
TRI_datafile_t*),
|
|
void* data) {
|
|
TRI_ASSERT(iterator != nullptr);
|
|
|
|
TRI_vector_pointer_t* datafiles =
|
|
TRI_CopyVectorPointer(TRI_UNKNOWN_MEM_ZONE, &collection->_datafiles);
|
|
|
|
if (datafiles == nullptr) {
|
|
TRI_set_errno(TRI_ERROR_OUT_OF_MEMORY);
|
|
|
|
return false;
|
|
}
|
|
|
|
TRI_vector_pointer_t* journals =
|
|
TRI_CopyVectorPointer(TRI_UNKNOWN_MEM_ZONE, &collection->_journals);
|
|
|
|
if (journals == nullptr) {
|
|
TRI_FreeVectorPointer(TRI_UNKNOWN_MEM_ZONE, datafiles);
|
|
TRI_set_errno(TRI_ERROR_OUT_OF_MEMORY);
|
|
|
|
return false;
|
|
}
|
|
|
|
TRI_vector_pointer_t* compactors =
|
|
TRI_CopyVectorPointer(TRI_UNKNOWN_MEM_ZONE, &collection->_compactors);
|
|
|
|
if (compactors == nullptr) {
|
|
TRI_FreeVectorPointer(TRI_UNKNOWN_MEM_ZONE, datafiles);
|
|
TRI_FreeVectorPointer(TRI_UNKNOWN_MEM_ZONE, journals);
|
|
TRI_set_errno(TRI_ERROR_OUT_OF_MEMORY);
|
|
|
|
return false;
|
|
}
|
|
|
|
bool result;
|
|
if (!IterateDatafilesVector(datafiles, iterator, data) ||
|
|
!IterateDatafilesVector(compactors, iterator, data) ||
|
|
!IterateDatafilesVector(journals, iterator, data)) {
|
|
result = false;
|
|
} else {
|
|
result = true;
|
|
}
|
|
|
|
TRI_FreeVectorPointer(TRI_UNKNOWN_MEM_ZONE, datafiles);
|
|
TRI_FreeVectorPointer(TRI_UNKNOWN_MEM_ZONE, journals);
|
|
TRI_FreeVectorPointer(TRI_UNKNOWN_MEM_ZONE, compactors);
|
|
|
|
return result;
|
|
}
|
|
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
/// @brief removes an index file from the indexFiles vector
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
|
|
int TRI_RemoveFileIndexCollection(TRI_collection_t* collection,
|
|
TRI_idx_iid_t iid) {
|
|
size_t const n = collection->_indexFiles._length;
|
|
|
|
for (size_t i = 0; i < n; ++i) {
|
|
char const* filename = collection->_indexFiles._buffer[i];
|
|
|
|
if (GetNumericFilenamePart(filename) == iid) {
|
|
// found
|
|
TRI_RemoveVectorString(&collection->_indexFiles, i);
|
|
return true;
|
|
}
|
|
}
|
|
|
|
return false;
|
|
}
|
|
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
/// @brief iterates over all index files of a collection
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
|
|
void TRI_IterateIndexCollection(TRI_collection_t* collection,
|
|
bool (*iterator)(char const* filename, void*),
|
|
void* data) {
|
|
// iterate over all index files
|
|
size_t const n = collection->_indexFiles._length;
|
|
|
|
for (size_t i = 0; i < n; ++i) {
|
|
char const* filename = collection->_indexFiles._buffer[i];
|
|
bool ok = iterator(filename, data);
|
|
|
|
if (!ok) {
|
|
LOG(ERR) << "cannot load index '" << filename << "' for collection '" << collection->_info.namec_str() << "'";
|
|
}
|
|
}
|
|
}
|
|
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
/// @brief opens an existing collection
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
|
|
TRI_collection_t* TRI_OpenCollection(TRI_vocbase_t* vocbase,
|
|
TRI_collection_t* collection,
|
|
char const* path, bool ignoreErrors) {
|
|
TRI_ASSERT(collection != nullptr);
|
|
|
|
if (!TRI_IsDirectory(path)) {
|
|
TRI_set_errno(TRI_ERROR_ARANGO_DATADIR_INVALID);
|
|
|
|
LOG(ERR) << "cannot open '" << path << "', not a directory or not found";
|
|
|
|
return nullptr;
|
|
}
|
|
|
|
try {
|
|
// read parameters, no need to lock as we are opening the collection
|
|
VocbaseCollectionInfo info =
|
|
VocbaseCollectionInfo::fromFile(path, vocbase,
|
|
"", // Name will be set later on
|
|
true);
|
|
InitCollection(vocbase, collection, std::string(path), info);
|
|
|
|
double start = TRI_microtime();
|
|
|
|
LOG_TOPIC(TRACE, Logger::PERFORMANCE) <<
|
|
"open-collection { collection: " << vocbase->_name << "/" << collection->_info.name();
|
|
|
|
// check for journals and datafiles
|
|
bool ok = CheckCollection(collection, ignoreErrors);
|
|
|
|
if (!ok) {
|
|
LOG(DEBUG) << "cannot open '" << collection->_directory << "', check failed";
|
|
|
|
if (collection->_directory != nullptr) {
|
|
TRI_FreeString(TRI_CORE_MEM_ZONE, collection->_directory);
|
|
collection->_directory = nullptr;
|
|
}
|
|
|
|
return nullptr;
|
|
}
|
|
|
|
LOG_TOPIC(TRACE, Logger::PERFORMANCE) << "[timer] " << Logger::DURATION(TRI_microtime() - start) << " s, open-collection { collection: " << vocbase->_name << "/" << collection->_info.name() << " }";
|
|
|
|
return collection;
|
|
} catch (...) {
|
|
LOG(ERR) << "cannot load collection parameter file '" << path << "': " << TRI_last_error();
|
|
return nullptr;
|
|
}
|
|
}
|
|
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
/// @brief closes an open collection
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
|
|
int TRI_CloseCollection(TRI_collection_t* collection) {
|
|
// close compactor files
|
|
CloseDataFiles(&collection->_compactors);
|
|
|
|
// close journal files
|
|
CloseDataFiles(&collection->_journals);
|
|
|
|
// close datafiles
|
|
CloseDataFiles(&collection->_datafiles);
|
|
|
|
return TRI_ERROR_NO_ERROR;
|
|
}
|
|
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
/// @brief returns information about the collection files
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
|
|
TRI_col_file_structure_t TRI_FileStructureCollectionDirectory(
|
|
char const* path) {
|
|
return ScanCollectionDirectory(path);
|
|
}
|
|
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
/// @brief frees the information
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
|
|
void TRI_DestroyFileStructureCollection(TRI_col_file_structure_t* info) {
|
|
TRI_DestroyVectorString(&info->_journals);
|
|
TRI_DestroyVectorString(&info->_compactors);
|
|
TRI_DestroyVectorString(&info->_datafiles);
|
|
TRI_DestroyVectorString(&info->_indexes);
|
|
}
|
|
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
/// @brief iterate over the markers in a collection's datafiles
|
|
///
|
|
/// this function may be called on server startup for all collections, in order
|
|
/// to get the last tick value used
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
|
|
bool TRI_IterateTicksCollection(char const* const path,
|
|
bool (*iterator)(TRI_df_marker_t const*, void*,
|
|
TRI_datafile_t*),
|
|
void* data) {
|
|
TRI_ASSERT(iterator != nullptr);
|
|
|
|
TRI_col_file_structure_t structure = ScanCollectionDirectory(path);
|
|
LOG(TRACE) << "iterating ticks of journal '" << path << "'";
|
|
|
|
bool result;
|
|
|
|
if (structure._journals._length == 0) {
|
|
// no journal found for collection. should not happen normally, but if
|
|
// it does, we need to grab the ticks from the datafiles, too
|
|
result = IterateFiles(&structure._datafiles, iterator, data);
|
|
} else {
|
|
// compactor files don't need to be iterated... they just contain data
|
|
// copied
|
|
// from other files, so their tick values will never be any higher
|
|
result = IterateFiles(&structure._journals, iterator, data);
|
|
}
|
|
|
|
TRI_DestroyFileStructureCollection(&structure);
|
|
|
|
return result;
|
|
}
|
|
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
/// @brief determine whether a collection name is a system collection name
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
|
|
bool TRI_IsSystemNameCollection(char const* name) {
|
|
if (name == nullptr) {
|
|
return false;
|
|
}
|
|
|
|
return *name == '_';
|
|
}
|
|
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
/// @brief checks if a collection name is allowed
|
|
///
|
|
/// Returns true if the name is allowed and false otherwise
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
|
|
bool TRI_IsAllowedNameCollection(bool allowSystem, char const* name) {
|
|
bool ok;
|
|
char const* ptr;
|
|
size_t length = 0;
|
|
|
|
// check allow characters: must start with letter or underscore if system is
|
|
// allowed
|
|
for (ptr = name; *ptr; ++ptr) {
|
|
if (length == 0) {
|
|
if (allowSystem) {
|
|
ok = (*ptr == '_') || ('a' <= *ptr && *ptr <= 'z') ||
|
|
('A' <= *ptr && *ptr <= 'Z');
|
|
} else {
|
|
ok = ('a' <= *ptr && *ptr <= 'z') || ('A' <= *ptr && *ptr <= 'Z');
|
|
}
|
|
} else {
|
|
ok = (*ptr == '_') || (*ptr == '-') || ('0' <= *ptr && *ptr <= '9') ||
|
|
('a' <= *ptr && *ptr <= 'z') || ('A' <= *ptr && *ptr <= 'Z');
|
|
}
|
|
|
|
if (!ok) {
|
|
return false;
|
|
}
|
|
|
|
++length;
|
|
}
|
|
|
|
// invalid name length
|
|
if (length == 0 || length > TRI_COL_NAME_LENGTH) {
|
|
return false;
|
|
}
|
|
|
|
return true;
|
|
}
|