2016-07-27 15:22:59 -04:00
|
|
|
#include "util/rsdir.h"
|
2016-08-06 13:04:54 -04:00
|
|
|
#include "rsserver/p3face.h"
|
2016-08-09 09:07:02 -04:00
|
|
|
#include "pqi/authssl.h"
|
2016-07-27 15:22:59 -04:00
|
|
|
#include "hash_cache.h"
|
2016-08-09 09:07:02 -04:00
|
|
|
#include "filelist_io.h"
|
2016-09-02 15:49:43 -04:00
|
|
|
#include "file_sharing_defaults.h"
|
2016-07-27 15:22:59 -04:00
|
|
|
|
|
|
|
#define HASHSTORAGE_DEBUG 1
|
|
|
|
|
2016-08-09 09:07:02 -04:00
|
|
|
static const uint32_t DEFAULT_INACTIVITY_SLEEP_TIME = 50*1000;
|
|
|
|
static const uint32_t MAX_INACTIVITY_SLEEP_TIME = 2*1000*1000;
|
|
|
|
|
2016-07-27 15:22:59 -04:00
|
|
|
HashStorage::HashStorage(const std::string& save_file_name)
|
|
|
|
: mFilePath(save_file_name), mHashMtx("Hash Storage mutex")
|
|
|
|
{
|
2016-08-16 07:46:55 -04:00
|
|
|
mInactivitySleepTime = DEFAULT_INACTIVITY_SLEEP_TIME;
|
2016-07-27 18:48:28 -04:00
|
|
|
mRunning = false ;
|
2016-09-02 15:49:43 -04:00
|
|
|
mLastSaveTime = 0 ;
|
2016-08-16 07:46:55 -04:00
|
|
|
|
2016-09-02 15:49:43 -04:00
|
|
|
{
|
|
|
|
RS_STACK_MUTEX(mHashMtx) ;
|
|
|
|
locked_load() ;
|
|
|
|
}
|
2016-07-27 15:22:59 -04:00
|
|
|
}
|
|
|
|
|
|
|
|
void HashStorage::data_tick()
|
|
|
|
{
|
|
|
|
FileHashJob job;
|
2016-07-27 18:48:28 -04:00
|
|
|
RsFileHash hash;
|
|
|
|
uint64_t size ;
|
2016-07-27 15:22:59 -04:00
|
|
|
|
|
|
|
{
|
2016-08-12 13:30:19 -04:00
|
|
|
bool empty ;
|
|
|
|
uint32_t st ;
|
2016-07-27 15:22:59 -04:00
|
|
|
|
2016-09-02 16:08:27 -04:00
|
|
|
{
|
|
|
|
RS_STACK_MUTEX(mHashMtx) ;
|
|
|
|
if(mChanged && mLastSaveTime + MIN_INTERVAL_BETWEEN_HASH_CACHE_SAVE < time(NULL))
|
|
|
|
{
|
|
|
|
locked_save();
|
|
|
|
mLastSaveTime = time(NULL) ;
|
|
|
|
mChanged = false ;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-08-05 16:37:40 -04:00
|
|
|
{
|
2016-08-12 13:30:19 -04:00
|
|
|
RS_STACK_MUTEX(mHashMtx) ;
|
2016-08-05 16:37:40 -04:00
|
|
|
|
2016-08-12 13:30:19 -04:00
|
|
|
empty = mFilesToHash.empty();
|
|
|
|
st = mInactivitySleepTime ;
|
|
|
|
}
|
|
|
|
|
|
|
|
// sleep off mutex!
|
|
|
|
if(empty)
|
|
|
|
{
|
|
|
|
std::cerr << "nothing to hash. Sleeping for " << st << " us" << std::endl;
|
|
|
|
|
|
|
|
usleep(st); // when no files to hash, just wait for 2 secs. This avoids a dramatic loop.
|
2016-08-06 13:04:54 -04:00
|
|
|
|
2016-08-12 13:30:19 -04:00
|
|
|
if(st > MAX_INACTIVITY_SLEEP_TIME)
|
|
|
|
{
|
|
|
|
RS_STACK_MUTEX(mHashMtx) ;
|
2016-08-09 09:07:02 -04:00
|
|
|
|
2016-08-12 13:30:19 -04:00
|
|
|
mInactivitySleepTime = MAX_INACTIVITY_SLEEP_TIME;
|
|
|
|
|
2016-09-02 15:49:43 -04:00
|
|
|
if(!mChanged) // otherwise it might prevent from saving the hash cache
|
|
|
|
{
|
|
|
|
std::cerr << "Stopping hashing thread." << std::endl;
|
|
|
|
shutdown();
|
|
|
|
mRunning = false ;
|
|
|
|
std::cerr << "done." << std::endl;
|
|
|
|
}
|
2016-08-12 13:30:19 -04:00
|
|
|
|
|
|
|
RsServer::notify()->notifyHashingInfo(NOTIFY_HASHTYPE_FINISH, "") ;
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
RS_STACK_MUTEX(mHashMtx) ;
|
|
|
|
mInactivitySleepTime = 2*st ;
|
|
|
|
}
|
2016-08-09 09:07:02 -04:00
|
|
|
|
2016-07-27 15:22:59 -04:00
|
|
|
return ;
|
2016-08-05 16:37:40 -04:00
|
|
|
}
|
2016-08-09 09:07:02 -04:00
|
|
|
mInactivitySleepTime = DEFAULT_INACTIVITY_SLEEP_TIME;
|
2016-07-27 15:22:59 -04:00
|
|
|
|
2016-08-16 07:46:55 -04:00
|
|
|
{
|
|
|
|
RS_STACK_MUTEX(mHashMtx) ;
|
|
|
|
job = mFilesToHash.begin()->second ;
|
|
|
|
mFilesToHash.erase(mFilesToHash.begin()) ;
|
|
|
|
}
|
2016-07-27 15:22:59 -04:00
|
|
|
|
2016-07-27 18:48:28 -04:00
|
|
|
std::cerr << "Hashing file " << job.full_path << "..." ; std::cerr.flush();
|
2016-07-27 15:22:59 -04:00
|
|
|
|
2016-08-06 13:04:54 -04:00
|
|
|
std::string tmpout;
|
|
|
|
//rs_sprintf(tmpout, "%lu/%lu (%s - %d%%) : %s", cnt+1, n_files, friendlyUnit(size).c_str(), int(size/double(total_size)*100.0), fe.name.c_str()) ;
|
|
|
|
|
|
|
|
RsServer::notify()->notifyHashingInfo(NOTIFY_HASHTYPE_HASH_FILE, job.full_path) ;
|
2016-07-27 15:22:59 -04:00
|
|
|
|
2016-07-27 18:48:28 -04:00
|
|
|
if(!RsDirUtil::getFileHash(job.full_path, hash,size, this))
|
|
|
|
std::cerr << "ERROR: cannot hash file " << job.full_path << std::endl;
|
|
|
|
else
|
|
|
|
std::cerr << "done."<< std::endl;
|
2016-07-27 15:22:59 -04:00
|
|
|
|
2016-07-28 04:49:49 -04:00
|
|
|
// store the result
|
|
|
|
|
2016-09-02 16:08:27 -04:00
|
|
|
{
|
|
|
|
RS_STACK_MUTEX(mHashMtx) ;
|
|
|
|
HashStorageInfo& info(mFiles[job.full_path]);
|
2016-07-28 04:49:49 -04:00
|
|
|
|
2016-09-02 16:08:27 -04:00
|
|
|
info.filename = job.full_path ;
|
|
|
|
info.size = size ;
|
|
|
|
info.modf_stamp = job.ts ;
|
|
|
|
info.time_stamp = time(NULL);
|
|
|
|
info.hash = hash;
|
2016-09-02 15:49:43 -04:00
|
|
|
|
2016-09-02 16:08:27 -04:00
|
|
|
mChanged = true ;
|
|
|
|
}
|
2016-07-27 18:48:28 -04:00
|
|
|
}
|
2016-07-27 15:22:59 -04:00
|
|
|
// call the client
|
|
|
|
|
2016-07-27 18:48:28 -04:00
|
|
|
if(!hash.isNull())
|
|
|
|
job.client->hash_callback(job.client_param, job.full_path, hash, size);
|
2016-09-02 15:49:43 -04:00
|
|
|
|
2016-07-27 15:22:59 -04:00
|
|
|
}
|
|
|
|
|
|
|
|
bool HashStorage::requestHash(const std::string& full_path,uint64_t size,time_t mod_time,RsFileHash& known_hash,HashStorageClient *c,uint32_t client_param)
|
|
|
|
{
|
|
|
|
// check if the hash is up to date w.r.t. cache.
|
|
|
|
|
2016-07-28 04:49:49 -04:00
|
|
|
#ifdef HASHSTORAGE_DEBUG
|
|
|
|
std::cerr << "HASH Requested for file " << full_path << ": ";
|
|
|
|
#endif
|
2016-07-27 15:22:59 -04:00
|
|
|
RS_STACK_MUTEX(mHashMtx) ;
|
|
|
|
|
|
|
|
time_t now = time(NULL) ;
|
|
|
|
std::map<std::string,HashStorageInfo>::iterator it = mFiles.find(full_path) ;
|
|
|
|
|
|
|
|
if(it != mFiles.end() && (uint64_t)mod_time == it->second.modf_stamp && size == it->second.size)
|
|
|
|
{
|
|
|
|
it->second.time_stamp = now ;
|
2016-07-28 04:49:49 -04:00
|
|
|
known_hash = it->second.hash;
|
|
|
|
#ifdef HASHSTORAGE_DEBUG
|
2016-07-27 15:22:59 -04:00
|
|
|
std::cerr << "Found in cache." << std::endl ;
|
|
|
|
#endif
|
|
|
|
return true ;
|
|
|
|
}
|
2016-07-28 04:49:49 -04:00
|
|
|
#ifdef HASHSTORAGE_DEBUG
|
2016-08-29 15:30:56 -04:00
|
|
|
std::cerr << "Not in cache. Scheduling for re-hash." << std::endl ;
|
2016-07-28 04:49:49 -04:00
|
|
|
#endif
|
2016-07-27 15:22:59 -04:00
|
|
|
|
|
|
|
// we need to schedule a re-hashing
|
|
|
|
|
|
|
|
if(mFilesToHash.find(full_path) != mFilesToHash.end())
|
|
|
|
return false ;
|
|
|
|
|
|
|
|
FileHashJob job ;
|
|
|
|
|
|
|
|
job.client = c ;
|
|
|
|
job.client_param = client_param ;
|
|
|
|
job.full_path = full_path ;
|
2016-07-28 04:49:49 -04:00
|
|
|
job.ts = mod_time ;
|
2016-07-27 15:22:59 -04:00
|
|
|
|
|
|
|
mFilesToHash[full_path] = job;
|
|
|
|
|
2016-07-27 18:48:28 -04:00
|
|
|
if(!mRunning)
|
2016-07-27 15:22:59 -04:00
|
|
|
{
|
2016-07-27 18:48:28 -04:00
|
|
|
mRunning = true ;
|
2016-07-27 15:22:59 -04:00
|
|
|
std::cerr << "Starting hashing thread." << std::endl;
|
|
|
|
start() ;
|
|
|
|
}
|
|
|
|
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
void HashStorage::clean()
|
|
|
|
{
|
2016-09-02 16:08:27 -04:00
|
|
|
RS_STACK_MUTEX(mHashMtx) ;
|
|
|
|
|
2016-07-27 15:22:59 -04:00
|
|
|
#ifdef HASHSTORAGE_DEBUG
|
|
|
|
std::cerr << "Cleaning HashStorage..." << std::endl ;
|
|
|
|
#endif
|
|
|
|
time_t now = time(NULL) ;
|
|
|
|
time_t duration = mMaxStorageDurationDays * 24 * 3600 ; // seconds
|
|
|
|
|
|
|
|
#ifdef HASHSTORAGE_DEBUG
|
|
|
|
std::cerr << "cleaning hash cache." << std::endl ;
|
|
|
|
#endif
|
|
|
|
|
|
|
|
for(std::map<std::string,HashStorageInfo>::iterator it(mFiles.begin());it!=mFiles.end();)
|
|
|
|
if(it->second.time_stamp + duration < (uint64_t)now)
|
|
|
|
{
|
|
|
|
#ifdef HASHSTORAGE_DEBUG
|
|
|
|
std::cerr << " Entry too old: " << it->first << ", ts=" << it->second.time_stamp << std::endl ;
|
|
|
|
#endif
|
|
|
|
std::map<std::string,HashStorageInfo>::iterator tmp(it) ;
|
|
|
|
++tmp ;
|
|
|
|
mFiles.erase(it) ;
|
|
|
|
it=tmp ;
|
|
|
|
mChanged = true ;
|
|
|
|
}
|
|
|
|
else
|
|
|
|
++it ;
|
|
|
|
|
|
|
|
#ifdef HASHSTORAGE_DEBUG
|
|
|
|
std::cerr << "Done." << std::endl;
|
|
|
|
#endif
|
|
|
|
}
|
|
|
|
|
2016-09-02 15:49:43 -04:00
|
|
|
void HashStorage::locked_load()
|
2016-08-09 09:07:02 -04:00
|
|
|
{
|
|
|
|
uint64_t file_size ;
|
|
|
|
|
|
|
|
if(!RsDirUtil::checkFile( mFilePath,file_size,false ) )
|
|
|
|
{
|
|
|
|
std::cerr << "Encrypted hash cache file not present." << std::endl;
|
|
|
|
return ;
|
|
|
|
}
|
|
|
|
|
|
|
|
// read the binary stream into memory.
|
|
|
|
//
|
|
|
|
void *buffer = rs_malloc(file_size) ;
|
|
|
|
|
|
|
|
if(buffer == NULL)
|
|
|
|
return ;
|
|
|
|
|
|
|
|
FILE *F = fopen( mFilePath.c_str(),"rb") ;
|
|
|
|
if (!F)
|
|
|
|
{
|
|
|
|
std::cerr << "Cannot open file for reading encrypted file cache, filename " << mFilePath << std::endl;
|
|
|
|
free(buffer);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
if(fread(buffer,1,file_size,F) != file_size)
|
|
|
|
{
|
|
|
|
std::cerr << "Cannot read from file " + mFilePath << ": something's wrong." << std::endl;
|
|
|
|
free(buffer) ;
|
|
|
|
fclose(F) ;
|
|
|
|
return ;
|
|
|
|
}
|
|
|
|
fclose(F) ;
|
|
|
|
|
|
|
|
// now decrypt
|
|
|
|
void *decrypted_data =NULL;
|
|
|
|
int decrypted_data_size =0;
|
|
|
|
|
|
|
|
if(!AuthSSL::getAuthSSL()->decrypt(decrypted_data, decrypted_data_size, buffer, file_size))
|
|
|
|
{
|
|
|
|
std::cerr << "Cannot decrypt encrypted file cache. Something's wrong." << std::endl;
|
|
|
|
free(buffer) ;
|
|
|
|
return ;
|
|
|
|
}
|
|
|
|
free(buffer) ;
|
|
|
|
|
|
|
|
#ifdef HASHSTORAGE_DEBUG
|
|
|
|
std::cerr << "Loading HashCache from file " << mFilePath << std::endl ;
|
|
|
|
int n=0 ;
|
|
|
|
#endif
|
|
|
|
unsigned char *data = (unsigned char*)decrypted_data ;
|
|
|
|
uint32_t offset = 0 ;
|
|
|
|
HashStorageInfo info ;
|
|
|
|
|
|
|
|
while(offset < decrypted_data_size)
|
|
|
|
if(readHashStorageInfo(data,decrypted_data_size,offset,info))
|
|
|
|
{
|
|
|
|
#ifdef HASHSTORAGE_DEBUG
|
|
|
|
std::cerr << info << std::endl;
|
|
|
|
++n ;
|
|
|
|
#endif
|
|
|
|
mFiles[info.filename] = info ;
|
|
|
|
}
|
|
|
|
|
|
|
|
free(decrypted_data) ;
|
|
|
|
#ifdef HASHSTORAGE_DEBUG
|
|
|
|
std::cerr << n << " entries loaded." << std::endl ;
|
|
|
|
#endif
|
|
|
|
}
|
|
|
|
|
2016-09-02 15:49:43 -04:00
|
|
|
void HashStorage::locked_save()
|
2016-08-09 09:07:02 -04:00
|
|
|
{
|
|
|
|
#ifdef HASHSTORAGE_DEBUG
|
|
|
|
std::cerr << "Saving Hash Cache to file " << mFilePath << "..." << std::endl ;
|
|
|
|
#endif
|
|
|
|
|
|
|
|
unsigned char *data = NULL ;
|
|
|
|
uint32_t offset = 0 ;
|
|
|
|
uint32_t total_size = 0;
|
|
|
|
|
|
|
|
for(std::map<std::string,HashStorageInfo>::const_iterator it(mFiles.begin());it!=mFiles.end();++it)
|
2016-08-12 09:20:23 -04:00
|
|
|
writeHashStorageInfo(data,total_size,offset,it->second) ;
|
2016-08-09 09:07:02 -04:00
|
|
|
|
|
|
|
void *encryptedData = NULL ;
|
|
|
|
int encDataLen = 0 ;
|
|
|
|
|
|
|
|
if(!AuthSSL::getAuthSSL()->encrypt( encryptedData, encDataLen, data,offset, AuthSSL::getAuthSSL()->OwnId()))
|
|
|
|
{
|
|
|
|
std::cerr << "Cannot encrypt hash cache. Something's wrong." << std::endl;
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
FILE *F = fopen( (mFilePath+".tmp").c_str(),"wb" ) ;
|
|
|
|
|
|
|
|
if(!F)
|
|
|
|
{
|
|
|
|
std::cerr << "Cannot open encrypted file cache for writing: " << mFilePath+".tmp" << std::endl;
|
|
|
|
goto save_free;
|
|
|
|
}
|
|
|
|
if(fwrite(encryptedData,1,encDataLen,F) != (uint32_t)encDataLen)
|
|
|
|
{
|
|
|
|
std::cerr << "Could not write entire encrypted hash cache file. Out of disc space??" << std::endl;
|
|
|
|
fclose(F) ;
|
|
|
|
goto save_free;
|
|
|
|
}
|
|
|
|
|
|
|
|
fclose(F) ;
|
|
|
|
|
|
|
|
RsDirUtil::renameFile(mFilePath+".tmp",mFilePath) ;
|
|
|
|
#ifdef FIM_DEBUG
|
|
|
|
std::cerr << "done." << std::endl ;
|
|
|
|
#endif
|
2016-09-02 16:08:27 -04:00
|
|
|
std::cerr << mFiles.size() << " Entries saved." << std::endl;
|
2016-08-09 09:07:02 -04:00
|
|
|
|
|
|
|
save_free:
|
|
|
|
free(encryptedData);
|
|
|
|
}
|
|
|
|
|
|
|
|
bool HashStorage::readHashStorageInfo(const unsigned char *data,uint32_t total_size,uint32_t& offset,HashStorageInfo& info) const
|
|
|
|
{
|
|
|
|
unsigned char *section_data = NULL ;
|
|
|
|
uint32_t section_size = 0;
|
2016-08-12 09:20:23 -04:00
|
|
|
uint32_t section_offset = 0;
|
2016-08-09 09:07:02 -04:00
|
|
|
|
2016-08-12 13:30:19 -04:00
|
|
|
// This way, the entire section is either read or skipped. That avoids the risk of being stuck somewhere in the middle
|
|
|
|
// of a section because of some unknown field, etc.
|
|
|
|
|
2016-08-09 09:07:02 -04:00
|
|
|
if(!FileListIO::readField(data,total_size,offset,FILE_LIST_IO_TAG_HASH_STORAGE_ENTRY,section_data,section_size))
|
|
|
|
return false;
|
|
|
|
|
|
|
|
if(!FileListIO::readField(section_data,section_size,section_offset,FILE_LIST_IO_TAG_FILE_NAME ,info.filename )) return false ;
|
|
|
|
if(!FileListIO::readField(section_data,section_size,section_offset,FILE_LIST_IO_TAG_FILE_SIZE ,info.size )) return false ;
|
|
|
|
if(!FileListIO::readField(section_data,section_size,section_offset,FILE_LIST_IO_TAG_UPDATE_TS ,info.time_stamp)) return false ;
|
|
|
|
if(!FileListIO::readField(section_data,section_size,section_offset,FILE_LIST_IO_TAG_MODIF_TS ,info.modf_stamp)) return false ;
|
|
|
|
if(!FileListIO::readField(section_data,section_size,section_offset,FILE_LIST_IO_TAG_FILE_SHA1_HASH,info.hash )) return false ;
|
|
|
|
|
|
|
|
free(section_data);
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
bool HashStorage::writeHashStorageInfo(unsigned char *& data,uint32_t& total_size,uint32_t& offset,const HashStorageInfo& info) const
|
|
|
|
{
|
|
|
|
unsigned char *section_data = NULL ;
|
|
|
|
uint32_t section_offset = 0 ;
|
|
|
|
uint32_t section_size = 0;
|
|
|
|
|
|
|
|
if(!FileListIO::writeField(section_data,section_size,section_offset,FILE_LIST_IO_TAG_FILE_NAME ,info.filename )) return false ;
|
|
|
|
if(!FileListIO::writeField(section_data,section_size,section_offset,FILE_LIST_IO_TAG_FILE_SIZE ,info.size )) return false ;
|
|
|
|
if(!FileListIO::writeField(section_data,section_size,section_offset,FILE_LIST_IO_TAG_UPDATE_TS ,info.time_stamp)) return false ;
|
|
|
|
if(!FileListIO::writeField(section_data,section_size,section_offset,FILE_LIST_IO_TAG_MODIF_TS ,info.modf_stamp)) return false ;
|
|
|
|
if(!FileListIO::writeField(section_data,section_size,section_offset,FILE_LIST_IO_TAG_FILE_SHA1_HASH,info.hash )) return false ;
|
|
|
|
|
|
|
|
// now write the whole string into a single section in the file
|
|
|
|
|
|
|
|
if(!FileListIO::writeField(data,total_size,offset,FILE_LIST_IO_TAG_HASH_STORAGE_ENTRY,section_data,section_offset)) return false ;
|
|
|
|
|
|
|
|
free(section_data) ;
|
|
|
|
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
std::ostream& operator<<(std::ostream& o,const HashStorage::HashStorageInfo& info)
|
|
|
|
{
|
|
|
|
return o << info.hash << " " << info.size << " " << info.filename ;
|
|
|
|
}
|