2023-05-31 17:04:01 -04:00
# ifndef GPTJ_H_I_KNOW_WHAT_I_AM_DOING_WHEN_INCLUDING_THIS_FILE
# error This file is NOT meant to be included outside of gptj.cpp. Doing so is DANGEROUS. Be sure to know what you are doing before proceeding to #define GPTJ_H_I_KNOW_WHAT_I_AM_DOING_WHEN_INCLUDING_THIS_FILE
# endif
2023-04-08 23:28:39 -04:00
# ifndef GPTJ_H
# define GPTJ_H
2024-05-31 16:34:54 -04:00
# include "llmodel.h"
2023-04-08 23:28:39 -04:00
# include <functional>
2024-05-31 16:34:54 -04:00
# include <string>
2023-04-10 15:04:40 -04:00
# include <vector>
2023-04-08 23:28:39 -04:00
2023-05-31 17:04:01 -04:00
struct GPTJPrivate ;
2023-04-13 22:15:40 -04:00
class GPTJ : public LLModel {
2023-04-08 23:28:39 -04:00
public :
GPTJ ( ) ;
~ GPTJ ( ) ;
2023-07-09 11:32:51 -04:00
bool supportsEmbedding ( ) const override { return false ; }
bool supportsCompletion ( ) const override { return true ; }
2024-01-31 14:17:44 -05:00
bool loadModel ( const std : : string & modelPath , int n_ctx , int ngl ) override ;
2023-04-13 22:15:40 -04:00
bool isModelLoaded ( ) const override ;
2024-01-31 14:17:44 -05:00
size_t requiredMem ( const std : : string & modelPath , int n_ctx , int ngl ) override ;
2023-05-05 10:00:05 -04:00
size_t stateSize ( ) const override ;
size_t saveState ( uint8_t * dest ) const override ;
size_t restoreState ( const uint8_t * src ) override ;
2023-04-18 09:46:03 -04:00
void setThreadCount ( int32_t n_threads ) override ;
2023-05-21 16:45:29 -04:00
int32_t threadCount ( ) const override ;
2023-04-08 23:28:39 -04:00
private :
GPTJPrivate * d_ptr ;
2023-06-04 08:59:24 -04:00
protected :
2024-02-21 15:45:32 -05:00
std : : vector < Token > tokenize ( PromptContext & ctx , const std : : string & str , bool special ) const override ;
2023-06-04 08:59:24 -04:00
Token sampleToken ( PromptContext & ctx ) const override ;
2024-02-21 15:45:32 -05:00
std : : string tokenToString ( Token id ) const override ;
2023-06-04 08:59:24 -04:00
bool evalTokens ( PromptContext & ctx , const std : : vector < int32_t > & tokens ) const override ;
int32_t contextLength ( ) const override ;
2024-02-21 15:45:32 -05:00
const std : : vector < Token > & endTokens ( ) const override ;
bool shouldAddBOS ( ) const override { return false ; }
2023-04-08 23:28:39 -04:00
} ;
2023-04-18 09:46:03 -04:00
# endif // GPTJ_H