main : allow empty --prompt-cache file (#5176)

author divinity76 <redacted>

Tue, 30 Jan 2024 09:18:02 +0000 (10:18 +0100)

committer GitHub <redacted>

Tue, 30 Jan 2024 09:18:02 +0000 (11:18 +0200)
author divinity76 <redacted>
Tue, 30 Jan 2024 09:18:02 +0000 (10:18 +0100)
committer GitHub <redacted>
Tue, 30 Jan 2024 09:18:02 +0000 (11:18 +0200)
diff --git a/examples/main/main.cpp b/examples/main/main.cpp

index 58b7f807a9ccaa856d0659f0dd972fb196b60128..1c6138d2364eaae595ea58791027b9e4f37b293d 100644 (file)
--- a/examples/main/main.cpp
+++ b/examples/main/main.cpp
@@ -39,6 +39,17 @@ static std::ostringstream       * g_output_ss;
  static std::vector<llama_token> * g_output_tokens;
  static bool is_interacting = false;
  
+static bool file_exists(const std::string &path) {
+    std::ifstream f(path.c_str());
+    return f.good();
+}
+
+static bool file_is_empty(const std::string &path) {
+    std::ifstream f;
+    f.exceptions(std::ifstream::failbit | std::ifstream::badbit);
+    f.open(path.c_str(), std::ios::in | std::ios::binary | std::ios::ate);
+    return f.tellg() == 0;
+}
  
  static void write_logfile(
      const llama_context * ctx, const gpt_params & params, const llama_model * model,
@@ -215,12 +226,12 @@ int main(int argc, char ** argv) {
  
      if (!path_session.empty()) {
          LOG_TEE("%s: attempting to load saved session from '%s'\n", __func__, path_session.c_str());
-
-        // fopen to check for existing session
-        FILE * fp = std::fopen(path_session.c_str(), "rb");
-        if (fp != NULL) {
-            std::fclose(fp);
-
+        if (!file_exists(path_session)) {
+            LOG_TEE("%s: session file does not exist, will create.\n", __func__);
+        } else if (file_is_empty(path_session)) {
+            LOG_TEE("%s: The session file is empty. A new session will be initialized.\n", __func__);
+        } else {
+            // The file exists and is not empty
              session_tokens.resize(n_ctx);
              size_t n_token_count_out = 0;
              if (!llama_load_session_file(ctx, path_session.c_str(), session_tokens.data(), session_tokens.capacity(), &n_token_count_out)) {
@@ -229,10 +240,7 @@ int main(int argc, char ** argv) {
              }
              session_tokens.resize(n_token_count_out);
              llama_set_rng_seed(ctx, params.seed);
-
-            LOG_TEE("%s: loaded a session with prompt size of %d tokens\n", __func__, (int) session_tokens.size());
-        } else {
-            LOG_TEE("%s: session file does not exist, will create\n", __func__);
+            LOG_TEE("%s: loaded a session with prompt size of %d tokens\n", __func__, (int)session_tokens.size());
          }
      }
author	divinity76 <redacted>
	Tue, 30 Jan 2024 09:18:02 +0000 (10:18 +0100)
committer	GitHub <redacted>
	Tue, 30 Jan 2024 09:18:02 +0000 (11:18 +0200)