ggml-org
diff --git a/‎examples/gguf-hash/gguf-hash.cpp
Lines changed: 60 additions & 2 deletions b/‎examples/gguf-hash/gguf-hash.cpp
Lines changed: 60 additions & 2 deletions
diff --git a/‎ggml/include/ggml-rpc.h
Lines changed: 8 additions & 2 deletions b/‎ggml/include/ggml-rpc.h
Lines changed: 8 additions & 2 deletions
@@ -55,6 +55,7 @@ typedef enum {
 
 struct hash_params {
     std::string input;
+    bool fnv = false;
     bool xxh64 = false;
     bool sha1 = false;
     bool sha256 = false;
@@ -103,6 +104,7 @@ static void hash_print_usage(const char * executable) {
     printf("\n");
     printf("options:\n");
     printf("  -h, --help              show this help message and exit\n");
+    printf("      --fnv               use FNV-1a hash\n");
     printf("      --xxh64             use xxh64 hash\n");
     printf("      --sha1              use sha1 hash\n");
     printf("      --sha256            use sha256 hash\n");
@@ -131,6 +133,11 @@ static void hash_params_parse_ex(int argc, const char ** argv, hash_params & par
             exit(0);
         }
 
+        if (arg == "--fnv") {
+            arg_found = true;
+            params.fnv = true;
+        }
+
         if (arg == "--xxh64") {
             arg_found = true;
             params.xxh64 = true;
@@ -188,6 +195,26 @@ static void hash_params_parse_ex(int argc, const char ** argv, hash_params & par
     params.input = argv[arg_idx++];
 }
 
+struct fnv_ctx {
+    uint64_t hash;
+};
+
+static void fnv_init(fnv_ctx * ctx) {
+    ctx->hash = 0xcbf29ce484222325ULL;
+}
+
+static void fnv_update(fnv_ctx * ctx, const uint8_t * data, size_t len) {
+    const uint64_t fnv_prime = 0x100000001b3ULL;
+    for (size_t i = 0; i < len; ++i) {
+        ctx->hash ^= data[i];
+        ctx->hash *= fnv_prime;
+    }
+}
+
+static void fnv_final(fnv_ctx * ctx, uint64_t * digest) {
+    *digest = ctx->hash;
+}
+
 static bool hash_params_parse(int argc, const char ** argv, hash_params & params) {
     bool result = true;
     try {
@@ -306,6 +333,12 @@ static hash_exit_code_t gguf_hash(const hash_params & hash_params) {
         }
     }
 
+    // FNV init
+    fnv_ctx fnv_model_hash_ctx;
+    if (hash_params.fnv) {
+        fnv_init(&fnv_model_hash_ctx);
+    }
+
     // sha1 init
     SHA1_CTX sha1_model_hash_ctx;
     if (hash_params.sha1) {
@@ -326,7 +359,11 @@ static hash_exit_code_t gguf_hash(const hash_params & hash_params) {
         SHA1Update( &sha1_for_uuid_ctx, (unsigned char const *)uuidv5_namespace, sizeof(uuidv5_namespace));
     }
 
+    struct gguf_context * ctx_out = gguf_init_empty();
     struct gguf_context * ctx = gguf_init_from_file(fname.c_str(), params);
+
+    gguf_set_kv(ctx_out, ctx);
+
     const int n_tensors = gguf_get_n_tensors(ctx);
     bool tensor_layer_in_manifest = false;
     bool model_in_manifest = false;
@@ -335,10 +372,16 @@ static hash_exit_code_t gguf_hash(const hash_params & hash_params) {
     for (int i = 0; i < n_tensors; ++i) {
         const char * name = gguf_get_tensor_name(ctx, i);
         struct ggml_tensor * cur = ggml_get_tensor(ctx_data, name);
+        gguf_add_tensor(ctx_out, cur);
         auto n_bytes = ggml_nbytes(cur);
         auto *raw_data = cur->data;
         const std::string tensor_layer_name = fname + ":" + name;
 
+        if (hash_params.fnv) {
+            // Overall Model Hash
+            fnv_update(&fnv_model_hash_ctx, (const uint8_t *)raw_data, n_bytes);
+        }
+
         if (hash_params.xxh64) {
 
             if (!hash_params.no_layer) {
@@ -455,6 +498,18 @@ static hash_exit_code_t gguf_hash(const hash_params & hash_params) {
         }
     }
 
+    if (hash_params.fnv) {
+        uint64_t hash;
+        fnv_final(&fnv_model_hash_ctx, &hash);
+        char hex_result[17];
+        for (int  offset = 0; offset < 8; offset++) {
+            unsigned int shift_bits_by = (8 * (8 - offset - 1));
+            snprintf( ( hex_result + (2*offset)), sizeof(hex_result) - (2*offset), "%02x", (unsigned char) (hash >> shift_bits_by)&0xff);
+        }
+        printf("%-8s  %-s  %s\n", "fnv", hex_result, fname.c_str());
+        gguf_set_val_u64(ctx_out, "model_hash", hash);
+    }
+
     if (hash_params.xxh64) {
         XXH64_hash_t const hash = XXH64_digest(xxh64_model_hash_state);
 
@@ -580,6 +635,9 @@ static hash_exit_code_t gguf_hash(const hash_params & hash_params) {
         }
     }
 
+    auto fname_out = fname + ".rpc";
+    gguf_write_to_file(ctx_out, fname_out.c_str(), false);
+    gguf_free(ctx_out);
 
     ggml_free(ctx_data);
     gguf_free(ctx);
@@ -663,7 +721,7 @@ int main(int argc, const char ** argv) {
 
         // Autoselect the highest security hash if manifest is provided but
         // the user has not specifically defined the hash they care about
-        if (!params.xxh64 && !params.sha1 && !params.uuid && !params.sha256) {
+        if (!params.fnv && !params.xxh64 && !params.sha1 && !params.uuid && !params.sha256) {
             // User has not selected a specific value, pick most secure hash
             if (manifest_check.sha256) {
                 params.sha256 = true;
@@ -680,7 +738,7 @@ int main(int argc, const char ** argv) {
     }
 
     // By default if no swich argument provided, assume xxh64
-    if (!params.xxh64 && !params.sha1 && !params.uuid && !params.sha256) {
+    if (!params.fnv && !params.xxh64 && !params.sha1 && !params.uuid && !params.sha256) {
         params.xxh64 = true;
     }
 
 
@@ -8,7 +8,7 @@ extern "C" {
 #endif
 
 #define RPC_PROTO_MAJOR_VERSION    2
-#define RPC_PROTO_MINOR_VERSION    0
+#define RPC_PROTO_MINOR_VERSION    1
 #define RPC_PROTO_PATCH_VERSION    0
 #define GGML_RPC_MAX_SERVERS       16
 
@@ -21,12 +21,18 @@ GGML_BACKEND_API ggml_backend_buffer_type_t ggml_backend_rpc_buffer_type(const c
 GGML_BACKEND_API void ggml_backend_rpc_get_device_memory(const char * endpoint, size_t * free, size_t * total);
 
 GGML_BACKEND_API void ggml_backend_rpc_start_server(ggml_backend_t backend, const char * endpoint,
-                                                    const char * cache_dir,
+                                                    const char * model_file, const char * cache_dir,
                                                     size_t free_mem, size_t total_mem);
 
 GGML_BACKEND_API ggml_backend_reg_t ggml_backend_rpc_reg(void);
 
 GGML_BACKEND_API ggml_backend_dev_t ggml_backend_rpc_add_device(const char * endpoint);
+GGML_BACKEND_API bool ggml_backend_rpc_buffer_load_tensor(ggml_backend_buffer_t buffer,
+                                                          ggml_tensor * tensor,
+                                                          const char * path,
+                                                          size_t file_offset,
+                                                          size_t tensor_offset,
+                                                          size_t size);
 
 #ifdef  __cplusplus
 }