mirror of
https://github.com/ggerganov/llama.cpp.git
synced 2025-01-25 19:08:44 +01:00
metal : support default.metallib load & reuse code for swift package (#3522)
* metal : support load default.metallib & reuse code for swift package * metal : use SWIFT_PACKAGE def instead of define GGML_SWIFT
This commit is contained in:
parent
0e797c2fc5
commit
c26765a0a1
1
.gitignore
vendored
1
.gitignore
vendored
@ -10,6 +10,7 @@
|
|||||||
*.gcno
|
*.gcno
|
||||||
*.gcda
|
*.gcda
|
||||||
*.dot
|
*.dot
|
||||||
|
*.metallib
|
||||||
.DS_Store
|
.DS_Store
|
||||||
.build/
|
.build/
|
||||||
.cache/
|
.cache/
|
||||||
|
@ -10,15 +10,18 @@ let platforms: [SupportedPlatform]? = [
|
|||||||
.tvOS(.v14)
|
.tvOS(.v14)
|
||||||
]
|
]
|
||||||
let exclude: [String] = []
|
let exclude: [String] = []
|
||||||
let additionalSources: [String] = ["ggml-metal.m", "ggml-metal.metal"]
|
let resources: [Resource] = [
|
||||||
|
.process("ggml-metal.metal")
|
||||||
|
]
|
||||||
|
let additionalSources: [String] = ["ggml-metal.m"]
|
||||||
let additionalSettings: [CSetting] = [
|
let additionalSettings: [CSetting] = [
|
||||||
.unsafeFlags(["-fno-objc-arc"]),
|
.unsafeFlags(["-fno-objc-arc"]),
|
||||||
.define("GGML_SWIFT"),
|
|
||||||
.define("GGML_USE_METAL")
|
.define("GGML_USE_METAL")
|
||||||
]
|
]
|
||||||
#else
|
#else
|
||||||
let platforms: [SupportedPlatform]? = nil
|
let platforms: [SupportedPlatform]? = nil
|
||||||
let exclude: [String] = ["ggml-metal.metal"]
|
let exclude: [String] = ["ggml-metal.metal"]
|
||||||
|
let resources: [Resource] = []
|
||||||
let additionalSources: [String] = []
|
let additionalSources: [String] = []
|
||||||
let additionalSettings: [CSetting] = []
|
let additionalSettings: [CSetting] = []
|
||||||
#endif
|
#endif
|
||||||
@ -40,6 +43,7 @@ let package = Package(
|
|||||||
"ggml-alloc.c",
|
"ggml-alloc.c",
|
||||||
"k_quants.c",
|
"k_quants.c",
|
||||||
] + additionalSources,
|
] + additionalSources,
|
||||||
|
resources: resources,
|
||||||
publicHeadersPath: "spm-headers",
|
publicHeadersPath: "spm-headers",
|
||||||
cSettings: [
|
cSettings: [
|
||||||
.unsafeFlags(["-Wno-shorten-64-to-32"]),
|
.unsafeFlags(["-Wno-shorten-64-to-32"]),
|
||||||
|
66
ggml-metal.m
66
ggml-metal.m
@ -185,56 +185,44 @@ struct ggml_metal_context * ggml_metal_init(int n_cb) {
|
|||||||
|
|
||||||
ctx->d_queue = dispatch_queue_create("ggml-metal", DISPATCH_QUEUE_CONCURRENT);
|
ctx->d_queue = dispatch_queue_create("ggml-metal", DISPATCH_QUEUE_CONCURRENT);
|
||||||
|
|
||||||
#ifdef GGML_SWIFT
|
// load library
|
||||||
// load the default.metallib file
|
|
||||||
{
|
{
|
||||||
NSError * error = nil;
|
NSBundle * bundle = nil;
|
||||||
|
#ifdef SWIFT_PACKAGE
|
||||||
NSBundle * bundle = [NSBundle bundleForClass:[GGMLMetalClass class]];
|
bundle = SWIFTPM_MODULE_BUNDLE;
|
||||||
NSString * llamaBundlePath = [bundle pathForResource:@"llama_llama" ofType:@"bundle"];
|
|
||||||
NSBundle * llamaBundle = [NSBundle bundleWithPath:llamaBundlePath];
|
|
||||||
NSString * libPath = [llamaBundle pathForResource:@"default" ofType:@"metallib"];
|
|
||||||
NSURL * libURL = [NSURL fileURLWithPath:libPath];
|
|
||||||
|
|
||||||
// Load the metallib file into a Metal library
|
|
||||||
ctx->library = [ctx->device newLibraryWithURL:libURL error:&error];
|
|
||||||
|
|
||||||
if (error) {
|
|
||||||
GGML_METAL_LOG_ERROR("%s: error: %s\n", __func__, [[error description] UTF8String]);
|
|
||||||
return NULL;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
#else
|
#else
|
||||||
UNUSED(msl_library_source);
|
bundle = [NSBundle bundleForClass:[GGMLMetalClass class]];
|
||||||
|
#endif
|
||||||
// read the source from "ggml-metal.metal" into a string and use newLibraryWithSource
|
|
||||||
{
|
|
||||||
NSError * error = nil;
|
NSError * error = nil;
|
||||||
|
NSString * libPath = [bundle pathForResource:@"default" ofType:@"metallib"];
|
||||||
|
if (libPath != nil) {
|
||||||
|
NSURL * libURL = [NSURL fileURLWithPath:libPath];
|
||||||
|
GGML_METAL_LOG_INFO("%s: loading '%s'\n", __func__, [libPath UTF8String]);
|
||||||
|
ctx->library = [ctx->device newLibraryWithURL:libURL error:&error];
|
||||||
|
} else {
|
||||||
|
GGML_METAL_LOG_INFO("%s: default.metallib not found, loading from source\n", __func__);
|
||||||
|
|
||||||
//NSString * path = [[NSBundle mainBundle] pathForResource:@"../../examples/metal/metal" ofType:@"metal"];
|
NSString * sourcePath = [bundle pathForResource:@"ggml-metal" ofType:@"metal"];
|
||||||
NSBundle * bundle = [NSBundle bundleForClass:[GGMLMetalClass class]];
|
GGML_METAL_LOG_INFO("%s: loading '%s'\n", __func__, [sourcePath UTF8String]);
|
||||||
NSString * path = [bundle pathForResource:@"ggml-metal" ofType:@"metal"];
|
NSString * src = [NSString stringWithContentsOfFile:sourcePath encoding:NSUTF8StringEncoding error:&error];
|
||||||
GGML_METAL_LOG_INFO("%s: loading '%s'\n", __func__, [path UTF8String]);
|
if (error) {
|
||||||
|
GGML_METAL_LOG_ERROR("%s: error: %s\n", __func__, [[error description] UTF8String]);
|
||||||
NSString * src = [NSString stringWithContentsOfFile:path encoding:NSUTF8StringEncoding error:&error];
|
return NULL;
|
||||||
if (error) {
|
}
|
||||||
GGML_METAL_LOG_ERROR("%s: error: %s\n", __func__, [[error description] UTF8String]);
|
|
||||||
return NULL;
|
|
||||||
}
|
|
||||||
|
|
||||||
|
MTLCompileOptions* options = nil;
|
||||||
#ifdef GGML_QKK_64
|
#ifdef GGML_QKK_64
|
||||||
MTLCompileOptions* options = [MTLCompileOptions new];
|
options = [MTLCompileOptions new];
|
||||||
options.preprocessorMacros = @{ @"QK_K" : @(64) };
|
options.preprocessorMacros = @{ @"QK_K" : @(64) };
|
||||||
ctx->library = [ctx->device newLibraryWithSource:src options:options error:&error];
|
|
||||||
#else
|
|
||||||
ctx->library = [ctx->device newLibraryWithSource:src options:nil error:&error];
|
|
||||||
#endif
|
#endif
|
||||||
|
ctx->library = [ctx->device newLibraryWithSource:src options:options error:&error];
|
||||||
|
}
|
||||||
|
|
||||||
if (error) {
|
if (error) {
|
||||||
GGML_METAL_LOG_ERROR("%s: error: %s\n", __func__, [[error description] UTF8String]);
|
GGML_METAL_LOG_ERROR("%s: error: %s\n", __func__, [[error description] UTF8String]);
|
||||||
return NULL;
|
return NULL;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
#endif
|
|
||||||
|
|
||||||
// load kernels
|
// load kernels
|
||||||
{
|
{
|
||||||
@ -437,7 +425,7 @@ static id<MTLBuffer> ggml_metal_get_buffer(struct ggml_metal_context * ctx, stru
|
|||||||
for (int i = 0; i < ctx->n_buffers; ++i) {
|
for (int i = 0; i < ctx->n_buffers; ++i) {
|
||||||
const int64_t ioffs = (int64_t) t->data - (int64_t) ctx->buffers[i].data;
|
const int64_t ioffs = (int64_t) t->data - (int64_t) ctx->buffers[i].data;
|
||||||
|
|
||||||
//metal_printf("ioffs = %10ld, tsize = %10ld, sum = %10ld, ctx->buffers[%d].size = %10ld, name = %s\n", ioffs, tsize, ioffs + tsize, i, ctx->buffers[i].size, ctx->buffers[i].name);
|
//GGML_METAL_LOG_INFO("ioffs = %10ld, tsize = %10ld, sum = %10ld, ctx->buffers[%d].size = %10ld, name = %s\n", ioffs, tsize, ioffs + tsize, i, ctx->buffers[i].size, ctx->buffers[i].name);
|
||||||
if (ioffs >= 0 && ioffs + tsize <= (int64_t) ctx->buffers[i].size) {
|
if (ioffs >= 0 && ioffs + tsize <= (int64_t) ctx->buffers[i].size) {
|
||||||
*offs = (size_t) ioffs;
|
*offs = (size_t) ioffs;
|
||||||
|
|
||||||
|
Loading…
Reference in New Issue
Block a user