Skip to content

Commit a6367a8

Browse files
committed
Skip config.json when loading tokenizers
1 parent 46cd5ab commit a6367a8

File tree

2 files changed

+10
-6
lines changed

2 files changed

+10
-6
lines changed

Sources/Hub/Hub.swift

Lines changed: 8 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -80,7 +80,8 @@ public final class LanguageModelConfigurationFromHub: Sendable {
8080
public init(
8181
modelName: String,
8282
revision: String = "main",
83-
hubApi: HubApi = .shared
83+
hubApi: HubApi = .shared,
84+
skipModelConfig: Bool = false
8485
) {
8586
configPromise = Task.init {
8687
try await Self.loadConfig(modelName: modelName, revision: revision, hubApi: hubApi)
@@ -89,7 +90,8 @@ public final class LanguageModelConfigurationFromHub: Sendable {
8990

9091
public init(
9192
modelFolder: URL,
92-
hubApi: HubApi = .shared
93+
hubApi: HubApi = .shared,
94+
skipModelConfig: Bool = false
9395
) {
9496
configPromise = Task {
9597
try await Self.loadConfig(modelFolder: modelFolder, hubApi: hubApi)
@@ -142,9 +144,11 @@ public final class LanguageModelConfigurationFromHub: Sendable {
142144
static func loadConfig(
143145
modelName: String,
144146
revision: String,
145-
hubApi: HubApi = .shared
147+
hubApi: HubApi = .shared,
148+
skipModelConfig: Bool = false,
146149
) async throws -> Configurations {
147-
let filesToDownload = ["config.json", "tokenizer_config.json", "chat_template.jinja", "chat_template.json", "tokenizer.json"]
150+
let modelConfig = skipModelConfig ? [] : ["config.json"]
151+
let filesToDownload = modelConfig + ["tokenizer_config.json", "chat_template.jinja", "chat_template.json", "tokenizer.json"]
148152
let repo = Hub.Repo(id: modelName)
149153

150154
do {

Sources/Tokenizers/Tokenizer.swift

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -630,7 +630,7 @@ public extension AutoTokenizer {
630630
hubApi: HubApi = .shared,
631631
strict: Bool = true
632632
) async throws -> Tokenizer {
633-
let config = LanguageModelConfigurationFromHub(modelName: model, hubApi: hubApi)
633+
let config = LanguageModelConfigurationFromHub(modelName: model, hubApi: hubApi, skipModelConfig: true)
634634
guard let tokenizerConfig = try await config.tokenizerConfig else { throw TokenizerError.missingConfig }
635635
let tokenizerData = try await config.tokenizerData
636636

@@ -642,7 +642,7 @@ public extension AutoTokenizer {
642642
hubApi: HubApi = .shared,
643643
strict: Bool = true
644644
) async throws -> Tokenizer {
645-
let config = LanguageModelConfigurationFromHub(modelFolder: modelFolder, hubApi: hubApi)
645+
let config = LanguageModelConfigurationFromHub(modelFolder: modelFolder, hubApi: hubApi, skipModelConfig: true)
646646
guard let tokenizerConfig = try await config.tokenizerConfig else { throw TokenizerError.missingConfig }
647647
let tokenizerData = try await config.tokenizerData
648648

0 commit comments

Comments
 (0)