You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
parser.add_argument('--eps', default='5.0e-06', help='RMS norm eps (use 1e-5 for LLaMA2)')
231
-
parser.add_argument('--context-length', '-c', type=int, default=2048, help='Default max context length')
230
+
parser.add_argument('--eps', default='5.0e-06', help='RMS norm eps: Use 1e-6 for LLaMA1 and OpenLLaMA, use 1e-5 for LLaMA2')
231
+
parser.add_argument('--context-length', '-c', type=int, default=2048, help='Default max context length: LLaMA1 is typically 2048, LLaMA2 is typically 4096')
232
232
returnparser.parse_args()
233
233
234
234
defmain():
235
235
cfg=handle_args()
236
236
print(f'* Using config: {cfg}')
237
-
print('\n=== WARNING === Be aware that this conversion script is best-effort. Use a native GGUF model if possible. === WARNING ===\n')
237
+
print('\n=== WARNING === Be aware that this conversion script is best-effort. Special tokens may not be converted correctly. Use a native GGUF model if possible. === WARNING ===\n')
238
238
data=np.memmap(cfg.input, mode='r')
239
239
model=GGMLV3Model()
240
240
print('* Scanning GGML input file')
241
241
offset=model.load(data, 0)
242
-
print(model.hyperparameters)
242
+
print(f'* GGML model hyperparameters: {model.hyperparameters}')
243
243
converter=GGMLToGGUF(model, data, cfg)
244
244
converter.save()
245
245
print(f'* Successful completion. Output saved to: {cfg.output}')
0 commit comments