mirror of
https://github.com/oobabooga/text-generation-webui.git
synced 2024-11-25 09:19:23 +01:00
Read rope_theta for DBRX model (thanks turboderp)
This commit is contained in:
parent
db5f6cd1d8
commit
9ab7365b56
@ -84,6 +84,8 @@ def get_model_metadata(model):
|
|||||||
|
|
||||||
if 'rope_theta' in metadata:
|
if 'rope_theta' in metadata:
|
||||||
model_settings['rope_freq_base'] = metadata['rope_theta']
|
model_settings['rope_freq_base'] = metadata['rope_theta']
|
||||||
|
elif 'attn_config' in metadata and 'rope_theta' in metadata['attn_config']:
|
||||||
|
model_settings['rope_freq_base'] = metadata['attn_config']['rope_theta']
|
||||||
|
|
||||||
if 'rope_scaling' in metadata and type(metadata['rope_scaling']) is dict and all(key in metadata['rope_scaling'] for key in ('type', 'factor')):
|
if 'rope_scaling' in metadata and type(metadata['rope_scaling']) is dict and all(key in metadata['rope_scaling'] for key in ('type', 'factor')):
|
||||||
if metadata['rope_scaling']['type'] == 'linear':
|
if metadata['rope_scaling']['type'] == 'linear':
|
||||||
|
Loading…
Reference in New Issue
Block a user