| from huggingface_hub import snapshot_download | |
| import json | |
| import os | |
| REPO_ID = "mosaicml/mosaic-bert-base-seqlen-2048" | |
| MODEL_DIRECTORY = "mosaic-bert-base-seqlen-2048" | |
| def main(): | |
| snapshot_download(repo_id=REPO_ID, local_dir=MODEL_DIRECTORY) | |
| # modify the model's config.json file to satisfy our requirements | |
| config_file_path = os.path.join(MODEL_DIRECTORY, 'config.json') | |
| contents = json.load(open(config_file_path)) | |
| contents['architectures'] = ['BertModel'] | |
| contents['auto_map']['AutoModel'] = 'bert_layers.BertModel' | |
| contents['torch_dtype'] = 'bfloat16' | |
| contents['transformers_version'] = '4.28.1' | |
| contents['_name_or_path'] = 'mosaic-bert-base-seqlen-2048' | |
| json.dump(contents, open(config_file_path, 'w'), ensure_ascii=True) | |
| if __name__ == '__main__': | |
| main() |