InternLM/tools/convert2llama.py

# Copyright (c) InternLM. All rights reserved.
import argparse
import json
import os

import torch
from einops import rearrange
from tqdm import tqdm
from transformers import AutoConfig, LlamaConfig, LlamaTokenizer


def weight_load(fp, **kwargs):
    """Load weights from a file."""
    is_safetensors = kwargs.pop('is_safetensors', False)

    if is_safetensors:
        try:
            from safetensors import safe_open
        except ImportError:
            raise ImportError(
                'Before loading ckpts in the `safetensors` format, '
                'please install the `safetensors` package first.')

        model = safe_open(fp, framework='pt')
        state_dict = {}
        for k in model.keys():
            state_dict[k] = model.get_tensor(k)
        return state_dict

    else:
        return torch.load(fp, **kwargs)


def save_conifg(config, tgt):
    config_dict = config.to_dict()
    unnecessary_keys = [
        '_name_or_path',
        'auto_map',
        'transformers_version',
        'model_type',
        'architectures',
        'tokenizer_class',
        'attn_implementation',
    ]
    for k in unnecessary_keys:
        config_dict.pop(k, None)
    config_dict['attention_bias'] = config_dict.pop('bias')
    config_dict['architectures'] = ['LlamaForCausalLM']
    llama_config = LlamaConfig(**config_dict)
    llama_config.save_pretrained(tgt)


def convert(src, tgt):
    """Convert InternLM2 huggingface checkpoints to Llama-style."""

    print('Convert InternLM2 huggingface checkpoints to Llama...')

    config = AutoConfig.from_pretrained(src, trust_remote_code=True)
    assert not config.bias, 'Cannot convert InternLM Model with bias to LLaMA.'

    head_dim = config.hidden_size // config.num_attention_heads
    num_key_value_groups = \
        config.num_attention_heads // config.num_key_value_heads

    # load index json file
    index_file = 'pytorch_model.bin.index.json'
    if os.path.exists(os.path.join(src, index_file)):
        with open(os.path.join(src, index_file)) as fp:
            index_dict = json.load(fp)
            index_dict['weight_map'] = {}
    else:
        index_file = 'model.safetensors.index.json'
        if os.path.exists(os.path.join(src, index_file)):
            with open(os.path.join(src, index_file)) as fp:
                index_dict = json.load(fp)
                index_dict['weight_map'] = {}
        else:
            index_dict = None

    os.makedirs(tgt, exist_ok=True)
    for filename in tqdm(os.listdir(src)):
        if not any(filename.endswith(ext) for ext in ('.bin', '.safetensors')):
            continue

        print(f'Loading {os.path.join(src, filename)}...', flush=True)
        states = weight_load(os.path.join(src, filename),
                             is_safetensors=filename.endswith('.safetensors'))

        llama_states = {}
        for k, v in states.copy().items():
            if 'wqkv' in k:
                v = rearrange(
                    v,
                    '(h gs d) dim -> h gs d dim',
                    gs=2 + num_key_value_groups,
                    d=head_dim,
                )
                wq, wk, wv = torch.split(v, [num_key_value_groups, 1, 1],
                                         dim=1)
                wq = rearrange(wq, 'h gs d dim -> (h gs d) dim')
                wk = rearrange(wk, 'h gs d dim -> (h gs d) dim')
                wv = rearrange(wv, 'h gs d dim -> (h gs d) dim')
                _prefix = k.split('attention')[0]
                wq_key = _prefix + 'self_attn.q_proj.weight'
                wk_key = _prefix + 'self_attn.k_proj.weight'
                wv_key = _prefix + 'self_attn.v_proj.weight'
                llama_states[wq_key] = wq.clone()
                llama_states[wk_key] = wk.clone()
                llama_states[wv_key] = wv.clone()

            elif 'attention.wo' in k:
                new_k = k.replace('attention.wo', 'self_attn.o_proj')
                llama_states[new_k] = v
            elif 'feed_forward.w1' in k:
                new_k = k.replace('feed_forward.w1', 'mlp.gate_proj')
                llama_states[new_k] = v
            elif 'feed_forward.w2' in k:
                new_k = k.replace('feed_forward.w2', 'mlp.down_proj')
                llama_states[new_k] = v
            elif 'feed_forward.w3' in k:
                new_k = k.replace('feed_forward.w3', 'mlp.up_proj')
                llama_states[new_k] = v
            elif 'attention_norm' in k:
                new_k = k.replace('attention_norm', 'input_layernorm')
                llama_states[new_k] = v
            elif 'ffn_norm' in k:
                new_k = k.replace('ffn_norm', 'post_attention_layernorm')
                llama_states[new_k] = v
            elif 'tok_embeddings' in k:
                llama_states['model.embed_tokens.weight'] = v
            elif 'output' in k:
                llama_states['lm_head.weight'] = v
            else:
                llama_states[k] = v

        if index_dict is not None:
            for k in llama_states:
                index_dict['weight_map'][k] = filename

        print(f'Saving to {os.path.join(tgt, filename)}...', flush=True)
        if filename.endswith('.safetensors'):
            from safetensors.torch import save_file
            save_file(llama_states,
                      os.path.join(tgt, filename),
                      metadata={'format': 'pt'})
        else:
            torch.save(llama_states, os.path.join(tgt, filename))
        del states

    print('Saving config and tokenizer...', flush=True)
    # index.json
    if index_dict is not None:
        with open(os.path.join(tgt, index_file), 'w') as fp:
            json.dump(index_dict, fp, indent=2)
    # tokenizer
    tokenizer = LlamaTokenizer.from_pretrained(src)
    tokenizer.init_kwargs.pop('auto_map', None)
    tokenizer.save_pretrained(tgt)
    # config
    save_conifg(config, tgt)

    print('Done!', flush=True)


def parse_args():
    parser = argparse.ArgumentParser()
    parser.add_argument('--src', type=str, help='Input folder')
    parser.add_argument('--tgt', type=str, help='Output folder')

    args = parser.parse_args()

    return args


if __name__ == '__main__':
    args = parse_args()

    convert(args.src, args.tgt)
[Tool]: Support converting InternLM2 to Llama format (#627) Co-authored-by: x54-729 <whxiaohao@163.com> 2024-01-19 11:47:28 +00:00			`# Copyright (c) InternLM. All rights reserved.`
			`import argparse`
			`import json`
			`import os`

			`import torch`
			`from einops import rearrange`
			`from tqdm import tqdm`
			`from transformers import AutoConfig, LlamaConfig, LlamaTokenizer`


[Tool]: Update tools/convert2llama.py to support `safetensors` format (#730) 2024-04-10 09:06:18 +00:00			`def weight_load(fp, **kwargs):`
			`"""Load weights from a file."""`
			`is_safetensors = kwargs.pop('is_safetensors', False)`

			`if is_safetensors:`
			`try:`
			`from safetensors import safe_open`
			`except ImportError:`
			`raise ImportError(`
			'Before loading ckpts in the `safetensors` format, '
			'please install the `safetensors` package first.')

			`model = safe_open(fp, framework='pt')`
			`state_dict = {}`
			`for k in model.keys():`
			`state_dict[k] = model.get_tensor(k)`
			`return state_dict`

			`else:`
			`return torch.load(fp, **kwargs)`


[Tool]: Support converting InternLM2 to Llama format (#627) Co-authored-by: x54-729 <whxiaohao@163.com> 2024-01-19 11:47:28 +00:00			`def save_conifg(config, tgt):`
			`config_dict = config.to_dict()`
			`unnecessary_keys = [`
[CI]: fix and pass pre-commit hook (#666) 2024-01-26 09:26:04 +00:00			`'_name_or_path',`
			`'auto_map',`
			`'transformers_version',`
			`'model_type',`
			`'architectures',`
			`'tokenizer_class',`
			`'attn_implementation',`
[Tool]: Support converting InternLM2 to Llama format (#627) Co-authored-by: x54-729 <whxiaohao@163.com> 2024-01-19 11:47:28 +00:00			`]`
			`for k in unnecessary_keys:`
			`config_dict.pop(k, None)`
[CI]: fix and pass pre-commit hook (#666) 2024-01-26 09:26:04 +00:00			`config_dict['attention_bias'] = config_dict.pop('bias')`
			`config_dict['architectures'] = ['LlamaForCausalLM']`
[Tool]: Support converting InternLM2 to Llama format (#627) Co-authored-by: x54-729 <whxiaohao@163.com> 2024-01-19 11:47:28 +00:00			`llama_config = LlamaConfig(**config_dict)`
			`llama_config.save_pretrained(tgt)`


			`def convert(src, tgt):`
			`"""Convert InternLM2 huggingface checkpoints to Llama-style."""`

[CI]: fix and pass pre-commit hook (#666) 2024-01-26 09:26:04 +00:00			`print('Convert InternLM2 huggingface checkpoints to Llama...')`
[Tool]: Support converting InternLM2 to Llama format (#627) Co-authored-by: x54-729 <whxiaohao@163.com> 2024-01-19 11:47:28 +00:00
			`config = AutoConfig.from_pretrained(src, trust_remote_code=True)`
[CI]: fix and pass pre-commit hook (#666) 2024-01-26 09:26:04 +00:00			`assert not config.bias, 'Cannot convert InternLM Model with bias to LLaMA.'`
[Tool]: Support converting InternLM2 to Llama format (#627) Co-authored-by: x54-729 <whxiaohao@163.com> 2024-01-19 11:47:28 +00:00
			`head_dim = config.hidden_size // config.num_attention_heads`
[Update] InternLM2.5 (#752) Co-authored-by: zhangwenwei <zhangwenwei@pjlab.org.cn> Co-authored-by: ZwwWayne <wayne.zw@outlook.com> Co-authored-by: 张硕 <zhangshuo@pjlab.org.cn> Co-authored-by: zhangsongyang <zhangsongyang@pjlab.org.cn> Co-authored-by: 王子奕 <wangziyi@pjlab.org.cn> Co-authored-by: 曹巍瀚 <caoweihan@pjlab.org.cn> Co-authored-by: tonysy <sy.zhangbuaa@gmail.com> Co-authored-by: 李博文 <libowen@pjlab.org.cn> 2024-07-03 12:28:08 +00:00			`num_key_value_groups = \`
			`config.num_attention_heads // config.num_key_value_heads`
[Tool]: Support converting InternLM2 to Llama format (#627) Co-authored-by: x54-729 <whxiaohao@163.com> 2024-01-19 11:47:28 +00:00
			`# load index json file`
[Tool]: Update tools/convert2llama.py to support `safetensors` format (#730) 2024-04-10 09:06:18 +00:00			`index_file = 'pytorch_model.bin.index.json'`
			`if os.path.exists(os.path.join(src, index_file)):`
			`with open(os.path.join(src, index_file)) as fp:`
[Tool]: Support converting InternLM2 to Llama format (#627) Co-authored-by: x54-729 <whxiaohao@163.com> 2024-01-19 11:47:28 +00:00			`index_dict = json.load(fp)`
[CI]: fix and pass pre-commit hook (#666) 2024-01-26 09:26:04 +00:00			`index_dict['weight_map'] = {}`
[Tool]: Support converting InternLM2 to Llama format (#627) Co-authored-by: x54-729 <whxiaohao@163.com> 2024-01-19 11:47:28 +00:00			`else:`
[Tool]: Update tools/convert2llama.py to support `safetensors` format (#730) 2024-04-10 09:06:18 +00:00			`index_file = 'model.safetensors.index.json'`
			`if os.path.exists(os.path.join(src, index_file)):`
			`with open(os.path.join(src, index_file)) as fp:`
			`index_dict = json.load(fp)`
			`index_dict['weight_map'] = {}`
			`else:`
			`index_dict = None`
[Tool]: Support converting InternLM2 to Llama format (#627) Co-authored-by: x54-729 <whxiaohao@163.com> 2024-01-19 11:47:28 +00:00
			`os.makedirs(tgt, exist_ok=True)`
			`for filename in tqdm(os.listdir(src)):`
[Tool]: Update tools/convert2llama.py to support `safetensors` format (#730) 2024-04-10 09:06:18 +00:00			`if not any(filename.endswith(ext) for ext in ('.bin', '.safetensors')):`
[Tool]: Support converting InternLM2 to Llama format (#627) Co-authored-by: x54-729 <whxiaohao@163.com> 2024-01-19 11:47:28 +00:00			`continue`
[Tool]: Update tools/convert2llama.py to support `safetensors` format (#730) 2024-04-10 09:06:18 +00:00
			`print(f'Loading {os.path.join(src, filename)}...', flush=True)`
			`states = weight_load(os.path.join(src, filename),`
			`is_safetensors=filename.endswith('.safetensors'))`

[Tool]: Support converting InternLM2 to Llama format (#627) Co-authored-by: x54-729 <whxiaohao@163.com> 2024-01-19 11:47:28 +00:00			`llama_states = {}`
			`for k, v in states.copy().items():`
[CI]: fix and pass pre-commit hook (#666) 2024-01-26 09:26:04 +00:00			`if 'wqkv' in k:`
[Tool]: Support converting InternLM2 to Llama format (#627) Co-authored-by: x54-729 <whxiaohao@163.com> 2024-01-19 11:47:28 +00:00			`v = rearrange(`
			`v,`
[CI]: fix and pass pre-commit hook (#666) 2024-01-26 09:26:04 +00:00			`'(h gs d) dim -> h gs d dim',`
[Tool]: Support converting InternLM2 to Llama format (#627) Co-authored-by: x54-729 <whxiaohao@163.com> 2024-01-19 11:47:28 +00:00			`gs=2 + num_key_value_groups,`
			`d=head_dim,`
			`)`
[CI]: fix and pass pre-commit hook (#666) 2024-01-26 09:26:04 +00:00			`wq, wk, wv = torch.split(v, [num_key_value_groups, 1, 1],`
			`dim=1)`
			`wq = rearrange(wq, 'h gs d dim -> (h gs d) dim')`
			`wk = rearrange(wk, 'h gs d dim -> (h gs d) dim')`
			`wv = rearrange(wv, 'h gs d dim -> (h gs d) dim')`
			`_prefix = k.split('attention')[0]`
			`wq_key = _prefix + 'self_attn.q_proj.weight'`
			`wk_key = _prefix + 'self_attn.k_proj.weight'`
			`wv_key = _prefix + 'self_attn.v_proj.weight'`
[Tool]: Support converting InternLM2 to Llama format (#627) Co-authored-by: x54-729 <whxiaohao@163.com> 2024-01-19 11:47:28 +00:00			`llama_states[wq_key] = wq.clone()`
			`llama_states[wk_key] = wk.clone()`
			`llama_states[wv_key] = wv.clone()`

[CI]: fix and pass pre-commit hook (#666) 2024-01-26 09:26:04 +00:00			`elif 'attention.wo' in k:`
			`new_k = k.replace('attention.wo', 'self_attn.o_proj')`
[Tool]: Support converting InternLM2 to Llama format (#627) Co-authored-by: x54-729 <whxiaohao@163.com> 2024-01-19 11:47:28 +00:00			`llama_states[new_k] = v`
[CI]: fix and pass pre-commit hook (#666) 2024-01-26 09:26:04 +00:00			`elif 'feed_forward.w1' in k:`
			`new_k = k.replace('feed_forward.w1', 'mlp.gate_proj')`
[Tool]: Support converting InternLM2 to Llama format (#627) Co-authored-by: x54-729 <whxiaohao@163.com> 2024-01-19 11:47:28 +00:00			`llama_states[new_k] = v`
[CI]: fix and pass pre-commit hook (#666) 2024-01-26 09:26:04 +00:00			`elif 'feed_forward.w2' in k:`
			`new_k = k.replace('feed_forward.w2', 'mlp.down_proj')`
[Tool]: Support converting InternLM2 to Llama format (#627) Co-authored-by: x54-729 <whxiaohao@163.com> 2024-01-19 11:47:28 +00:00			`llama_states[new_k] = v`
[CI]: fix and pass pre-commit hook (#666) 2024-01-26 09:26:04 +00:00			`elif 'feed_forward.w3' in k:`
			`new_k = k.replace('feed_forward.w3', 'mlp.up_proj')`
[Tool]: Support converting InternLM2 to Llama format (#627) Co-authored-by: x54-729 <whxiaohao@163.com> 2024-01-19 11:47:28 +00:00			`llama_states[new_k] = v`
[CI]: fix and pass pre-commit hook (#666) 2024-01-26 09:26:04 +00:00			`elif 'attention_norm' in k:`
			`new_k = k.replace('attention_norm', 'input_layernorm')`
[Tool]: Support converting InternLM2 to Llama format (#627) Co-authored-by: x54-729 <whxiaohao@163.com> 2024-01-19 11:47:28 +00:00			`llama_states[new_k] = v`
[CI]: fix and pass pre-commit hook (#666) 2024-01-26 09:26:04 +00:00			`elif 'ffn_norm' in k:`
			`new_k = k.replace('ffn_norm', 'post_attention_layernorm')`
[Tool]: Support converting InternLM2 to Llama format (#627) Co-authored-by: x54-729 <whxiaohao@163.com> 2024-01-19 11:47:28 +00:00			`llama_states[new_k] = v`
[CI]: fix and pass pre-commit hook (#666) 2024-01-26 09:26:04 +00:00			`elif 'tok_embeddings' in k:`
			`llama_states['model.embed_tokens.weight'] = v`
			`elif 'output' in k:`
			`llama_states['lm_head.weight'] = v`
[Tool]: Support converting InternLM2 to Llama format (#627) Co-authored-by: x54-729 <whxiaohao@163.com> 2024-01-19 11:47:28 +00:00			`else:`
			`llama_states[k] = v`

			`if index_dict is not None:`
			`for k in llama_states:`
[CI]: fix and pass pre-commit hook (#666) 2024-01-26 09:26:04 +00:00			`index_dict['weight_map'][k] = filename`
[Tool]: Update tools/convert2llama.py to support `safetensors` format (#730) 2024-04-10 09:06:18 +00:00
			`print(f'Saving to {os.path.join(tgt, filename)}...', flush=True)`
[Tool]: Fix the issue of safetensors conversion LLama error (#732) 2024-04-11 06:54:55 +00:00			`if filename.endswith('.safetensors'):`
			`from safetensors.torch import save_file`
[Update] InternLM2.5 (#752) Co-authored-by: zhangwenwei <zhangwenwei@pjlab.org.cn> Co-authored-by: ZwwWayne <wayne.zw@outlook.com> Co-authored-by: 张硕 <zhangshuo@pjlab.org.cn> Co-authored-by: zhangsongyang <zhangsongyang@pjlab.org.cn> Co-authored-by: 王子奕 <wangziyi@pjlab.org.cn> Co-authored-by: 曹巍瀚 <caoweihan@pjlab.org.cn> Co-authored-by: tonysy <sy.zhangbuaa@gmail.com> Co-authored-by: 李博文 <libowen@pjlab.org.cn> 2024-07-03 12:28:08 +00:00			`save_file(llama_states,`
			`os.path.join(tgt, filename),`
			`metadata={'format': 'pt'})`
[Tool]: Fix the issue of safetensors conversion LLama error (#732) 2024-04-11 06:54:55 +00:00			`else:`
			`torch.save(llama_states, os.path.join(tgt, filename))`
[Tool]: Support converting InternLM2 to Llama format (#627) Co-authored-by: x54-729 <whxiaohao@163.com> 2024-01-19 11:47:28 +00:00			`del states`

[Tool]: Update tools/convert2llama.py to support `safetensors` format (#730) 2024-04-10 09:06:18 +00:00			`print('Saving config and tokenizer...', flush=True)`
[Tool]: Support converting InternLM2 to Llama format (#627) Co-authored-by: x54-729 <whxiaohao@163.com> 2024-01-19 11:47:28 +00:00			`# index.json`
			`if index_dict is not None:`
[Tool]: Update tools/convert2llama.py to support `safetensors` format (#730) 2024-04-10 09:06:18 +00:00			`with open(os.path.join(tgt, index_file), 'w') as fp:`
[Tool]: Support converting InternLM2 to Llama format (#627) Co-authored-by: x54-729 <whxiaohao@163.com> 2024-01-19 11:47:28 +00:00			`json.dump(index_dict, fp, indent=2)`
			`# tokenizer`
			`tokenizer = LlamaTokenizer.from_pretrained(src)`
[CI]: fix and pass pre-commit hook (#666) 2024-01-26 09:26:04 +00:00			`tokenizer.init_kwargs.pop('auto_map', None)`
[Tool]: Support converting InternLM2 to Llama format (#627) Co-authored-by: x54-729 <whxiaohao@163.com> 2024-01-19 11:47:28 +00:00			`tokenizer.save_pretrained(tgt)`
			`# config`
			`save_conifg(config, tgt)`
[Tool]: Update tools/convert2llama.py to support `safetensors` format (#730) 2024-04-10 09:06:18 +00:00
			`print('Done!', flush=True)`
[Tool]: Support converting InternLM2 to Llama format (#627) Co-authored-by: x54-729 <whxiaohao@163.com> 2024-01-19 11:47:28 +00:00

			`def parse_args():`
			`parser = argparse.ArgumentParser()`
[CI]: fix and pass pre-commit hook (#666) 2024-01-26 09:26:04 +00:00			`parser.add_argument('--src', type=str, help='Input folder')`
			`parser.add_argument('--tgt', type=str, help='Output folder')`
[Tool]: Support converting InternLM2 to Llama format (#627) Co-authored-by: x54-729 <whxiaohao@163.com> 2024-01-19 11:47:28 +00:00
			`args = parser.parse_args()`

			`return args`


[CI]: fix and pass pre-commit hook (#666) 2024-01-26 09:26:04 +00:00			`if __name__ == '__main__':`
[Tool]: Support converting InternLM2 to Llama format (#627) Co-authored-by: x54-729 <whxiaohao@163.com> 2024-01-19 11:47:28 +00:00			`args = parse_args()`

			`convert(args.src, args.tgt)`