From cf8073eb420588e170f6430359afded42addbe6e Mon Sep 17 00:00:00 2001 From: Junyoung Park Date: Tue, 10 Dec 2024 16:37:58 +0900 Subject: [PATCH] [24/12/10] Implementation error on internvideo2_clip.py --- .DS_Store | Bin 0 -> 6148 bytes InternVideo2/.DS_Store | Bin 0 -> 6148 bytes .../multi_modality/models/internvideo2_clip.py | 10 ++++++---- 3 files changed, 6 insertions(+), 4 deletions(-) create mode 100644 .DS_Store create mode 100644 InternVideo2/.DS_Store diff --git a/.DS_Store b/.DS_Store new file mode 100644 index 0000000000000000000000000000000000000000..6eeded1515140e6de0d33e7b9dba5ab21605e1be GIT binary patch literal 6148 zcmeHK!EVz)5S?ueaaxdapb|o=WU1GvBo@$CT--D{RDvGrsvH0X8%JQ(^;U_~9HL0R z1K+~EAJTv63Eu2(rN(VVPYBT+Y4*+T&a<`8_O6GBL}#3|i5f)Y!Wo?qa5>@#QaNtTX^R_k0WEIJP!*4&!A?0yWt%1Ky6#dy?- zhVQv|AY~R`#!-Bj4krD^lO35CQJN2iijXD)q=Q~q+Uh0Z^*d%oa(fX%xyf?x4?Berli8Ss4&pAcJCB0Z>GC^ z?^bRXY!$Ey{7C`cA3Qi?V6fDvwhlC^1OPf1R)$#p`U5>400st2jTnImO$BPIFeQdC zm4nc9%m*gF)Trqs)SYo1b7x^H6k!Sv;i+^IfkxX}1*`(|3M}ewgU|oo?e+gW$@Z)Q zR)POY0pWDRZU;*;XX~}a@mcG^Kf&2Juhgh0Xv}e}0zQhL!j)mp;{X^KEHz>TW`6{f M47RZf{8a^h1F+1H)c^nh literal 0 HcmV?d00001 diff --git a/InternVideo2/.DS_Store b/InternVideo2/.DS_Store new file mode 100644 index 0000000000000000000000000000000000000000..aca79d1df3e8c7da33d5a61cadd255ebb264161d GIT binary patch literal 6148 zcmeHKO>fgc5S?vI<4{3!00|)>S>hU{NkoCF7dNB_4qR#k2a19nht#U;tzxGUiX! zM5;i+W5_|2$_O40XT>sL8Tj8B;BU7=F-aOcO&7l3J@hocDN&Pf=q)8QqI@au(^B3| zI-v=rR3N(#TVnJOeuBum#aeOiZ)&4yerooY&(Ud`TbBNgCjW& zim;gE-EjPhz2{P<(YYN)FOuQ3U%&N4W<{7}!?7wz;vrHFUnW^Br(HS8;#}1Ry2Gux zwSN8XY}VOscN*T#gVwy^&DxzuI}Pt~>*0J}b8p|@+CAtWrze^GptvG|{ZPpbgXi!O z#%~!q3&vS0vk~%mj2a!#KJ8JDo&lTSGhX8GE3$rEr%lSib%vEnY52z#c)wH)*UE}8 zVBS%8V@2j`r)e3m3|yW8-XAIwjK5LNm!sb|`K3l(PC`8yLEOpPQuq{Tg!lDV3C1}cI$lp@BjM# zzgT2F%YbFzN--duUeN1eO6F|6FgZSJJ?I-K3+I&@RS6n%94mv5;yX|!==0bB`UXpl Rh(PR*fTF=RmVtlDz;|A`l`jAQ literal 0 HcmV?d00001 diff --git a/InternVideo2/multi_modality/models/internvideo2_clip.py b/InternVideo2/multi_modality/models/internvideo2_clip.py index 45a465c..299ab63 100644 --- a/InternVideo2/multi_modality/models/internvideo2_clip.py +++ b/InternVideo2/multi_modality/models/internvideo2_clip.py @@ -228,12 +228,14 @@ def load_checkpoint(self, vision_ckpt_path=None, text_ckpt_path=None, extra_ckpt # load text_encoder logger.info(f"Load text_encoder checkpoint from {text_ckpt_path}") - test_ckpt = torch.load(text_ckpt_path, map_location='cpu') - if 'module' in test_ckpt.keys(): - test_ckpt = test_ckpt['module'] - for k, v in test_ckpt.items(): + text_ckpt = torch.load(text_ckpt_path, map_location='cpu') + if 'module' in text_ckpt.keys(): + text_ckpt = text_ckpt['module'] + for k, v in text_ckpt.items(): if k.startswith('transformer.') or k == 'text_projection': new_k = "text_encoder." + k + if ("q_proj" in k or "v_proj" in k) and "lora" not in k: + new_k = new_k.replace("_proj.", "_proj.base_layer.") else: continue new_ckpt[new_k] = v