try
Browse files
meanaudio/model/utils/features_utils.py
CHANGED
@@ -63,8 +63,8 @@ class FeaturesUtils(nn.Module):
|
|
63 |
self.text_encoder = T5EncoderModel.from_pretrained('google/flan-t5-large').eval()
|
64 |
|
65 |
elif encoder_name == 't5_clap' or encoder_name == 't5_clap_cat':
|
66 |
-
self.tokenizer = AutoTokenizer.from_pretrained('google/flan-t5-large')
|
67 |
-
self.text_encoder = T5EncoderModel.from_pretrained('google/flan-t5-large').eval()
|
68 |
self.laion_clap_model = laion_clap.CLAP_Module(enable_fusion=False, amodel='HTSAT-base').eval()
|
69 |
self._clap_ckpt_path = "./weights/music_speech_audioset_epoch_15_esc_89.98.pt"
|
70 |
self.laion_clap_model.load_ckpt(self._clap_ckpt_path, verbose=False)
|
|
|
63 |
self.text_encoder = T5EncoderModel.from_pretrained('google/flan-t5-large').eval()
|
64 |
|
65 |
elif encoder_name == 't5_clap' or encoder_name == 't5_clap_cat':
|
66 |
+
self.tokenizer = AutoTokenizer.from_pretrained('google/flan-t5-large',revision="main")
|
67 |
+
self.text_encoder = T5EncoderModel.from_pretrained('google/flan-t5-large',revision="main").eval()
|
68 |
self.laion_clap_model = laion_clap.CLAP_Module(enable_fusion=False, amodel='HTSAT-base').eval()
|
69 |
self._clap_ckpt_path = "./weights/music_speech_audioset_epoch_15_esc_89.98.pt"
|
70 |
self.laion_clap_model.load_ckpt(self._clap_ckpt_path, verbose=False)
|