funasr/datasets/llm_datasets/datasets.py
@@ -39,8 +39,7 @@ self.float_pad_value = float_pad_value self.prompt = kwargs.get("prompt", "Transcribe speech to text.") self.prompt_pre = "USER: \nINSTRUCTION: {}\nINPUT: ".format( self.prompt) # "USER: \nINSTRUCTION: {}\nnINPUT: {}\nASSISTANT: " self.prompt_pre = "USER: \nINSTRUCTION: {}\nINPUT: ".format(self.prompt) # "USER: \nINSTRUCTION: {}\nnINPUT: {}\nASSISTANT: " self.prompt_af = "" self.IGNORE_INDEX = kwargs.get("IGNORE_INDEX", -100) self.int_pad_value = self.IGNORE_INDEX