mirror of
https://github.com/modelscope/FunASR
synced 2025-09-15 14:48:36 +08:00
add inference prepare func (#1848)
This commit is contained in:
parent
d9bdd0eb67
commit
e3eb52f8bf
@ -1241,7 +1241,8 @@ class LLMASR4(nn.Module):
|
||||
|
||||
return output
|
||||
|
||||
def inference(
|
||||
|
||||
def inference_prepare(
|
||||
self,
|
||||
data_in,
|
||||
data_lengths=None,
|
||||
@ -1319,6 +1320,22 @@ class LLMASR4(nn.Module):
|
||||
] = speech_token
|
||||
|
||||
speech_idx += 1
|
||||
return inputs_embeds, contents, batch, source_ids, meta_data
|
||||
|
||||
|
||||
def inference(
|
||||
self,
|
||||
data_in,
|
||||
data_lengths=None,
|
||||
key: list = None,
|
||||
tokenizer=None,
|
||||
frontend=None,
|
||||
**kwargs,
|
||||
):
|
||||
|
||||
inputs_embeds, contents, batch, source_ids, meta_data = self.inference_prepare(
|
||||
data_in, data_lengths, key, tokenizer, frontend, **kwargs
|
||||
)
|
||||
|
||||
llm_dtype = kwargs.get("llm_dtype", "fp32")
|
||||
if llm_dtype == "fp32":
|
||||
|
||||
Loading…
Reference in New Issue
Block a user