yuzaa commited on
Commit
e652c6b
·
1 Parent(s): b282589

add omni case for inference

Browse files
Files changed (3) hide show
  1. .gitattributes +1 -0
  2. README.md +6 -1
  3. assets/Skiing.mp4 +3 -0
.gitattributes CHANGED
@@ -37,3 +37,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
37
  *jpg filter=lfs diff=lfs merge=lfs -text
38
  *gif filter=lfs diff=lfs merge=lfs -text
39
  *.wav filter=lfs diff=lfs merge=lfs -text
 
 
37
  *jpg filter=lfs diff=lfs merge=lfs -text
38
  *gif filter=lfs diff=lfs merge=lfs -text
39
  *.wav filter=lfs diff=lfs merge=lfs -text
40
+ assets/Skiing.mp4 filter=lfs diff=lfs merge=lfs -text
README.md CHANGED
@@ -1029,7 +1029,7 @@ def get_video_chunk_content(video_path, flatten=True):
1029
 
1030
  return contents
1031
 
1032
- video_path="/path/to/video"
1033
  # if use voice clone prompt, please set ref_audio
1034
  ref_audio_path = 'assets/demo.wav'
1035
  ref_audio, _ = librosa.load(ref_audio_path, sr=16000, mono=True)
@@ -1060,6 +1060,11 @@ res = model.chat(
1060
  return_dict=True
1061
  )
1062
  print(res)
 
 
 
 
 
1063
  ```
1064
  #### Streaming inference
1065
  ```python
 
1029
 
1030
  return contents
1031
 
1032
+ video_path="assets/Skiing.mp4"
1033
  # if use voice clone prompt, please set ref_audio
1034
  ref_audio_path = 'assets/demo.wav'
1035
  ref_audio, _ = librosa.load(ref_audio_path, sr=16000, mono=True)
 
1060
  return_dict=True
1061
  )
1062
  print(res)
1063
+
1064
+ ## You will get the answer: The person in the picture is skiing down a snowy slope.
1065
+ # import IPython
1066
+ # IPython.display.Audio('output.wav')
1067
+
1068
  ```
1069
  #### Streaming inference
1070
  ```python
assets/Skiing.mp4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:479ace116d6ac92487ad90f415b3ef817cd019bba4521043ef0d5faaa1a8415d
3
+ size 8534409