Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
|
@@ -14,6 +14,8 @@ from PIL import Image
|
|
| 14 |
from torchaudio.functional import resample
|
| 15 |
from os.path import join
|
| 16 |
|
|
|
|
|
|
|
| 17 |
from DenseAV.denseav.train import LitAVAligner
|
| 18 |
from DenseAV.denseav.plotting import plot_attention_video, plot_2head_attention_video, plot_feature_video
|
| 19 |
from DenseAV.denseav.shared import norm, crop_to_divisor, blur_dim
|
|
@@ -81,14 +83,14 @@ def process_video(video, model_option):
|
|
| 81 |
original_frames, audio, info = torchvision.io.read_video(video, end_pts=10, pts_unit='sec')
|
| 82 |
sample_rate = 16000
|
| 83 |
|
| 84 |
-
print("---"*20)
|
| 85 |
-
print(type(info["video_fps"]))
|
| 86 |
-
print("---"*20)
|
| 87 |
-
|
| 88 |
if info["audio_fps"] != sample_rate:
|
| 89 |
audio = resample(audio, info["audio_fps"], sample_rate)
|
| 90 |
audio = audio[0].unsqueeze(0)
|
| 91 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 92 |
img_transform = T.Compose([
|
| 93 |
T.Resize(load_size, Image.BILINEAR),
|
| 94 |
lambda x: crop_to_divisor(x, 8),
|
|
|
|
| 14 |
from torchaudio.functional import resample
|
| 15 |
from os.path import join
|
| 16 |
|
| 17 |
+
from fractions import Fraction
|
| 18 |
+
|
| 19 |
from DenseAV.denseav.train import LitAVAligner
|
| 20 |
from DenseAV.denseav.plotting import plot_attention_video, plot_2head_attention_video, plot_feature_video
|
| 21 |
from DenseAV.denseav.shared import norm, crop_to_divisor, blur_dim
|
|
|
|
| 83 |
original_frames, audio, info = torchvision.io.read_video(video, end_pts=10, pts_unit='sec')
|
| 84 |
sample_rate = 16000
|
| 85 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 86 |
if info["audio_fps"] != sample_rate:
|
| 87 |
audio = resample(audio, info["audio_fps"], sample_rate)
|
| 88 |
audio = audio[0].unsqueeze(0)
|
| 89 |
|
| 90 |
+
info["video_fps"] = Fraction(info["video_fps"]).limit_denominator(1000)
|
| 91 |
+
|
| 92 |
+
print(info["video_fps"].numerator)
|
| 93 |
+
|
| 94 |
img_transform = T.Compose([
|
| 95 |
T.Resize(load_size, Image.BILINEAR),
|
| 96 |
lambda x: crop_to_divisor(x, 8),
|