Spaces:
Sleeping
Sleeping
Upload 29 files
Browse files- stf/.DS_Store +0 -0
- stf/TEMP/.DS_Store +3 -0
- stf/TEMP/Cam2_2309071202_0012_Natural_Looped.mp4 +3 -0
- stf/TEMP/front_config_v3.json +3 -0
- stf/TEMP/ref.jpg +3 -0
- stf/convert.py +20 -0
- stf/front_config.json +19 -0
- stf/front_config_v3.json +25 -0
- stf/nasilhong_f.jpg +0 -0
- stf/temp.mp4 +0 -0
- stf/templates/front_one_piece_dress_nodded_cut.webm +3 -0
- stf/test.py +30 -0
- stf/works/.DS_Store +0 -0
- stf/works/preprocess/.DS_Store +0 -0
- stf/works/preprocess/Ian_v3_front/.DS_Store +3 -0
- stf/works/preprocess/Ian_v3_front/Cam2_2309071202_0012_Natural_Looped.zip +3 -0
- stf/works/preprocess/Ian_v3_front/crop_video_Cam2_2309071202_0012_Natural_Looped.zip +3 -0
- stf/works/preprocess/Ian_v3_front/df_anchor_i/Cam2_2309071202_0012_Natural_Looped_000.pickle +3 -0
- stf/works/preprocess/Ian_v3_front/df_face_info/Cam2_2309071202_0012_Natural_Looped.pickle +3 -0
- stf/works/preprocess/Ian_v3_front/metadata.json +3 -0
- stf/works/preprocess/nasilhong_f_v1_front/.DS_Store +3 -0
- stf/works/preprocess/nasilhong_f_v1_front/crop_video_front_one_piece_dress_nodded_cut.zip +3 -0
- stf/works/preprocess/nasilhong_f_v1_front/df_anchor_i/front_golf_wear_nodded_cut_000.pickle +3 -0
- stf/works/preprocess/nasilhong_f_v1_front/df_anchor_i/front_one_piece_dress_nodded_cut_000.pickle +3 -0
- stf/works/preprocess/nasilhong_f_v1_front/df_face_info/front_golf_wear_nodded_cut.pickle +3 -0
- stf/works/preprocess/nasilhong_f_v1_front/df_face_info/front_one_piece_dress_nodded_cut.pickle +3 -0
- stf/works/preprocess/nasilhong_f_v1_front/front_golf_wear_nodded_cut.webm +3 -0
- stf/works/preprocess/nasilhong_f_v1_front/front_one_piece_dress_nodded_cut.zip +3 -0
- stf/works/preprocess/nasilhong_f_v1_front/metadata.json +3 -0
stf/.DS_Store
ADDED
Binary file (10.2 kB). View file
|
|
stf/TEMP/.DS_Store
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d65165279105ca6773180500688df4bdc69a2c7b771752f0a46ef120b7fd8ec3
|
3 |
+
size 6148
|
stf/TEMP/Cam2_2309071202_0012_Natural_Looped.mp4
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fed2d0f258d12caf91e35e0aeb5d7117fc21af282d2e6ed7f0437348079bece1
|
3 |
+
size 231354130
|
stf/TEMP/front_config_v3.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:93b430287a06ce92cbb21a5cb96f576a0dea77cfd30c7b5ec3f8fbb6eea68b5e
|
3 |
+
size 521
|
stf/TEMP/ref.jpg
ADDED
Git LFS Details
|
stf/convert.py
ADDED
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
import torch
|
2 |
+
import numpy as np
|
3 |
+
|
4 |
+
def convert():
|
5 |
+
state_dict = torch.load("mnist_cnn.pt")
|
6 |
+
|
7 |
+
tensor = {
|
8 |
+
key: tensor.cpu().numpy() for key, tensor in state_dict.items()
|
9 |
+
}
|
10 |
+
|
11 |
+
for key, value in tensor.items():
|
12 |
+
print(key, value.shape)
|
13 |
+
|
14 |
+
np.savez("mnist.npz", **tensor)
|
15 |
+
|
16 |
+
def main():
|
17 |
+
convert()
|
18 |
+
|
19 |
+
if __name__ == "__main__":
|
20 |
+
main()
|
stf/front_config.json
ADDED
@@ -0,0 +1,19 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"name": "nasilhong_f_v1_front",
|
3 |
+
"batch_size": 16,
|
4 |
+
"num_workers": 16,
|
5 |
+
"mel_step_size": 108,
|
6 |
+
"mel_ps": 80,
|
7 |
+
"img_size": 352,
|
8 |
+
"mask_ver": "pwb_front_v39_1_2",
|
9 |
+
"num_ips": 2,
|
10 |
+
"mask_img_trsf_ver": 0,
|
11 |
+
"mel_trsf_ver": -1,
|
12 |
+
"mel_norm_ver": -1,
|
13 |
+
"lr": 1,
|
14 |
+
"crop_offset_y": 0.08,
|
15 |
+
"crop_margin": 0.35,
|
16 |
+
"crop_start_frame": 3,
|
17 |
+
"model_type": "stf_v3"
|
18 |
+
}
|
19 |
+
|
stf/front_config_v3.json
ADDED
@@ -0,0 +1,25 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"name": "Ian_v3_front",
|
3 |
+
"batch_size": 16,
|
4 |
+
"num_workers": 16,
|
5 |
+
"mel_step_size": 108,
|
6 |
+
"mel_ps": 80,
|
7 |
+
"img_size": 352,
|
8 |
+
"mask_ver": "pwb_front_v39_1_wide",
|
9 |
+
"num_ips": 2,
|
10 |
+
"mask_img_trsf_ver": 0,
|
11 |
+
"mel_trsf_ver": -1,
|
12 |
+
"mel_norm_ver": -1,
|
13 |
+
"lr": 1,
|
14 |
+
"crop_offset_y": 0.08,
|
15 |
+
"crop_margin": 0.35,
|
16 |
+
"crop_start_frame": 3,
|
17 |
+
"model_type":"stf_v3",
|
18 |
+
"compose":"compose_smooth",
|
19 |
+
"image_resize":"True",
|
20 |
+
"compose_box": "face_only",
|
21 |
+
"compose_args": {
|
22 |
+
"blur_ratio": 0.3,
|
23 |
+
"dilate_ratio": 0.3
|
24 |
+
}
|
25 |
+
}
|
stf/nasilhong_f.jpg
ADDED
stf/temp.mp4
ADDED
Binary file (77.4 kB). View file
|
|
stf/templates/front_one_piece_dress_nodded_cut.webm
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7f992d7c247e0b75995818d08b5e3a26ec117ccf4f47aac62bda126d444d29f2
|
3 |
+
size 12800728
|
stf/test.py
ADDED
@@ -0,0 +1,30 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
from time import time
|
2 |
+
from datasets import load_dataset
|
3 |
+
from faster_whisper import WhisperModel
|
4 |
+
# from transformers import WhisperForConditionalGeneration, WhisperProcessor
|
5 |
+
|
6 |
+
ds = load_dataset("hf-internal-testing/librispeech_asr_dummy", "clean", split="validation", cache_dir=".")
|
7 |
+
|
8 |
+
# processor = WhisperProcessor.from_pretrained("openai/whisper-large-v3")
|
9 |
+
# model = WhisperForConditionalGeneration.from_pretrained("openai/whisper-large-v3").to("mps")
|
10 |
+
model = WhisperModel("large-v3", device="cuda", compute_type="float16", download_root=".")
|
11 |
+
|
12 |
+
audio_sample = ds[0]["audio"]
|
13 |
+
waveform = audio_sample["array"]
|
14 |
+
sampling_rate = audio_sample["sampling_rate"]
|
15 |
+
|
16 |
+
tic = time()
|
17 |
+
# input_features = processor(
|
18 |
+
# waveform, sampling_rate=sampling_rate, return_tensors="pt"
|
19 |
+
# ).input_features
|
20 |
+
segments, info = model.transcribe(waveform, beam_size=5)
|
21 |
+
# predicted_ids = model.generate(input_features.to("mps"))
|
22 |
+
|
23 |
+
# transcription = processor.batch_decode(predicted_ids, skip_special_tokens=True)
|
24 |
+
|
25 |
+
toc = time()
|
26 |
+
|
27 |
+
# print(transcription[0])
|
28 |
+
for segment in segments:
|
29 |
+
print("[%.2fs -> %.2fs] %s" % (segment.start, segment.end, segment.text))
|
30 |
+
print(toc - tic)
|
stf/works/.DS_Store
ADDED
Binary file (6.15 kB). View file
|
|
stf/works/preprocess/.DS_Store
ADDED
Binary file (6.15 kB). View file
|
|
stf/works/preprocess/Ian_v3_front/.DS_Store
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b2bab5852e3a44786fd245355a3533ec9d21267ec58697abca3a1f9bb552775b
|
3 |
+
size 6148
|
stf/works/preprocess/Ian_v3_front/Cam2_2309071202_0012_Natural_Looped.zip
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:52b01f710ebe61088b0a5f22b7c4b2490023d370acc783573d935a4cbdadb8db
|
3 |
+
size 511705088
|
stf/works/preprocess/Ian_v3_front/crop_video_Cam2_2309071202_0012_Natural_Looped.zip
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:df3c585610ab66e232ae971be8ed43ce472b9a792fad05b7826c4396d2c64b77
|
3 |
+
size 73588867
|
stf/works/preprocess/Ian_v3_front/df_anchor_i/Cam2_2309071202_0012_Natural_Looped_000.pickle
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:410850fc627f0c2cd6699f1825ccaee3e4a5ee26d54708e3bcceeeb511fd553e
|
3 |
+
size 31559
|
stf/works/preprocess/Ian_v3_front/df_face_info/Cam2_2309071202_0012_Natural_Looped.pickle
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c73c0b3704e01331bcd7ee7a0e5fab0d55823d9158f8b81fa46fd3dad3241ea1
|
3 |
+
size 117457
|
stf/works/preprocess/Ian_v3_front/metadata.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:615681285dec4805f5dd7886b7ee1c9a348ee0bb8efc38e91841bccf835bdccd
|
3 |
+
size 42
|
stf/works/preprocess/nasilhong_f_v1_front/.DS_Store
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0c2786dddebbe68bf137be2a3005ceb4092317c279e75b605c5dc22ac16032e8
|
3 |
+
size 6148
|
stf/works/preprocess/nasilhong_f_v1_front/crop_video_front_one_piece_dress_nodded_cut.zip
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7bfefccf14d9b8411262eda85d2bac67679f7bd1015866a5fe8c92ae2a226a7d
|
3 |
+
size 242568709
|
stf/works/preprocess/nasilhong_f_v1_front/df_anchor_i/front_golf_wear_nodded_cut_000.pickle
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9371a6b8c525a2eb9f90ca286145c97143e76f546afe24aa99e61ca33b34dcee
|
3 |
+
size 38482
|
stf/works/preprocess/nasilhong_f_v1_front/df_anchor_i/front_one_piece_dress_nodded_cut_000.pickle
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dd4704c0a9c32b22b14deac1e966127d5a2727d957cfb1547f88b68ea18abdae
|
3 |
+
size 38566
|
stf/works/preprocess/nasilhong_f_v1_front/df_face_info/front_golf_wear_nodded_cut.pickle
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:44408b86e82431f50b069d3a3d408e62706f106f0d7e79bcd7118723cda145fc
|
3 |
+
size 143627
|
stf/works/preprocess/nasilhong_f_v1_front/df_face_info/front_one_piece_dress_nodded_cut.pickle
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:05d953518ca36c9243168c56058b37a46aeb0cad940dec75cf0626ae75ec5f8f
|
3 |
+
size 143591
|
stf/works/preprocess/nasilhong_f_v1_front/front_golf_wear_nodded_cut.webm
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bc3f6f0e5ab11b1db1c12fc397391e66b4152a0272b31528998b52fffc416fa9
|
3 |
+
size 12855848
|
stf/works/preprocess/nasilhong_f_v1_front/front_one_piece_dress_nodded_cut.zip
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cb6e8fe920cdd7132c3824579159a77dd79f0b1afa56ad37ce3263fb018f8927
|
3 |
+
size 902495052
|
stf/works/preprocess/nasilhong_f_v1_front/metadata.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:06c2997fe0bba05ca3922fd09d0ce435fb175d94de722d4027a6f82bdfeb6946
|
3 |
+
size 42
|