yerang commited on
Commit
e86dc78
1 Parent(s): 3b6df21

Upload 29 files

Browse files
Files changed (29) hide show
  1. stf/.DS_Store +0 -0
  2. stf/TEMP/.DS_Store +3 -0
  3. stf/TEMP/Cam2_2309071202_0012_Natural_Looped.mp4 +3 -0
  4. stf/TEMP/front_config_v3.json +3 -0
  5. stf/TEMP/ref.jpg +3 -0
  6. stf/convert.py +20 -0
  7. stf/front_config.json +19 -0
  8. stf/front_config_v3.json +25 -0
  9. stf/nasilhong_f.jpg +0 -0
  10. stf/temp.mp4 +0 -0
  11. stf/templates/front_one_piece_dress_nodded_cut.webm +3 -0
  12. stf/test.py +30 -0
  13. stf/works/.DS_Store +0 -0
  14. stf/works/preprocess/.DS_Store +0 -0
  15. stf/works/preprocess/Ian_v3_front/.DS_Store +3 -0
  16. stf/works/preprocess/Ian_v3_front/Cam2_2309071202_0012_Natural_Looped.zip +3 -0
  17. stf/works/preprocess/Ian_v3_front/crop_video_Cam2_2309071202_0012_Natural_Looped.zip +3 -0
  18. stf/works/preprocess/Ian_v3_front/df_anchor_i/Cam2_2309071202_0012_Natural_Looped_000.pickle +3 -0
  19. stf/works/preprocess/Ian_v3_front/df_face_info/Cam2_2309071202_0012_Natural_Looped.pickle +3 -0
  20. stf/works/preprocess/Ian_v3_front/metadata.json +3 -0
  21. stf/works/preprocess/nasilhong_f_v1_front/.DS_Store +3 -0
  22. stf/works/preprocess/nasilhong_f_v1_front/crop_video_front_one_piece_dress_nodded_cut.zip +3 -0
  23. stf/works/preprocess/nasilhong_f_v1_front/df_anchor_i/front_golf_wear_nodded_cut_000.pickle +3 -0
  24. stf/works/preprocess/nasilhong_f_v1_front/df_anchor_i/front_one_piece_dress_nodded_cut_000.pickle +3 -0
  25. stf/works/preprocess/nasilhong_f_v1_front/df_face_info/front_golf_wear_nodded_cut.pickle +3 -0
  26. stf/works/preprocess/nasilhong_f_v1_front/df_face_info/front_one_piece_dress_nodded_cut.pickle +3 -0
  27. stf/works/preprocess/nasilhong_f_v1_front/front_golf_wear_nodded_cut.webm +3 -0
  28. stf/works/preprocess/nasilhong_f_v1_front/front_one_piece_dress_nodded_cut.zip +3 -0
  29. stf/works/preprocess/nasilhong_f_v1_front/metadata.json +3 -0
stf/.DS_Store ADDED
Binary file (10.2 kB). View file
 
stf/TEMP/.DS_Store ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d65165279105ca6773180500688df4bdc69a2c7b771752f0a46ef120b7fd8ec3
3
+ size 6148
stf/TEMP/Cam2_2309071202_0012_Natural_Looped.mp4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fed2d0f258d12caf91e35e0aeb5d7117fc21af282d2e6ed7f0437348079bece1
3
+ size 231354130
stf/TEMP/front_config_v3.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93b430287a06ce92cbb21a5cb96f576a0dea77cfd30c7b5ec3f8fbb6eea68b5e
3
+ size 521
stf/TEMP/ref.jpg ADDED

Git LFS Details

  • SHA256: 93c0efca983b94e18dab683e73db1a125c9bd35bef758a9c3c6b9f8e08b19265
  • Pointer size: 130 Bytes
  • Size of remote file: 36 kB
stf/convert.py ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import torch
2
+ import numpy as np
3
+
4
+ def convert():
5
+ state_dict = torch.load("mnist_cnn.pt")
6
+
7
+ tensor = {
8
+ key: tensor.cpu().numpy() for key, tensor in state_dict.items()
9
+ }
10
+
11
+ for key, value in tensor.items():
12
+ print(key, value.shape)
13
+
14
+ np.savez("mnist.npz", **tensor)
15
+
16
+ def main():
17
+ convert()
18
+
19
+ if __name__ == "__main__":
20
+ main()
stf/front_config.json ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "name": "nasilhong_f_v1_front",
3
+ "batch_size": 16,
4
+ "num_workers": 16,
5
+ "mel_step_size": 108,
6
+ "mel_ps": 80,
7
+ "img_size": 352,
8
+ "mask_ver": "pwb_front_v39_1_2",
9
+ "num_ips": 2,
10
+ "mask_img_trsf_ver": 0,
11
+ "mel_trsf_ver": -1,
12
+ "mel_norm_ver": -1,
13
+ "lr": 1,
14
+ "crop_offset_y": 0.08,
15
+ "crop_margin": 0.35,
16
+ "crop_start_frame": 3,
17
+ "model_type": "stf_v3"
18
+ }
19
+
stf/front_config_v3.json ADDED
@@ -0,0 +1,25 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "name": "Ian_v3_front",
3
+ "batch_size": 16,
4
+ "num_workers": 16,
5
+ "mel_step_size": 108,
6
+ "mel_ps": 80,
7
+ "img_size": 352,
8
+ "mask_ver": "pwb_front_v39_1_wide",
9
+ "num_ips": 2,
10
+ "mask_img_trsf_ver": 0,
11
+ "mel_trsf_ver": -1,
12
+ "mel_norm_ver": -1,
13
+ "lr": 1,
14
+ "crop_offset_y": 0.08,
15
+ "crop_margin": 0.35,
16
+ "crop_start_frame": 3,
17
+ "model_type":"stf_v3",
18
+ "compose":"compose_smooth",
19
+ "image_resize":"True",
20
+ "compose_box": "face_only",
21
+ "compose_args": {
22
+ "blur_ratio": 0.3,
23
+ "dilate_ratio": 0.3
24
+ }
25
+ }
stf/nasilhong_f.jpg ADDED
stf/temp.mp4 ADDED
Binary file (77.4 kB). View file
 
stf/templates/front_one_piece_dress_nodded_cut.webm ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f992d7c247e0b75995818d08b5e3a26ec117ccf4f47aac62bda126d444d29f2
3
+ size 12800728
stf/test.py ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ from time import time
2
+ from datasets import load_dataset
3
+ from faster_whisper import WhisperModel
4
+ # from transformers import WhisperForConditionalGeneration, WhisperProcessor
5
+
6
+ ds = load_dataset("hf-internal-testing/librispeech_asr_dummy", "clean", split="validation", cache_dir=".")
7
+
8
+ # processor = WhisperProcessor.from_pretrained("openai/whisper-large-v3")
9
+ # model = WhisperForConditionalGeneration.from_pretrained("openai/whisper-large-v3").to("mps")
10
+ model = WhisperModel("large-v3", device="cuda", compute_type="float16", download_root=".")
11
+
12
+ audio_sample = ds[0]["audio"]
13
+ waveform = audio_sample["array"]
14
+ sampling_rate = audio_sample["sampling_rate"]
15
+
16
+ tic = time()
17
+ # input_features = processor(
18
+ # waveform, sampling_rate=sampling_rate, return_tensors="pt"
19
+ # ).input_features
20
+ segments, info = model.transcribe(waveform, beam_size=5)
21
+ # predicted_ids = model.generate(input_features.to("mps"))
22
+
23
+ # transcription = processor.batch_decode(predicted_ids, skip_special_tokens=True)
24
+
25
+ toc = time()
26
+
27
+ # print(transcription[0])
28
+ for segment in segments:
29
+ print("[%.2fs -> %.2fs] %s" % (segment.start, segment.end, segment.text))
30
+ print(toc - tic)
stf/works/.DS_Store ADDED
Binary file (6.15 kB). View file
 
stf/works/preprocess/.DS_Store ADDED
Binary file (6.15 kB). View file
 
stf/works/preprocess/Ian_v3_front/.DS_Store ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b2bab5852e3a44786fd245355a3533ec9d21267ec58697abca3a1f9bb552775b
3
+ size 6148
stf/works/preprocess/Ian_v3_front/Cam2_2309071202_0012_Natural_Looped.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:52b01f710ebe61088b0a5f22b7c4b2490023d370acc783573d935a4cbdadb8db
3
+ size 511705088
stf/works/preprocess/Ian_v3_front/crop_video_Cam2_2309071202_0012_Natural_Looped.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df3c585610ab66e232ae971be8ed43ce472b9a792fad05b7826c4396d2c64b77
3
+ size 73588867
stf/works/preprocess/Ian_v3_front/df_anchor_i/Cam2_2309071202_0012_Natural_Looped_000.pickle ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:410850fc627f0c2cd6699f1825ccaee3e4a5ee26d54708e3bcceeeb511fd553e
3
+ size 31559
stf/works/preprocess/Ian_v3_front/df_face_info/Cam2_2309071202_0012_Natural_Looped.pickle ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c73c0b3704e01331bcd7ee7a0e5fab0d55823d9158f8b81fa46fd3dad3241ea1
3
+ size 117457
stf/works/preprocess/Ian_v3_front/metadata.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:615681285dec4805f5dd7886b7ee1c9a348ee0bb8efc38e91841bccf835bdccd
3
+ size 42
stf/works/preprocess/nasilhong_f_v1_front/.DS_Store ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c2786dddebbe68bf137be2a3005ceb4092317c279e75b605c5dc22ac16032e8
3
+ size 6148
stf/works/preprocess/nasilhong_f_v1_front/crop_video_front_one_piece_dress_nodded_cut.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7bfefccf14d9b8411262eda85d2bac67679f7bd1015866a5fe8c92ae2a226a7d
3
+ size 242568709
stf/works/preprocess/nasilhong_f_v1_front/df_anchor_i/front_golf_wear_nodded_cut_000.pickle ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9371a6b8c525a2eb9f90ca286145c97143e76f546afe24aa99e61ca33b34dcee
3
+ size 38482
stf/works/preprocess/nasilhong_f_v1_front/df_anchor_i/front_one_piece_dress_nodded_cut_000.pickle ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd4704c0a9c32b22b14deac1e966127d5a2727d957cfb1547f88b68ea18abdae
3
+ size 38566
stf/works/preprocess/nasilhong_f_v1_front/df_face_info/front_golf_wear_nodded_cut.pickle ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44408b86e82431f50b069d3a3d408e62706f106f0d7e79bcd7118723cda145fc
3
+ size 143627
stf/works/preprocess/nasilhong_f_v1_front/df_face_info/front_one_piece_dress_nodded_cut.pickle ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05d953518ca36c9243168c56058b37a46aeb0cad940dec75cf0626ae75ec5f8f
3
+ size 143591
stf/works/preprocess/nasilhong_f_v1_front/front_golf_wear_nodded_cut.webm ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc3f6f0e5ab11b1db1c12fc397391e66b4152a0272b31528998b52fffc416fa9
3
+ size 12855848
stf/works/preprocess/nasilhong_f_v1_front/front_one_piece_dress_nodded_cut.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb6e8fe920cdd7132c3824579159a77dd79f0b1afa56ad37ce3263fb018f8927
3
+ size 902495052
stf/works/preprocess/nasilhong_f_v1_front/metadata.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:06c2997fe0bba05ca3922fd09d0ce435fb175d94de722d4027a6f82bdfeb6946
3
+ size 42