Skip to content

Commit 3591556

Browse files
committed
sd
1 parent d4ca2c5 commit 3591556

File tree

7 files changed

+29
-17
lines changed

7 files changed

+29
-17
lines changed

audio_curation/scraping/youtube.py

+2-1
Original file line numberDiff line numberDiff line change
@@ -19,7 +19,8 @@
1919
'restrictfilenames': True,
2020
"nooverwrites": True,
2121
"continuedl": True,
22-
"outtmpl": {"default": "ST_%(upload_date)s_%(title).50s"}
22+
"outtmpl": {"default": "ST_%(upload_date)s_%(title).50s"},
23+
'ignoreerrors': True
2324
}
2425

2526

audio_curation_projects/shaastra_audio/archive_yt.py

+20-9
Original file line numberDiff line numberDiff line change
@@ -9,7 +9,7 @@
99
from audio_utils import mp3_utility
1010
from audio_curation.scraping import youtube
1111

12-
UPANYASA_BASE = "/media/vvasuki/vData/audio/learning/upanyAsAH"
12+
ARCHIVE_BASE = "/media/vvasuki/vData/audio/curation/archive"
1313
YT_BASE = "/media/vvasuki/vData/audio/curation/archive/yt-curation"
1414
DESCRIPTION_BASE = """
1515
श्रवणसौकर्याय-रक्ष्यमाणम् अत्र।
@@ -19,18 +19,23 @@
1919
def shrii_vaishnava():
2020
# youtube.get_all(url="https://www.youtube.com/@Ramayanaforus/videos", dest_dir=os.path.join(YT_BASE, "duShyanth-shrIdhar-talks"), postprocessor_args={"metadata": {"albumartist": "dushyanth shrIdhar"}})
2121
# archive_utility.update_item(item_id="duShyanth-shrIdhar-talks", dir_path=os.path.join(YT_BASE, "duShyanth-shrIdhar-talks"))
22+
23+
24+
# youtube.get_all(url="https://www.youtube.com/@gspk/videos", dest_dir=os.path.join(YT_BASE, "gspk_stotra-pArAyaNa-kainkaryam"), postprocessor_args={"metadata": {"albumartist": "GSPK"}})
2225
# archive_utility.update_item(item_id="gspk_stotra-pArAyaNa-kainkaryam", dir_path=os.path.join(YT_BASE, "gspk_stotra-pArAyaNa-kainkaryam"))
2326

2427
# youtube.get_all(url="https://www.youtube.com/@ramanujadaya8750/videos", dest_dir=os.path.join(YT_BASE, "rAmAnuja-dayA"), postprocessor_args={"metadata": {"albumartist": "rAmAnuja-dayA"}})
2528
# archive_utility.update_item(item_id="rAmAnuja-dayA-audio", dir_path=os.path.join(YT_BASE, "rAmAnuja-dayA"))
29+
30+
2631
# archive_utility.update_item(item_id="tattva-muktA-kalApaH_ALvAr", dir_path=os.path.join(YT_BASE, "tattva-muktA-kalApaH_ALvAr"), metadata={"title": "tattva-muktA-kalApaH - ALvAr", "description": "तत्त्व-मुक्ता-कलापः - आळ्वार्-पाठः\n\n" + DESCRIPTION_BASE})
2732

2833
# youtube.get_all(url="https://www.youtube.com/@parankushacharinstituteofvedic/videos", dest_dir=os.path.join(YT_BASE, "PISV"), postprocessor_args={"metadata": {"albumartist": "pisvTalks"}})
2934
# archive_utility.update_item(item_id="pisvTalks", dir_path=os.path.join(YT_BASE, "PISV"), metadata={"title": "PISV Talks", "description": "पराङ्कुशाचार्य-वैदिक-शोध-संस्था-धारा-भाषणानि\n\n" + DESCRIPTION_BASE})
3035

3136

3237
# youtube.get_all(url="https://www.youtube.com/@desikadaily/videos", dest_dir=os.path.join(YT_BASE, "deshika-daily"), postprocessor_args={"metadata": {"albumartist": "deshika-daily"}})
33-
# archive_utility.update_item(item_id="deshika-daily", dir_path=os.path.join(YT_BASE, "deshika-daily"), metadata={"title": "deshika-daily talks", "description": "देशिक-दैनिक-धारा-भाषणानि\n\n" + DESCRIPTION_BASE})
38+
archive_utility.update_item(item_id="deshika-daily", dir_path=os.path.join(YT_BASE, "deshika-daily"), metadata={"title": "deshika-daily talks", "description": "देशिक-दैनिक-धारा-भाषणानि\n\n" + DESCRIPTION_BASE})
3439

3540
# youtube.get_all(url="https://www.youtube.com/playlist?list=PLFLowj4VMohUI_zCFA0ZadHDEARgm8J7B", dest_dir=os.path.join(YT_BASE, "nArAyaNAchArya/mbh"), postprocessor_args={"metadata": {"albumartist": "KS nArAyaNAchArya"}})
3641

@@ -40,10 +45,15 @@ def shrii_vaishnava():
4045
pass
4146

4247

43-
def naaTTeri():
44-
item = audio_archive_utility.ArchiveAudioItem(archive_id="natteri-guru-paramparA_tamiL")
45-
base_dir = os.path.join(UPANYASA_BASE, "nATTeri")
46-
item.download_original_files(destination_dir=base_dir)
48+
def naaTTeri(dry_run=False):
49+
archive_id = "natteri-guru-paramparA_tamiL"
50+
base_dir = os.path.join(ARCHIVE_BASE, "nATTeri")
51+
item = audio_archive_utility.ArchiveAudioItem(archive_id=archive_id, repo_base=base_dir)
52+
# archive_audio_item.update_metadata(metadata=metadata)
53+
# item.download_original_files(destination_dir=base_dir)
54+
item.update_from_dir(dry_run=dry_run)
55+
item.delete_unaccounted_for_files(all_files_or_dir=base_dir, dry_run=dry_run)
56+
4757

4858
def dhaarmika_lectureicts():
4959
pass
@@ -55,14 +65,15 @@ def dhaarmika_lectureicts():
5565

5666
def misc():
5767
pass
58-
archive_utility.update_item(item_id="paNDita-parichayaH", dir_path=os.path.join(YT_BASE, "../paNDita-parichayaH"))
68+
# archive_utility.update_item(item_id="paNDita-parichayaH", dir_path=os.path.join(YT_BASE, "../paNDita-parichayaH"))
69+
archive_utility.update_item(item_id="MA-lakShmI-tAtAchAryaH", dir_path=os.path.join(YT_BASE, "../paNDita-parichayaH/laxmI-tAtAryaH"))
5970
# archive_utility.update_item(item_id="vyAsarAja-maTha-lectures", dir_path=os.path.join(YT_BASE, "vyAsarAjamaTha"))
6071
# archive_utility.update_item(item_id="viShNu-purANa-taylor", dir_path=os.path.join(YT_BASE, "../viShNu-purANa-taylor"))
6172

6273

6374
if __name__ == "__main__":
6475
# shrii_vaishnava()
65-
# naaTTeri()
76+
naaTTeri(dry_run=False)
6677
# dhaarmika_lectures()
67-
misc()
78+
# misc()
6879
pass

audio_curation_projects/shaastra_audio/palaveri_misc.py

+2-2
Original file line numberDiff line numberDiff line change
@@ -54,7 +54,7 @@ def rts():
5454

5555

5656
def tirukkural():
57-
repo = RepoBase(archive_id="laxmI-narasiMhaH_RTS", dir_path=os.path.join(BASE_DIR, "tiruk-kuraL"), album_id="tiruk-kuraL तिरुक्-कुरळ्", desc=f"{GENERIC_DESCRIPTION}\n\nतिरुक्-कुरळ्।")
57+
repo = RepoBase(archive_id="laxmI-narasiMhaH_tirukkuraL", dir_path=os.path.join(BASE_DIR, "tiruk-kuraL"), album_id="tiruk-kuraL तिरुक्-कुरळ्", desc=f"{GENERIC_DESCRIPTION}\n\nतिरुक्-कुरळ्।")
5858
repo.update_derivatives(dry_run=False)
5959
# archive_audio_item.update_metadata(metadata=NormalizedFilesRepo.metadata)
6060
repo.archive_audio_item.update_from_dir(file_patterns=["*.mp3"], overwrite_all=False)
@@ -78,7 +78,7 @@ def misc():
7878

7979
if __name__ == '__main__':
8080
# bhagavad_vishayam()
81-
rts()
81+
# rts()
8282
# tirukkural()
8383
# bs()
8484
# misc()

audio_curation_projects/veda/jaimini_paravastu/gopal_2014.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -72,7 +72,7 @@ def update_gopal_2014(dry_run=False):
7272
archive_audio_item.update_metadata(metadata=metadata)
7373
repo = Gopal2014RepoBase(repo_paths=[os.path.join("/home/vvasuki/veda-audio/jaiminIya-sAma-paravastu", "jaiminIya-sAma-gAna-paravastu-tradition-gopAla-2014")], archive_audio_item=archive_audio_item, git_remote_origin_basepath="[email protected]:veda-audio")
7474
repo.reprocess_files(mp3_files=repo.get_unnormalized_files(), update_git=False, dry_run=dry_run, normalize_files=False)
75-
repo.delete_unaccounted_for_files(all_files=repo.get_unnormalized_files(), dry_run=dry_run)
75+
repo.delete_unaccounted_for_files(all_files_or_dir=repo.get_unnormalized_files(), dry_run=dry_run)
7676
# gmusic_client.upload(mp3_files=repo.get_unnormalized_files(), dry_run=True)
7777

7878

audio_curation_projects/veda/jaimini_paravastu/gopal_2018.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -72,7 +72,7 @@ def update_gopal_2018(dry_run=False):
7272
archive_audio_item.update_metadata(metadata=metadata)
7373
repo = Gopal2018RepoBase(repo_paths=[os.path.join("/home/vvasuki/veda-audio/jaiminIya-sAma-paravastu", "jaiminIya-sAma-gAna-paravastu-tradition-gopAla-2018")], archive_audio_item=archive_audio_item, git_remote_origin_basepath="[email protected]:veda-audio")
7474
repo.reprocess_files(mp3_files=repo.get_unnormalized_files(), update_git=False, dry_run=dry_run, normalize_files=False)
75-
repo.delete_unaccounted_for_files(all_files=repo.get_unnormalized_files(), dry_run=dry_run)
75+
repo.delete_unaccounted_for_files(all_files_or_dir=repo.get_unnormalized_files(), dry_run=dry_run)
7676
# gmusic_client.upload(mp3_files=repo.get_unnormalized_files(), dry_run=True)
7777

7878

audio_curation_projects/veda/jaimini_paravastu/gopal_compilations.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -72,7 +72,7 @@ def update_gopal_compilation(dry_run=False):
7272
archive_audio_item.update_metadata(metadata=metadata)
7373
repo = GopalcompilationRepoBase(repo_paths=[os.path.join("/home/vvasuki/veda-audio/jaiminIya-sAma-paravastu", "jaiminIya-sAma-gAna-paravastu-tradition-gopAla-compilation")], archive_audio_item=archive_audio_item, git_remote_origin_basepath="[email protected]:veda-audio")
7474
repo.reprocess_files(mp3_files=repo.get_unnormalized_files(), update_git=False, dry_run=dry_run, normalize_files=False)
75-
repo.delete_unaccounted_for_files(all_files=repo.get_unnormalized_files(), dry_run=dry_run)
75+
repo.delete_unaccounted_for_files(all_files_or_dir=repo.get_unnormalized_files(), dry_run=dry_run)
7676
# gmusic_client.upload(mp3_files=repo.get_unnormalized_files(), dry_run=True)
7777

7878

audio_curation_projects/veda/rgveda.py

+2-2
Original file line numberDiff line numberDiff line change
@@ -46,7 +46,7 @@ def update_rgveda_sriranga():
4646
# repo.update_git(collapse_history=False, first_push=True)
4747
# exit(1)
4848
repo.archive_item.update_metadata(metadata=metadata)
49-
# repo.archive_item.delete_unaccounted_for_files(all_files=repo.get_unnormalized_files())
49+
# repo.archive_item.delete_unaccounted_for_files(all_files_or_dir=repo.get_unnormalized_files())
5050
# repo.update_archive_item(mp3_files_in=repo.get_unnormalized_files(), overwrite_all=False)
5151

5252

@@ -68,7 +68,7 @@ def update_rgveda_auro():
6868
# repo.update_git(collapse_history=False, first_push=True)
6969
# exit(1)
7070
# repo.archive_item.update_metadata(metadata=metadata)
71-
# repo.archive_item.delete_unaccounted_for_files(all_files=repo.get_unnormalized_files())
71+
# repo.archive_item.delete_unaccounted_for_files(all_files_or_dir=repo.get_unnormalized_files())
7272

7373

7474
if __name__ == "__main__":

0 commit comments

Comments
 (0)