vikramvasudevan commited on
Commit
cc0b1f9
·
verified ·
1 Parent(s): b1790fa

Upload folder using huggingface_hub

Browse files
modules/config/bhagavat_gita.py CHANGED
@@ -23,7 +23,7 @@ bhagavat_gita_config = {
23
  "word_by_word_native": "word_by_word_meaning",
24
  "translation": "translation",
25
  "author": lambda doc: f"Maharishi Vedvyas Ji",
26
- "chapter_name": "chapter_title",
27
  "relative_path": lambda doc: f"{doc.get("chapter_title","")}-{doc.get("relative_verse_number","")}",
28
  },
29
  "metadata_fields": [
 
23
  "word_by_word_native": "word_by_word_meaning",
24
  "translation": "translation",
25
  "author": lambda doc: f"Maharishi Vedvyas Ji",
26
+ # "chapter_name": "chapter_title",
27
  "relative_path": lambda doc: f"{doc.get("chapter_title","")}-{doc.get("relative_verse_number","")}",
28
  },
29
  "metadata_fields": [
modules/config/chathusloki.py CHANGED
@@ -16,7 +16,7 @@ chathusloki_config = {
16
  "transliteration": "sloka_english_transliteration",
17
  "word_by_word_native": "meaning",
18
  "author": lambda doc: f"Sri Aalavandhaar",
19
- "relative_path": lambda doc: f"Chathusloki-{doc.get("sloka_number","")}",
20
  },
21
  "metadata_fields": [
22
  {
 
16
  "transliteration": "sloka_english_transliteration",
17
  "word_by_word_native": "meaning",
18
  "author": lambda doc: f"Sri Aalavandhaar",
19
+ "relative_path": lambda doc: f"॥ चतुः श्लोकी ॥ {doc.get("sloka_number","")}",
20
  },
21
  "metadata_fields": [
22
  {
modules/config/divya_prabandham.py CHANGED
@@ -20,7 +20,7 @@ divya_prabandham_config = {
20
  "transliteration": "pasuram_en",
21
  "reference_link": "html_url",
22
  "author": "azhwar_name",
23
- "chapter_name": "prabandham_name",
24
  "relative_path": lambda doc: "-".join(
25
  filter(
26
  None,
 
20
  "transliteration": "pasuram_en",
21
  "reference_link": "html_url",
22
  "author": "azhwar_name",
23
+ # "chapter_name": "prabandham_name",
24
  "relative_path": lambda doc: "-".join(
25
  filter(
26
  None,
modules/config/kamba_ramayanam.py CHANGED
@@ -9,14 +9,14 @@ kamba_ramayanam_config = {
9
  "collection_name": "kamba_ramayanam",
10
  "unit": "chunk",
11
  "unit_field": "chunk_index",
12
- "field_mapping": {
13
- "chapter_name": lambda doc: f"{doc.get('kandam','')}",
14
- "title": lambda doc: f"{doc.get('padalam_ta','')} - {doc.get('padalam_en','')}".strip(),
15
- "author": lambda doc: "Kamban",
16
- "unit_index": "chunk_index",
17
- "verse": lambda doc: int(doc.get("verse_number", "0")),
18
- "relative_path": lambda doc: f"{doc.get('padalam_ta','')} - {doc.get('padalam_en','')}".strip(),
19
- },
20
  "metadata_fields": [
21
  {
22
  "name": "chunk_index",
 
9
  "collection_name": "kamba_ramayanam",
10
  "unit": "chunk",
11
  "unit_field": "chunk_index",
12
+ # "field_mapping": {
13
+ # "chapter_name": lambda doc: f"{doc.get('kandam','')}",
14
+ # "title": lambda doc: f"{doc.get('padalam_ta','')} - {doc.get('padalam_en','')}".strip(),
15
+ # "author": lambda doc: "Kamban",
16
+ # "unit_index": "chunk_index",
17
+ # "verse": lambda doc: int(doc.get("verse_number", "0")),
18
+ # "relative_path": lambda doc: f"{doc.get('padalam_ta','')} - {doc.get('padalam_en','')}".strip(),
19
+ # },
20
  "metadata_fields": [
21
  {
22
  "name": "chunk_index",
modules/config/katakam.py CHANGED
@@ -21,9 +21,9 @@ katakam_config = {
21
  else "॥ काठकम् ॥"
22
  ),
23
  "relative_path": lambda doc: (
24
- "-"
25
  if not doc.get("panchadhi") or doc.get("panchadhi") == "-"
26
- else f"{doc.get('prapaatakam')}.{doc.get('anuvakam')}.{doc.get('panchadhi_index')} || {doc.get('panchadhi_sa')} ||"
27
  ),
28
  },
29
  "metadata_fields": [
 
21
  else "॥ काठकम् ॥"
22
  ),
23
  "relative_path": lambda doc: (
24
+ "॥ काठकम् ॥"
25
  if not doc.get("panchadhi") or doc.get("panchadhi") == "-"
26
+ else f"॥ काठकम् ॥ {doc.get('prapaatakam')}.{doc.get('anuvakam')}.{doc.get('panchadhi_index')} || {doc.get('panchadhi_sa')} ||"
27
  ),
28
  },
29
  "metadata_fields": [
modules/config/pancha_sooktham.py CHANGED
@@ -17,7 +17,7 @@ pancha_sooktham_config = {
17
  "text": "sanskrit",
18
  "unit_index": "relative_verse_number",
19
  "transliteration": lambda doc: f"English: \n{doc.get('english')}\n\nதமிழ்: \n{doc.get('tamil')}\n\nతెలుగు: \n{doc.get('telugu')}\n\nಕನ್ನಡ: \n{doc.get('kannada')}",
20
- "chapter_name": "chapter_title",
21
  "relative_path": lambda doc: f"{doc.get('chapter_title',"")}-{doc.get('relative_verse_number',"")}",
22
  },
23
  "metadata_fields": [
 
17
  "text": "sanskrit",
18
  "unit_index": "relative_verse_number",
19
  "transliteration": lambda doc: f"English: \n{doc.get('english')}\n\nதமிழ்: \n{doc.get('tamil')}\n\nతెలుగు: \n{doc.get('telugu')}\n\nಕನ್ನಡ: \n{doc.get('kannada')}",
20
+ # "chapter_name": "chapter_title",
21
  "relative_path": lambda doc: f"{doc.get('chapter_title',"")}-{doc.get('relative_verse_number',"")}",
22
  },
23
  "metadata_fields": [
modules/config/shanthi_panchakam.py CHANGED
@@ -18,8 +18,8 @@ shanthi_panchakam_config = {
18
  "text": "sanskrit",
19
  "unit_index": "relative_verse_number",
20
  "transliteration": lambda doc: f"English: \n{doc.get('english')}\n\nதமிழ்: \n{doc.get('tamil')}\n\nతెలుగు: \n{doc.get('telugu')}\n\nಕನ್ನಡ: \n{doc.get('kannada')}",
21
- "chapter_name": "chapter_title",
22
- "relative_path": lambda doc: f"{doc.get('chapter_title',"")}-{doc.get('relative_verse_number',"")}",
23
  },
24
  "metadata_fields": [
25
  {
 
18
  "text": "sanskrit",
19
  "unit_index": "relative_verse_number",
20
  "transliteration": lambda doc: f"English: \n{doc.get('english')}\n\nதமிழ்: \n{doc.get('tamil')}\n\nతెలుగు: \n{doc.get('telugu')}\n\nಕನ್ನಡ: \n{doc.get('kannada')}",
21
+ # "chapter_name": "chapter_title",
22
+ "relative_path": lambda doc: f"॥ शान्ति पञ्चकम् ॥ {doc.get('chapter_title')}.{doc.get('relative_verse_number',"")}",
23
  },
24
  "metadata_fields": [
25
  {
modules/config/sri_stavam.py CHANGED
@@ -13,12 +13,12 @@ sri_stavam_config = {
13
  "text": "sanskrit",
14
  "title": lambda doc: f"Verse {doc.get('sloka_number','')}",
15
  "unit_index": "sloka_number",
16
- "chapter" : "chapter",
17
  "transliteration": "transliteration",
18
  "word_by_word_native": "meaning_short",
19
  "translation" : "commentary",
20
  "author": lambda doc: "Sri Koorathazhwan" if 1 <= doc.get("sloka_number", 0) <= 11 else "-",
21
- "relative_path": lambda doc: f"Sri Stavam-{doc.get("sloka_number","")}" if 1 <= doc.get("sloka_number", 0) <= 11 else "-",
22
  },
23
  "metadata_fields": [
24
  {
 
13
  "text": "sanskrit",
14
  "title": lambda doc: f"Verse {doc.get('sloka_number','')}",
15
  "unit_index": "sloka_number",
16
+ "chapter_name" : "chapter",
17
  "transliteration": "transliteration",
18
  "word_by_word_native": "meaning_short",
19
  "translation" : "commentary",
20
  "author": lambda doc: "Sri Koorathazhwan" if 1 <= doc.get("sloka_number", 0) <= 11 else "-",
21
+ "relative_path": lambda doc: f" श्री:स्तव: ॥ {doc.get("sloka_number",'')}",
22
  },
23
  "metadata_fields": [
24
  {
modules/config/taitriya_brahmanam.py CHANGED
@@ -25,9 +25,9 @@ taitriya_brahmanam_config = {
25
  )
26
  ),
27
  "relative_path": lambda doc: (
28
- "-"
29
  if not doc.get("panchadhi") or doc.get("panchadhi") == "-"
30
- else f"{doc.get('ashtakam')}.{doc.get('prapaatakam')}.{doc.get('anuvakam')}.{doc.get('panchadhi_index')} || {doc.get('panchadhi_sa')} ||"
31
  ),
32
  },
33
  "metadata_fields": [
 
25
  )
26
  ),
27
  "relative_path": lambda doc: (
28
+ "॥ तैत्तिरीय-ब्राह्मणम् ॥"
29
  if not doc.get("panchadhi") or doc.get("panchadhi") == "-"
30
+ else f"॥ तैत्तिरीय-ब्राह्मणम् ॥ {doc.get('ashtakam')}.{doc.get('prapaatakam')}.{doc.get('anuvakam')}.{doc.get('panchadhi_index')} || {doc.get('panchadhi_sa')} ||"
31
  ),
32
  },
33
  "metadata_fields": [
modules/config/taitriya_samhitha.py CHANGED
@@ -25,9 +25,9 @@ taitriya_samhitha_config = {
25
  )
26
  ),
27
  "relative_path": lambda doc: (
28
- "-"
29
  if not doc.get("panchadhi") or doc.get("panchadhi") == "-"
30
- else f"{doc.get('kandam')}.{doc.get('prashnam')}.{doc.get('anuvakam')}.{doc.get('panchadhi_index')} || {doc.get('panchadhi_sa')} ||"
31
  ),
32
  },
33
  "metadata_fields": [
 
25
  )
26
  ),
27
  "relative_path": lambda doc: (
28
+ "॥ तैत्तिरीय-संहिता ॥"
29
  if not doc.get("panchadhi") or doc.get("panchadhi") == "-"
30
+ else f"॥ तैत्तिरीय-संहिता ॥ {doc.get('kandam')}.{doc.get('prashnam')}.{doc.get('anuvakam')}.{doc.get('panchadhi_index')} || {doc.get('panchadhi_sa')} ||"
31
  ),
32
  },
33
  "metadata_fields": [
modules/config/taitriya_upanishad.py CHANGED
@@ -18,8 +18,8 @@ taitriya_upanishad_config = {
18
  "text": "sanskrit",
19
  "unit_index": "relative_verse_number",
20
  "transliteration": lambda doc: f"English: \n{doc.get('english')}\n\nதமிழ்: \n{doc.get('tamil')}\n\nతెలుగు: \n{doc.get('telugu')}\n\nಕನ್ನಡ: \n{doc.get('kannada')}",
21
- "chapter_name": "chapter_title",
22
- "relative_path": lambda doc: f"{doc.get('chapter_title',"")}-{doc.get('relative_verse_number',"")}",
23
  },
24
  "metadata_fields": [
25
  {
 
18
  "text": "sanskrit",
19
  "unit_index": "relative_verse_number",
20
  "transliteration": lambda doc: f"English: \n{doc.get('english')}\n\nதமிழ்: \n{doc.get('tamil')}\n\nతెలుగు: \n{doc.get('telugu')}\n\nಕನ್ನಡ: \n{doc.get('kannada')}",
21
+ # "chapter_name": "chapter_title",
22
+ "relative_path": lambda doc: f"{doc.get('chapter_title')}{doc.get('relative_verse_number','')}",
23
  },
24
  "metadata_fields": [
25
  {
modules/config/vishnu_sahasranamam.py CHANGED
@@ -20,8 +20,8 @@ vishnu_sahasranamam_config = {
20
  "transliteration": "transliteration",
21
  "translation": "translation",
22
  "author": lambda doc: f"Sage Vyasa",
23
- "chapter_name": "chapter",
24
- "relative_path": lambda doc: f"{doc.get("chapter","")}-{doc.get("verse","")}",
25
  },
26
  "metadata_fields": [
27
  {
 
20
  "transliteration": "transliteration",
21
  "translation": "translation",
22
  "author": lambda doc: f"Sage Vyasa",
23
+ # "chapter_name": "chapter",
24
+ "relative_path": lambda doc: f"{doc.get("chapter","")}{doc.get("verse","")}",
25
  },
26
  "metadata_fields": [
27
  {
modules/config/yt_metadata.py CHANGED
@@ -11,7 +11,7 @@ yt_metadata_config = {
11
  "unit": "video",
12
  "field_mapping": {
13
  "text": "description",
14
- "title": "video_title",
15
  "author": "channel_title",
16
  "reference_link": lambda doc: f"https://www.youtube.com/watch?v={doc.get('video_id','')}",
17
  },
 
11
  "unit": "video",
12
  "field_mapping": {
13
  "text": "description",
14
+ "relative_path": "video_title",
15
  "author": "channel_title",
16
  "reference_link": lambda doc: f"https://www.youtube.com/watch?v={doc.get('video_id','')}",
17
  },