Hi Kaśyap,
This is a good idea, but I doubt there will be a single format that meets everyone's needs.
For the
verses I give to my students, the data is stored in a JSON format (see below) that has proven both easy to generate from Google Documents and easy to modify manually, after the fact, if required. Some of the tagging is a bit idiosyncratic and not well standardized, and the glossing of compounds leaves something to be desired, but the grammatical information is stored in such a way as to make (automated) dictionary lookups and the use of Dhaval's Prakriyā generator straightforward.
Andrew
{
"data": {
"metadata": {
"title": "Śakuntalā",
"passage": "5.4",
"meter": "vasantatilakam",
"description": "Inexplicable nostalgia.",
"slug": "abhijna-5-4",
"tags": {
"syntax": [
"relative-correlative"
],
"nmorphology": [
"aD-antam",
"s-antam",
"u-antam"
],
"vmorphology": [
"LyaP",
"bhvādi",
"laṭ",
"parasmaipadam",
"cvi"
],
"compounds": [
"karmadhārayaḥ",
"vibhaktitatpuruṣaḥ"
]
},
"author": "Kālidāsaḥ"
},
"unanalyzed": {
"pada_a": "ramyāṇi vīkṣya madhurāṁś ca niśamya śabdān",
"pada_b": "paryutsukībhavati yat sukhitō ’pi jantuḥ",
"pada_c": "tac cētasā smarati nūnam abōdhapūrvaṁ",
"pada_d": "bhāvasthirāṇi jananāntarasauhr̥dāni "
},
"analyzed": [
{
"word": "ramyāṇi",
"meaning": {
"def": "pleasing, lovely"
},
"morphology": {
"class": "adj",
"stem": "ramya-",
"gender": "n",
"number": "pl",
"case": "2"
}
},
{
"word": "vīkṣya",
"meaning": {
"def": "having seen",
"note": "lyap suffix (converb/absolutive/gerund)"
},
"morphology": {
"class": "indecl"
}
},
{
"word": "madhurān",
"meaning": {
"def": "pleasant, charming"
},
"morphology": {
"class": "adj",
"stem": "madhura-",
"gender": "m",
"number": "pl",
"case": "2"
}
},
{
"word": "ca",
"meaning": {
"def": "and"
},
"morphology": {
"class": "particle"
}
},
{
"word": "niśamya",
"meaning": {
"def": "having heard",
"note": "lyap suffix (converb/absolutive/gerund)"
},
"morphology": {
"class": "indecl"
}
},
{
"word": "śabdān",
"meaning": {
"def": "sounds, words"
},
"morphology": {
"class": "noun",
"stem": "śabda-",
"gender": "m",
"number": "pl",
"case": "2"
}
},
{
"punct": "odd_pada"
},
{
"word": "paryutsukībhavati",
"meaning": {
"def": "he becomes sorrowful or regretful",
"note": "cvi suffix"
},
"morphology": {
"class": "verb",
"root": "bhū",
"gana": "bhvadi",
"person": "3rd",
"number": "sg",
"padam": "parasmai",
"l": "laṭ",
"preverb": "paryutsuka"
}
},
{
"word": "yat",
"meaning": {
"def": "which"
},
"morphology": {
"class": "pron",
"stem": "yad-",
"gender": "n",
"number": "sg",
"case": "1"
}
},
{
"word": "sukhitaḥ",
"meaning": {
"def": "happy"
},
"morphology": {
"class": "adj",
"stem": "sukhita-",
"gender": "m",
"number": "sg",
"case": "1"
}
},
{
"word": "api",
"meaning": {
"def": "even"
},
"morphology": {
"class": "particle"
}
},
{
"word": "jantuḥ",
"meaning": {
"def": "a person"
},
"morphology": {
"class": "noun",
"stem": "jantu-",
"gender": "m",
"number": "sg",
"case": "1"
}
},
{
"punct": "even_pada"
},
{
"word": "tat",
"meaning": {
"def": "that"
},
"morphology": {
"class": "pron",
"stem": "tad-",
"gender": "n",
"number": "sg",
"case": "1"
}
},
{
"word": "cētasā",
"meaning": {
"def": "by the mind"
},
"morphology": {
"class": "noun",
"stem": "cētas-",
"gender": "n",
"number": "sg",
"case": "3"
}
},
{
"word": "smarati",
"meaning": {
"def": "he remembers, recollects"
},
"morphology": {
"class": "verb",
"root": "smṛ",
"gana": "bhvadi",
"person": "3rd",
"number": "sg",
"padam": "parasmai",
"l": "laṭ",
"preverb": ""
}
},
{
"word": "nūnam",
"meaning": {
"def": "certainly"
},
"morphology": {
"class": "particle"
}
},
{
"word": "abōdha-pūrvam",
"meaning": {
"def": "previously unknowingly, in a manner that was unknown before ",
"note": "pūrvam na abōdhyata"
},
"morphology": {
"class": "adv"
},
"compound": {
"type": "k",
"head": "pūrvam",
"dep": "abōdham"
}
},
{
"punct": "odd_pada"
},
{
"word": "bhāva-sthirāṇi",
"meaning": {
"def": "fixed in the heart"
},
"morphology": {
"class": "adj",
"stem": "bhāvasthira-",
"gender": "n",
"number": "pl",
"case": "2"
},
"compound": {
"type": "t7",
"head": "sthirāṇi",
"dep": "bhāve"
}
},
{
"word": "janana-antara-sauhr̥dāni ",
"meaning": {
"def": "friendships from [previous] births"
},
"morphology": {
"class": "noun",
"stem": "sauhr̥da- ",
"gender": "n",
"number": "pl",
"case": "2"
},
"compound": {
"type": "t5",
"head": "sauhr̥dāni ",
"dep": "jananānām antarāt"
}
}
]
}
}