Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
9,113 changes: 4,503 additions & 4,610 deletions scriptshifter/tables/data/bengali.yml → scriptshifter/tables/data/_bengali_base.yml

Large diffs are not rendered by default.

5 changes: 4 additions & 1 deletion scriptshifter/tables/data/_gurmukhi_base.yml
Original file line number Diff line number Diff line change
@@ -1,9 +1,12 @@
---
general:
name: Gurmukhi base
case_sensitive: false
description: Bidirectional base mapping for the Gurmukhi script.
version: 1.0.0
date: 2025-12-07
parents:
- _ignore_base
case_sensitive: false

roman_to_script:
# Nasalization hook has no value here. It must be added to the individual
Expand Down
7 changes: 7 additions & 0 deletions scriptshifter/tables/data/_ignore_base.yml
Original file line number Diff line number Diff line change
@@ -1,15 +1,22 @@
---
general:
name: Common ignore list.
description: List of Latin strings not converted.
version: 1.0.0
date: 2025-12-03

roman_to_script:
ignore:
- "At head of title"
- "at head of title"
- "Colophon"
- "colophon"
- "Cover title"
- "date of publication not identified"
- "place of publication not identified"
- "publisher not identified"
- "and one other"
- "and others"
- "et al."
ignore_ptn:
- "and ([a-z0-9]+ )?others"
Expand Down
18 changes: 18 additions & 0 deletions scriptshifter/tables/data/abazin_cyrillic.yml
Original file line number Diff line number Diff line change
@@ -0,0 +1,18 @@
---
general:
name: Abazin (Cyrillic)
description: Abazin language in the Cyrillic script
version: 1.0.0
date: 2025-11-29
parents:
- cyrillic_generic

roman_to_script:
map:
"H\u0307": "\u04C0"
"h\u0307": "\u04CF"

script_to_roman:
map:
"\u04C0": "H\u0307"
"\u04CF": "h\u0307"
176 changes: 96 additions & 80 deletions scriptshifter/tables/data/abkhaz_cyrillic.yml
Original file line number Diff line number Diff line change
@@ -1,80 +1,96 @@
general:
name: Abkhaz (Cyrillic)
parents:
- cyrillic_generic

roman_to_script:
map:
"T\uFE20S\uFE21\u0307": "\u04B4"
"T\uFE20s\uFE21\u0307": "\u04B4"
"t\uFE20s\uFE21\u0307": "\u04B5"
"T\uFE20\u0307S\uFE21": "\u04B4"
"T\uFE20\u0307s\uFE21": "\u04B4"
"t\uFE20\u0307s\uFE21": "\u04B5"
"T\u0307\uFE20S\uFE21": "\u04B4"
"T\u0307\uFE20s\uFE21": "\u04B4"
"t\u0307\uFE20s\uFE21": "\u04B5"
"C\u0301h\u0301": "\u04BE"
"C\u0301H\u0301": "\u04BE"
"c\u0301h\u0301": "\u04BF"
"C\u0301h": "\u04BC"
"C\u0301H": "\u04BC"
"c\u0301h": "\u04BD"
"C\u0307h": "\u04B6"
"C\u0307H": "\u04B6"
"c\u0307h": "\u04B7"
"D\uFE20Z\uFE21": "\u04E0"
"D\uFE20z\uFE21": "\u04E0"
"d\uFE20z\uFE21": "\u04E1"
"GH": "\u0494"
"Gh": "\u0494"
"gh": "\u0495"
"H\u0307": "\u04FC"
"h\u0307": "\u04FD"
"Kh": "\u04C3"
"KH": "\u04C3"
"kh": "\u04C4"
"PH": "\u0524"
"Ph": "\u0524"
"ph": "\u0525"
"W\u0307": "\u04D8"
"w\u0307": "\u04D9"
"J": "\u040F"
"j": "\u045F"
"Q": "\u049C"
"q": "\u049D"
"W": "\u04A8"
"w": "\u04A9"
"Z": "\u0417"
"z": "\u0437"

script_to_roman:
map:
"\u040F": "J"
"\u0417": "Z"
"\u0437": "z"
"\u045F": "j"
"\u0494": "GH"
"\u0495": "gh"
"\u049C": "Q"
"\u049D": "q"
"\u04A8": "W"
"\u04A9": "w"
"\u04B4": "T\uFE20S\uFE21\u0307"
"\u04B5": "t\uFE20s\uFE21\u0307"
"\u04B6": "C\u0307h"
"\u04B7": "c\u0307h"
"\u04BC": "C\u0301h"
"\u04BD": "c\u0301h"
"\u04BE": "C\u0301h\u0301"
"\u04BF": "c\u0301h\u0301"
"\u04C3": "Kh"
"\u04C4": "kh"
"\u04D8": "W\u0307"
"\u04D9": "w\u0307"
"\u04E0": "D\uFE20Z\uFE21"
"\u04E1": "d\uFE20z\uFE21"
"\u04FC": "H\u0307"
"\u04FD": "h\u0307"
"\u0524": "Ph"
"\u0525": "ph"
---
general:
name: Abkhaz (Cyrillic)
description: Abkhaz language in Cyrillic script
version: 1.0.0
date: 2025-11-29
parents:
- cyrillic_generic

roman_to_script:
map:
"T\uFE20S\uFE21\u0307": "\u04B4"
"T\u0361S\u0307": "\u04B4"
"T\uFE20s\uFE21\u0307": "\u04B4"
"T\u0361s\u0307": "\u04B4"
"t\uFE20s\uFE21\u0307": "\u04B5"
"t\u0361s\u0307": "\u04B5"
"T\uFE20\u0307S\uFE21": "\u04B4"
"T\u0361\u0307S": "\u04B4"
"T\uFE20\u0307s\uFE21": "\u04B4"
"T\u0361\u0307s": "\u04B4"
"t\uFE20\u0307s\uFE21": "\u04B5"
"t\u0361\u0307s": "\u04B5"
"T\u0307\uFE20S\uFE21": "\u04B4"
"T\u0307\u0361S": "\u04B4"
"T\u0307\uFE20s\uFE21": "\u04B4"
"T\u0307\u0361s": "\u04B4"
"t\u0307\uFE20s\uFE21": "\u04B5"
"t\u0307\u0361s": "\u04B5"
"C\u0301h\u0301": "\u04BE"
"C\u0301H\u0301": "\u04BE"
"c\u0301h\u0301": "\u04BF"
"C\u0301h": "\u04BC"
"C\u0301H": "\u04BC"
"c\u0301h": "\u04BD"
"C\u0307h": "\u04B6"
"C\u0307H": "\u04B6"
"c\u0307h": "\u04B7"
"D\uFE20Z\uFE21": "\u04E0"
"D\u0361Z": "\u04E0"
"D\uFE20z\uFE21": "\u04E0"
"D\u0361z": "\u04E0"
"d\uFE20z\uFE21": "\u04E1"
"d\u0361z": "\u04E1"
"GH": "\u0494"
"Gh": "\u0494"
"gh": "\u0495"
"H\u0307": "\u04FC"
"h\u0307": "\u04FD"
"Kh": "\u04C3"
"KH": "\u04C3"
"kh": "\u04C4"
"PH": "\u0524"
"Ph": "\u0524"
"ph": "\u0525"
"W\u0307": "\u04D8"
"w\u0307": "\u04D9"
"J": "\u040F"
"j": "\u045F"
"Q": "\u049C"
"q": "\u049D"
"W": "\u04A8"
"w": "\u04A9"
"Z": "\u0417"
"z": "\u0437"

script_to_roman:
map:
"\u040F": "J"
"\u0417": "Z"
"\u0437": "z"
"\u045F": "j"
"\u0494": "GH"
"\u0495": "gh"
"\u049C": "Q"
"\u049D": "q"
"\u04A8": "W"
"\u04A9": "w"
"\u04B4": "T\u0361S\u0307"
"\u04B5": "t\u0361s\u0307"
"\u04B6": "C\u0307h"
"\u04B7": "c\u0307h"
"\u04BC": "C\u0301h"
"\u04BD": "c\u0301h"
"\u04BE": "C\u0301h\u0301"
"\u04BF": "c\u0301h\u0301"
"\u04C3": "Kh"
"\u04C4": "kh"
"\u04D8": "W\u0307"
"\u04D9": "w\u0307"
"\u04E0": "D\u0361Z"
"\u04E1": "d\u0361z"
"\u04FC": "H\u0307"
"\u04FD": "h\u0307"
"\u0524": "Ph"
"\u0525": "ph"
18 changes: 18 additions & 0 deletions scriptshifter/tables/data/adygei_cyrillic.yml
Original file line number Diff line number Diff line change
@@ -0,0 +1,18 @@
---
general:
name: Adygei (Cyrillic)
description: Adygei language in the Cyrillic script
version: 1.0.0
date: 2025-11-29
parents:
- cyrillic_generic

roman_to_script:
map:
"H\u0307": "\u04C0"
"h\u0307": "\u04CF"

script_to_roman:
map:
"\u04C0": "H\u0307"
"\u04CF": "h\u0307"
61 changes: 34 additions & 27 deletions scriptshifter/tables/data/altai_cyrillic.yml
Original file line number Diff line number Diff line change
@@ -1,27 +1,34 @@
general:
name: Altai (Cyrillic)
parents:
- cyrillic_generic

roman_to_script:
map:
"N\uFE20G\uFE21": "\u04A4"
"N\uFE20g\uFE21": "\u04A4"
"n\uFE20g\uFE21": "\u04A5"
"D\u0301": "\u0408"
"d\u0301": "\u0458"
"O\u0307": "\u04E6"
"o\u0307": "\u04E7"
"U\u0307": "\u04F0"
"u\u0307": "\u04F1"

script_to_roman:
map:
"\u0408": "D\u0301"
"\u0458": "d\u0301"
"\u04A4": "N\uFE20G\uFE21"
"\u04A5": "n\uFE20g\uFE21"
"\u04E6": "O\u0307"
"\u04E7": "o\u0307"
"\u04F0": "U\u0307"
"\u04F1": "u\u0307"
---
general:
name: Altai (Cyrillic)
description: Altai language in Cyrillic script
version: 1.0.0
date: 2025-11-29
parents:
- cyrillic_generic

roman_to_script:
map:
"N\uFE20G\uFE21": "\u04A4"
"N\u0361G": "\u04A4"
"N\uFE20g\uFE21": "\u04A4"
"N\u0361g": "\u04A4"
"n\uFE20g\uFE21": "\u04A5"
"n\u0361g": "\u04A5"
"D\u0301": "\u0408"
"d\u0301": "\u0458"
"O\u0307": "\u04E6"
"o\u0307": "\u04E7"
"U\u0307": "\u04F0"
"u\u0307": "\u04F1"

script_to_roman:
map:
"\u0408": "D\u0301"
"\u0458": "d\u0301"
"\u04A4": "N\u0361G"
"\u04A5": "n\u0361g"
"\u04E6": "O\u0307"
"\u04E7": "o\u0307"
"\u04F0": "U\u0307"
"\u04F1": "u\u0307"
18 changes: 0 additions & 18 deletions scriptshifter/tables/data/amharic.yml

This file was deleted.

Loading