Skip to content

Commit

Permalink
Add homophones and other exceptions
Browse files Browse the repository at this point in the history
  • Loading branch information
ibleaman committed Jan 24, 2024
1 parent 1629d8a commit e37a6ca
Show file tree
Hide file tree
Showing 3 changed files with 12 additions and 2 deletions.
2 changes: 1 addition & 1 deletion LICENSE.md
Original file line number Diff line number Diff line change
@@ -1,4 +1,4 @@
Copyright 2021-2023 Isaac L. Bleaman
Copyright 2021-2024 Isaac L. Bleaman

Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated documentation files (the "Software"), to deal in the Software without restriction, including without limitation the rights to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of the Software, and to permit persons to whom the Software is furnished to do so, subject to the following conditions:

Expand Down
2 changes: 1 addition & 1 deletion setup.py
Original file line number Diff line number Diff line change
Expand Up @@ -5,7 +5,7 @@

setup(
name='yiddish',
version='0.0.15',
version='0.0.16',
author='Isaac L. Bleaman',
author_email='[email protected]',
description='A Python library for processing Yiddish text',
Expand Down
10 changes: 10 additions & 0 deletions yiddish/yiddish.py
Original file line number Diff line number Diff line change
Expand Up @@ -260,6 +260,7 @@ def transliterate(string, loshn_koydesh=False):
(r'\bumeydel', 'אומאײדעל'), # אומאײדעלע
(r'\bureynikl', 'אוראײניקל'),
(r'\bbaayn', 'באַאײַנ'), # באַאײַנדרוקן, באַאײַנפֿלוסן
(r'\bbaumr', 'באַאומר'), # באַאומרויִקן
(r'geayn', 'געאײַנ'), # געאײַנפֿלוסט
(r'tsuayn', 'צואײַנ'),
(r'durkhayl', 'דורכאײַל'), # דורכאײַלן
Expand All @@ -279,6 +280,7 @@ def transliterate(string, loshn_koydesh=False):
(r'\bforur', 'פֿאָראור'), # פֿאָראורטל
(r'\bfaribl', 'פֿאַראיבל'),
(r'\bfarinteres', 'פֿאַראינטערעס'), # פֿאַראינטערעסירן
(r'\bvoltst', 'װאָלטסט'),

# ay != ײַ
(r'\brayon\b', 'ראַיאָן'),
Expand Down Expand Up @@ -325,6 +327,7 @@ def transliterate(string, loshn_koydesh=False):
(r'umloyal', 'אומלאָיאַל'),
(r'loyal', 'לאָיאַל'),
(r'paranoye', 'פּאַראַנאָיע'),
(r'poyezd', 'פּאָיעזד'),

# ts != צ
(r'tstu\b', 'טסטו'),
Expand All @@ -349,6 +352,7 @@ def transliterate(string, loshn_koydesh=False):
(r'\brekhts\b', 'רעכטס'),
(r'du shatst', 'דו שאַטסט'), # cf. ער שאַצט
(r'\bforverts\b', 'פֿאָרװערטס'),
(r'\bayngemakhts', 'אײַנגעמאַכטס'),

# kh != כ
(r'\bpikhol', 'פּיקהאָל'), # פּיקהאָלץ, פּיקהאָלצן
Expand All @@ -372,20 +376,26 @@ def transliterate(string, loshn_koydesh=False):
'דינע',
'װײס',
'װעסט',
'זאַל',
'זאָל',
'טאָמער',
'טו',
'לױט',
'לײען',
'מאָגן',
'מאַסע',
'מאַן',
'מוטער',
'מײַנע',
'מע',
'נעמען',
'עלעף',
'עמער',
'פּױלן',
'קעלער',
'קעץ',
'קערן',
'רוס',
'שװאַך',
'שיִער',
'שנײ',
Expand Down

0 comments on commit e37a6ca

Please sign in to comment.