File size: 371 Bytes
d093ea4
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
# -*- coding: utf-8 -*-
from pysbd.abbreviation_replacer import AbbreviationReplacer
from pysbd.lang.common import Common, Standard

class Burmese(Common, Standard):

    iso_code = 'my'

    SENTENCE_BOUNDARY_REGEX = r'.*?[။၏!\?]|.*?$'
    Punctuations = ['။', '၏', '?', '!']

    class AbbreviationReplacer(AbbreviationReplacer):
        SENTENCE_STARTERS = []