Ari Nubar Boyacıoğlu
add files
d093ea4
raw
history blame contribute delete
364 Bytes
# -*- coding: utf-8 -*-
from pysbd.abbreviation_replacer import AbbreviationReplacer
from pysbd.lang.common import Common, Standard
class Urdu(Common, Standard):
iso_code = 'ur'
SENTENCE_BOUNDARY_REGEX = r'.*?[۔؟!\?]|.*?$'
Punctuations = ['?', '!', '۔', '؟']
class AbbreviationReplacer(AbbreviationReplacer):
SENTENCE_STARTERS = []