14 lines
364 B
Python
14 lines
364 B
Python
# -*- coding: utf-8 -*-
|
||
from pysbd.abbreviation_replacer import AbbreviationReplacer
|
||
from pysbd.lang.common import Common, Standard
|
||
|
||
class Urdu(Common, Standard):
|
||
|
||
iso_code = 'ur'
|
||
|
||
SENTENCE_BOUNDARY_REGEX = r'.*?[۔؟!\?]|.*?$'
|
||
Punctuations = ['?', '!', '۔', '؟']
|
||
|
||
class AbbreviationReplacer(AbbreviationReplacer):
|
||
SENTENCE_STARTERS = []
|