14 lines
364 B
Python
14 lines
364 B
Python
|
# -*- coding: utf-8 -*-
|
|||
|
from pysbd.abbreviation_replacer import AbbreviationReplacer
|
|||
|
from pysbd.lang.common import Common, Standard
|
|||
|
|
|||
|
class Urdu(Common, Standard):
|
|||
|
|
|||
|
iso_code = 'ur'
|
|||
|
|
|||
|
SENTENCE_BOUNDARY_REGEX = r'.*?[۔؟!\?]|.*?$'
|
|||
|
Punctuations = ['?', '!', '۔', '؟']
|
|||
|
|
|||
|
class AbbreviationReplacer(AbbreviationReplacer):
|
|||
|
SENTENCE_STARTERS = []
|