File size: 1,288 Bytes
21baa2f | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 | '''
Created on ٢٢/٠٧/٢٠١٠
@Created by: Muhammad Altabba
'''
from Models.Lexicon.RootsAndPatternsRepository import *;
from Models.Lexicon.SpecialWords.StandAloneParticle import *;
from Models.Lexicon.SpecialWords.ProperNoun import *;
from Controllers.TextEntities.TextEncapsulator import *;
from Controllers.TextEntities.Word import *;
from Controllers.Tokenization.Tokenizer import *;
from Controllers.Normalization.Normalizer import *;
from Controllers.Morphology.AffixParser import *;
from Controllers.Morphology.MorphologicalAnalyzer import *;
import codecs;
import io;
procliticsXmlFile = '../../Data/MorphologyTransducers/Proclitics.xml';
encliticsXmlFile = '../../Data/MorphologyTransducers/Enclitics.xml';
text = TextEncapsulator();
text.LoadFromFiles(None, None, \
procliticsXmlFile, encliticsXmlFile,\
None, \
None);
f = codecs.open('../../Data/Cliticalization_test.txt', 'r', 'utf-8');
string = f.read();
f.close();
text.String = string;
text.Tokenize();
text.Normalize(2);
text.ParseClitics();
print('---------------------------------------------------------------------------');
text.PrintForClitics();
print('---------------------------------------------------------------------------');
|