# NOT RUN {
# Since the extraction of bg-en.tgz in Europarl corpus is time consuming,
# so the aforementioned unzip files have been temporarily exported to
# http://www.um.ac.ir/~sarmad/... .
# }
# NOT RUN {
w1 = align.ibm1 ('http://www.um.ac.ir/~sarmad/word.a/euro.bg',
'http://www.um.ac.ir/~sarmad/word.a/euro.en',
n = 30, encode.sorc = 'UTF-8')
w2 = align.ibm1 ('http://www.um.ac.ir/~sarmad/word.a/euro.bg',
'http://www.um.ac.ir/~sarmad/word.a/euro.en',
n = 30, encode.sorc = 'UTF-8', remove.pt = FALSE)
S1 = align.symmet ('http://www.um.ac.ir/~sarmad/word.a/euro.bg',
'http://www.um.ac.ir/~sarmad/word.a/euro.en',
n = 200, encode.sorc = 'UTF-8')
S2 = align.symmet ('http://www.um.ac.ir/~sarmad/word.a/euro.bg',
'http://www.um.ac.ir/~sarmad/word.a/euro.en',
n = 200, encode.sorc = 'UTF-8', method = 'grow-diag')
# }
Run the code above in your browser using DataLab